import requests
ensembl_server = 'http://rest.ensembl.org'
def do_request(server, service, *args, **kwargs):
url_params = ''
for a in args:
if a is not None:
url_params += '/' + a
req = requests.get('%s/%s%s' % (server, service, url_params),
params=kwargs,
headers={'Content-Type': 'application/json'})
if not req.ok:
req.raise_for_status()
return req.json()
answer = do_request(ensembl_server, 'info/species')
for sp in answer['species']:
print(sp['name'])
saccharomyces_cerevisiae ciona_savignyi myotis_lucifugus taeniopygia_guttata sorex_araneus otolemur_garnettii macropus_eugenii erinaceus_europaeus anolis_carolinensis gadus_morhua dasypus_novemcinctus chlorocebus_sabaeus tursiops_truncatus mus_musculus bos_taurus monodelphis_domestica choloepus_hoffmanni sus_scrofa rattus_norvegicus caenorhabditis_elegans pteropus_vampyrus microcebus_murinus sarcophilus_harrisii ovis_aries papio_anubis pelodiscus_sinensis equus_caballus xiphophorus_maculatus macaca_mulatta astyanax_mexicanus latimeria_chalumnae ficedula_albicollis gasterosteus_aculeatus gorilla_gorilla oryctolagus_cuniculus oreochromis_niloticus echinops_telfairi nomascus_leucogenys homo_sapiens dipodomys_ordii lepisosteus_oculatus anas_platyrhynchos canis_familiaris callithrix_jacchus pongo_abelii ornithorhynchus_anatinus tetraodon_nigroviridis mustela_putorius_furo tarsius_syrichta vicugna_pacos meleagris_gallopavo xenopus_tropicalis ictidomys_tridecemlineatus cavia_porcellus takifugu_rubripes ochotona_princeps pan_troglodytes petromyzon_marinus ailuropoda_melanoleuca felis_catus procavia_capensis oryzias_latipes danio_rerio gallus_gallus tupaia_belangeri ciona_intestinalis loxodonta_africana poecilia_formosa drosophila_melanogaster Ancestral sequences
ext_dbs = do_request(ensembl_server, 'info/external_dbs', 'homo_sapiens', filter='HGNC%')
print(ext_dbs)
[{u'release': u'1', u'display_name': u'HGNC Symbol', u'name': u'HGNC', u'description': None}, {u'release': u'1', u'display_name': u'HGNC (automatic)', u'name': u'HGNC_automatic_gene', u'description': None}, {u'release': u'1', u'display_name': u'HGNC (automatic)', u'name': u'HGNC_automatic_transcript', u'description': None}, {u'release': u'1', u'display_name': u'HGNC (curated)', u'name': u'HGNC_curated_gene', u'description': None}, {u'release': u'1', u'display_name': u'HGNC (curated)', u'name': u'HGNC_curated_transcript', u'description': None}, {u'release': u'1', u'display_name': u'HGNC transcript name', u'name': u'HGNC_trans_name', u'description': u'transcript name from HGNC'}]
answer = do_request(ensembl_server, 'lookup/symbol', 'homo_sapiens', 'LCT')
print(answer)
lct_id = answer['id']
{u'assembly_name': u'GRCh38', u'display_name': u'LCT', u'description': u'lactase [Source:HGNC Symbol;Acc:HGNC:6530]', u'seq_region_name': u'2', u'logic_name': u'ensembl_havana_gene', u'object_type': u'Gene', u'start': 135787840, u'id': u'ENSG00000115850', u'source': u'ensembl_havana', u'db_type': u'core', u'biotype': u'protein_coding', u'end': 135837180, u'species': u'homo_sapiens', u'strand': -1}
lct_seq = do_request(ensembl_server, 'sequence/id', lct_id)
print(lct_seq)
{u'molecule': u'dna', u'id': u'ENSG00000115850', u'seq': u'GTTCCTAGAAAATGGAGCTGTCTTGGCATGTAGTCTTTATTGCCCTGCTAAGTTTTTCATGCTGGGGGTCAGACTGGGAGTCTGATAGAAATTTCATTTCCACCGCTGGTCCTCTAACCAATGACTTGCTGCACAACCTGAGTGGTCTCCTGGGAGACCAGAGTTCTAACTTTGTAGCAGGGGACAAAGACATGTATGTTTGTCACCAGCCACTGCCCACTTTCCTGCCAGAATACTTCAGCAGTCTCCATGCCAGTCAGATCACCCATTATAAGGTATTTCTGTCATGGGCACAGCTCCTCCCAGCAGGAAGCACCCAGAATCCAGACGAGAAAACAGTGCAGTGCTACCGGCGACTCCTCAAGGCCCTCAAGACTGCACGGCTTCAGCCCATGGTCATCCTGCACCACCAGACCCTCCCTGCCAGCACCCTCCGGAGAACCGAAGCCTTTGCTGACCTCTTCGCCGACTATGCCACATTCGCCTTCCACTCCTTCGGGGACCTAGTTGGGATCTGGTTCACCTTCAGTGACTTGGAGGAAGTGATCAAGGAGCTTCCCCACCAGGAATCAAGAGCGTCACAACTCCAGACCCTCAGTGATGCCCACAGAAAAGCCTATGAGATTTACCACGAAAGCTATGCTTTTCAGGGTGAGTACACATTGACCTGATGGTGACCCCTCGGCAACCTTCATCACACACCTTCCCCATCCTCCTTAGAGCAGATTCGACATTTCTCCCAACTCACCTTCAGCAGTCCTCTTATGTCTGTGCATAGGGAGAAATTAATATTGTAAATTGATTTCCCACTGGCGATAGGAAGGGGTAGCTAACATGGCAAAACACTCAGCATTTCCTTTGAAAAATATCTTTGAGGCTCACGCCTGTAATCCTAGCACTTTGGGAGGCCGAGGTGGGCGGATCACTTGAAGTCAGGAGTTCGAGACCAGCCTGGCCAATATGGCAAAACCCCGTCTCTACTAAAAATACCAAAATTAGCCAGGGATGGTAGCAGGCGCCTGTGATCCCAGCTACTCGGGAGGCTTAGGCAGGAGAATTGCTTGAACCCAGGAGGCAGATGTTGCAGTGAGCCGAAATCATGCCACTGTACTACAGCCTGTGCGACAGAGCAAGACACAATCTCAAAAAAAAAAAATATGTATACATATATATATATATATATATATATATATATATATATATACACACATGTATTTTTGAAATACCCCTTGCCCAGTCTTGAGTTGTGCAAGCACTGATTGTCTTTCTGTCTTCCTTTCCGTCTATGTCCTGCTACCCTGACTTGGAGGCAAAGTTTCGTGGTTTCCTGTCCTTCCCCCTCGGCTCCCCTATACTTACATGTCTTAGTTGGAGCTTACATTGCAGCTTGGGAGACAGACAAATACAAGATGAAACAATTATATATCACAGGATGAGGAGAGCACAACTGTAACTGTTCACATTCCTGCCTCCTAGGGGACTTGAAGTTCTGATCTGTAGGCCTAGGCTGAACCAGGACATTTGTGATTATAATCAATTCCCTAAGTGTATGTTAGGTACACCAATTTTGAGAATCAATTTTGGATTATATATGCTTTCTTGTTTTTATTATATACCATATACATACATATTTGTATATATAGTACCTGATATATATATATATATATATATATATATATATATATATATATATATATACTTCTATGTTCTACTTTTTCATTTTAACATAGTTTATGACTATATTCTCATTTTATTAAAAACTTGAGCCAGGCATGGTGGCTCATGCCTATAATCCCAGCACGTTAGGAGGCCAAGGCAGGGGGATTGCTTGAGGCCAGGAGTTGGAGACCAGCCTGGGCAACATAGAGAGCCACTATCTCTAAAATAATATAATAATTTACTCCAGTGCTGGAATAGTATTGCTTAAAACAAAAGAAAAACTTGAAAGCATAACTTTCAATGGTCTTTTAGGTTCCCATTGTATAAATGGAGCATAAAGTTTAAGGTATTTTCCTTATTTTTGTATGTTTATTCTAATTTTCACTAGTTACAAGTTATGTTGCAATGACATTCCTATCTATAAACTATTTCCCACCTTCTGATAAATTCTTTCTGACAGAATCTTAGAATTGAAACTACTAGGTGAAAAGATCTGCATTCTTTAAGATTTTAAAGCATGGTACTAAATTATTTTCCAGAAAAGTTGTAATCATTTATACGAACAGTTATAAAATTACTCTCTGACCCCATTCTGTCAGTTTCAAATGCTATATTTTATTACTAATTTGACAGCTGAAAACAGCTTATTTTCATGTCTTGTTAATTTGCATGTATTTGATTATAGAGACGTTAAACATTTTTTTCTTCTTCTTTTTTTTTTTTTTTTTTTTTTTGAGATGGAGTCTCACTCTTTTGTCCAGGCTGGAGTGCAGTGGTGTGATCTCGGCTCACTGCAACCTCTGCCTCCCGAGTTCAAGCAATTCTCCTGCCTCAGCCTTCCCAGTAGCTGGGATTACAGGCACGCACCACCACATCTGGCTAATTTTTGTATTTTTAGTAGAGATGGGGTTTCACCGTGTTGGCCAGGCTGGACTCAAACTTCTGATCTCAGGTGATCCGCCCGCCTCGGACTCCCAAAATGCTGGGATTACAGGCGTGAGCCACCACGCCCGGCCTTAAACAAAAAAATAAAATAAGGCCAGGCGTGGTGGTTCACGCTTGTAATCCCAGCACTTTGGGAGGCTGAGGCAGGCGGGTCACAAGGTCAGAAGATCGAGACCATCCTGGCTAACACGGTGAAACCCCATCTCTACTAAAAATACAAAAAATTAGCGAGGCGTGGTAGCACGTGTCTGTAGTCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCGCTTGAACCTGGGAGGCGGAGGTTGCAGTGAGCCGAGACTGCGCCATTGCACTCCAGCCTGGGCGACAGAGCGAGACTCTGTCTCAAAAATAAATGAAAAATAAACTAGGACATCATAGCTGCCTTATTCACAATAGCCAAAAGGTGGAAGCAACCCAGATATCCACTGATGGATGAATGGATAAACGAGACGTGGCATAGACATAAAATGGAATATTACTCCACATTTATTAAAAAGGGAAGAAATCATCACATGCTACAACATGGATGAACCTTGAGGACATTATGCTATGTGAAATAAGCCAGACACAAAAAGACAAACGCTGTATGATTCCATGTATAGGAGGAAACTAGAGCAGTCGAATTCATGGAGAGAGGAAGGAGAATGGCAGAGGCCAGGGGCTGGGGTAGGGGAGAAATGGAGAGCTCTTTAATGGGAGTAGAATTTCTGTTCAGAAAAATGAAAAAGTTCTGGAGATTGGTTGCACAACAATGTGAATATACTTAATAATACTGAACTGTGCACTTAAAAATAGTTAAGATGGCCGGGCGCGGTGGCTCACGCCTGTAATCCCAACACTTTGGGAGGCCAAGGCGGGCAGATCATGAGGTCAGGAGATCGAGACCATCCTGGCTAACCCGGTGCAACTCCGTCTCTACCAAAAATGCAAAAAATTAGCCGGGCGTGGTGGCGGGCCCCTGTAGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGCGTGAACGCGGGAGGCGGAGCTTTCAGTGAGCCGAGATGGCACGACTGCACTCCAGCCTGGGCGACGGAGCGAGACTCCGTCTCAAAAAAAAAAAAAAAAAAAAAAAGAAGTTTAGGAAGGAGTTCTCTCCTTGCCAACTCTCCAACTGCTCTGCATTTCATAGTCCTGATTTTCACAAAACACTCTCTAAAGGAACATTATTTTTTTAAGCCACCTTGTCTTCTAAAATCTTTCAGCTAGAGTAAAGTCATTTGGATGATTTCTTCAGGTCCATAGGAAATGAATCCCCCAGTGGTTTCCACAGTCAGAGCCTCCTGCCCTCGCTCACCTGCTGTTCGTGTCTCTGGTTGGTTTCAGGCGGAAAACTCTCTGTTGTCCTGCGAGCTGAAGATATCCCGGAGCTCCTGCTAGAACCACCCATATCTGCGCTTGCCCAGGTGACAGCAGCCCAAAAATATACCTGTAACATCTGAGGAGAGTTTGATTTTAATTTTTTAAAAACAAGAGAAGTTTTGGTCTATTGGTTTGACATTTCTGTAAATGCCTCAGAATGAGTGGTGTATGTTCTCCAGGTTCATAATTACCTTAAAAACAAAATCTTGAAGCTGCAGCTCCTGCTTGGTCAAGTGTCAGCTTCCCTGCAGGAAGAAGCCACTTGCCTCTGCTGGCTCTGATTTTTGAGTCCAAAATAGCTTATAGGATAAGAGATGAGATTATGGCAAAACAGGTACTAGGGTAAAGGGGTTTTTCAAAAATGTGCACCTGGCCAAACACGGTGGCTCACTTCTGTAATCCCAGCACTTTGGGAGGCGGAGATGGGAGGGTTGTTTGAGCCAGGAGTTTGAGACCAGCCTGGGCAACATGGCAAAACTCCTTCTTTGCTAAAAATACAAAAATTAGCAAGGCATGGTGATGCATGCCTGTAGTTCCAGCTGCTCGGGAGGATGAGGTGGGAGGATTGCTTGAGCCCTGGAGGTCAAGGCTGCAGTGAACTGTGATCATGTCACTGCACTCCAGCCTGGGTGACACAGCAAGACCCTGTCTTGAAAAAAAAAAATTAAAAATGTACGTATATCCTCTATCACTTTTTATTTTTTATTTTTATTTATTTATTTTTTTACAGACAGGGTCTTGTGGCCTTGCTCTGTCACCCAGGCCAGAGTGCAGTGGCATGATCACAGCTCACTGCAGCCTCTACTTCCAACTCCTGGCCTTGAGCAATCCTCCCACCTCAGCCTCCCAAAGTGTCAGGATTACAGGCATGAGCCACCACACCCAGCCAACTATCACTTTTTAACTATAATTTATATTTTTTATTTTATTTTTTTTTTGAGATGGAGTTTCATTCTTGTTGCCCAGGCTGGAGTGCAGTGGCACGATCTCGGCTCACTGCAACCTCTACACCCTGGATTCAAGTGATTCTCCTGCCTCAGCCTCCCAAGTAGCTGGGATTACAGGTGTGCACCACCACGCCCGGCTAATTTTGTATTTTTAGTAGAGATGGGGTTTCACCATGTTGGTCAGGCTTGTCTCAAACTCCTGACCTCAGGTAATCCACCTGCCTCGGCCTCCCAAAGTGCTGGAATTACAGGCTTGAGCCACCACGCCAGCCTTTAACTATAATTTTTAAAAGAAAAATTAAAATAATCTGGGAAGTGAACAGCTTTGGGCCCCCTTGGGCAGCTGGGCAGTCTGGAAGCCATGGGAACCACCGCCGGTCTCCGTAGTTCTGCAGCATCGCCCTGGTGCTGTAGAGATGTTGTGCTGCTCATTGGCGTCTGTGCGTTGATGGGGGCCCCAGGAGTCAGGGTCTGGTCTTCAGATTTTCCATTTCAAACACGATGGAACCAAGACTGATAAGGTTCTGGAGGGACAACTCCCAGGCTGATTGCACGGCCAGAATGGCACCTAAATTAGTTTACAGAGGGCGATAACTGCTATCAGTTATGAACGCAGGAGACCAAAGTGCTGATCAGAAAAATGCTTGTCGAGAAATAGCCTTTGTACTGGTCTATCTGCCCCAGTCCATGCTGTGAAATGCTTCTGGGTCATCTCCCAAAAGCACAGTTCTGACCAGTTACCTGCTGGGAAGCCACACTTCCGAGTGGGACGAATCCCACAGGACCCTCCAGTGCATGAACGTGTGGGCCTCTCTCTCTGTCTCTCTCTGGCCTCACCTCCTATTTTGTCCATGTGAGTGCTATGCTTGCTTCCTACCCTCCTGCATCCCCTACTGGACGTCCTTCCTGTCTTCCTGCCTTCCTCAAATCTCCTTCCAGCAAAATTTTCTCCATTGTTAATGTACACGTAACTGTGCTCTCCAGCTGAGGCCTCGCTCAGTAACACTCCCTCACTCACCCTGATGCACTCTGTCCCCACCCGGACCCTTAGCCATTGCTTTAGACCAGTGGTTCCCAAGCTTGAGTGGGCATCAGAACCACCTAGAGAGCTAGGAGAGAGCACGGAGACCAAGACTTAATGTGGTGGGACCCACCTGGGCCTGCACAGGCATCCGAAGTCCCCAGGTGAGTCTAATCCCCAGCAAGGCATGAGAACCACTGGTGTGGGCTTCTTACAGCACTTCTAAATTTCTGTCTTCTCCTCGTGTGATTGGTGCATTTGCTAACCCTCCCTATTAAAGGTGTAAACCTCTGTGGATATTATTTATCTCTAAATGTGAATCCCTACCCACCATCCCCACACAGTGTGACTTTCAGAGGTAGGAACTCAGTGACGATGTGTTGTGCAGAACTGACAGACATAAGGAAGAGCTGCGAGAGTGGGCAGGGAATGCTGGAGTGATACCTGCCAGTGTGGTCTTTAGTGAACACTGATGACAACTTGACTGAGAAAGAAACAGGGAGCCAGTAGTGAACCACTTATTAACCCATTTATGCCTGAGGCTGCAATTTTTTGAACTTTTGCAATCAGACCTTAGCGAAGACCTTGAGCAGTAGGATATAAGTAACTTCCACAGGCTTAGCATTCCCATAATGGAACACTAGGCATTCACAGAGCACTTGGTTCTGACCAGGTGACAGTAACCATTAGTCCTTGTCTTGAAGAAGCAGATGATCAGTGGGAGGGATAAGACAGGTAATGATCTAATCAGGCCAAGGGTAGACAGGTACGGCCAGCCAGGCTCGTGGAGGGGAGCGCAGCACTGGGGGTGTTGGCATGGTCCTGTGTAGACTCTGTGAATCTGAAGTTCTTTGAGCACATGCAGGCCAGAGACAGGGCAGAGGGGACATCCTCATCAGAAGTGTGGATGGGGGTGTCGACGACCAGGACCATGAGGGTTGTCTCTGCTAAAGAGGAAGTCCCCAGTGCGTACTCCACAGGCCCTAGCTCTTGGCCTGGCTAGGGATAACTGGGGGTGGACTTCAAACGGTGGCCTGAAATTTAAACCAAAACCAAACACCCGGTAGGATTCACAGGGATGACTGTGGAGCCATGCGTGGCTGAAGGCTCCACCACCCCCATCCTGGCCAAATGTGAGGGTCTATGGAGGAAGCACCAGGGGCAGCACTGGCCTCTAACTGCCTCCCATTTCTGGCATACACACTCCTTCACGCATTCATTTAGCCATCAACACTGCGTGCTTTCTGTGTGCTGAGCACAGAGGCGCATGGATGAGCACATAGGTGATGCATTCCCAACAACATACAGGCACAGGCACCCCCCGCCCCCTACACACACACACACACACACACACACTTTCTCATTCCATCTCCATCTTTTCCTTTGGAAAATCCTGCTTTGGAATATTTGGTTTAGTGATAAGGGGAGAAACAAAAAAGCGTACTTCTGAGAGGCTGTTAGTCTTGACAGTGCTTAGGTTCTAATGACCCTATTTAACTACTATTTTCAGGACACGGTCGATTTCCTCTCTCTTGATTTGTCTTATGAATGCCAAAATGAGGCAAGTCTGCGGCAGAAGCTGAGTAAATTGCAGGTAATTTGAGCCCTTTTCCACATTAATGATGAATGCAGCGAAGGTTTCAGAGAGCAGATTAGACATTTAATGCTTTGGCTACTGCATAAACTGAACTTCCATCAACAGCAGAGACCGGCTGAGTTGTGTCTGGGGAGATTTCCATTGCAAGCATCCCTAGAGAACATCGGATGTTAGGCAGTCTTTCCTAGAAGGGATACAAGGGTTAGCTTGTTAAGGTGAATATTTACATAGATCCTCTGCTTGCTTGTGTAGAAATCTGCCGAGAATTGAGATTCTGGGGTTCATTCTGAGTTTTAAAAAGGCAACTCATCAATGGGGGTGATGGTTCCATAACGATAAGCGTCCACTTAACACCACTGAACTATACATTTAATGGTTATGATGGTAATTTTTTTTTTTGAGATGGAGTCTTCCTCGGTTGCCCAGGCTGGGGTGCAGTGGCGTGATCTTGGCTCACTGCAGCCTCCACCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGCCTCTCCAGTAGCTGAGATGACAGGAACACACAAACACGCCTGGCTAATTTTTGTATTTTTGGTAGAGGCAAGGATTCACCATGTTGGTCACGTTGGTCTCAAACTCCTGACCTAAAGTGATCCGCCCACCTTGGCCTCCCAAAGTGTTGGGATTACAGGCGTGAGCCACCACACCTGGCCTGTAAATTTCTTCTTTATGTCTATTTTACCACATTTTTAAAAAAACAAACATTTCACACCCAGGTCTACTAAATCAGATCCCAGCTGTCTGGACCTTCCAGTAAGCTCAGTACTCCCTCCTGTACCCAGTACTGCTTTTCTCAAGTCTAATGATGCGGGCTCATTAGAGAAAGTGTGTTAGGAGCCTCCTATCCAACTACCAGGTTTCTCTCTTAGGCTTGGTCACTGCTGTGTGACTTACTTGCTTCATTCCCTGGAGTCCCAACTATTCTCCTGTGACAAGGTCTATCTGATGGTGCCCACGTTTTCTCCTGCACCTTCCGAGTGCTGGCAGTATTCCTATAACCCTGGAGAGCTGCCTTCCTGTGGGCCTTTCCAAGGATGTCTGGCCACTGGTATGCACCCACATTGGACCCCCTGCCTCTTCAGGTTTGGGCACAAAACCACTCCCCGCTGCTTTCAGCCTGTGCCTCCCATGAGGGAGGCAGAGCAGCCCCCTACACTCACCTGTGGTTTTGAATCCCACCATCTCCGTCACCAAGGAGGATGGTTTACCTGAGGAATTATCCCTTTAAAGGCCAAGTTTGGCTAGGCACAGTGGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCCGAGGTGGGTGGATCATGAGATCAAGAGATTAAGACCATCCTGGCCAACATGGCAAAAACCCATCTCTACTAAAAATACAAAAATTAGATGGGTGTGGTGGCACGCACCTGTAGTCTCAGCTACTTGGGAGGTGGAGGCAGGAGAATCACTTGAACCTGGGAGGCGGAGGTTGCAGCGAGCCAAGATTTCGCCACTGCACTCCAGCCTGGTGACAGAGCGAGACTCCATCTCAAAAATAAAAATAAAAATAAAAGGCCAAGCTCAGGAATGTCAAACTGAGCTTCAGCTACATGGACCCTCCATTTTACCTGAGGCAGAGTGCTTGAAATGGACAAATTAGCACCAGTCCTATCCCAATGTCTGTGTGTTTCTAGCTGTCTGTGTAGTAGACACTGCTGCTTTTGTTATCTACAAATAATAAGATGATCTAATTTAGGGGTCCCCAGCCCCCAGGCGGAGCACCAGTACTGGTCCATGGCCTGTTAGGAACCTGGCTGCACAGCAGGAGGTGAGTGGCAGGCGAGCAAGCATTACCACCTGAGTTCCACCTCCTGTCAGATCAGCGACCATATTAGATAGGAGCACAAACCCTATTGTGAACTGCGCATGCGAGGGATCCAGGTTGCGTGCTCCTTATGAGAATCAAATGCCTGATAATCTGAGGTGGAACAATTTCATCCCCAAATCATCCCCATCATCCCCCCTACCTCCCCCAAGTCTGTGGAAAAATTGTCTTCCACGAAACCGGTCCCTGGTGCCAAGAATGTTGGGGACCACTGATCTAATCAAAGGTGACAGATGCAGCCACAAAGACATCTGAGTAACAGCTATTTTAGTGCTTGCTTATCCCAGACACCTGGGAGGCACTTCATTCTCACATCATCTCAACCTCTCAAAACACACCCTAAGGTTTAAACAATTTAACCAAGGTGGTGAGCTCCAGGGTTGGGATTTGAACTAGGGCTTTCTCATTCTAAGACACCACACTGTCTTTTCAAAAGAAAAATAAGTCTCACATCTGTAATCCCAGCACTTTGGGAGGTTGAGGCAGGCGGATCACTTGAGGCCAGGAGTTCAAGACCAGCCTGCCCAACATGGCGAAACCCCGTCTCTACTAAAAATACAAAAATTAACCAAGTATAGTGGCACGAACCTGTAATCCCAGCTCCTTGGGAGGCTGAGGCACAACAATCGCTTGAACCCGGGAGGTGGAGGTTGCAGTGAGCCGAGATGGCGCCACTGCACTCCAGCCCAGGGGACAGAGAGAGACTTGTCTCAAAAAAAAATAAAGAAAAAGAAAAAGAAGTCCAAGGGTTTGGAACATGATAATGAGGGTGGTATTTTTTAAATCACATATGATCAGTTTCAGTTGTTTTTGTGAATGCCTCACCTGAACCTAAACTTGCTTGCTGCCCAGGGCCTGTGCTTGCGGGCTGGCTGACAAGGTTTCTGGGCCTTACGTAACACTCTAGGGTCTTCGAGGTCTGCTTGTGCCTGTGATGACTAAAGCTGCCTTTTGTCCTCCTCATGGAATTAAACCAGAGCTTGTTGCTAGGCTAATGGGTTCAGACAAAGCTGCCATTTTAAAACCATCTCTGTTGTGCGGAGGTGGCGTGCCTCTGACAGGCAGCAGAGGCACTGCATGGCTGGTACTTGAGGATGTGATTTTCAGTCTCTTCCCTTTTTCCATCACAACATTTTTTTTTTAAGATGGAGTCTCGCTCTGTCACCCAGGCTGGAGTGCCCCGTGGCATGATCTCGGCTCACTGCAACCTGCACCTCTGGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCAAGTAGCTGGGACTACAGGTGCCCGCCACCATGCCTAGCTTTTTTTTTTTTTTTTTGTATTTGTAGCAGATACAGTGTTTCACCATGTTGGCTAGGCTGGTCTCGAACTCCTGGCCTCAAGTGATCCACCACCCCCCTCGACCTCCTAAAGTGCTGAGATTACAGGCATGAGCCACTGCACCTGGCTACCACATTTTCAAGACACTTCTACCAGTGTCTGGGTAAAGCACTGAAACTTCAGTCTGTAGCTGGCCAGCCAAATAGTAAAACTCTCCCTGGACAAACTTAGCAGCCATTTATAAATGTTCTGCAATGGTTATCTATTCCTTTTACTTCCTTGGGTAGGGTTGGCCCCTCAGAGGCAGCCTCAAAGATTCGGAAATGACAGCTGACAACCCCTGAGCTGGAGAGCACACTGTTCCTTCCTGGGATTGTGGTCTCATGCCTGGTAGCATTTCCCATGCACAGTTACCACACCCAGGACAGGGAGAACAGCTGAGCCTGCCCTGAGAACAGGGGCTGAGTTGTGTCCACAGGAGCCTGAATCGTGCTGCCCACCTTCCCAGTGTCCCCTCCCTCCCTGTCCTGGAACCCCACCCTCCCCTTGAAGGGGCCTCTTCCTGTGGGCTGCGAGGGAAGAGGGCGAAAGCAGGGCAGGGAGGAGCAGGCACCTGCCCCCATTCCCACCCTCTCCCCGGAGCACCTGCACAGCCCTCTCTGAGCCTCAGGGGCCCTCAGCGGCCACTCCCCAACGGCACACAGCTGTCTGAGGGCCTGAGAACAGCCTCAAGCCCAGAAATGAAGAGCTGCGGCACACTCCAGGGTTCTCGGTTCTGCAGGAGGCACACGAGGAGGTCCCCCATCCACTTATCAGAAAAAGCTGTGCTCCCAGGGAGTTCTCCGCTTGGCAGAAGACAGGCTGGGGGCCTCCGAGGCTCCTCTAGCTCTCCAGCCCTGGGACATCACCGGCTGCCTCATGGCATATCCGTCTTTCAGGAAGGAGAAAACCCTTGCTTCCCTAAGCACGCCACCCTGGGTCATTTGTCCCCACTGCATTGACCCAGCACAGGGAGGGATGAGGACTGTGTGGAGTCACAGCTCCACTAACTGCGCAGTCATGGGCAACCCGCTCGGCCTCTCGAGCTTCTGACTCCCCATCTGTAAAGAAAGTCACAGGTGGCTATGAGAAAGTAAAGACTATGCCTGGCTCCTTTTAAAGTGGTTACTATTGGTATCTTTTGGTAGCTTTTAGTTGCTCAGAGGAGGAAAAAGTTACTGTGAGTAAAATGACCAAACTCCAAGCCCCGCAAAAAAGGTAATTTAAAGTGAAGTCAAACAGCATGTCAGCCCTGAGACGTTTTCCTTGATACTGAAATGGCTAGAAATAAGAAGAGGAAATTACATTTGCTTCCATTTTAATGATAACAGCTAATATAACTTTTCTTTTTCTTTTTTTTTTTTTTTTTGAGATGGAGCCTGGCTCTTGTTGCCCAGACTGAAGTGCAGCGGTTCACTGCAACCTCTGCCTCTTGAGTTCGAGCGATTCTCCTGTCTCAGCCTCCCAAGTAGCTGATATTACAGGCGTGCACCACCAAGCCCAGCTAATTTTTGTATTTTTGATAAAGACAGGGTTTCACCATGTTGATCAGGCTGGTCTCAAACTCCTGACCTCAGGTGATCCGCCCGCCTCAACTTCCCAAAGTGCTGGGATTATAGGCGTGAGCCACCACACCCGCTGGGCTGCTGTAACTTTTTGTTTTGGAAAATTTCTAACATCCAAAAGTAAAAAGAATGATGAACCCCTACGAAGCCATCTCCAGCTGCAAGAGCTATTATTGGCTCATAGCTAATCTTCTTTCACCTAACCTATAACTTCTATCTCCCAAACTAGATTTTTAATTAAAAAAAATTTTTTTTAGAGACAGGATCTTGCTCTGTCACCCAGGCTGGAGTGCAGTGGTGCAATCATAGCTCACTGCAGCCTTAAACTCCTGGGCTCAAGCGATCCTCCTGGCTCAGCCTCCCAAGTAGCTGGAACTACAGGCATGCACCACCACACCCAGCTAACCAAACTGGATTATTTTGAAGCAAATCCCAGACATCCATAGATGGTGGCCTCTTAACTAAGCTTCTTAAGTAGCACAGGCTCTGGATGTGAGCAGTGGCCTTGTTCCTGATCCTAACACCGTGCCTGGCTCTAAGAGGTGCCCTGTAAGCCTGTGATGAAAGAAGAGGTGAAGGTGGGGGTTGGTGGGGAGGGTAGACTATGTTATTGAAAATTGTAGATCTTTCTCCTTCAGAGTCTAGAGTTGACTCCTTTAATTAACTGAGATACTTAGAGGTCATTTCCAAAGCCAGAGTAAGTGCCACAGCTTCTCATCTTGAAACTCTGTCCCTGTTATCAAGATGCTTTCCAGGAGGCTTCAGTTCACTTGCTGGTCCTTCTCTTTTTCAGACCATTGAGCCAAAAGTGAAAGTTTTCATCTTCAACCTAAAACTCCCAGACTGCCCCTCCACCATGAAGAACCCAGCCAGTCTGCTCTTCAGCCTTTTTGAAGGTGAGTGGGCCATTGCTGAAGAGGTTTTGAGTGACATCTGGTGCACTGGTGTGCTAGGTAGCAGTCTTGAAAGTCCGGGGTTCCAATGGGAGGAGGAGCATGGGAGGAAGACTAGTATAAAAGCCCACCCCAGACTGGGTTAGTGTACTATGCCTTCCTACTGATGGTCCCTTGCAACCATCCCCCATTGACCCAAGAAAGAGGAGAGGTTCGACACAAGGATGCCTCTTATGGACATAAAGATAGTTAGGCCTCAGCTGTGAGTTGTAAGCATGGAAAATCATCTTTGCCTCCTTTTATTACCTCTCCCTCCAAGGTCTCTCATCTCTGCTCCTCTTGGCAGGGCTTTCCTCTGCCCGTCTCTCTCCAGCCAGCCCTCTCCACTTACCCTTGTTCCATGTCCCCATTATCTCAGTTTGCACATGGCCCTGGTGGGTACCTGACCAAGATGCTAAGAACTTTCAAGTGTAGGACTCACAGCTCAAGGGCCATCTTCCTAGTGTCTCTTAGTTCAAATTCTTGAAAGTGAATCTGATTGTTGGCCATGGATCAGGAGGCTGCTTCTGGTCCAATCAAGTCAGGGGAAAGGTGGGGTCTATGATAGCATTGAGGCTGGCAGTCACTGGAGACTCTGCAAGAAGGGAGGAAGGGGCAGAGAGGAATGTGCCTGAGGGCCCTGATATTCACTCTTGTCTGTCTGTCACTCTTGTCCATAGGCCAGAGTATGGGAGAAGTCAGTAGTGTTCTTTCTACCACTGTGTCTTAGTCTGTCTTGTGTTGCTATAATAGAATACTCTAGACTGCGTAATTTATAGAGAAAAAAGGTTTATTTAGCTCATGGTTCTGGGGACTGGGAAGTTCAAGATCAGGCAGCCACATCTGGTCAGCTTCTGGTGAGGGCCTCATGCTGCATCCTAACCTGGCAGAGAAGTGGAAGGGGAAGGAAGTGCCTGCAAACAGATAAAACACCAGAAGCAGCCTCACTTTATAACAACCACTGTATGGTAACTAATCCAGTCCCACTAGAATGGGAACTCACTCACTCCCTGGAGACTGCACTAATCCCTGAAGGCGGATCCCTCATGACCCAAATGCCTCTTAAAAGTCCATAACCTCTCAATAATGTTACACTGGCAATTAAATTTCAACATGAGTTTTTGTAGGGACAAACCACATCCAAACCATAGCACACCTGGACCCCATCCCAGCAATGGGTTGGCTCCACAGGGCCCCTGAAGTTTATCCATAGATACCATTTAATAATGCTTATCTGAACTCACCTTTGATGGCATAACAATTTCTGTTCTTAGATCCCACCTCTCTCTAAGTGGTTAAAATTGTACCTTTTCTGTTTATGCGTATTTTACCACAATTTTAAAAATATTCCACCCCTTTCTGATCTTTGAGTTCTTCTAAATCAATTGTTCCCAAAGTTGTGGTCCCCAGACCAGCAGCATCAACATTAGCATCACCTGGGAGCTCATTAGAAATGCATATTCTTGAGCCCTACTTGAGACCTACTGCATCAGACACTCTTGGGGTGGGACCAGCAACCTGTGTTTTAACAAGCTCTACAGATGATTTTGATTCACCTTGAAGTTTGAGAACCACTTTTAAGTAATAAGTAAGTAGAATTCACTTCTAAGCTTTTAAAGTCGTTAGCCCATGGTATTTTCCAAAGGGGCTTGGAACCACTGCTTGGAGTTTGGGTGTGTCGTATGAGCGAGGAAAACTGTTGATTTCAGACTTGCATGTTCTTAGTTGGCATTTACATAGAGTTAATTCAATTTCTTCTCTTACAGCCATAAATAAAGACCAAGTGCTCACCATTGGGTTTGATATTAATGAGTTTCTGAGTTGTTCATCAAGTTCCAAGAAAAGGTAATGTCAGGTTGCCTATTGAACTATCAATAACTGATATTTGTAGAATACTCTGTTTCTTTTACATGTATAATCTTATAGGACTGTTGTCATCAACTCTTGGGCCACCAAGTTGTTTATTGCCATTCAATTGATGAGAAACAAAGACTCAGAAAGAAAGTAGGGAGTCTCTTACTGAGTGGGACTCACGAGGTTCTGCTTTCTCATCTGTCAGTTCGCCCAACTGTGCGCAACTAGCATGATGGCTCACACCTGTAATCCCAGCACTCTGGTAGGCAAAGGTGGGAAGATTGCTTGAGTCCAGGAGTTCAAGACTGGGCTGGGCAACATGGTGAAACTCTGTCTCTACAAAAAATTACAAAAATACAAAAATTAGCCAGGCATAGTGGTGCATGCCTATGGTCCCAGCTACTTGGGAGACTGAGGTCAGAGGATCGCTTGAGCCCAGGAGGCAGAAGGTGCTGTGAGCCGAGATTGTGCCACTGCACCAGCTAGGATTTGAACTCCTGCCTTCTAGTTTAAGATCTTGCTGGAGACAGTGTGAGCTTGTGGAAGAGTGGCCAGGTTAAAGATAGATCTGACCATCCCACTGAAGTTACATGATGAGTAAGAGAAATGGGTTCTCTGTGCCCATTTCCTCAATATGAAGGGTGAAACATCCTCCCTGGAAGGAGACAGCATAGACAGGAAAGCCAGCTGTTGCTGCAAGCCAGATGCCTAACTTGACAACATTCTAGGGACAGAGGTTTGAATCTATGGTGGGGTTGTAAATAATATCTTACTGAGTGACTCAAGTGCCAAAGTTTGCAAATGATATGCTTTAAAAAATTAGAGCAGATTGCCGGGCACGGTGGCTCACGCCTGTAATCCCAGAACTTTGGGAGGCTGAGGCGGGTGGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACAGTGAAACCCCGTCTCTACTAAAAATACAAAAAAATTAGCCGGGCATGGTGGCGGGCGCCTGTATTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGTGTGAACCCTGGAGGCAGAGCTTGCAGTGAGCTGAGATCGCGCCATTGCACTCCAGCCTGGGTGATGGAGCGAGACTCCATCTCCAAAAAAAAAAAAAATTAGAGCAGGTTTTGAGGTTGTGCCCATAATTACATTGCTTTCATGCACGCATATCCCAATACGCTCTTGAGTGAATGAGAAAAGAATGGCATGGTAGCCAGCACTGGGAATTGCCCAGAACCTCAGCGCTCCTGGAGGGATGTTACATGCATGAAGTTCATGCACCATCCCTTAGGGTGGGACAAAAGCTGGAGACAATAATTGACTTCCAGACCTTCAACTAGAGTTCTCTTTGTCACTCACCTCTGATATTTCCAGTGCAGCCCTGTTCAGGGTCATTCAGTGCCAACACCTCTTTGTACCTTTCCTCTTCCAGTACTTGACTGTCCTGAGCCATATCCTCCTTCTATTGTTCCATCCTCTCAATCCACTTCAAATCAGCAGTTCAGATCAACAGACCCGCAGCAGCAGCTGTACCTCAGGCTTTGTGTGGCAGTGTAGACTTGCAATAGACAGACATGGGTTACCACTGCTTCCTGACCACACTTGGAGTCAGCCAAGAAGGACTGGCTGTGGCTTCACAAAAGAAAACTCAAGAAGCCGTAATAAAATGGGTTCCCTGAAAAGCCAGTGATTACAAGTGACACCAGCTCGGAGATTCTCTCAGCGCTTGGTGGTGCTTTGCCTGAAGGGGAGGGCCAACACAGGCTTACATTAAACGGACAGCCAGGGGCCCCTACTCAGGAGGATGTGGTTGGAGAACCCGCTGAATGCAGGGGCGGTGGGTGGGGAGTGATTCAGAAATGACTAACGTAGTTTTCTCCTTCAGAATTCTAGACCTTATAGGGGAGACAGAGCGGCCCCTGAACAACTCTCACATGAGAATGTGGCAGGAGACACACAGCACTGCACCCTAAAAAAGGGAGAACTTAGGAGCCCTGGGTGTGGAGCCTGAGGTGCCGTCATGTGCTAAATCCCTCTCCATGGCCGGCAAACCCAGGGTTCCCAGCTCCAAGCCTGTACAGCAAGTTCTGTTTCATCCCAGGGCAGTTTATTTGTTTCCTTAAAACTCTTCATGCAATCCAGGAGGACAGTCAGGGCCAGGAGGGCTGGGTAAGAGCGAGGTTCGGAGCAGCGGACGCTGTGTTTATGGGCACCGTGGATACGCAGAGGCTGAGCACCGAGGGGACGCGACACATCCCCAGCTGCGATCCACAGTCGCATATGTTTTGGGATCATCTACGAAGGAAAGGATCATTTCCCTTTCCCCCTAATCTAGCAAATGTCAGGGAGTTGATGCTGAGTGAAACAGAAGGCTCTTAGGTTCGGAAGACGCCTCCTGCTGGGTGACCCGGCCCCAGGCTTCGCTTTTTGAGAGGAAGATCCCTGTGCAGTGTTCCTGTCACTTCTCCCAGTTCTGCGCTGTGGGCCAGCCTGGTATAGGTGCCATCGGCTCTCCACACGATGGCTGTGTGACAGGGAGATGCTCTTGTACTCCACGTCCTTTTCCCCAGGCATGTGCCACACTCCTCAAGGCCGACCTCTGCTGGCTGTAATTTGCAGCATGCATGCTTTCCTGCCTGCATGACATGACTCAATTTAGAAGTTGGCAATCACAATTGAAAAAAAAGAAAGAAAAAAGAGGAAAGGAGAGTGGGAGGGAGGAAAATGGACTAGAATAAAATAGAAAAATCAGACCACATTTTGTATAAATGCAGCATGCACTTTTATGTGATGTTTTATTTCATATGCATATACATATGTACATGCATATACATGCACATAAACATGTATGTGTATGAGGTTAAAAGCACAGAATCTGCTCCACCACCTGCAAGCTGTGTGCAAGGAGAAGTTACTCATAATCACCAGGAATCCAGGCTCCTTTGTTGTTGCTTTGTCACCTTTAACAAGGTTTCTACCTCATGGTTCAGGATGGATGCTTGAGCTCCTGCCATTATGTCAGAAATCCAAGCAGCATGAAGAAAGGAAGCAGTAGCCAGGACTGATATTCAACTGGTCCACATCAGTGTACTTCTGTACCAGCTGATAAATAGCTGCTGGCTCCCTGAAATCAGGAAGTTTTCCATTTCTTTTTCTTTTTTTAGACGGAGTTTCACTCTTGTTGCCCAGGCTGGAGTGCAATGGCGTGATCTCAGCTCACCACAACCTCTGCCTCCCGGGTTCAAGTGATTCTCCTGCTTCAGCCTCCTGAGTAGCTGGGATTACAGGCCCCCACCACCACGCCTGGCTAATTTTGTATTTTTAGTAGAGACGGGGTTTCCCCATGTTGGTCAGTCTGGTCTCGAACTTCTGACCTCGTGATCCACCTGCCTCGGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACCACACCCAGCCCCCGTTTCTTTTAGTCTCAGTTTCCTCCTGTGTAGGATGAGGATAAATCATTGTAGTACCCATCTCATAAATTTGTTGGGAAAATTAAATGAGATAATACACATCCATTCTTATTACAGTGGCCAGCGCAGAATCAAGGCTCAATAAATTGGAGTCATTGTTATTATTAGCTATGTTTTACAAATAATGAATTATAAGAAGAATAAAGTATGGTACTAACACTGAAGACAATATTCAAGGGCAATCTAATACAGAGAACAGTAGCATTGTTCCTGTTTTAACCATGAAAGAGCAAGAATCACTCACCTCAGAAGGGGTAATAATAATAATTTTCCCATCTGCCAGTTACTTCCTGCCCATGGCTTTGCAGATATGACTTTTGACTCAGTGTTTCTGGAATCTTTTCTGATTAAACACAGTAGTCATCCGTAGGGGGCATTTGTAACTGCCAGCGTCATTCATTATTATGTCCCTTTTTGTCCCTTCAATCCTGCAGCATGTCTTGTTCTCTGACTGGCAGCCTGGCCCTTCAGCCTGACCAGCAGCAGGACCACGAGACCACGGACTCCTCTCCTGCCTCTGCCTATCAGAGAATCTGGGAAGCATTTGCCAATCAGTCCAGGGCGGAAAGGGATGCCTTCCTGCAGGATACTTTCCCTGAAGGCTTCCTCTGGGGTGCCTCCACAGGAGCCTTTAACGTGGAAGGAGGCTGGGCCGAGGGTGGGAGAGGGGTGAGCATCTGGGATCCACGCAGGCCCCTGAACACCACTGAGGGCCAAGCGACGCTGGAGGTGGCCAGCGACAGTTACCACAAGGTAGCCTCTGACGTCGCCCTGCTTTGCGGCCTCCGGGCTCAGGTGTACAAGTTCTCCATCTCCTGGTCCCGGATCTTCCCCATGGGGCACGGGAGCAGCCCCAGCCTCCCAGGCGTTGCCTACTACAACAAGCTGATTGACAGGCTACAGGATGCGGGCATCGAGCCCATGGCCACGCTGTTCCACTGGGACCTGCCTCAGGCCCTGCAGGATCATGGTGGATGGCAGAATGAGAGCGTGGTGGATGCCTTCCTGGACTATGCGGCCTTCTGCTTCTCCACATTTGGGGACCGTGTGAAGCTGTGGGTGACCTTCCATGAGCCGTGGGTGATGAGCTACGCAGGCTATGGCACCGGCCAGCACCCTCCCGGCATCTCTGACCCAGGAGTGGCCTCTTTTAAGGTACTTCCCAACCCTGCAGCTCCTACTAATTGGAGGAGAAAGGACATTGGCTGGAAGAAAGTCATTTTCTCTGTTTTCTTCCATCAGCAAGCCTTTACTTTTTGTTCTTTCTTTAAAGGAAATCGGGGAGGGAAGGAACCATAAATTGTTAATTAAATTGTTAATCACCTGGCCAGGTGCAGTGGCTCATGCCAGTAATCTCTTCACTGTGGGAGGCCAAGGCAGGCAGATTTCTTGAGTCCAGGAGTTCGAGACCAGACTGGGCAACATGGCGAAATCTTGTCTCTGCAAAAAAAATACAAAAATTAGCTGGGCATAGTGTTGCACGCCTGTGATCCCACCTACCCAGGAGACTGAGGTGGGAGGATCGCTTGAGCCTGGTATGCAGAGGCTGCAGTGAGCCAAGATTTTGCCACTGCACTCCAGCCTGGTCAACAGAGCAAGACCCTGTCTCAAAAAAAAAAAAAAATTGTTAATCACCTTATTTTGTCCAGACCCTCTACTGGTACTTTTAAAATATAATAGTTATTACATACTCAGAATAGCACTGATGGATGAGTGAGGCTCAGACAGGATAAACAATGTGGTCATGATGACATTGCTAGTGAGTAGCCAGGTGGAAGTCAGGATTTGAGTCCGAGTCTTCTTGACTCCAAATCAAGTTCCTCATGTCAGTGACAAGTGACAGAAAGCTCAACCCAAAGTGACTTAAGCAAGGAGAGAATTTACACATTCAGGAGGTTGAAAATTCTTCATTTAGCCTGATCAGGGTGGAATTTGATCAGAGCACAAGCGATGCCACCAGGACCCAGTTCCTCTCCTGTTCCCCTCGTTGGCTTTATTCTTGGGCTACTTTGCAGCCAGATGGCAGCAGCCCTGTTTCTGTTATTTCATGACCAGTAGGGAAAAAAGCTCGGCTCTTTTCTGTCCTTCCCAACAGAAGTGTCCCTGTGTCTCATGGTCTCTCAGTGGGTCGCATACCCACCCTGAACTCATTGCTGGGTCCTGGCCAGGAGGCTGTGACAACTGACTGGTGTGGGCCAAGGACCCATGCTTTACTCCTCAATACGCTCACTGAGAGCTGAGGAGGCAGAGAGGGAAGAGGCAAGGAGGCATTGGCTTTCCAGACGCCAGTCAGGGCATCGTTTCAACAAGAAGGGGATGTATACACTTGGCACAAAATTTTAAATGGCTATAGGTCTTTTCCATTATTTCCCTTTTTCTTCGGAATCTCCCAGAAAACCCACCAGCTTTCTTTGGCAGCGTTCTTCAGGATGGACATGTTAGTCTGCCTTTTCCCTGTCACTGTTTGGGTTCCATTCTTAAAGATGAGTATTTCCGGCCGGGCATGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCAAGGCAGGCAGATCACCTGGGAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGTGAAATCCTGTCTCTACTAAAATACAAAAATTAGCCAGATATGTTGGTGGGTGCCTGTAATCCCATCTACTTGGGAGGCTGAGGCAAGAGAATCACTTCATCCTGGGAGGCGGAGGTTGTAGTGAGCCGAGATTATGCCACTGCACTCCAGCCTGGGCAGCCTGGGTGACAAAGCGAGACTTTCATCTCAAAAATAATAATAATAATAATAATACTATTTCCTGTGTCCCGTGCTAGGTGTTAAAGAGGGGTCACAGCCATGCCCTGGACATGTTATAACCTTTTGGGGAAGATGACACTAACACACGTAGCAAAATTACAGAACTCTTCAAAAAGACCATTACTAGGGTGAGCTGGAACATCATGAATAAATAACTCAATGAAATGTCAAACATTGTAGCACGTAAGTCAGAGTTTCCATTCAGCTCTTGAGCAGCAAGTGACTGCACATATGGAGCCATTCCACCACCCACCTTCTGAAAATGGAAGGTTTGAAATCTTCTGTTTCACTCCTTGTTGTAAAACTTATCTAAACCTTTTCTTCTTAGGCTTTTCTTCCCCTTTGAACTGTGGCTCTTGAGATATCTTTACAGAGACTTTGATGAGAAAGTCCCCTTCACTCTTCTCCTTCAATTCTTCCCTTTATTTATTAGTTCAATGTTAGAATGCCATTGTCTTAGTGAGCTTGAGCTGCAATAACAAAACACCATAGACTGGTGGTTTAAACAACAGATATTTATTTCCCAGCATTCTGGAGCTGGGGAAGTCCAAGATCAAGGGACCAGCATGTTTGGGTTCTGGTGAGGGCTCTCTTCCTGGCCTGCAGGCAGCCACCTTCTTGCTGTCCTCATATAGGGGTGGTTGGAAGAACTCACTGGTATCTTTTCTTATAAGGACACTAATACCACCACCATGAGAGTCCCACCCTCACGACCTCCTCTAAATCTAATCACCCCTCAAAGGCCCTATCTCCAAATACCATCACATTGGGGATTAGGGCTTCAACATATGAATTTTGATGGGGGAACTAATTCAGTTCATAGCAACTATTAAGGAAAAAATTTAAAGAAAAAAATGTCTTGGGCCAGGCGCGGTGGCTCACACCTGTAATCTCAGCACTTTGGGAGGCCGAGGCGGGCGGATCACGAGATCAGGGGTTCGAGACCAGCCTGGCCAACATAGTGAAACCCTGTCTCTACTAAAAATACAAAAATTAGCCAGGCATGGTGGCGGGCACCTGTAGTCCCAGCTACTCTGGAGGATGAGGCAGGAAAATCGCTTGAACCTAGGAGGTAGAGGTTGTGGTGAGCCGAGATTGCGCCACTGCACTCCAGCCTGGTGACAGAGCGAGACTCCATCTCAAAAAAAAAAAAAAGGTATTTTATTATTTTAGAGTATTTCCTTCCAGTCTTGGCTTCTTTGCATTTATGATGTTGTCACAGGGCACCTCAGATTGTTGCTCACTGTTTACTTGATATCATGTCATTAGCACTTTTCCCTATTATTAAGCAGTTGTGATGACTGTTTTTGATGGTTGTCTAATATTCCACTGAGCTCCCTTCCTGACACTGGCTAATTTAGAAGAAAGACATCCTTGCTTTTGGGAAAGGAGCACAGTTTGCCATTCGAGTTTAGAACTCAACTAAAGACGAATATTTGGGATGTGAGAAGCAGCCAGGCGTTTTAGTGATTATGGCATATTTTGACATGAAATTCTTCAGAGGTAAGTGTCATCCTCTTCAGATGATAAAAAGGAAAAAGGAAAGCAAGCTAAGATTTAGCAAGCTCACTCCTGCTCTCTGAGTTTCTGCTCAATGCTTTATATACACGTATTTAATCATCCCAGATGGATCCATAATTACCCACTTCTTGCCAACAAGTAAGCTGAAGTTGAGAGAATAAATTGTCCAAGTTAACAAGTTAGTAACAGAGTCAAGATTTAAATCTAGGCTTGTTATATTTCAGACACCCTCCTTTTGCCCCTACTTCCCACAAAAAGCTGTTGCTGTTTGTAAGAGCATGAGTTAAGTCTACAAAGAAACTCCTAGTTTGGTTTTTCTTCCGAGATTCCATTAAATAGAAAGAAGAACAAATAAGCAAGAAAGAGCCCTCCTCTCCCTTGTGTGCTAATTAAAATAATCCTCCCCATGGACTAATTTCTCAAAAAGCACTTATTAAGGACAGAGGCAGAATAGCAGTGTGGGTAACAGTAACAGGCTTGGAATCAGACTGCCAGGGGCTTGTTCTCACTTTACTCCTGACTCTTGGCCTTGTGAAGTTACTACACAGCTCTGGATCTTGTTTTCACCATCTCTATAGTGGTGATAATAATTGTACCTGCCATATGAGGTTGTGGTGAGGATTACATGAGAGAATTCATTAAGTAGTAGGTGCCCAATATATGTTAGTTGTTATTGTTAATGTGGTTGTTGATGCTGTTATTTTGTTGACAATTTTGAAGAATTGCTGTTGACTTGTTGACTTTGTTGATGATATTGGTGTTGACTTGTTGACATTGTTGACTTGATATTGTTGACCTTTTCACATTGGTGTTCACTTGTTGATGCCGTTCATGTTGGTATTGATGTTGTTGACATCAACATCGTTGATATTATTGACTTGTTGACATTGGTTTGGATTTCTTGACATTGTTGACTTGTTGACATTGTTAGTATCAGTCTTAACTTGTTGTTTATGTTGTTAACTTGTTAACTTTATTATTGACTTGTTAACATCATTGATGTTAGTGTCAACATTGTTATTTGTTGATGACTTGATGTTAACATTAGTGCTGATGTTGTCAATATTGACAATGTCAATGTTGTTGTTGTCTTTATTGACTTGTTGACATTGTTGTTGACTTGTTATTGGTTCATTAGTCCTGTTGTTGTCATTGTTATTATTACTAATCACTGTATTTCCTTCTTACTTTTTCACAAGGTGGCTCACTTGGTCCTCAAGGCTCATGCCAGAACTTGGCACCACTACAACAGCCATCATCGCCCACAGCAGCAGGGGCACGTGGGCATTGTGCTGAACTCAGACTGGGCAGAACCCCTGTCTCCAGAGAGGCCTGAGGACCTGAGAGCCTCTGAGCGCTTCTTGCACTTCATGCTGGGCTGGTTTGCACACCCCGTCTTTGTGGATGGAGACTACCCAGCCACCCTGAGGACCCAGATCCAACAGATGAACAGACAGTGCTCCCATCCTGTGGCTCAACTCCCCGAGTTCACAGAGGCAGAGAAGCAGCTCCTGAAAGGCTCTGCTGATTTTCTGGGTCTGTCGCATTACACCTCCCGCCTCATCAGCAACGCCCCACAAAACACCTGCATCCCTAGCTATGATACCATTGGAGGCTTCTCCCAACACGTGAACCATGTGTGGCCCCAGACCTCATCCTCTTGGATTCGTGTGGTGCCCTGGGGGATAAGGAGGCTGTTGCAGTTTGTATCCCTGGAATACACAAGAGGAAAAGTTCCAATATACCTTGCCGGGAATGGCATGCCCATAGGGGAAAGTGAAAATCTCTTTGATGATTCCTTAAGAGTAGACTACTTCAATCAATATATCAATGAGGTGCTCAAGGGTAAGAACAATGGATGTGCCAGTGATTGGAAGGTGGGTGGTACTTCTCCAAGTCTTCAAAGTTTCGTTTAATAAGACAAAGAAAGTCTCCTAGAGAAATGGAGCCAAAGAAAGCATAATAGTGGGGAGTCCTTCACGTCAGCTCCCTAACTCTCTTTCCCAAGGTTCATTCATGTCATTCACGTCTTTGCTCCTGTGGTTTTTTTGTTTTATTTTGTTTTGTTTTTGAGACAGGGTCTTGCTGTGTTGCCCGCTGGAGAGCTGGAGTGCGGTGGCATAAACATCGCTCACTGCAGCCTCAAAGTCCTAAGCTCAAGCCAACCTCCCACCTCAGCCTCTTGAGTAGCTGGGACCACAGTGCAAACCACTATGCGTGGCTTATTTTTTTTTTTTTTAGACATGGGGTCTCTTCACATTGCCCAGGCTGGTCTCAAACTCCTGGGCTCAAACAGTCTTCTCACTTCAATCCTCCCAAAGTGTTGGGACTACAGGCATGAGCCACCATGCCTGACCCAGTGTCCTTATTGCCTAGAATACCTCCCTCTACATTCTGCCCATCTGAGTCCTATGCAGTCATCAAGCCTCATTATCTTTTTTTTTTTTTTTTTTTAGAATCAGGGTCTTGCTTTGTCACATAGACTGGAATAGAGTGGCATGTTCATAGCTCACTTCAGCCTCAAACTCCTAGGCTCTAGTGATCCTCCGGACTCCAACCCATTAACTCTTCCCTCATTGCTCCAGCCACACTGGTCTTCATTTCCTTTAATTGGCTATAAAATCTACATTCTATGTCATTGATTTTGATCCAATTGATCCACATCTACGGTCTCATTCTTACCTGACATACTATTTCATATGTCTTTTTATTCCAATTGGAAAGGTATGGCAAATAGATTTCATCTCACAGGTCAGTCCTCAGTTAACCCAGGATGTTCTTATCTTGAGCTCATTAACTTAATTACATCTGCAAAGATCCTTTTTCCAAATAAGGTTATATTCACTGGCACCACGGGTTAGAATTTAGACATATCTTTCGGGGGTCACCATTCAATGCACTGTATCAGGGAATATATGTTTTAGGCTTTATTTATTTATTTATTTTAATTTTAATTTTTTTAGACAGGGTCTTGCTCTGAGGAGTACACTGACCTGATCTGAGCTCACTGCAGCCTTGACCTCCTGGGCTCAAGCGATTCTCCCACCTCAGCCTCCCAAGTGGCTGGGACTACAGGTGCACACCACCACACCAGGCTAATTTTCTTTTCTTTTTTCTTTTTTTTTTTTTGAGACGGAGTCTGGCTCTGTCGCCGAGGCTGGAGTGCAGTGGCGCGATCTCAGCTCACTGCAAGCTCCGCCTCCTGGGTTCACACCATTCTCCTGCCTCAGCCTCCTGAGTAGCTGGGACTACAGGCTCCCGTCACCACGCCCGGCTAATTTTTTTGTATTTTTAGTAGAGACAGGTTTTCACCATGTTAGCCAGGATGATCTCAATCTCCTGACCTCATGATCCGCCTGCCTCAGCCTCCCAAAGTACTGGGATTACAGGCGTGAGCCACCACGCCTGGCCACATTTTTTTTTTTTTCAATAGAGACAGAGTCTGGCCATGTTGCCCAGGCTGCTTTATTTCTTTTTTAAAATATGAAATATGTTGTCACTTAATGTCAATATTACTAAACATAAACAAGGAAAAGCAAAAGCATATTGTTAAAAGATTGATTTATGTATTTTATATAAAACCAAGACACCCTGGTGGTAACACATGGGACACATCCCCTCCACTATTTATTTGAAGATGGGGATGCTCCTTTGGTTTGAGATTTATGGCCACAAAAGTGGCCTGATGTTTTGTGAGGATCTTGTGGATTTTCCTTTTATCCATTCTGAGGAGGAAAAAGGATGAACATTTGGGGGGTAACCCAAGTCACCCCCAAAACTTTCATGTCAAAAGGAACACTTTTTAAAAGCAACATTAGTAACAGAGACTATACTTCTAATTTTTCAATAAAAACTATTTTATTGAAAAACAGTCCTCGCTGGTCCGAGGTAATAACTTATCTCAGTTGACTGTTCACAACCAGTTACAGATCAAACAGCTTCTAATACCCTTCTCCCCCTTCTCACTACTGCACTGACTAGTCTTTAAAAGATAAATAAATAAAATAATGGTGCACTAGCTCACTCCTGTAGTCAGTCCCAGCTACTTGGGAGGATCACTTGAGTCCAGGAGTTTGAGACCAGCCTGGGCAATACAGTGAGACCCCATCTCAATTAAATAAATCCATAAATAAATAAATCTAATTTTTATTTTTCTTCACAGCTATCAAGGAAGACTCTGTGGATGTTCGTTCCTACATTGCTCGTTCCCTCATTGATGGCTTCGAAGGCCCTTCTGGTTACAGCCAGCGGTTTGGCCTGCACCACGTCAACTTCAGCGACAGCAGCAAGTCAAGGACTCCCAGGAAATCTGCCTACTTTTTCACTAGCATCATAGAAAAGAACGGTTTCCTCACCAAGGGGGCAAAAAGACTGCTACCACCTAATACAGTAAACCTCCCCTCCAAAGTCAGAGCCTTCACTTTTCCATCTGAGGTGCCCTCCAAGGCTAAAGTCGTTTGGGAAAAGTTCTCCAGCCAACCCAAGTTCGAAAGAGATTTGTTCTACCACGGGACGTTTCGGGATGACTTTCTGTGGGGCGTGTCCTCTTCCGCTTATCAGATTGAAGGCGCGTGGGATGCCGATGGCAAAGGCCCCAGCATCTGGGATAACTTTACCCACACACCAGGGAGCAATGTGAAAGACAATGCCACTGGAGACATCGCCTGTGACAGCTATCACCAGCTGGATGCCGATCTGAATATGCTCCGAGCTTTGAAGGTGAAGGCCTACCGCTTCTCTATCTCCTGGTCTCGGATTTTCCCAACTGGGAGAAACAGCTCTATCAACAGTCATGGGGTTGATTATTACAACAGGCTGATCAATGGCTTGGTGGCAAGCAACATCTTTCCCATGGTGACATTGTTCCATTGGGACCTGCCCCAGGCCCTCCAGGATATCGGAGGCTGGGAGAATCCTGCCTTGATTGACTTGTTTGACAGCTACGCAGACTTTTGTTTCCAGACCTTTGGTGATAGAGTCAAGTTTTGGATGACTTTTAATGAGCCCATGTACCTGGCATGGCTAGGTTATGGCTCAGGGGAATTTCCCCCAGGGGTGAAGGACCCAGGCTGGGCACCATATAGGATAGCCCACGCCGTCATCAAAGCCCATGCCAGAGTCTATCACACGTACGATGAGAAATACAGGCAGGAGCAGAAGGGGGTCATCTCGCTGAGCCTCAGTACACACTGGGCAGAGCCCAAGTCACCAGGGGTCCCCAGAGATGTGGAAGCCGCTGACCGAATGCTGCAGTTCTCCCTGGGCTGGTTTGCTCACCCCATTTTTAGAAACGGAGACTATCCTGACACCATGAAGTGGAAAGTGGGGAACAGGAGTGAACTGCAGCACTTAGCCACCTCCCGCCTGCCAAGCTTCACTGAGGAAGAGAAGAGGTTCATCAGGGCGACGGCCGACGTCTTCTGCCTCAACACGTACTACTCCAGAATCGTGCAGCACAAAACACCCAGGCTAAACCCACCCTCCTACGAAGACGACCAGGAGATGGCTGAGGAGGAGGACCCTTCGTGGCCTTCCACGGCAATGAACAGAGCTGCGCCCTGGGGGACGCGAAGGCTGCTGAACTGGATCAAGGAAGAGTATGGTGACATCCCCATTTACATCACCGAAAACGGAGTGGGGCTGACCAATCCGAACACGGAGGATACTGATAGGATATTTTACCACAAAACCTACATCAATGAGGCTTTGAAAGGTGTGTGAGGGTTCAGTTCCCCTTAAAGAAATCTTCCAACATTCCCTGGGTCATATGCCTGAAATGTTTTGCCGGGATGATTTATGAACCATCAATAGATCTCTCTCTTAGGTCCCAACTCCATAATTCTTTATCTGTTTGGGGGTTATATGTTCCTTGAGAAGCTGGGGGAAAAAAGGCTATGGTTGTCTCTGCAGAGGAAAAATACAAACACTACACACACAGGGTCCCTAGCAGAATATTCATATTGTCATGGGTCCATTCATTCATTACTGAGCAAGTTCTATTTTAGGTGCTGGGAATACAGCAATGAACAAAACACAAATTTCTGCCTTCGTAGAGCTTATCCCATGCACCCCAGAACAAGAAAGTTGTGTTAATTCAAACTTCCTTTTTTTTTTTTGAGATGGAGTCTTGCTCTGTTACCCAGGCTGGAGTGCAGTGGCCACCGTGCCCGGCTAATTTTTTTGTATTTTTGGTAGAGATGGGGTTTCACCATGTTGGCCAGGCTGGTTTCAAACTCCTGACCTCAAGTGATCCACCTGCCTTTGCCTCCCAAAGTGTTAGGATTACAGGCATGAGCCACTGTGCCCAGCCTAAAAATCAACTTTTTGTTTCATTGATTTTTTTTTTTTTGAGACAGTCTCACTCTGTTGCCCAGGCTGGAGTGCAATGGTGTGATCTCGGCTCACTGCAACCTCCATCTCCCGAGTTCAAGCAATTCTATTGCCTCAGCCTCCCCAGTAGCTAGGACTACAGATGCATTGGGCTTAACTTCCTAAGTGGGCTGAAGATCTTGAATTTGGGGCATGTTTCTTTACCCCAAGAGAAGAATTTGATTTGGAGATGATCAGTCATTAATGCTTGCTGTGGGGTCATAGGTACTGGCAGAAAAGTAAGATCAACAGATGATCTGTTGGTCTCTCAGGGTGTATGTCACTTTTAGGACCACAACCTTGAATTGAGGAGCTGGCAGTGGGTTGGGTGCATGGAGGTCCTGACTCCTGGTGTCAAGCTCTCCTCTGCTCCCTTTGGGATGTTCCCAGCCTACAGGCTCGATGGTATAGACCTTCGAGGGTATGTCGCCTGGTCTCTGATGGACAACTTTGAGTGGCTAAATGGCTACACGGTCAAGTTTGGACTGTACCATGTTGATTTCAACAACACGAACAGGCCTCGCACAGCAAGAGCCTCCGCCAGGTACTACACAGAGGTCATTACCAACAACGGCATGCCACTGGCCAGGGAGGATGAGTTTCTGTACGGACGGTTTCCTGAGGGCTTCATCTGGAGTGCAGCTTCTGCTGCATATCAGGTGAGGAGTTCAGGATGGTGGGACACCAGTGACTGCACACCTGCCCTGTGCCAGGCTCTGGGCTCAGTGCTGGGAAGGGCAGATGCATGAACAGGAGATTCCAGCAGACCCATGGAGGGGCAGCATGGGGTCTGGGAGGTCCTCTTCCAGACAGCCTGGCTTCTTCACACCCCCAAATTTACCCAGACCAGCATGGTGAGGCTCGCTGTCCTGAGATGGGTGCTTGCAGGGCCAGATGGAGCAGGGGGAGCCTGGGCAGAAGTACTTGGGCAAAGACACACAAATACAGTCACGCATTGCTCACAACAGGGATTTACTCTGAGAGATGTGATGTTAGGTGAGTTCATAGTTGTGTGAACATCACACAGAGTGCACTTACACACACCTAGATAGTGTAGCTTACTACACACCTAGGCTACATGGTATAGCCTAGTGCTCCTAGGCTACAAACCTGTACAGCCTGTTACTGTACTGAATGCTGTAGGCAGTTGTAACACAGTGGTATTTGTGTATCTAAATGTATCTAAATGTAGAAAGGCACAGTGAAAATATGGCATAAAAGCTGGACAGGGTACTCACCATGAATGGAGCCTGCTGGACTGGGAGTTGCTTTGGGTGAGTCAGTGGGTGAGGGGTGAGTGAATGGGAAGGCCTAGGCATTACTGTACACTACTGTGGACTTTATGAACACTGCACACTTAAGCTACACTAAGTTTATTTTTTAAATGTTTTTCTTTCTTCAATAACACATTAACCTTAGCTTACTGTAACATTTTTACTTTATTAACTTTTTAATTCTTTAAACTTTTTTACTCTTTTGTGATAATGCTTAGCTTAAAACAAGCACATTGGTCCAGGTGTGGTGGCTCATGCCTGCAATCCCAGTGCTATGGGAGGATCGCTCGAGACGAGGAGTTCAAAACCAGCCTGGGCAAGACATGGCAAAACCCTATCTCTATAAAAAAATCAAAAAAATTAGCCAAGTGTGGTGGTGTGCTCCTGTAGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGGATCACTCAGCCTCCCCATTAGCTGGGATTACATGCATATGCCACCACACCCAATGAATTTTTTATTTTTAATTTTTTTGTAGAGATGGGGGTCTTGCTATGTTGCTAGGGCTAGTCTGAACTCCTGGCCTCAAGTGATCCTCCTCCCTCAGCCTCCCAAAGTGCTGGAATTACAGGTCTGAGCCACAGCACCCGGCCTGCATGTGCTATACTTTTATACTGCTGGCCATACGGTAGATTTATTGACATGAGCACTGCCACAAGCATGAATAATGCAGTGCTCTACAACGTTATGATGGCTGCAAAGCACTAGGCAATAGGAATGTTTCAGCTCCATTATAATCTTATGGGACCACCATCATATATCAGGTCCGTCATTGACCAAAACACTGTTCTACAGCCCATGACTATGACCAGTCCCTGTTGGACCCCTTTATTCCCCAGCTAGATCCTTCCAAGCAGGCAGTTTGCTCACATTGGCTCTCAGCATGGGCCTGAGCTTATTCTGATGTCCTAAAAACATCACACCACTACTGTATTCATGCCAAAATGAGGCTTACTCATACAGAAAATAGGATGGTTTTATTTTGTGCAAGAAAAATGGAAAAGGCAAGAGTGACTTGCCTGGCAGTTAGTGGTGGTTCCTGCTTTCCATCTTCTGTCTGCGTCTGTCTCTGTGCAAGAGTGGGCCTGCCACATGCGTAGAGAAAGCCAGGGGAGTTCCGAGACTGAGCAGGGGCCAGAGCAGGCTCCCAGAGGAGGTAACCACACTTGGCTAATTTTTTTGATTTTTTTTATAGAGATGGGGTTTTGCCATGTTGCCCAGGCTGGTTTTGAACTCCTGGGCTCAAGCGATCCTCCCATAGCGCTGGGGTTGCCGGCGTGAGCCACCACACATGGACCAATGTGCTTGTTTTAAGCTAAGCGTTATCACAAAAGAGTAAACGTCCTGACTTGAGACTCACCCAGTGAAAGAAAGGAGGCTGTGAGTGCTTGACTGAATGACTTAATAAGACCATGTCTTGTCATCTTGAGATTGAAGGTGCGTGGAGAGCAGATGGCAAAGGACTCAGCATTTGGGACACGTTTTCTCACACACCACTGAGGGTTGAGAACGATGCCATTGGAGACGTGGCCTGTGACAGTTATCACAAGATTGCTGAGGATCTGGTCACCCTGCAGAACCTGGGCGTGTCCCACTACCGTTTTTCCATCTCCTGGTCTCGCATCCTCCCTGATGGAACCACCAGGTACATCAATGAAGCGGGCCTGAACTACTACGTGAGGCTCATCGATACACTGCTGGCCGCCAGCATCCAGCCCCAGGTATGGTGGGTCCTGGCAAGGCCTTGGGAAAGTCCACATGCAGGAACCAGCAGGGCTGGGGGAGCACATTTATCATGTAAACAAAATGCTGGTTTCAAATTTAGCTTTTGTTGTTATTGTTGTTTTTGAGACGTAGTCTCGCTCTGTCACCCAGGCTGGAGTGCAGTGGCGGATCTCGTTTCTCAGCCTCCAGAGTAGCTGGGCTTATAGGCACGCATCACCATGCCCAGCTAATTTTTGTATTTTTAGTAGAGACGGGGTTTCACTGTGTTGGCCAGGCTGGTCTCAAACTCCTGGCCTCAAGTGATCCACCCGCCTCGGCCTCCCAAAGTGCTGAGATTATAGGTATGAGCCACCGTGCTCGACCTCAAATTTAACTTTTTAATTGTCAGTGAATTCATATGATGCAGAATTTGAAAAGCATAAAAGAGTTTCCTTCCCAACCTTGACCTCAGCCATCTAGTTCTCCCTGAAAGCAATTTACCCTTTTCCCAAAAGAAAAAGAAAAAAATCTTTGAGCCTTTTTGTCTCATAAGTCACTCTCAGGATTTGCAGCAGACGTTGATGCTGGCACATCTAACCTAGGGCTTCCCATGGAAAGCATGACTGATGCAACAGCTGATCTGGCTTCTTCCCAGGTGACCATTTACCACTGGGACCTACCACAGACGCTCCAAGATGTAGGAGGCTGGGAGAATGAGACCATCGTGCAGCGGTTTAAGGAGTATGCAGATGTGCTCTTCCAGAGGCTGGGAGACAAGGTGAAGTTTTGGATCACGCTGAATGAGCCCTTTGTCATTGCTTACCAGGGCTATGGCTACGGAACAGCAGCTCCAGGTAAGTCCCAGCCCTGGCTCATAGGCTCTTTGAATCATGGCATTCTTAGCACATCAAGAGTTGAAATCCAGATGGCACAGGACGAGGCAACCAAGAAAGCCCCATGGCAGAAACCCTGCCTCTTGCTCAGGGCTGTAGAGGTTTCCCTCCTGGCATTGCATTGTTAAACATGAATTTCACATCTCAATTCCTCAAGGTGGGTTCATTTCTTTGCTCTGTGACTCTGATCGGCCTCAGGTGGGAAGCTCTCTGAGATCAGAGATGTGGGCAAATTGATGTGGGGAAGGACAGTTTGTCAGGCTGTACAGGTCTACAGTCTATTTCCACAATTCCCAAACCCCAAAGTTTCTGACAATTGGTTTGGCTGACCTGAGCTCATTTAATAGTAGTGAAACCTGACTCAAACCAACAGGAGGCTGCTCATGGTCTTTATCGCACTGAGCAAACATTCCTAAGTTCTGCTGCAGAGATATCAGTGTGCTTGACTATGGAGAGCTAGCTGTCTGCGGCCCATGGGGCTGATAGGTACTTTTCTCAAAGGAAACATTTAATTCCAAAACACATCTGACCCTAAAAGATTTTTTTTCTTTTAACTTTGGTTGACATGCAATAATTGTACATATGTATGGAGTACAAAATATATTTTGATACATGTATACAATGTGTGATGATGAAATCAGAATAATTAGTATATTCATCACCTCAAACATTCATCATTTCTTTGTGTTGGGAAAATTCGGAGTCCTCTTTTCTAGCTTTTTGCAAATATACACTAAATTCTTTTGTATCATTATTTTTTATTCATTTTTTATTTTTTTGAGACAGAGTCTAGCTCTGTTGGCCACGCTGGAGTGCAGTGGTATGATACCAGCTCACTGCAACCTCCACCTCCTGGGCTCAAGCAATTCTCCTGCCTCAGCCTCCCAAGTAGCTGGGATTACAGGCATGTGTCACCATGCCCAGCTAATTTTTGTATTTTTAGTAGAAATGGGGTTTCATCATGTTGGCCAGGCTGGTCTCGAACTCGTGACCTCAGGTAATCCGCCCGCCTCAGCCTCCCAAAGTGCTGGGATTACAGATGTGAGCCACTGCACCCAGCCTAAATTATTGTTAACTACATTCACTCTACAGTGCCACACATCACTAGAACTTCATCTTCTTATCTAGCTTAACTTTGTATCCGTTAACCAACCTCTCCCTGTCCTCCCTCCCTACTACCCTTCCCATCCTCTAATAATCACAATTCTATTCTCTGCTGCTAGGAGCTCATCTTTTTAGCTCCCACATGTGAGTAAGAACATGCAGTATTTGCCTTTCTGTGCCTGACTTATTTCACTTTACATAATGACCTCCAGTTCCAGCGATGTTGTCACGAATGACAAGATTCATCCTTCTTTATGGCTGTATAGTATTCCATCATATATAGATGCCACATTTTCTTTATCCATTCATCTGTTGATGGACACTTAGGTTGATTCCATATCTTGGCCATTGTAACAGTGATGCAATAAACACAGAGGTCAAGGTATTGATTTGGTATTCTGACTTACTTTCCTTTGGATAAATACCCAAAAGTAAGATTGCGGGATCCCTTAGGGTTTTGAATAAGAAATTGTGGACCTATTTTTGTGCCTTGAGAACCATCCAGTTTCCCTTTTATCTAGTTCTGAGTTAATAAGAATAAATTTGTGTTCATTCATGTGATTCCTCAGAACACTGTGTAACAGCTGGAAAGAGCCACCAGGAGATGTGCCTCAAATCGTTATCAGAGGCATCTCCATTGGTCCTAGTTCGCCCCTTTGGTTTACACTCCTTCAACACATGAGAGGCGCCTCTCTTGCAGCATTCACTATCAGGGTATCTCCGTGTCAGCTGGTTGCATTAGCTACATTCTCCAACCCAAATGATCACAATGGGTCCCCAAGGAGCTCCAGATTATCAACTCCTGTCAATTCATTTGAGCCCAGGAGTTCAAGGCTGCCGTGAGCCATGCTCATGGCACCACTGCACTCCAGCCTGGATGACAGTGCATGACCCTGTCTCAAAAATAATCATAGGCCGAGTATGGTATCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCAAGACAGGTGGATCACCTGAGGTCAGGAGTTCAAGACCAGCCTGATCAATATGGTGAAACTCCACCTCTACTAAAAATACAAAAATTAACCAGATGTGGTGGCATGCGCCTGCAGTCCCAGCTACTCAGGAGGCTGAGACAGGAGAATTGTTTGAACCCCTCGGCTCACTGCAGTCTCCACCTCCTGGATTCGAGTGATTCTCCTGCCTCAGCCTCCTGAGTAGCTGGGATTACAGGCGCCTGCCACCACAGCTGGCTAATTTTTTGTATTTTTAGTAGAGACAGGTTTCACCATATTGGGCAAGTTGGTCTCAAACTCCTGACCTCAGGTGATCCACCTGCCTCAGCCTCCCAAAGTGCTGGGATTATGGGTGTGAGCCACCCTGCCTGGCCTGGGTTGTCTTTTAAGTTTTAAAAAATCATTTGTACATATAGTCCTTTCTGAATATAACATTGGTTTGAAGCTAACTCAATAGAAAGAAATTCCATCTCTTTAGTCTCTCTAGTTTGACTATAGTAGCTAACAGAGCTGGGCTGCAATGTCACACTTCACCTTTAGGTGCCACCATCTGATTTGATTTGCTCCAGCCTAAGCATTTCTTAAATTGGGGGCTTTAGATTCTGCGATAGGTATCTCTATTATGGGTATTTTGCCTGAGACGTACGAGCCACTCTTCTGGAGGAGGGGAACAGAAGCCAACATTTATCAAGTGGCCTTCCCTCTTCCAGACACAGTGCTGCTGTGGGCGGGTTTCATACACTGTTTCATTTCCCTCTCACAAGCACTCTCTGCTGCCCATTTCACCAAGGAGGAAACTGAAAGGCTGAATTACTCACCCAAAGTTACACAGCCAGGTAATAAGAGGGAGAGCCAGGGTTTGAATTCCAGTTTTCCTAGTGTCAGAATCTACACCCCTTCTCCCAAACACAGAGGGGACATCTGCAGGCAGGGACTAACAATCTCAGTCACATCCATTCTATCCATTCTCTGTTGACATCCATGTGTATGTTTCCAGGAGTCTCCAATAGGCCTGGCACTGCCCCCTACATTGTTGGCCACAATCTAATAAAGGCTCATGCTGAGGCCTGGCATCTGTACAACGATGTGTACCGCGCCAGTCAAGGTGGCGTGATTTCCATCACCATCAGCAGTGACTGGGCTGAACCCAGAGATCCCTCTAACCAGGAGGATGTGGAGGCAGCCAGGAGATATGTTCAGGTCTGTTTTTCCTCTGGGCGCTTGTTCTTACTCTTGTCCATCTTTCCTTCCAGCCTAATGGAAACAGATTGTGAATCAAAGATTTAGGGTGTGGTGGCTCATGTCTATAATCCCAGCACTTTGGAAGTCTGAGGCAGGAGGATTTCTTGAGGCTAGGAGTTTGAGACTAGCCTGGGCAACATAGAAAGACCTTGTCTGTGAAGAAAAAAAAATTATTAGGGCATGGTGACACACACCTATAGTCCCAGCTGCTCAGGAGGCTAAGGTGGGAGCTTGAGTCCAGGAGGTCAAGGTTGCAGTGAGCCATGATTTCGGCACCATTAAACTCCAGGTGACAGAGGGAGACCACCCCCAACCCCCAAAAAGAAGAATTATTAGGATCTAAGCCTAGTTTTGCTATTGCCTGATTTTGTGAGCTTGGGAAAATCATCTAACTTTTTCGTACCTTAGTTTCCTCAACTTCAAACTGGAGATGTCCTGCCCACCTCAAAAGTTTGCTGTGATGAAAGTGATAAAGTCTGTGGGGTTAAGTTGTCTTTAAGTTTTTAAAAATCATTTGTACAGGTAATTCTTTCTGTAACATTGGTTTGAAGTTAACTCCTAGAGAGAAATTTCCATTTCTTCAGTCTCTCTGGTTTGACTATAGTAGCTAACAGAGCTGGGCTGCAGTGTCACACGTCACCTTTAGGTGTCACCATCTAATTTGATTTGCTCCAGCCTAGGCATTTCTTAAATTGGGGGCTTTAGATTCTGTGAAACTCATTAGTGCCCCTAATTTGCCAACTCAATGAGTTTAAGAACAGCATCTTTCAGTCATGGAATTTCACCCAAGGAAGTAGAGACATTACTAGGAAGCCGACTGGGCAAGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCTAAGGCAGGCTGATAACCTGAGGTCAGGAGTTCTAGACCAGCCTGGCCAACATGGTGAGACCCCATCTCTACTAAAAATATAAAAATTACCGAGGTGTGGTGGCACATGCCTGTAGTTCCAACTACTCTGGAGGCTAAGGCAGGAGAACCCAGAAGCTGAGATCACCATTGCACTACAGCCTGAGCAATGGAGAGAGACTCCATCTCCAAAAAAAAAAAAAAAGGAAGCAGGTGCCAGCATGGCCTACCTTTATTTCCACCTGAACCCCTGACTGACAAGAGGAGAGAAGGAAAAGAATGATCCTCGTTCACGGCACAGCTCCTCTGGCTCCTCCTAGAAAGGGATAGAAGGTGCTCTCTCCTACATTTTGCATCAGGAAGGAAAGGCAAGGGTTTCTCTCTGGATTGGTTCCCACTTTGGGCTCCGTGGAAGAGTCTGCCAACTGTGGCACTATAACTCTCTCGGGGGAAACACCATGGGCCTTGGTTTGCCAAACTCTTCACAAGAGAACTTGACAAAGATAGTCAAATTAATAAATGCAACGAAGGGCTTAATTTTCTGGTCTGCTAGCCAGCTGGGGAAACAGTTTTGAAACAAAATTAATGTATCCCTCATTTCAGACTCACAGAACTGGTGATTTAGAACAACATTTCCTTTTTTCCTGAAATCAAAACTTCAAACGTCAGGAAACGTTAGGCTGTCATATCATTAGATTGAGCCACTTACTGGTGAACTGTGATACTGCAGCCATGGACTATGACAGATGCATCTCTTATTAGAATCAGCTTCCACGAAAATATCTAGTGTGTTACCTTGGAGTGGGTGCATTTAAGCCTCTTTACCAGGGCATGTGTGTTCCATGCCTCATCTCTGACCATGAGTGGAAGCTGCCCTCACCCCACATTCCCAGCAGCAGCCAGTGGGTGAGGAGAGGATTTGGAGAGACTACAGAAGGCTCTCAAACCCCCAGCATCATAGTGTTTGGGTGCCACGTATCCCCGCACATGATAAGGATGGCCTAGGCCTCATTAGAGAAAATAGGTCAAACGGTTCCCCACTCTGGGGCTGTGAAAGCCCATTAAGAGTTATACTTTGCCCGGAAAGTCAGGAAAGCCTTGCATTTCAGCCCTCCCCAGAAAGTTCTGTTTGCTCCTTGGGCACTTTGATGAGGAAGTGCAGCCGCTCAGTGGTGAGAAAGAGAACCGGGAGCCTGGAGGCTTGTGGGTTCTCCCTTCTCCTCTGCAGGACCCATCCAAGGGCAGCCAGGAAGCATTTGTTGAGCACCAGGGCCAGTGCCCAGGTCAGTTACTGTCACCTCAAGCTACAACTATGAAGAGGTGGCCCTGTCCTCAGTGCAACAGCAACTGAGCAAGCACAGACCCAGCTGGGAGACCTGTGGACACTGAAGCTGCAACAGGCAGGAGCCACAGGGAAGAGAGCTTAACCTGGGGGTCCAGGAAAAGGAGGGAGGTTGTGAGGCCAGGCACTTCTGAGCGGGGACGATGCTGTCTCTTGCTGTGCCCACCTGTAACGCCTGGGCTGTCTCCCCCACCCTACCCGCAGTTCATGGGAGGCTGGTTTGCACATCCTATTTTCAAGAATGGAGATTACAATGAGGTGATGAAGACGCGGATCCGTGACAGGAGCTTGGCTGCAGGCCTCAACAAGTCTCGGTAAGGGCCTGGTGCCCGCAGTGGTGAGGGCATGGGCGTCGGGGTCACAGAGGCATGTCTCGGGCAAGTTACCATGACTGAGCTTCTTTGCTTGCTGGGAAGTTACATGTGATCATATATGTAAAGCTTAGCCCAGCACCTGGCACTGCTATATGCTTGACAGAGGGGTTTGCTATTATGGTTATTATATTGTGGAACAGCCAGGAAATCTGTTCCAAGGCTATCCACCTCTGAGCAACCCCACTATGCCACTCCACAGACAAATCCCAGCTCATCCTATCCTATTTCATCACCGCACGTGTGAATGTGGGTGGCAGTGGCTGACAGTCAGGCGTGTGCTTTGCATCACTTGGCCAGCAGGTGGCGATGGTCTGCACCAAAGCGTCCTTCCTTACCCGCCCGCCCCTTCTTGTCAAGGAAGGAGTAGCAACATTAGCAGCCAACGTTTACCCATCTTCTGTTGGTATCTTTATTTCTATTTAAATACGAGTAAAGTGAGGCGCAAAGATTAGGGCAAGATCACCCAGCTATTAAGAGATAGAGCTGAGATTTGCAGCCAAGCTGTCGGCCCCCAGGGCGCATGCTGGGGGCTTGAGAATCATGCAGGTGGGGTGAGAGGTGTGGTGTGAGGAAGCGCAGGAAGCGGCAGTCACTGCCCACGGGAACATGCCCACCGCTCCAAGGCTGGCGGGAATCAAGTGTGAATTCCCAACATAGTCTTTGAGTCCTGCCCCTAGACGCCCCCATATAGTCCAGCTGAGGATTAAAAATCCAGCTCCCAGGCCGGGTGCGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCAAGGTGGGCGGATCACTTGAAGTCATGAGTTCAAGACCAGGCTGGCCAACATGGCGAAACCCTGTCTCTACTAAAAATACAAAAATTAGCTGGGTGCGGTGGCGGGGGCCTGTAATCCCAGCTACTTGGGAGGCTGAGGCCAGAGAATTGCTTGAGCTCGGGAGGCAGAGGTTGCAGTGAGCCGAGATCATGCCACTGCACTCCAGCCTGGACGATGGAGCAAGACTCTTTGTCTCAAAAAAAAAAAAAAAAAAAAAATCCAGCTCCCACCTCACAATGCACACCCTGGCCTAGTTAGGGTAAGTTCCCCAGAGCAGGCTGTGCCTAAAGGTCTGATCTGCGAACTGTGATCTCCAGCAAAACCGATGAGCGCCCGGCCCATCTGCACAACTTTGCCGAGCACCTACCATTTGCCCGAGCCAGGGCCAGGGGGAGGGGTCCATGGAAGGAGAGGATTCCATTCGGCTCCTCAAGCTGCTGACAGATCAGCTGGAAAGACAGTTCTCCATCCCATTCCCCAGGCTCTTCAGTACAAAGAAAACTCAGAAGATGAGATCAGGGTAGGCTGGGTAGACCCAGGAGATTTCATGGACAAGGCAGGACATCAGCTGAGCTGGGCCTTGACAGGGGATAGAATGTGGGGGATTGCAGGTCATTCTTTCCACGGGGCAGAGTTGTGAAGACAGGCCTAGAGGTAAGAATGAGTGGGGGTGCCAGAGCTGAGAGTGGGGAGACCAGCCCAGCAGCAGTGAAGGGGCTGAGGCCACATGGTGGAGGGCCTGGAAGCCAAGCACAGGGCCTTGGCTTTGGTGCCACAGGCCATTGCTGGCTTCTGAGCAGAAGCGTCAGGGACAGGAGGAGGCTGTGCTTTGGTTTTCTCCCATCATCTCAGAAACCCCAGGGAAGGAAGGTTCTTGATCCCTCAGGTTAATGGTAGCAGAAAGGTCAAGATGAAAGTGTCAGAGGCCTCAGCAGGGCATCTCTGGGCCACACCTAAACCAGAAGCCCCAGGTCTCCCTGTGGGCATGCGCATGCATTCAGGATCACCTGTACATGCTGCACACAAGTGTATTAGTCAGGTTCTACAGGAGAGGCTTTTCACTCAGAGTGCCTGGAAAATGCTCCATCTACAGGTTAAGAAGCCAAAGTTCCCAGGCTCACAAGTAATCTCAGCACTTTGGGAGGCTGAGGCAGGAGGATTGCTTGAGACCAGGAGTTCAAGACCAGCCTGGGCAATATAGTGAGACTTTGTCTTTACAAAAAATTTAAAAATTATCTAGGCATGGTGACGCACACCTATATTCCCAACTACTTGGGAGGCTGAGGTGAGAGGATTGCTTGAGCCCAGGAGACTGAGGTTGCAGTGAGCTATGATTGCACCACTGCACTCCAGCCTCAGGGGGCGTGCAGTGTCCTCAGGAGGACAGGGCGAGACCCTGTCTGGGAAAAAAAAAAGGAAGAAAGAAAACAAAGTTCAGTGAAATCGTGAGAACTGAGAAATTCAAACTCAAATACTCAATTTGCAAATTATTTCCCCTGCTACTTTGAAGATCTTGAAGCTATTATTATTATTATTATTATTATTATTATTATTAGAGTTGGAGAAAAGAGGCATGCCTAAACAAACCCCAAGAGGAGCAGAGAAACTTGGAAAGGGCAGAAAACGGAAATACAAATTACACAAGATACAGGGCCGGGTGTGGTGGCTCATGCCTGTAATCCCAACACTTTAGGAGGCTGAGGTGGGCGGATCACTTGAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGTGAAACCCCATCTCTACCAAAAATATAAAAAATCAGCCAGGAGTTGTGGCAGGCGCTTGTAGTCCCAGCTACTTGGGAGGCTGAGGCAGGAGAATCACTTGAACCCAGGAGGCGGAGGTTGCAGTGAGCTGAGATCGCGCCACTGCACTCCAGCCTAGGTGACAGAGCCAGACTCAGCCACAAAAAAAAAAAATTATACAAGATCTAACTTTACAAACATAGGGGAAGAGTCTCAGATATGTACCTCAGGCATGCTCTTGATTTTGAAATCTGTCATAGATGCTAAATATCAGAATTTGCATATGTTGTTTGAAGGAAATTAAAAACTGTTTATGCATGTGTGTGTGTGTGTGTGTGTGTGCGCGCGCGCGCGTGGGTGCGTGTGTGTGTGGTCCTTCAGGTTTCAGAGGCTCTTGTAGAGACCTAGGGAAGCCAGGTTTATGGTCTGGCTGGAGGAGCCGCAGTGCTTCCTGCACCGCCTGAAGGACCTCTTCTCCTTCCCTGCCAGTTTCCCCTACTCACTGCCAAGTGCCTGGGGTTCGGAGAGCTCCCCCGCCCCAGCCCTATGACGTTCTCTTCTCAAAGCATGGCTCTCCCTGAAGCCCTGCCCTCAATGGCTTCTTCCACCCAGGCTGCCAGAATTTACAGAGAGTGAGAAGAGGAGGATCAACGGCACCTATGACTTTTTTGGGTTCAATCACTACACCACTGTCCTCGCCTACAACCTCAACTATGCCACTGCCATCTCTTCTTTTGATGCAGACAGGTAAGTCCACCAACAGGGAGCCCGGAGCCATCTCTGGAAAAGGCAGAAAGGTGCCCTTGGCTGTGCTCTCTGAGGCCTGCCCAGCCTCAAAACAGGGCCTCCAACGCCGAATGTGCCGGGGTTTGCAAGATGCTCGCCACCCCACAGATCCCAAGGAAATCTCCAGCAAGCAAGAGGGAGAGAAGGCCGGGGTCTCCAGGGCACCTCCCATTAGGGCACATGTGCTTGGCTTTTTGTTTTTTTATTTCATTTTTAAAATTTATTTATTTTGCGTTCTTTTTCACAGGCTGCTTAACTCTAAAAATGCTTGGTTGTTAAAAAGGATTTTCAAGAAAAAAATTGTTTAGGTTTTATCAAAATTCGCTTTAATATTAATAAATATTACAATAATACAAGAGTAAAATTTTATTTTCTCTTTTTAAACAATGCTTTTATGAAGTAGAGATAGTAAAAGATTTTGGTTCACCTTTTAAGTAACAGTTTTTATTTTATTTATTTTTTTTGAGACAGAGTCTCGCTCTGTCACCAGGCTGGAGTGCAGTGGCACAATCTTGGCTCACTGCAACCTCCACCACCCGGGTTCCAGTGATTCCCCTGCCTCAGCCTCCAAGTAGCTGGGATTACAGGCGCGTACCTCCACGCCTGGCTAATTTTTTTTTTTTTTTTTTTGTATTTTAGCAGAGACGGGGTTTCATCATGTTGGCCAGAATGGTCTCGGCTAATTTTGTGTTTTTAGTAGAGACAGGGTTTCTCCATGTTGGTCAGGCTGGTCTCTATCTCCTGACCTCAGATGATCCCCTTGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGTGTGAGCCACTGCGCCCAGCCGATTGTCTTTTTCTTTATGATATCTATTTATCTAGAGACTTTTTCATCCATATCCTGTATTGTTTTTTAAATTTCTCTAAGTTAATTTTCACCTTTCTCTAGTACCTCCTTGAGTAGTTTAATAATCAACCTTCTGAATTCTTTATCTGGCAATTCAGAGATTTCTTCTTGGTTTGGATCCATAGCTGGAGAGTTAGTGCGACCTTTTGGGGGTCTTATAGAACCTTGTTTTGTCATATTACCAGAATTAACATTTCTGGTTCCTTCTCATTCAGGTAGACTGTTTCAGTGGAAAGATCTAGAACTCAAGGGCTGCCCCTCAGATCCTTTTGTCCCACAGGGTGATCCCTTGATGTGGTGCTCACCCCCTTTCCCTAAGGATGGGGCTTCCTGAGAGCCAGACTGCAGTGATTGCCATTGCCCTTCTGGGTCTATCCACCCAGCAGAATTACTGGGATCTGAACTGGTGCTGAGGAATGTCTGCAAAGAGTCCTGTGATGTGATCTGTCTTCAGGTCTCCCAGCCATGGATACCAGCACCTGCTCCAGTGCAGGTGGCAGGGGACTTAAGTGGATTCTGTGAGGGTCCTTGGTTGTAGTTTTCTTTCGTGCACTGGTTTTCTCAAACGCTGGTTATGCGAGCAGTGAAGTTGTCATGTGGACAGACTCAGGACCTCTGGTTAGCCAGGATGTTGCAGGCAGTGGAATTAGTTGTTGTTTTCTCTTTCTTTGGAGCAGGGTTCTTCTGTTATGAGTTGCTATAATGGCGTGAGTTGGTTGGTCTCCAGCCAGGAGGTGGCACTTTCAAGAGAGGAGGTGGCACTTTTGAGGTGCTTTCCCCTTCCACTGCCACCAGCTGCGGTAGTAGAAGGGGGATTACAAGGTTGCCCTACGTTGGCCAGGGTATTTGGGTTTCTCAGGTTATGGGCGGGGCCATAGAGCTCCCAAGAGTTTATGTCTTTTGTCTTCAGCTACCAGCAAAGGTAGAGAAAGACCATCAGGTTGGGGCAGCATTAGGCATATCTGAGCTCAGACTCTCCTCGGGTGAGGCTTGCTGTGGCCACTGTGGGGGAATAGGGGGCTGGTTCTCAGGCCAGTGGAGTTCTGTTCCCAGGGGTATTATGGCTTCCTCTGCTGTGTCATACAGGTTGCTAGGGAAGTTGGGAAAGCTGGCAGTCACAAGCCTCACCTAGCTCCCATGCAGCCAGCAAGGCCAGTCTCACTCCTGCTGTGCCCTGCCAACAGTGCGCAGGGCAGAGATCTCACCCCAGGCCACAAGCCTTCTCTCTGAGAAAGCAAACAGGGCTTTCAGGCCTTGCCCCTCCCCACCTGCCCACACTGTTGGCTGTGGCTTCTGTGCTTTTATCTGCACTTCTTGTTTGCCCCCAAGATTCTGCTCAGGAAAATTCATGCTTCTAGTTGAAATTAATAAGTTGAGCTAGAAGCTTCCTTAATCCTGCCCCTCCCTAATTCCACTGGCTTCCTTCTACAAGGACCCCTGTAGGATAAAGTCAGGAATGGCTTCCCTGGGCTCAAGCTGGGGACAGGGAGTGGCTACAGGGCTCTTCCCACTGCTTCTTCTACTTTTACATTTCACTTGGCTCCCTAAATCCACTTGCGCTCTAGGTAAGGTTAAATCCTTCTCCTATGATCTGGATGTTCAGGTCCCCAGAGAGGATGTGTGTTCAGAGGCAGACTTTCCCCTTCTCACACTTTGGGAACTCACAGTTTTGCAGCTGTCTCATGGAGTTTGCAGTAGCATTCTGCTTCTTTCAAAGGTCTGTGAATTCTTTTGGTTTTTCTGGTATGTTCCAGCAGTAGTTCTTGGAGCAACAGTTAACAATGTGAGTCTCCACACACTGTTCTGTCCATCCAAGTGGGAGCTGTACCTAAGTCCTGTCTCTTATCTGCCATTTTCAGAAAATCTCATTTTGTTCCTTTTCCATCAAGCATCTTTCCACACCAGTAGCTCTGACTGTGTCCAGGTTCTTTCTTTGAAAACCAGCCCCTCCACTCCCACTGTATCCTGAAACCCCCAGAGTCAGGCTCACCAAGGGGGCTGAGGAGACTCCAGAACACCCCTCTACTCCTTCTGATTCTCCCTCCCTCTTATGAGCCCTGGGGCTGTCCCTGGGAAGACCTCCACTAGTGCTTATGAAATGGCCCACATTCAATTCAGCTGAGTCAGATAAATCCAGGTGCTGATAAAACCAACATTTTTTTTTTCCCTGAAAGATCTGAGTGTAGGAAGTGTCTAAATTCTTGGTTCTTATTTGACATATGTGACTACAGGTGATCAGGCTTCTGTGGCCTCCCCCAGCAGGCACCCCTGTGGCAGGAGCTGTCCACCTCCTCGTCCATCACTGAAGAGAGAGGCCAGGCTCTTGGACACTTGAAGGAGGTGCCAGCCTGTCTGCTGCCTGTCTTCACACAAAGCAGGGCCCCTACAAATATTCGTGCCTGTGGCCTCACCCGTGGTCTGCAAGTGGCATTGACTAGACATGGGTGACTTGGGGGAGCCCATTCTCTGAAGACACAGCACTGGCGTCCATTGGAAGCCTGGAGCTGGGGACCCATAGCCTTTCATAGCTGGTGTAAGGAGCCATCTATTCAGAGTAGTGGAGGGCTGGGCTCCATGAGCAAGACCATTCTCTGCACAGGCAGAGAAATTGAAGGACGGAGAGCTGAGTGGCTTGTCCAATGCTATACAAGCACAGAGTGCAGGCAGCTAGAACCAGCGAAAGGAGGAGAATTTGAGGCAATTTGATTCTTCTGGGTTTAGTATGATTCTTAAGGCTAGACAAAACCTAAGGCTTTTCCTGGTCTAAGTCCTGTTTTGTGTTTCGTGTAAAGGGCCTCTTGAGATTTACAAAACAAGACCTCATCTTTAGTTTTTGAACTTGTAGAGGAGTTGCTTCCATCGCAGATCGCTCGTGGCCAGACTCTGGCTCCTTCTGGCTGAAGATGACGCCTTTTGGCTTCAGGAGGATCCTGAACTGGTTAAAGGAGGAATACAATGACCCTCCAATTTATGTCACAGAGAATGGAGTGTCCCAGCGGGAAGAAACAGACCTCAATGACACTGCAAGGATCTACTACCTTCGGACTTACATCAATGAGGCCCTCAAAGGTACGACGGGCCCGCCCTTCCCCAGCGTGCACCTTCCCCTGTTGGAAACATCTGCTATTTGCAGGAGTGTGATACAGCGTCCTTGGGCCACAGTAAGAAGAGAACGATAAGCCTTCTTGCTCCTGTGGGGGTTAAGCTTTGCTTTAGGGCCGCACTCTGAGTTTTTTTCCTTCCTATGTCTAAGCTCAGCAAGCAAGCCCAGTGGCCTGATGCCACCAAACCCTAGTTCCTGGCCTGAGTCACTTGCTCCCCTTGATCCTCCCTGATGTCGGAACAGCAGTGCCCTCCTGAGAATGGTCTGGGTAGGGCCCAGGAGGAGTAGGCTGTGTGGTTGCCTGTAGGGTCTCTTAGTCTCCGAGCAAAAGTTTGAGGCTCTTGGCTCAGCCCTAACAACTTGAGATGGGACCATGAGGATAAGAGAATGGAACAAATGCTGAGTAAAAGAGCAAGCAATGCACCAGCAAAGGAAATGATTAGAAAAATCCTACCCAGCTGAAATATATTCTATCTAAGGGCTATTTTCTACAGGGAGAAGCATTAACATTCTAAGGCACTGACCAAGATCATGGATAGAAGTGTAGGTGACCCAGGGAAATTAGTCCACCCATGTTCCCGACTCCCATTCAGGGCTGAGCCTTTCTAAAGATGCTGGTGGCTCTACATCTCCATCCACAGAGGACCCGCTAACAGTCACTGCATGCAAAGAAAGGGGCAGCTTTCTCACAGAGCTAAAGCCAAAGCTTACCGCCATCTGTGAAGGCGGTGGGGAGAGCAGTAGGCAGACCTGGCTTCCGAAGGCCTGGCAGGAAGCTGCCTTATGAGATAGGAAACTTATGCCTAGTCCTCTGTGTTTGAGCAGCTGTGCAGGACAAGGTGGACCTTCGAGGATACACAGTTTGGAGTGCGATGGACAATTTTGAGTGGGCCACAGGCTTTTCAGAGAGATTTGGTCTGCATTTTGTGAACTACAGTGACCCTTCTCTGCCAAGGATCCCCAAAGCATCAGCGAAGTTCTACGCCTCTGTGGTCCGATGCAATGGCTTCCCTGACCCCGCTACAGGGCCTCACGCTTGTCTCCACCAGCCAGGTGAGATGTGGCTCTGGGAGGGAATAAAGCCTAAGGGTGAAGGGCAGGTGGAAGGGCCTCTCTCAGTCTGTTTTCTTCTAGTTTATTACCCTCCTCTCTGCTGCCCCATCTCCTTCATTCATTCAACAAATGTTTATTTTCTTTGAATGCTCCAGACATTTCCTGGGGTGGAACAAAGGACACTTAGGGTCAATGTTACACCTAGAAACCAGAGCCCTGACCTGGGAATAAGCAGGTCTAGACTCTTCTTCCAGCCCTACCACTAACTTGCTGTGCACTCATAGATAAGAAACCAGGCACATGCTTCAGGGCAGTTATAAGGATCAAATAAAGGGACCATGAAAGTACAATGCCTGCACCATGTGGGTGCCCCGTATTTGTTAAATGTAAGAGTATAAATCACTACACAAATGTAAATGACAATTATCCAGTTTCAATTATACAGGCTGAGAATCCTTCATCTGAAAATTCAAAATCCAAAATACTCCAAAATCTGAAACTTTTTGAGCATGACTGGCATGACAACACAAATGGAAAATTCAACACCTGACCCCATGTGACAGGTCGCAGTCAAAACACAGTTAAAGCTTTGTTTCATGCACACAATTATTTAACATATTGTATAGAATTACCTTCACACCACGTGGATAAGTTGCATATAAAACATATATGAATTTCATATTTAGACCTGGGTCCCATCCCCAAAATATCTCATTATGTATATGCAAATATTCCAAAATCTTAAAAAATCCCAAATCTGAAACACTTCTGATCCCAAGCAAGCATGTCAGATAAGGGATATTCAACCGTATTCTAATTGCTGATAGAGATGTTTAAAAAATACAACTGCTTAACTTCACTCAGAGGCTCCTGACACACAGTGAAAGGGGATGGGTACCTCCACCTCGGCATCCCGTCAATGGCTGTGCGGATTTGGGGTACCGTGCAGCCTCTGCTGGGGTCTCAGAGATCTGAGAACTCAAATCAGCGCCAGAGCACCAACCACCCTGTGTCACACTCTCCTAGATGCTGGACCCACCATCAGCCCCGTGAGACAGGAGGAGGTGCAGTTCCTGGGGCTAATGCTCGGCACCACAGAAGCACAGACAGCTTTGTACGTTCTCTTTTCTCTTGTGCTTCTTGGAGTCTGTGGCTTGGCATTTCTGTCATACAAGTACTGCAAGCGCTCTAAGCAAGGGAAAACACAACGAAGCCAACAGGAATTGAGCCCGGTGTCTTCATTCTGATGAGTTACCACCTCAAGTTCTATGAAGCAGGCCTAGTTTCTTCATCTATGTTTACCGGCCACCAAACACCTTAGGGTCTTAGACTCTGCTGATACTGGACTTCTCCATAAAGTCCTGCTGCACCGTTAGAGATGACTTTAATCTTGAATGATTTCGACTTGCTGAGTAAAATGGAAATATCTCCATCTTGCTCCAGTATCAGAGTTCATTTGGGCATTTGAGAAGCAAGTAGCTCTTGCGGAAACGTGTAGATACTGGTCTAGTGGGTCTGTGAACCACTTAATTGAACTTAACAGGGCTGTTTTAAGTTTCAGAGTTGTTAAGGGTTGTTAAGGGAGCAAAAACCGTAAAAATCCTTCCTATAAGAAGAAATCAACTCCATTGCATAGACTGCAATATCATCTCCTGCCCTTCTGCAAGCTCTCCCTAGCTTCACATCTTGTGTTTTCCAGAAAATAAAAACAGCAGACTGTCCTTTCTCCTA', u'desc': u'chromosome:GRCh38:2:135787840:135837180:-1'}
lct_xrefs = do_request(ensembl_server, 'xrefs/id', lct_id)
for xref in lct_xrefs:
print(xref['db_display_name'])
print(xref)
Vega gene {u'display_id': u'OTTHUMG00000131738', u'description': None, u'db_display_name': u'Vega gene', u'info_text': u'Added during ensembl-vega production', u'info_type': u'NONE', u'primary_id': u'OTTHUMG00000131738', u'synonyms': [], u'version': u'2', u'dbname': u'Vega_gene'} Vega gene {u'display_id': u'LCT', u'description': None, u'db_display_name': u'Vega gene', u'info_text': u'', u'info_type': u'NONE', u'primary_id': u'OTTHUMG00000131738', u'synonyms': [], u'version': u'1', u'dbname': u'Vega_gene'} Havana gene {u'display_id': u'OTTHUMG00000131738', u'description': None, u'db_display_name': u'Havana gene', u'info_text': u'', u'info_type': u'NONE', u'primary_id': u'OTTHUMG00000131738', u'synonyms': [], u'version': u'0', u'dbname': u'OTTG'} Expression Atlas {u'display_id': u'ENSG00000115850', u'description': u'', u'db_display_name': u'Expression Atlas', u'info_text': u'', u'info_type': u'DIRECT', u'primary_id': u'ENSG00000115850', u'synonyms': [], u'version': u'0', u'dbname': u'ArrayExpress'} EntrezGene {u'display_id': u'LCT', u'description': u'lactase', u'db_display_name': u'EntrezGene', u'info_text': u'', u'info_type': u'DEPENDENT', u'primary_id': u'3938', u'synonyms': [u'LAC', u'LPH', u'LPH1'], u'version': u'0', u'dbname': u'EntrezGene'} HGNC Symbol {u'display_id': u'LCT', u'description': u'lactase', u'db_display_name': u'HGNC Symbol', u'info_text': u'Generated via ensembl_manual', u'info_type': u'DIRECT', u'primary_id': u'HGNC:6530', u'synonyms': [], u'version': u'0', u'dbname': u'HGNC'} MIM gene {u'display_id': u' LACTASE; LCT [*603202]', u'description': u' LACTASE; LCT\n;;LAC;;\nLACTASE-PHLORIZIN HYDROLASE; LPH\n', u'db_display_name': u'MIM gene', u'info_text': u'', u'info_type': u'DEPENDENT', u'primary_id': u'603202', u'synonyms': [], u'version': u'0', u'dbname': u'MIM_GENE'} MIM disease {u'display_id': u' LACTASE DEFICIENCY, CONGENITAL [#223000]', u'description': u' LACTASE DEFICIENCY, CONGENITAL\n;;ALACTASIA, CONGENITAL;;\nDISACCHARIDE INTOLERANCE II\n', u'db_display_name': u'MIM disease', u'info_text': u'', u'info_type': u'DEPENDENT', u'primary_id': u'223000', u'synonyms': [u'150220'], u'version': u'0', u'dbname': u'MIM_MORBID'} UniGene {u'ensembl_start': 1, u'xref_start': 1, u'display_id': u'Hs.551506', u'score': 31370, u'db_display_name': u'UniGene', u'xref_end': 6274, u'evalue': None, u'info_text': u'', u'info_type': u'SEQUENCE_MATCH', u'ensembl_end': 6274, u'primary_id': u'Hs.551506', u'ensembl_identity': 99, u'synonyms': [], u'version': u'0', u'cigar_line': u'6274M', u'xref_identity': 100, u'dbname': u'UniGene', u'description': u'Lactase'} UniProtKB Gene Name {u'display_id': u'LCT', u'description': u'', u'db_display_name': u'UniProtKB Gene Name', u'info_text': u'', u'info_type': u'DEPENDENT', u'primary_id': u'LCT', u'synonyms': [u'LPH'], u'version': u'0', u'dbname': u'Uniprot_gn'} WikiGene {u'display_id': u'LCT', u'description': u'lactase', u'db_display_name': u'WikiGene', u'info_text': u'', u'info_type': u'DEPENDENT', u'primary_id': u'3938', u'synonyms': [], u'version': u'0', u'dbname': u'WikiGene'}
refs = do_request(ensembl_server, 'xrefs/id', lct_id, external_db='GO', all_levels='1')
print(lct_id, refs)
(u'ENSG00000115850', [{u'display_id': u'GO:0000016', u'description': u'lactase activity', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0000016', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0004553', u'description': u'hydrolase activity, hydrolyzing O-glycosyl compounds', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'IEA'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0004553', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0005886', u'description': u'plasma membrane', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0005886', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0005887', u'description': u'integral component of plasma membrane', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0005887', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0005975', u'description': u'carbohydrate metabolic process', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS', u'IEA'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0005975', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0009405', u'description': u'pathogenesis', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0009405', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0016020', u'description': u'membrane', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0016020', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0016324', u'description': u'apical plasma membrane', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'IEA'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0016324', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0017042', u'description': u'glycosylceramidase activity', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'IEA'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0017042', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0044245', u'description': u'polysaccharide digestion', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0044245', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0044281', u'description': u'small molecule metabolic process', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'TAS'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0044281', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0004553', u'description': u'hydrolase activity, hydrolyzing O-glycosyl compounds', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'IEA'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0004553', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}, {u'display_id': u'GO:0005975', u'description': u'carbohydrate metabolic process', u'db_display_name': u'GO', u'info_text': u'Generated via main', u'linkage_types': [u'IEA'], u'info_type': u'DEPENDENT', u'primary_id': u'GO:0005975', u'synonyms': [], u'version': u'0', u'dbname': u'GO'}])
hom_response = do_request(ensembl_server, 'homology/id', lct_id, type='orthologues', sequence='none')
#print(hom_response['data'][0]['homologies'])
homologies = hom_response['data'][0]['homologies']
for homology in homologies:
print(homology['target']['species'])
if homology['target']['species'] != 'equus_caballus':
continue
print(homology)
print(homology['taxonomy_level'])
horse_id = homology['target']['id']
pan_troglodytes gorilla_gorilla pongo_abelii nomascus_leucogenys papio_anubis macaca_mulatta chlorocebus_sabaeus callithrix_jacchus tarsius_syrichta otolemur_garnettii microcebus_murinus ictidomys_tridecemlineatus rattus_norvegicus oryctolagus_cuniculus oryctolagus_cuniculus ochotona_princeps dipodomys_ordii cavia_porcellus mus_musculus oryctolagus_cuniculus myotis_lucifugus ailuropoda_melanoleuca felis_catus canis_familiaris sus_scrofa sorex_araneus ovis_aries bos_taurus tursiops_truncatus sus_scrofa pteropus_vampyrus mustela_putorius_furo erinaceus_europaeus vicugna_pacos equus_caballus {u'taxonomy_level': u'Boreoeutheria', u'target': {u'perc_pos': 92, u'id': u'ENSECAG00000018594', u'protein_id': u'ENSECAP00000016483', u'perc_id': 86, u'cigar_line': u'329MD258MD1264MD76M', u'taxon_id': 9796, u'species': u'equus_caballus'}, u'source': {u'perc_pos': 92, u'id': u'ENSG00000115850', u'protein_id': u'ENSP00000264162', u'perc_id': 86, u'cigar_line': u'351M2D1503MD73M', u'taxon_id': 9606, u'species': u'homo_sapiens'}, u'method_link_type': u'ENSEMBL_ORTHOLOGUES', u'dn_ds': 0.22114, u'type': u'ortholog_one2one'} Boreoeutheria dasypus_novemcinctus choloepus_hoffmanni echinops_telfairi loxodonta_africana procavia_capensis tupaia_belangeri sarcophilus_harrisii macropus_eugenii monodelphis_domestica ornithorhynchus_anatinus ornithorhynchus_anatinus petromyzon_marinus meleagris_gallopavo anolis_carolinensis ficedula_albicollis pelodiscus_sinensis gallus_gallus taeniopygia_guttata anas_platyrhynchos latimeria_chalumnae astyanax_mexicanus oryzias_latipes takifugu_rubripes gasterosteus_aculeatus tetraodon_nigroviridis poecilia_formosa poecilia_formosa danio_rerio gadus_morhua xiphophorus_maculatus xiphophorus_maculatus oreochromis_niloticus danio_rerio lepisosteus_oculatus gasterosteus_aculeatus takifugu_rubripes tetraodon_nigroviridis takifugu_rubripes xenopus_tropicalis xenopus_tropicalis ciona_intestinalis ciona_savignyi ciona_savignyi drosophila_melanogaster caenorhabditis_elegans caenorhabditis_elegans
horse_req = do_request(ensembl_server, 'lookup/id', horse_id)
print(horse_req)
{u'assembly_name': u'EquCab2', u'display_name': u'LCT', u'description': u'lactase [Source:HGNC Symbol;Acc:HGNC:6530]', u'seq_region_name': u'18', u'logic_name': u'ensembl', u'object_type': u'Gene', u'start': 19610968, u'id': u'ENSECAG00000018594', u'source': u'ensembl', u'db_type': u'core', u'biotype': u'protein_coding', u'end': 19657160, u'species': u'equus_caballus', u'strand': -1}
#maybe synteny of MCM6 and LCT with caballus and gorilla