Last active
January 11, 2016 18:24
-
-
Save kescobo/3f9c663daafd79615b5f to your computer and use it in GitHub Desktop.
Files and code for Biopython issue #747
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
LOCUS BW77_ACAGTG.R1_(paired)_contig_93 233 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_93 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..233 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
BASE COUNT 43 a 68 c 71 g 51 t | |
ORIGIN | |
1 tagtagtaca ccgccagcgg gccgttaggc cccgcgatca cctggaccgg ggtttcgaaa | |
61 acctcggaca ggatttcgtc attcatgatc cgttccggcg agccgaactg gacgaccttg | |
121 ccgtgcttca ttgcgcagat gtagtccgcg taatggccgg cgaagttaat atcgtgcagc | |
181 acgatcacga tggtgcggtt cagctcctgg gcggcccgct tcaggtgctg cat | |
// | |
LOCUS BW77_ACAGTG.R1_(paired)_contig_65 27499 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_65 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..27499 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
CDS 256..387 | |
/db_xref="SEED:fig|6666666.134544.peg.3335" | |
/translation="MHAETNKSKTGKPVLDAPDGDAKTAARPAQYPFGHVDVKQKTV" | |
/product="hypothetical protein" | |
CDS complement(656..1228) | |
/db_xref="SEED:fig|6666666.134544.peg.3336" | |
/translation="MTGLDLVRDALIEVAVLITDSDLNIIDEGIQVVIKPSDAALAQM | |
GDFVRNMHQVSGLLMELDGGMQMEQAQRLVMDYIRKHVPEPNKALLGGNSVGTDKNFL | |
ARDMPEIIDHLHYRIIDVSTLKELSRRWFTKAHYAAPAKTGNHRALGDIQDSIDELRY | |
YRAAIMVPSPGPTTDQARKIATQISTIDEK" | |
/product="3'-to-5' oligoribonuclease (orn)" | |
CDS 1569..3005 | |
/db_xref="SEED:fig|6666666.134544.peg.3337" | |
/translation="MILFGSFGTGWLASVSPLNRDPFFIMVRTEAAGVTICVMLLTLG | |
CWLLFRAWWRLGQKLKTWGKGSLKIVQRAVMLWSIPMLIALPIMSRDVFAYIGQGRLV | |
DAGQDPYVDGISSLNNWFQLGADTMWAQDGTPYGPLFLTIEYIVVNIVGGSTDAAVLA | |
FRAIAVIGVLLCLRYVPKLAELHSVSGAKATWMTVANPLFLVNFVASAHNDALMTGLS | |
VWAVYLACKRHGFWAIVVLAASIGVKPITLVLLPFIGLLWAGPEAKWPRRFLYWFYSG | |
SIFLVLMTLVGWLNGYWFGWLSVLLNYTGTGVSVVAPLGMLTIALQGIFGSFGMETDW | |
VLSVIKNGGRLLGVGLAIVLMFRGKYSHLVQRMGIAYAAIVVLSPVIQPWYLLWLLPF | |
FAATGLRDDWQMLWLHLTTIFFLAYQAADQIFVWQFLQEDLVPRVQLISWGISILCAL | |
YLVFLDPKTKKICPELLSSTNWLKKKVK" | |
/product="POSSIBLE CONSERVED INTEGRAL MEMBRANE PROTEIN" | |
CDS 3002..4498 | |
/db_xref="SEED:fig|6666666.134544.peg.3338" | |
/translation="MSLLVQKLMRRGVSLKALGWQGFAASVMITVASWGIGWFPRSQL | |
SPLARSGFFIEFRTESWGVISCIILMAAGLAWLTRAWILARPLVDTAQLISSRQLAQL | |
FVKWTAPLMFSFPILSRDVYSYLAQGRMLHADKSPYHEGISALPGWFEGGSDGLWAQS | |
PSPYGPFFLVLSRIIYFVSNGVPEIGVGLLRITALLGVIGCFHFTAKLAKKMGQNPNW | |
ANWAIVGNPLFLLTMIGGAHNDALMIAGVFSAFALAYDRRPLVSTLALAIAVSVKPIV | |
LLVLPFIGLILLGRDKSLRAKCIVWLKVFCYCLIWLTIIGAVTNLWFGWLPAMFTAGD | |
AAFPYAPVGLIGWLLGMLVGVLGGSASLTQSIVVLIFQLVSVVIVAWLSLAKDISRPV | |
RLAAWALSAVILLAPIIQPWYILWMIALFAISHRVSWSSEKLMIYLASLILVVVFVDQ | |
LSIEQWHIVWLMRVFAAVLAVALFAGLFRFDPKTRTVLSGDTGPASIQ" | |
/product="POSSIBLE CONSERVED INTEGRAL MEMBRANE PROTEIN" | |
CDS 4583..5674 | |
/db_xref="SEED:fig|6666666.134544.peg.3339" | |
/translation="MFWPATIAMLGGVLFLGAAGIFLLAIQYHRHGRLSWRRTLTTGA | |
AVIYGFGLFSYTMLPLPETRNAFCRPGVAVPQLQPLNFLNDFALSYELGMRHFLTSFT | |
LWQVLFNVILFMPLGILAVRWLRGNVFLGTLIGLTASLAIELTQYTGIWGLYTCAYRV | |
ADVDDLLMNTFGALLGSIVAYLPIFAWLTGPREQSAAKSGPRKVTRLRRFMANGFDIA | |
FVLGLVMLTTFVLEIAEKLGAPQASYNLTQRWIPTISVLLVFLLPTLMPGRASLGQRC | |
AWIRVAGHGTCPAPAWQAVARSILGLGGISFAFQIADSIWAASPWAWLSALVLGYLLL | |
SSIFLLCDPAGRGIAGRLTGTRFIDRRIH" | |
/product="hypothetical protein" | |
CDS 5806..6585 | |
/db_xref="SEED:fig|6666666.134544.peg.3340" | |
/translation="MDTQQEIPHEPHRAVLGTAVGATVLIAIGAFVLSFAALTDLAER | |
SGIQANLAWIWPIIIDGMIVAATVAIVALNGFNRKAMIYPWSLLFFGAIVSTAANSTH | |
AILTVDSIVNGVPPLVSALVAAMPPIVLLAITHLTVHMYQKKSEAAKLRAAFDYDEEQ | |
INAEKYGVAYDDGYNSALSDAQQAEAERVAQLEQEHQDAIARARAEAIAQSRSEKVTP | |
LKQAQAPAAAPATAKPATATKQAGEDKAPLYEDMAKRLTRP" | |
/product="Phage excisionase # putative" | |
CDS 6644..7741 | |
/db_xref="SEED:fig|6666666.134544.peg.3341" | |
/translation="MDQLTSNTEPEQFSEQIDEAVSRFESVGQELDEVLRAMKSKIRS | |
LFIDSEVQPLFVTGRVKTAESFRAKASRQLQETPDSNPVLEFPNPLREIHDMVGLRII | |
VMLPHEIQQVATLIKAHREDFDCRSDREKDIGSVESGTYGYSSRHLLLKTRNEPSVSR | |
FQTALGKPVVPSGNFVFEVQIRTVLQHAWSEMEHDIRFKHPGEAAWNPQIDRHFTATA | |
AMLETVENYFTDIDDLYHRMNGYHDREGLGTEKLTGEKIGEIWQTLLPHVDRKRDDDW | |
SWAAELLGSHGIDQTWQLAELLDANVVTEVRAALDHRYSPGPDRLLDDVLLWRFGKAH | |
IDKTSGSDLKREASLRRRLIQMKDFRSTQRS" | |
/product="RelA/SpoT domain protein" | |
CDS 7906..9507 | |
/db_xref="SEED:fig|6666666.134544.peg.3342" | |
/db_xref="GO:0005524" | |
/db_xref="GO:0006810" | |
/db_xref="GO:0016021" | |
/db_xref="GO:0016887" | |
/translation="MISVANLELRVGARLLMDEVNFRIDKGDKIGLVGRNGAGKTTMT | |
KVLAGESQPASGNVSLKGSIGYLPQDPKTEDMEQLAKDRILAARGLDVVLNKLAKARD | |
EMASDDASVAKKAMGRYDRLEAEFMAAGGYSAESEAAAICSNLDLPERILEQPLRTLS | |
GGQRRRVELARILYSDAETLLLDEPTNHLDADSITWLRDFIKNYTGGVLMISHDTGLL | |
DATVNKVLFLDANRATVDVYNMNWKRYQTQRETDERARKRERGNIEKKASVLMAQANK | |
MKARASGASAAQSMLKRVDRMLSGLEEVRANDRVAALRFPDPAPCGKTPMMAEGLSKA | |
YGSLEIFTDVSLAIDRGSKVVILGLNGAGKTTLLRMLAGVSEPDTGTIIPGHGLKIGY | |
FAQEHDTLDPDATVLENMRRNAPDHLGDADVRSILGSFMFVGDDVSKPAGVLSGGEKT | |
RLALATIVASSANVLLLDEPTNNLDPASRAEVLGALSSFPGAVVMVSHDEGAVMALKP | |
ERVVILPDGDEDLFNEGYLELVSLT" | |
/product="ABC transporter ATP-binding protein" | |
CDS complement(9624..10532) | |
/db_xref="SEED:fig|6666666.134544.peg.3343" | |
/translation="MYRFLASTRWVGWLLLVVIFAAACAGLGKWQSDRRTEVLTSISH | |
VNNNYDATPVSGDQALDKFNSLPEEDTWMTVELTGQYLSDDTRIVRNRIKASRPGYEV | |
LVPFRTETGTTVIIDRGFLPIGNSEGGRPDTVPAAPAGTVTVNARLKAGEIKLDRGAP | |
DGQLASIHLPAYAAQLPYPISEGAYGIMYEEDPAPATAPQPLDAPDTDEGPHLSYEFQ | |
WYFFGILSFVGFWYAAKQQRKINAEDAAELAEAQALGFEEPIHRVRKLRAKEEKKFRR | |
DGSLTDEAYEDLMLDEDPPKDGDKPQ" | |
/product="Cytochrome oxidase biogenesis protein Surf1, | |
facilitates heme A insertion" | |
CDS complement(10533..10775) | |
/db_xref="SEED:fig|6666666.134544.peg.3344" | |
/translation="MDLLGSLAGASSAPTEVQCSRKGCRAPAAFQILWNNPKIHTPER | |
RKIWLACTEHREWLETYLKERLLYKETLPMGEGATQ" | |
/product="hypothetical protein" | |
CDS complement(10776..11180) | |
/db_xref="SEED:fig|6666666.134544.peg.3345" | |
/translation="MSHQHANHGPKDQPVHRITEARESHTSERDLRIRKYTISMTVRM | |
LCFILAFFFEGWVRWVLLAGAVILPYIAVVIANGGADLTRREPPAEFYSGKEPEQIEN | |
TVRPTVVDEPEIVIIEGTLTDTAPPSDTSKEA" | |
/product="hypothetical protein" | |
CDS 11390..12112 | |
/db_xref="SEED:fig|6666666.134544.peg.3346" | |
/db_xref="GO:0004316" | |
/translation="MSTETTNGRSVLVTGGNRGIGLAIARSFEANGDKVAITYRSGEV | |
PEGLLGVKADVTDSESIDAAFKEVEAAHGPVEVLIANAGVTKDTLLLRMSEDDFTSVI | |
DTNLTGAFRVIKRASKGMLRLKRGRVVLISSVVGLYGSPGQINYAASKAGLVGIARSL | |
TRELGSRNITANVVAPGFINTEMTAVLPEETQKSYLASIPANRFAEPEEVANVVRWVA | |
SDEAAYISGAVIPVDGGLGMGH" | |
/product="3-oxoacyl-[acyl-carrier protein] reductase (EC | |
1.1.1.100)" | |
/EC_number="1.1.1.100" | |
CDS 12152..12901 | |
/db_xref="SEED:fig|6666666.134544.peg.3347" | |
/db_xref="GO:0004319" | |
/translation="MSEYKGAIVTGSSRGIGAVTAQELAAEGLGVVINYRAKAPRANK | |
IVAAIEDKGGKAVAVGADLTTTEGPQALIDAAVENFGTLDVLVLNASGGMETSMGENY | |
ALRLNRDAQVAMLEAALPAMSEGGRVVFVTSHQAHFIKQVSTMEAYDQVAQSKRAGED | |
ALREFIPRLAEKNINFVVVSGDMIEGTITATLLNRMEPGAIDARREAAGKLYSVEEFG | |
AEVAKMVFADVETGHTELVGGAGDFLKQAEQ" | |
/product="Enoyl-[acyl-carrier-protein] reductase [NADPH] | |
(EC 1.3.1.10)" | |
/EC_number="1.3.1.10" | |
CDS complement(12994..13800) | |
/db_xref="SEED:fig|6666666.134544.peg.3348" | |
/translation="MQSLLAAEYLNIYDEQLRTDAETPSAVKVQRLGALRLINFTGGQ | |
GFITYPHIAHTSDTNLAALVGEALAYYLEQPEISDVEWKSRGHDHAPGLHEQLLAHGF | |
VADASESIMVGRAADLSTETPLPAGVTLRQIFSEDDVRAMTAMQDQTFGEAVSTRHAE | |
AILRRLATADGMQLWVAEDSTGTILSAGRLEPVPDTDFAGIWGGATVAAYRGQGIYRA | |
LTAARARAALELGKTLIHSDSTEYSRPILERYGLLKVSTTTPYRWSRTQH" | |
/product="FIG00512199: hypothetical protein" | |
CDS complement(13873..15612) | |
/db_xref="SEED:fig|6666666.134544.peg.3349" | |
/translation="MQTPSPDSSSSPSPSNRPKDQGRNKAKPWIITGSCVVAAAALYF | |
GGAALISAQVPANASIAGVNIGSMSQDDARAALNKSVVPLAAKPFEVQINSQSYKMDP | |
VKAGLSLNVDDTVADLTGYEANPVELIDRLTGKYTATASIDVDQDKLNSQLAALAKKA | |
DSKVTEGDITFAEGKAKLVKPVDGVSLKQDEAAKVLTSDWRIGAPAIELPSEIAKPEI | |
SEDTLQSFYDDKVKALLKDKVSLTSDKKKVDISAAAIAEAASYTPKDGAPAITLDDKK | |
LFKAATTNSEFSSTAKNARITLSGGKPTITKSTTGLALETKGLGAKVLAATETKERTA | |
KVVLKTSEADFTTADAKKLGIKEEIVEFSTPYPTYDKVRTKNLHAGSDRISGTVIKPG | |
ENFSLLQTLGPITVANGYFSSGVVESGFSTEAVGGGLSQISTQLYNVGFLAGYDDVTH | |
KPHSRWFERYPAGREATLWEGQVDMVWKNNTPYGVMIQAWVSGDRVHTRLWSTKYWKV | |
SQKSSGKYNMTNPETRYNPADKCVSESGGQKGFSIDITRNRSTIDGSKTLPPDVKSWT | |
YQPWHKVVCGEKP" | |
/product="Vancomycin B-type resistance protein VanW" | |
CDS complement(15773..16696) | |
/db_xref="SEED:fig|6666666.134544.peg.3350" | |
/db_xref="GO:0004647" | |
/translation="MASTLTLVSRPALPRDRFDELLAQLVNRLPAAAEAIFSVHESAT | |
RWVAKTRIENIDALDLRTEALASFDTLVDSGFFSADEACVTVLDSALTDAKRILLLMD | |
VDSTLIKQEVIELLAAHAGREQEVAAVTEAAMRGELDFAQSLIQRVATLKGLPESVLP | |
EVISRVIYSDGARELVQRMHAAGHIVGVVSGGFQQILDPLAQELKLDHALANTLGITD | |
GLLDGTVHGQIVDRAMKEKMLRAWAAEHGISMSATIAAGDGANDLDMVTAAGLGVAFN | |
AKPALREQAGARIDFSRLDVIADLVLDDFDA" | |
/product="Phosphoserine phosphatase (EC 3.1.3.3)" | |
/EC_number="3.1.3.3" | |
CDS 16805..17245 | |
/db_xref="SEED:fig|6666666.134544.peg.3351" | |
/translation="MTSSPPDAKLADDLLDAIYPLFGMLNKVRSISAGKLGILSLAEE | |
QGKITAAAMKDKLGVSQQAISLAAKELVEMELLVRTKDPGDLRRTWFALTDSGAQKLH | |
AERQLARAVLADVINKNLAPKQQESIRHAIDALTHISRGGHESN" | |
/product="Transcriptional regulator, MarR family" | |
CDS 17232..18623 | |
/db_xref="SEED:fig|6666666.134544.peg.3352" | |
/translation="MNRTNSNLVPTLIFAALSTAIVSSLGMLLVPSIAATYQISVSAA | |
QWMLTVNLLAGAVATPVMGRLSDGPHKKKLLLYSLVIILLGSILAALAPTFGIFLIGR | |
AMQGLTYGIVPVTIALARRYSDPKTVHHAISSLSVTVATGIGIGYPLTGVIAGMFSFQ | |
WAFWFAAVFVFIVIFVVLRIVPDGPDENVPRTKFDFAGALLLAAGLGLLLLGISEGSH | |
WGWISARTVLVLGVAIILLFIWVKTELRIAHPLINLRTLRQGEVLLANFAAIGLGAAL | |
YIGMSVASLVAQAPATTNFGLALPILWAGFVIMPLSVGSLVANRLVHRLGHRVGYPAL | |
LPIGATLFAAAATFLWLAHGALWELLLGMLVFGLGMGASYAAMPALIARSVAAEQLGS | |
SVSFNQVLRTVGSSFGTAVSAAIIAMHADSSGATTGQGVTLSFAVSAIGCILLGLALT | |
VHFFYRKQKSNES" | |
/product="Membrane transport protein" | |
CDS 18687..19478 | |
/db_xref="SEED:fig|6666666.134544.peg.3353" | |
/translation="MSEVLTFNDVSVVRGRKDLLKDVSWEVKEGQRWIVLGPNGAGKS | |
TLMNIAATRLHPTRGTAGILGETMGKVDVFELRPLIGLSSSLVANAIPANETALNVVL | |
TAAYGMTGRWREKYEKLDERRAFSMLHQWGMSTFMNQPFGKLSEGERKRVLIARALMT | |
DPELLILDEPAAGLDLAGREELVAQLTELAANEEAPALVLVTHHLEEIPPGFTHILML | |
NAGEVVAAGEIASTLTEENLKATYGMDLSVREVDGRYSAVARRVN" | |
/product="putative ABC transporter ATP-binding protein" | |
CDS 19494..20300 | |
/db_xref="SEED:fig|6666666.134544.peg.3354" | |
/translation="MIDFWREALILFGGLWAGTINTVVGSGTLVTFPILVALGFAPVN | |
AVVSNAMGLIAGGFSGAWGYRREAASVKKTLLKLVPVSLVGGLIGSLLLLNLPESVFG | |
VVAPVLLVCALVLVIFQPKLSAWAKTRQAQRGGNDPDDADRAKIPTILYVLVFVIGVY | |
GGYFTAAQGVLLMAVFGVFLQASLQQSNAIKVILSLMVNIVAAAMYLLIAPERIHWIV | |
VLLIAVGSLIGGFIGAKVGRKLSPGWLRVIIVILGGIALVNMVYKLVAGA" | |
/product="membrane protein, putative" | |
CDS 20293..21129 | |
/db_xref="SEED:fig|6666666.134544.peg.3355" | |
/translation="MPEIVNPERILHIADLQDARLDEYLRLSEAHLRMRSDVENGLYI | |
AESTTVVSRAINAGHVPRSFLLAEKHLDQLAQEFARFPDVPIFVGSDEQLQDLVGFHL | |
HRGAMASMNRPEPLNLSEVLERSSRIAILEDIADHTNLGAIMRSASGLGVDAVLITPK | |
CVDPWYRRSARVSMGTVFDLPWVRLTSWPQDINILKAHGYTMLAMELTEDAVSLAEVE | |
MTEGKKFAMILGNEGRGVTEETLSLVDQAVMIPMHREVSSLNVGAASAIAFWELCSST | |
PK" | |
/product="rRNA methyltransferase" | |
CDS 21265..21522 | |
/db_xref="SEED:fig|6666666.134544.peg.3356" | |
/db_xref="GO:0003735" | |
/db_xref="GO:0005622" | |
/db_xref="GO:0005840" | |
/db_xref="GO:0006412" | |
/translation="MKADIHPKYGPVVFNDLASGEQFLTRSTRSSDKTVEWADGNTYP | |
VIDVEISAASHPFYTGKQRIMDTAGRVERFNARFKGFGGKK" | |
/product="LSU ribosomal protein L31p" | |
CDS 21622..22677 | |
/db_xref="SEED:fig|6666666.134544.peg.3357" | |
/db_xref="GO:0003824" | |
/db_xref="GO:0006464" | |
/translation="MMHHGEYKVVGGKLVVVDLDSDNGVIVNASLNGDFFLEPDEALE | |
DLNAALNGLPTGASHGTIRDAVNNNLREGAVMFGFDADAVARAVRRSLGHATKWEDHQ | |
WEILGPEIIPVAEQVALDEVLTRQIGTGERKPTIRFWDWDESAVVIGSFQSLKNEVDM | |
EQATHHGIKVVRRISGGGAMFMEAGNCITYSLYAPDSLVDGMSFADSYPFLDAWVMQA | |
LKSLGINAYYKPLNDIATPSGKIGGAAQKRLAKGALLHHVTMSYDIDAQKMVQVLRIG | |
REKISDKGITSAVKRVDPLKSQTSEDRAQIISTMMDTFAARTNATVVELDDITRKAAQ | |
DLAQTKFDTEAWTARVP" | |
/product="Lipoate-protein ligase A" | |
CDS complement(22679..25324) | |
/db_xref="SEED:fig|6666666.134544.peg.3358" | |
/db_xref="GO:0004179" | |
/translation="MDTLERYAPNENLRRDEAAWRAANISWHYAAVELDLSNATQAQE | |
TSYTAITTLNFSSKSPQTFIDYIHESIESIVVNGAEISVADAVLDARIYLDGLRTDAA | |
NTVRITGRSSYSRSGEGLHRFVDPQDGQTYLYTQFEPSEARRVFACFEQPDLKTSYQF | |
TLTGPEDWHLASNQQIIDEMNHGDGTKTVACAPTGPISTYITAVLAGPYHVVRGTHVQ | |
KLADGESLDIEMAATCRASLAEHFDGEEILKLTSQGLDYFHELFDYPYPWGKYDSAFV | |
PEYNLGAMENPGLVTFTERYVFTSQATEAQYEQRANTLMHEMAHMWFGDLVTMAWWDD | |
LWLKESFADYIGTLANDEATEFTTAWTTFAARRKAWAYVADQMPTTHPIVADIPDLLA | |
ADQNFDGITYAKGASVLKQLAAFVGAEAFRDAARAYFRQHEYANTSLEDFLQALEKAS | |
GRDMRSWADAWLKTSGVPKLAVNYTVDDAGILTAANLEQHGIDPISGQAIVRPHVLTV | |
GAYTLTDGVLTRTATQRVELSGDSVALDFLVGQPLPDLILPNVGDETYALIEFDENSL | |
KTLLGNLGSLQESLPRATSWASLWDGVRQSKLASQTYVNAILEHAHTVTDSGVFAMLL | |
DQLVTSISKYVAPELRVSIRERAAEVLTGWLANFEAGSDQQTTTARTLARLARSGVAR | |
EVIDSFLAEEENPYRVTVDEQLRWASYIALAVAGGLDAQAEARMHQAAKRNPTSVAQN | |
AVRTALAARPDTDVKEAAFDTVLMGHDEHGPLSNDALSAIADGFAMGSASLLAGFQSR | |
YWAAILPVFETMSMEFATRVIEGLYPGSQDLTGEPEENPTLQAGNVWLEHHQGAPAAL | |
LRILIEQRAELERSLNAQQHSRASQ" | |
/product="Membrane alanine aminopeptidase N (EC | |
3.4.11.2)" | |
/EC_number="3.4.11.2" | |
CDS complement(25531..26430) | |
/db_xref="SEED:fig|6666666.134544.peg.3359" | |
/translation="MTETWAAKRLSSPDLNVDLRRCAINKGMVELTDSSQAMADETLE | |
WAQNADLVLIPGLGDFTATPPNQYLETIREAHQRGAVVASLCSGAFVLAQTGLLDGLT | |
ATTHWALTDELASRFLEINVDPAVLFVGESRVWTSAGVAAGIDLSIHLIGQFCGSSVA | |
STIARSMVMAPHRTGGQAQFLTTPVAVKHGDGQAMTTVRTLMMKDPTRTLTLSDFAGE | |
ACMSERTFLRRFLAETGSTPHQWAMSWRIDEACKLLEESHGSIAEVSAAVGFGTPVTF | |
RQRFRALKGVSPMEYRQAFRKPE" | |
/product="Transcriptional regulator, AraC family" | |
CDS complement(26622..27272) | |
/db_xref="SEED:fig|6666666.134544.peg.3360" | |
/translation="MYGELSGEGSLCDTLIYMSKIMVGYARVSTEEQDLTAQRDALAS | |
LGVEPERVYVDHGFTGRNKNRAGLHEALAACRAGDTFVVTKLDRLARSVRDAHEIADD | |
LARREIRLSIGGSVHDPTDPMGKLLFNVLAMIAEFEADLISMRTREGMKVAKANGRLR | |
GKQPKLTVKQETHLLELHDAGKHTMTEMAELFSISRSTIYRAVERDQRKKTGTITP" | |
/product="Mobile element protein" | |
tRNA complement(425..497) | |
/db_xref="SEED:fig|6666666.134544.rna.58" | |
/product="tRNA-His-GTG" | |
BASE COUNT 5778 a 7527 c 7776 g 6418 t | |
ORIGIN | |
1 tgagctatac ccaccatgat tacttagtga ctagtcggaa cgctagaagc tcccgaactg | |
61 atttcaagca acgagaaata ctatacatgc atctggggtg aaactaataa tcgggatgtt | |
121 agctacgttt ggggggtaag tcccaaaatg tgtgtacaga aacctctcaa aacaaataac | |
181 cactaggact aacaccacca gtacatgctt tgtaagcatg taccgtggca aaagttgcga | |
241 atcaacccgt ctgcgatgca tgcggaaaca aacaagtcaa aaacgggaaa accagtgctg | |
301 gacgcacccg atggcgatgc aaaaactgcg gcgcgtccag cacaatatcc gtttggacac | |
361 gttgacgtta aacaaaaaac ggtctgatcc aaaacttttg tttcgaatca gaccgtttgt | |
421 ctggggtgag taacggggct tgaacccgcg accttctgga ccacaaccag acgctctacc | |
481 aactgagcta tacccaccat gatcgcttcg acactagtca ctccgctttt gcgaaccaat | |
541 ttcgtatctg gcaacgagaa atactataca catatcgagg gggtgagtgc caacttgaaa | |
601 ggcccctaaa gtgctgtgtt gtgtatcacc tgcattttag gggtctgact agtgattact | |
661 tttcgtcgat ggtactgatc tgggtagcga ttttgcgtgc ctgatcggta gttggtccgg | |
721 gggagggcac catgatggcg gcccggtagt aacgaagctc gtcgattgag tcctggatat | |
781 cacctagcgc gcggtgattg cccgtcttgg cgggagccgc gtagtgcgcc ttggtgaacc | |
841 agcgtcgact caattccttc aaggtggaga cgtcgataat acggtagtgc aggtgatcaa | |
901 tgatctctgg catgtcgcgg gccaagaagt tcttatcggt gcctaccgag tttcctccaa | |
961 gcagggcttt gttgggctct gggacgtgtt tacggatgta atccatcacc agacgttgcg | |
1021 cctgctccat ttgcataccg ccgtccagtt ccatcaacaa gccggagacc tgatgcatat | |
1081 tgcgaacgaa gtcacccatc tgtgccagag ccgcatcgct aggcttgatg accacctgga | |
1141 taccctcgtc gatgatgttc aaatccgaat cggtaatcag taccgctacc tcgatcaatg | |
1201 catcacggac cagatctaaa ccggtcatct cgcaatcgat ccatacaatt ttttctgaat | |
1261 tactagccac ggaaccaatc taccctctgg acagcttgtg gggcagcgca cggcatgaaa | |
1321 gcatcagtga tcttagtgtc acgccggtaa gcacatagca ggcgatgcta aaatcatggg | |
1381 agatttcgtg acgttgaacg atgggcctac tgctggctaa ccggatgcaa cgtcaatctt | |
1441 tttaaacaaa ctttttgtcc aatccagcac gaggtgtcac ggtgtccgct agtaaggcag | |
1501 aagttctagc tccccaacca tacgctggtg taaataagac attgcttagc ggcataatcg | |
1561 gctcctcgat gatcctcttc ggatcctttg gtacgggctg gttggccagt gtttcaccgc | |
1621 tgaaccgcga tccatttttc atcatggtgc gaaccgaggc tgccggtgtc accatttgcg | |
1681 tgatgctctt gacgcttggt tgctggttgc ttttccgtgc gtggtggcgc ctaggacaga | |
1741 agctaaaaac ctggggcaaa ggatcgctca agattgtgca gcgcgcggtg atgctctgga | |
1801 gcattccaat gcttatcgcc cttcccatca tgagccgcga cgtttttgct tacattggac | |
1861 aaggccgtct agttgatgcc ggacaagatc cttacgtaga tggcatttca agtctgaata | |
1921 actggttcca gctaggtgcc gataccatgt gggctcaaga cgggaccccc tatggtccgc | |
1981 tgttcttgac cattgaatac atcgtcgtca acatcgttgg cgggtctacc gatgcggctg | |
2041 ttcttgcctt ccgcgccatc gcggtcatcg gtgtcctact atgcctgcga tatgtgccca | |
2101 agctggccga actacattcg gtttccggcg ccaaagcgac gtggatgacc gtggcgaacc | |
2161 cgctgttcct agtgaatttt gtggccagtg cgcataatga tgcgctgatg acgggtctat | |
2221 cggtgtgggc cgtgtacttg gcttgtaaac gacacggctt ttgggcgatt gtggtgctcg | |
2281 cggcctctat cggcgtcaag ccaataactc tggtattgct gccgtttatc ggtttgctct | |
2341 gggcaggtcc ggaggccaaa tggccgcgcc gattcctgta ttggttctac tccggttcca | |
2401 tattcttggt tctgatgacc cttgtgggct ggctgaatgg ctactggttt ggttggctca | |
2461 gtgtgttgct gaactacacc ggtactggtg tctctgttgt tgctcctcta gggatgttaa | |
2521 ccatcgcatt gcagggcatt tttgggtcat ttggcatgga aactgactgg gtactgtcgg | |
2581 tcataaaaaa tggtggccga ttgctcggtg tgggtcttgc tattgttctg atgttccgtg | |
2641 ggaagtactc acatctggtc caacgcatgg gcattgcata tgcggcaatt gtggtgcttt | |
2701 ctccggtaat ccagccatgg tatttgttgt ggttgttgcc cttcttcgcg gcgaccggat | |
2761 tacgtgatga ctggcagatg ctctggttgc acctcaccac gatattcttc ttggcctacc | |
2821 aagctgcgga tcaaattttt gtctggcagt tcctccaaga agacctggtg ccacgagtgc | |
2881 aattgatctc ctggggaatt tcgatcctct gtgcgctgta tctggtcttt ttagatccca | |
2941 agactaaaaa aatatgtccc gagctcctga gctccacaaa ctggctgaaa aagaaagtca | |
3001 agtgagtttg ctggtgcaaa aactaatgcg acgtggcgtg tcgctgaaag ctctgggctg | |
3061 gcaaggcttt gccgcttcgg tgatgatcac cgtggcttct tggggcatcg gctggtttcc | |
3121 gcgtagtcag ctctccccgc tcgctcgcag cggatttttt attgaattcc gcaccgaatc | |
3181 atggggtgtt attagttgca tcatcttgat ggcggcaggg ctggcatggc tgaccagagc | |
3241 ttggattctc gctcgtccgc tggttgatac tgcacaactg atcagctcac gacaattggc | |
3301 gcaactgttc gttaagtgga cggcgccatt gatgttttcc ttcccaattc tcagccgaga | |
3361 tgtttactcg tatctggcac aaggtcgaat gcttcatgcc gataagtctc catatcatga | |
3421 gggtatttcg gctttgcctg gctggtttga aggtggctcg gacgggctct gggcacaatc | |
3481 gccttccccc tatggtccat tcttcttggt actctcacga attatttatt ttgtctccaa | |
3541 cggggttcct gaaattggag tagggctgct gcgcattacc gcgttgctcg gggtcatcgg | |
3601 ctgttttcac ttcaccgcca aactagcgaa aaaaatgggg cagaatccaa actgggctaa | |
3661 ctgggccatt gtaggaaatc cactgttttt attgaccatg atcggtggcg cacacaacga | |
3721 cgcgttgatg attgccggag tgtttagcgc tttcgcattg gcctatgacc gtcgtccttt | |
3781 ggtatccacg ttggctctag ctatcgcggt gtctgtgaaa ccgattgtgc tcttggtgct | |
3841 gccatttata gggctgatct tgttaggtcg cgataagtca ttgcgcgcta aatgcatagt | |
3901 ttggctgaag gtattctgct attgcctgat ctggctaact atcattggcg cggtgacgaa | |
3961 cctctggttt ggatggttgc cggccatgtt caccgccgga gacgcagcct tcccctacgc | |
4021 tccggtgggc ttgattggtt ggttgcttgg catgctggtg ggagtgttgg gcggctcggc | |
4081 gagcctgaca cagagcatcg tggtgcttat ttttcagctt gtttctgtgg tgatcgtggc | |
4141 gtggctttca ttggctaaag atatttctcg gccggtgcgt ctggccgcgt gggcattatc | |
4201 tgcagtgata ttgctcgccc cgatcattca gccctggtac atcttgtgga tgatcgcgct | |
4261 cttcgcgatc tcacaccgtg tctcgtggtc ctccgagaag ctgatgatct atttggctag | |
4321 ccttattctt gtggtggtct tcgtggatca actatccatt gagcagtggc acatcgtgtg | |
4381 gttgatgcgg gtgtttgcgg cggtactggc ggtggcttta tttgccggcc ttttccgctt | |
4441 cgacccgaaa actcgcactg tcctgagtgg agacacagga ccagcttcca ttcagtaagc | |
4501 atccagccaa caatagctgg gctcacacca gacgtcacag gttgtgcgca tttttctcgg | |
4561 cttagataga aatatgcaaa cgatgttttg gcccgcgact atcgccatgc ttggcggtgt | |
4621 cctcttctta ggcgcagccg gtattttcct gctcgccatc cagtatcacc gccatggacg | |
4681 cctatcgtgg cgacggacgc tgaccaccgg tgccgcagta atctacgggt ttggcctctt | |
4741 cagctacacc atgctgccgc tacccgaaac acgtaacgca ttttgtcggc ccggggtagc | |
4801 cgttccgcag ctgcaaccgc tgaacttcct caatgacttt gcgctctcct acgaactggg | |
4861 gatgcgtcac tttttgacca gttttacgct ctggcaggtc ctttttaatg tgatcttgtt | |
4921 catgccgctc ggtatcctgg cggtccgctg gctgcgtggc aacgtatttc tgggcacgct | |
4981 catcgggctc accgccagtt tggccatcga actgactcag tacaccggaa tttggggcct | |
5041 gtatacctgc gcctaccgag ttgccgacgt cgatgatcta ctgatgaaca ccttcggtgc | |
5101 gctgcttgga tccatcgtgg cttacctgcc aatctttgcg tggcttaccg gaccacgaga | |
5161 acaaagtgcc gcgaagtccg gaccgcgtaa ggtcaccaga cttcgccgct ttatggccaa | |
5221 cggcttcgat atcgcttttg tccttgggct ggtgatgctc accaccttcg tgctggagat | |
5281 cgccgaaaaa cttggagccc cgcaggcctc ctacaacctg acgcagcggt ggattcccac | |
5341 gatctcggtg ctgctggtct tcttgcttcc aaccctgatg ccaggccgcg cgagcctagg | |
5401 gcagcgctgt gcctggattc gagtggccgg acatggcacg tgtccagcac ctgcatggca | |
5461 ggcagtggcg cgcagcattc tgggtctcgg cggaatctct ttcgctttcc aaattgccga | |
5521 cagcatctgg gctgcaagcc cctgggcctg gctcagtgca ctggtacttg gctacctgct | |
5581 gctgagctcg attttcctct tatgcgatcc ggccggccgc ggaatagccg gtaggctcac | |
5641 cggcaccaga ttcattgatc ggcgaattca ctaatcgttc accaccaagc tgtcagctga | |
5701 tggggctaaa atagtcccgg tggccggtac ccgatacgac tggcaaccac attcgcttct | |
5761 aagacgttcc gattcatctc tccaaagtta ggcctgcccc gcagtatgga tactcagcaa | |
5821 gaaattccgc acgaaccgca ccgcgccgtc cttggcaccg ccgtaggagc cacggtcctg | |
5881 atcgcgattg gtgcattcgt actatccttc gcggcgctaa ccgacttggc cgaacgctcc | |
5941 ggcattcagg cgaacctggc ctggatctgg ccaatcatca ttgacggcat gatcgtggcg | |
6001 gccaccgttg ccatcgtggc gctgaacggc ttcaatcgta aagccatgat ctacccgtgg | |
6061 tctttgctgt tcttcggcgc tatcgtctcg accgcagcaa actccaccca cgcgatcctt | |
6121 accgtggatt ccatcgttaa cggtgtgcca ccgctggtat cggccctcgt tgcggccatg | |
6181 ccacccatcg tgttgctggc catcacccac ctgaccgtgc acatgtacca gaagaagtct | |
6241 gaagctgcga agcttcgcgc cgccttcgac tatgacgaag agcagatcaa cgcagagaag | |
6301 tacggcgtcg cctacgacga cggttacaac tcggcacttt ctgatgcaca gcaggcggaa | |
6361 gccgagcgag tggctcagct ggaacaagag caccaggatg ccatcgcccg agcccgcgcc | |
6421 gaggccatcg ctcagtcgcg ctcggaaaag gtcaccccgc tgaagcaggc tcaagctcca | |
6481 gctgcggctc cggcaaccgc taagcctgcg accgctacta agcaggctgg cgaagacaaa | |
6541 gccccgttgt acgaggacat ggctaagcgc ctgactcgcc catagctagg acgcgcaccg | |
6601 catcgatcac ccacggcatt tcagcacatt aggaggcacc accatggatc aattgaccag | |
6661 caacaccgaa ccggaacagt tcagcgaaca aatcgacgag gcggtgtctc gttttgaaag | |
6721 cgtggggcag gaactcgatg aggtgctgcg ggcgatgaaa tcaaaaattc gctcgttatt | |
6781 tattgatagt gaagtgcaac ccttgtttgt gaccgggcgg gtgaaaaccg ccgagtcttt | |
6841 ccgcgccaag gcttcgcgcc agttacagga aactcctgat tcaaacccgg tattggagtt | |
6901 ccctaacccg ctccgggaaa tccacgacat ggtgggtttg cgcatcatcg tgatgcttcc | |
6961 ccatgaaatc cagcaggtag ccacgctgat caaggcgcac cgcgaggact ttgattgccg | |
7021 cagcgatcgt gagaaagaca tcggttcggt ggaatccgga acctatggtt actcctcacg | |
7081 gcacctgctg ctcaaaaccc gaaatgaacc gagcgtgtct aggttccaaa cggctttggg | |
7141 taaaccagtg gtacccagcg gcaacttcgt ttttgaggtg cagatccgca cggtgctcca | |
7201 gcacgcatgg agcgagatgg aacatgacat ccgctttaag catcctggag aagccgcgtg | |
7261 gaacccgcag atcgacaggc atttcaccgc caccgcggcc atgctcgaaa cggtggaaaa | |
7321 ctacttcacc gacatcgatg atctctacca tcggatgaat ggatatcacg accgtgaagg | |
7381 cttgggcacc gagaagctga ccggcgaaaa aatcggcgaa atctggcaga ccctgcttcc | |
7441 gcacgtggac cgcaagcgcg acgatgactg gtcctgggcc gccgaattgc tcggctccca | |
7501 tggcatcgat cagacctggc agctggctga acttttggat gcaaatgtag tcaccgaggt | |
7561 ccgtgccgca ctggatcacc ggtattctcc ggggccagat aggctgcttg acgacgtgtt | |
7621 gctttggcgt tttggcaagg cacatatcga taagaccagt ggctcggatt tgaaacgcga | |
7681 agcctcgctt cgtcgcagac tgatccaaat gaaagacttc cgctccacgc agcgcagcta | |
7741 gcacaactgc ccggcaccca atattgggtg ccgggcagtg agcgttaaga tgttggttcg | |
7801 cacacagtaa gcctgatccc gcctatacga ccggtaggat agacaagttg ccctttatat | |
7861 gggcgaatag tttttcctta ccccgttttg aaagggccac accatatgat ttccgtagcc | |
7921 aaccttgagc tacgcgtcgg cgcccgcttg ctgatggacg aagtaaattt ccgcatcgac | |
7981 aagggcgaca agatcggact ggtgggtcga aacggtgccg gtaagaccac catgaccaag | |
8041 gtcttggccg gagaatccca gccggctagc ggtaacgtct cgctgaaggg ttccattggc | |
8101 tacctgccac aggatccgaa gaccgaagac atggagcagc tggcgaagga ccgtatcctc | |
8161 gccgctcgtg gcctagacgt tgtactcaat aagctggcta aggcccgcga tgagatggct | |
8221 agcgatgacg cgtccgtagc gaagaaggcc atgggccgat atgaccgtct ggaagccgaa | |
8281 tttatggctg ccggcggcta ctccgccgaa tccgaagccg cggccatctg ttctaacctg | |
8341 gatttgccag aacgtattct tgagcagcca ttgcgcaccc tatccggtgg ccagcgccgc | |
8401 cgtgtggagc ttgcccgcat cctttactcg gacgccgaaa cgctgctgct cgatgagcca | |
8461 actaaccact tggatgccga ttccatcacc tggttacgtg acttcatcaa gaactacacc | |
8521 ggcggcgtgc tgatgatcag tcacgacacc ggcctgttgg atgccaccgt gaacaaggtg | |
8581 cttttccttg acgctaaccg cgccaccgtt gatgtgtaca acatgaactg gaagcgttac | |
8641 cagacccagc gcgaaaccga tgagcgtgct cgtaagcgcg agcgcggcaa cattgagaag | |
8701 aaggcttcgg tcttgatggc tcaggctaac aagatgaagg ctcgtgcttc cggtgcttcc | |
8761 gccgcgcaat cgatgctcaa gcgagttgac cgcatgcttt cgggcctgga agaagtgcgc | |
8821 gcgaacgacc gtgttgcagc tttgcgcttc ccggatcctg ccccttgtgg caagacccca | |
8881 atgatggccg agggcctatc caaggcctat ggatccctgg aaatcttcac cgatgtgtcg | |
8941 ctggctatcg accggggttc aaaggtagta atcctgggcc ttaacggcgc gggtaagacc | |
9001 accttgctgc gtatgcttgc cggagtttcg gagccagata ccggaacgat catcccggga | |
9061 cacggtttaa agatcggtta cttcgcacag gagcacgaca ccctggatcc agacgcgacg | |
9121 gtgcttgaaa atatgcgtcg caacgccccg gatcacctcg gtgatgccga cgtgcgttcg | |
9181 attcttggtt ccttcatgtt tgttggcgat gacgtctcga agccagccgg agtactctcc | |
9241 ggtggtgaga agacccgtct ggccttggcc accatcgtgg cttccagcgc taacgtgctg | |
9301 ttactcgatg agcctactaa caaccttgac ccggcctcgc gcgccgaggt acttggtgcg | |
9361 ctatccagct tcccaggcgc cgtagtgatg gtcagccacg atgagggcgc cgtgatggca | |
9421 ctgaagcccg agcgtgtggt catcctgcct gatggcgacg aggacctgtt caacgagggc | |
9481 tatctggaat tggtctcact gacctaagcc agtacagctt aaaagccgcg ggtcaccatt | |
9541 ctctaaggat ggtgacccgc ggcttttgtg ttgccctgat gctaaaggac aagcccacga | |
9601 ccggtggtcg tgggcttgtc gccttactgg ggtttgtcgc cgtccttcgg cggatcttca | |
9661 tcaagcatga gatcctcata ggcctcatcg gtcagcgacc cgtcgcgacg gaacttcttt | |
9721 tcttccttcg cacgtagctt gcggacccgg tgaattggtt cttcaaagcc caacgcctgc | |
9781 gcctcggcga gctcggcagc gtcttcggca ttgatcttgc gttgttgctt cgccgcgtac | |
9841 cagaagccga cgaaggataa gatcccaaag aagtaccact ggaactcata ggaaaggtgc | |
9901 ggaccttcat cggtgtccgg tgcatccaag ggctgtggtg ctgtggccgg agccggatct | |
9961 tcctcataca tgatgccgta ggcaccttcg gagatcgggt aggggagttg cgcggcgtag | |
10021 gcgggcagat gaatggatgc gagctggcca tcgggggccc cacgatccag tttgatctcg | |
10081 ccggccttca aacgtgcgtt cacggtgacc gttccggcag gagcagcggg aaccgtatcg | |
10141 gggcgaccgc cttcggaatt gccgataggt aggaagccac ggtcgataat taccgtagtg | |
10201 ccggtttcgg tgcggaacgg aaccagcacc tcataacccg ggcgggaggc cttaatccgg | |
10261 ttgcgcacga tacgcgtgtc atcgctgagg tactgaccgg tgagctcaac agtcatccag | |
10321 gtgtcttctt caggcaatga attaaacttg tccagcgcct gatcaccgga aacaggtgtg | |
10381 gcgtcgtagt tgttgttcac gtgggaaatg ctggtgagca cttcggtgcg acggtcagac | |
10441 tgccatttac ctagccccgc acaggctgca gcaaaaatga cgacgagtag caaccagcca | |
10501 acccagcggg tgctggccaa aaaacggtac atttactgag tagctccttc gcccatgggc | |
10561 agggtttcct tatagagcaa acgctccttc agataggttt ctaaccactc gcggtgctca | |
10621 gtacaggcca accagatctt tcggcgctcg ggagtatgaa tctttgggtt attccataaa | |
10681 atctgaaaag ctgccggcgc ccggcatccc ttacgcgagc attgaacttc ggtaggcgca | |
10741 gaactcgcgc ctgctaatga accgagaaga tccatttatg cctccttaga cgtatcggac | |
10801 gggggagcag tatcggtcag tgtgccctcg atgatcacga tctctggttc gtccaccaca | |
10861 gttggccgga ccgtattttc gatctgttcc ggctccttgc cactataaaa ttctgcggga | |
10921 ggttcgcgcc tagtcaggtc tgctccgcca ttggcgatga ctacggcaat atagggcagg | |
10981 atcactgctc cggcgagcag tacccaccgt acccaccctt caaagaagaa cgccaagatg | |
11041 aagcacagca tacgcacggt catggaaatc gtgtatttgc gtatgcgcag gtcacgctcc | |
11101 gaggtgtgtg actcgcgcgc ttcggtaata cggtgaaccg gctggtcctt cggaccatgg | |
11161 ttcgcatgct ggtgtgacat agctttcgaa cttcgctcaa cggggctatt tctgccttca | |
11221 ttctctcact tgtgcctgtg agaaccgaat ttctacgtgc cgtcgaagct gtaatactgc | |
11281 ggggtaacta ataggattgt tttcagacta gctactgacc taagcaaagt gtctgttttg | |
11341 gtgccccgta accgatggtg tgcgccgacg gcatggatgg agaattacat tgagcacgga | |
11401 aaccaccaac ggccgcagcg tactggtgac cggcggaaac cgcggaattg gcctagccat | |
11461 cgcgcgatcc ttcgaagcca acggtgacaa ggttgccatc acctaccgca gtggcgaggt | |
11521 tcccgaagga ctgctcggcg tgaaggccga tgtgaccgac agcgaatcaa tcgatgcagc | |
11581 attcaaagag gtcgaagcgg cccacggacc ggttgaagtg ctcatcgcca acgccggtgt | |
11641 aaccaaagac acgctgctgc tgcgcatgag tgaagatgac ttcacctcgg tgatcgacac | |
11701 caacctcacc ggcgccttcc gcgtgattaa acgagccagc aagggcatgc ttcgcctcaa | |
11761 gcgtggccgt gtggtgctga tctcttcggt ggttggactc tacggttcac cgggccagat | |
11821 caattacgct gcgtccaagg ccggtcttgt gggcattgcc cgctcactga cccgcgaact | |
11881 tggatcacgt aatatcaccg cgaacgtggt ggccccaggc tttatcaaca ccgaaatgac | |
11941 cgcggtactt ccagaagaaa ctcagaagtc ctacctcgcg tccattccgg ccaaccgctt | |
12001 tgccgagcca gaagaggtcg ctaacgtggt gcgctgggtt gctagcgatg aagcggccta | |
12061 catctccggg gcggttatcc cggttgatgg cggccttggc atgggccact aaaactaccc | |
12121 ccaatttttg atatacctaa ggagtaaaaa gttgagcgaa tacaagggtg caatagtcac | |
12181 cggctcgtcg cgcggaatcg gcgcggtcac cgcacaggaa ctggcagcag agggcctcgg | |
12241 agtggtcatc aactaccgcg ccaaggcacc acgtgcgaac aagattgtgg cagctattga | |
12301 agacaagggc ggcaaggccg ttgctgtagg cgccgacctg accaccaccg agggtccaca | |
12361 ggctctcatt gacgcagccg tggagaattt cggcacacta gacgtactgg tgctcaacgc | |
12421 ctccggcggc atggaaacct cgatggggga gaactacgcg ctgcgcttga accgcgacgc | |
12481 tcaggtagca atgctcgaag ccgcgctgcc agcgatgagc gagggcggcc gtgtcgtctt | |
12541 cgtgaccagc caccaggcgc acttcatcaa acaggtttcc accatggaag cctacgacca | |
12601 ggttgcgcag tccaagcgcg ccggtgaaga tgccttacgc gaattcattc caaggctcgc | |
12661 agagaagaat atcaactttg ttgtcgtctc cggtgacatg atcgagggca ccatcaccgc | |
12721 aacgctgctc aaccgcatgg agccaggcgc tattgacgcg cgtcgcgaag cggccggcaa | |
12781 gctgtactcg gttgaagaat ttggtgccga agttgccaag atggtcttcg ctgacgttga | |
12841 aaccggacac accgaacttg ttggtggggc cggagacttc ctgaagcagg ccgagcagta | |
12901 agaacctgct cgccaagtag ttttttgagg cctgtcgttc gctcccgcac cggtggtgaa | |
12961 cgacaggcct ttatgctgca ccgtaagcgc cgtttaatgc tgcgttcggc tccagcggta | |
13021 aggcgtagtg gtggagacct tcagtaggcc gtagcgctcc aaaatgggtc tggaatattc | |
13081 ggtggagtca ctatggatca gtgttttgcc cagttctagg gcggcccgtg ccctcgcagc | |
13141 ggtcagcgcc cgataaatgc cttgcccacg ataggccgca acggttgcgc caccccagat | |
13201 tcctgcaaaa tccgtgtcag gaaccggttc gagtcgaccg gcactaagta ttgttcccgt | |
13261 gctgtcctcg gccacccaca gttgcattcc atccgcggtg gccaggcgac gaagaatcgc | |
13321 ctcggcatga cgggttgata ccgcttctcc gaaggtttgg tcctgcatgg cggtcatcgc | |
13381 gcgaacatca tcttcggaga agatctgacg tagcgtgaca ccagccggta gcggcgtttc | |
13441 ggtactcaga tcggcggctc gcccgaccat gattgactcg ctagcgtccg ctacgaaacc | |
13501 gtgtgcgagt aactgctcgt gcagtcccgg cgcgtgatca tggccccggc tcttccattc | |
13561 gacgtcgctg atttctggct gctccaggta gtaagcgagc gcttcgccga ccagggctgc | |
13621 cagattggtg tcgctggtat gcgcaatgtg cgggtaggtg ataaaccctt gaccgcccgt | |
13681 aaaattgatc agacgtaggg cacctagccg ctgaaccttt acggcgctgg gagtctccgc | |
13741 atcggtacgc aattgctcat cgtaaatgtt tagatattct gcggctagaa gtgactgcac | |
13801 taaaacctcc tgcaggattg aagaacaaaa ggcgcctttt gaaagattca aaaggcgcct | |
13861 tgaaattttg agttatggct tctcgccgca cactaccttg tgccatggct ggtaggtcca | |
13921 gctcttaaca tctggcggaa gggttttgga gccatcaatc gtgctgcggt tacgcgtgat | |
13981 gtcgatgcta aagcccttct gtccaccact ttccgaaaca cacttatcgg ctgggttata | |
14041 ccgggtctca ggattagtca tgttgtactt gcctgagctc ttctggctaa ccttccagta | |
14101 cttcgtgctc cacaagcgcg tgtgtacacg atcgccgctg acccacgcct gaatcatcac | |
14161 gccgtagggg gtgttgttct tccacaccat gtcgacttgg ccctcccaga gggtggcttc | |
14221 gcgacctgct gggtagcgtt caaaccaacg agagtgtggc ttatgcgtga cgtcgtcata | |
14281 tccggcgagg aagccgacgt tgtatagctg ggtggaaatc tgagagagtc cgccgccaac | |
14341 tgcttcggtg ctaaagccgc tttcgaccac accggaactg aagtagccgt tagccacggt | |
14401 aatcgggcct agggtctgca ggagggagaa attctcccct ggcttgatca cggtcccgct | |
14461 gatgcgatct gatccggcat gcaggttctt ggtgcgtacc ttatcgtagg ttggatacgg | |
14521 ggtcgagaat tcaacgatct cttccttgat acccagcttc ttagcatccg cggtggtgaa | |
14581 gtcagcctcg gaggtcttga gaacaacctt tgcggtgcgc tctttagttt cggtggctgc | |
14641 taagactttt gcacccaatc ccttagtctc caaggccaga cccgtggtcg acttggtgat | |
14701 ggttggcttg ccgccggata gggtaatacg tgcgttcttt gcggtgctac tgaactcgga | |
14761 attcgtcgta gctgctttaa agagtttttt atcatccaag gtgatcgctg gtgcgccatc | |
14821 cttgggagtg taacttgcag cctccgcgat ggccgcagcc gaaatatcga ccttcttctt | |
14881 atccgaagtt aagctgactt tgtccttcaa cagggctttg accttgtcgt cgtagaaaga | |
14941 ctgcaaggta tcttcggaaa tttcaggctt ggcaatttcg ctaggcaatt cgatcgccgg | |
15001 tgcgcctatc cgccagtcgc tggtgaggac cttagcagcc tcatcttgtt tcaggctcac | |
15061 cccatctacg ggcttgacca gtttcgcttt gccctcagca aaggtgatat cgccttcggt | |
15121 gacctttgag tcagcctttt ttgctagcgc cgcaagctga gaattcagct tgtcttgatc | |
15181 tacgtcgatg cttgcggtcg cagtgtactt accggtcaaa cggtcgatga gttctaccgg | |
15241 gtttgcctcg tagccggtca gatcagcgac ggtgtcgtca acgttgagtg acagcccggc | |
15301 tttgacggga tccatcttat agctctgaga attgatctgc acttcgaaag gctttgcagc | |
15361 tagcggaaca actgacttgt tcagtgccgc tcgggcatca tcctggctca ttgatccaat | |
15421 gttcacccca gcgatgctgg cgttcgctgg aacttgggca ctaatgagtg cggcgccacc | |
15481 gaaatagagt gctgctgccg ccaccacgca ggaaccagtg atgatccaag gcttggcctt | |
15541 gtttcggcct tggtccttgg gccggttgct tggcgatggc gaggaggaac tgtccgggga | |
15601 gggggtctgc acttgtctgt tagctctttc gaaaagcggt tggggccggg cacgagacgc | |
15661 gaatttttac ttcgccgcgc atcggtgcac caaaagaaat actaactgtt ggaacaaccg | |
15721 atacatggcg ttgtgggggt aaacaccaaa attgttatct acttgttgga tttcacgcgt | |
15781 caaagtcgtc taaaactagg tcagcgatca catctaggcg actaaaatca atgcgcgcac | |
15841 cggcttgttc gcgcaaggct ggtttcgcat taaacgctac acccagtccg gcagcggtga | |
15901 ccatgtccag gtcgttggcg ccatcgccgg cggcaatagt tgctgacatg ctgattccgt | |
15961 gttcggcagc ccaagcgcgc agcatttttt ctttcatcgc acggtcaacg atttgtccgt | |
16021 gaactgtgcc atcaagcaat ccgtcggtaa ttcccagcgt atttgccaac gcgtgatcca | |
16081 atttcagctc ttgagccagg ggatcaagga tctgctggaa tccgccggaa acgacaccca | |
16141 ctatgtgacc agccgcgtgc atccgctgaa ctaattcgcg tgctccgtcg gagtaaatga | |
16201 ctcgtgaaat aacctcgggt aggaccgact ccggtagacc tttgagcgtt gccacgcgtt | |
16261 ggattaagga ctgggcgaag tccaattcac cgcgcatcgc cgcctcggtc acggccgcta | |
16321 cctcttgttc gcgtccggcg tgggccgcga gaagctcgat gacttcctgt ttgatcagtg | |
16381 ttgaatctac gtccatcaag agcaagatgc gcttggcatc ggtcagcgcg ctgtccagaa | |
16441 ccgtaacgca cgcttcgtcg gcggaaaaaa atcctgagtc aaccaaagtg tcaaagctag | |
16501 ctagagcttc ggtgcgcaag tctaaggcgt caatgttttc gatcctggtc ttggcgaccc | |
16561 agcgtgtagc cgactcgtgc acgctaaaaa ttgcctcggc agcggctggg agtcgattaa | |
16621 ccagctgtgc aaggagttca tcaaaacgat cacgggggag tgctgggcgg gatacgaggg | |
16681 tcaaagttga agccatgaac ctattttcgg tggtgcgagc gagtacgacc aaacatgacg | |
16741 tcgaagtaaa cgaggtgaga taaaacatca acccacttgt acaagttagt tgtagaatat | |
16801 ttagatgacc tcatcaccac cagatgccaa gcttgcagat gacctacttg acgccattta | |
16861 tccgttattc ggaatgctca ataaggttcg aagtatttcc gccgggaagc ttggcattct | |
16921 gagtttggct gaggaacaag gcaaaattac ggcggccgcc atgaaagaca agctcggggt | |
16981 aagccaacaa gcgatctcct tggctgctaa ggagctggtt gaaatggaac ttctggtgcg | |
17041 taccaaagat ccgggcgacc tgcgccgtac gtggttcgcg ttgaccgact ccggggccca | |
17101 aaaacttcac gccgaacgcc aactggcacg ggcggtactc gctgacgtga tcaacaaaaa | |
17161 tctcgctcca aaacagcaag aatcgatccg ccacgcaatc gacgcactga ctcatatttc | |
17221 acgcggtggg catgaatcga actaattcca atcttgtccc cacattaatt tttgcggcgt | |
17281 tatccaccgc gattgtcagt tccttgggga tgctcttagt tccgtctatc gcagcgacct | |
17341 accaaatttc ggtcagtgca gctcaatgga tgttgacggt aaacctccta gccggtgcgg | |
17401 tggctacccc ggtgatgggt aggctcagcg atggaccgca caagaaaaag ctcctgctat | |
17461 attcgctggt gatcattctg cttggctcca tcctcgcggc gctggcccct accttcggga | |
17521 tattcctcat aggacgtgcc atgcaggggc tgacctatgg catcgtgccg gtgactatcg | |
17581 ccttagctag gcgttactcg gatcccaaga ccgtgcacca tgcgatttct tcgttatccg | |
17641 tcaccgttgc caccggtatc ggcatcggtt atccactgac cggggtcatc gccgggatgt | |
17701 ttagctttca gtgggccttc tggtttgccg cggtttttgt attcatcgtg atctttgtgg | |
17761 tgcttcggat cgtgcccgac ggacctgatg agaatgtgcc ccgcacaaaa ttcgactttg | |
17821 ccggtgcgtt gctcttggcc gcgggccttg gcttgctctt actggggatc agtgaaggct | |
17881 cacactgggg ctggatttct gctcgtaccg tcctggtact tggagtagca atcatcttgc | |
17941 tgttcatctg ggtgaaaacc gagttgcgga tagctcaccc gctaataaac ctgcgcacac | |
18001 tacgccaagg cgaagtgctg ctagctaact tcgccgccat cggtctcggt gcagccctgt | |
18061 acatcggcat gtccgtggcc agtcttgtcg ctcaagcacc ggcaaccact aacttcgggc | |
18121 ttgcactacc gatcttgtgg gccggatttg tcatcatgcc actatcggta ggcagtttgg | |
18181 tcgctaaccg tctggtgcac cggctcgggc accgcgtggg ctaccccgca ttgttaccca | |
18241 tcggcgcgac actcttcgca gcggccgcca cgttcctctg gctagcgcac ggcgcactgt | |
18301 gggaactgct gctgggaatg ttggtctttg gtctaggcat gggtgccagc tacgcggcca | |
18361 tgccagcact tatcgcgcgg agcgtcgcgg ccgaacaatt gggtagctcg gtaagtttca | |
18421 accaggtgct gcgcaccgtg ggtagttcct tcggtactgc ggtctccgcc gcgatcatcg | |
18481 ccatgcacgc agattcttcc ggtgccacca caggtcaggg cgtcacattg tccttcgcgg | |
18541 tgagcgccat tggctgcatt ttgctcggtc tggcgctgac tgttcatttc ttttatcgca | |
18601 aacaaaagag caacgagtct taatccacat cggcaatggt gttttcaatt agtgaatcag | |
18661 gcaacgaaag tctaggctta aaaaccatga gcgaagtgct aactttcaac gatgtcagcg | |
18721 tggtgcgcgg gcgtaaagac ctgctcaagg acgtgtcctg ggaagtcaaa gaaggccagc | |
18781 ggtggatcgt gctgggcccg aatggcgccg gcaaatcaac cctgatgaac attgcagcca | |
18841 cccgtctgca ccccacccgc ggtaccgcgg gcattctggg agaaaccatg ggtaaggtcg | |
18901 acgttttcga actgcgaccg ttgatcggcc taagctcctc actggtcgcc aacgctatcc | |
18961 cggccaatga aaccgcacta aatgtggttc tcaccgccgc gtacggcatg accggacgct | |
19021 ggcgtgagaa gtacgagaaa ctcgacgaac gccgtgcgtt ctcgatgctc caccagtggg | |
19081 gcatgtccac cttcatgaac cagccttttg gcaagctctc cgaaggtgag cgcaagcgtg | |
19141 tgctgattgc tcgcgcgttg atgaccgacc cggaactgct gattcttgac gagccagctg | |
19201 ccgggctgga cctggcagga cgcgaagagc tcgttgctca gctgactgaa cttgcggcga | |
19261 atgaagaagc tccggctttg gtcttggtca cccaccacct ggaagaaatt ccaccgggct | |
19321 tcacccatat attgatgctt aacgcaggtg aagtagtcgc cgccggcgag atcgcttcca | |
19381 ccttgaccga agaaaatctc aaagcaacct acgggatgga tttgagcgtg cgcgaagtgg | |
19441 acggtcgtta tagcgccgtc gcgcgccgag tgaactaggg gcaacaccac accgtgatcg | |
19501 atttttggcg tgaagcgtta atcctgtttg gcggcctgtg ggccggaacc atcaacaccg | |
19561 tggtgggttc cggcaccctg gtgactttcc ccatcttggt ggccttaggt tttgcgccgg | |
19621 ttaacgcggt ggtatccaac gcaatgggtc tgattgccgg tggattctcc ggcgcctggg | |
19681 gctaccgtcg ggaagctgcc agcgtcaaaa aaaccttgtt aaaacttgta ccggtctccc | |
19741 tggtcggggg actgatcggt tcactgttac tgttgaacct gcccgaatcg gtgttcggcg | |
19801 tggtggctcc ggtcttgctg gtctgcgcgc tggtgctggt gatcttccaa cccaaactct | |
19861 ccgcatgggc taagacccgg caggcgcagc gcgggggaaa tgatcccgac gatgccgacc | |
19921 gggccaagat ccccactatc ctttacgtgc tggtctttgt tatcggcgtg tacggtggct | |
19981 acttcaccgc cgcccagggt gtcttgctta tggctgtctt cggggtattc ctgcaggctt | |
20041 ccttgcaaca gtccaatgcg atcaaggtca ttctttcgct gatggtcaac atcgtggcag | |
20101 ccgccatgta cctgctgatc gccccggaac gcattcactg gattgtggtg ctgctcatcg | |
20161 ccgtgggttc gttgatcggt ggatttattg gtgccaaggt agggcgcaaa ctttctcccg | |
20221 gctggcttcg agtcatcatc gttattcttg gcggtatcgc gctagtgaat atggtgtaca | |
20281 agttggtcgc tggtgcctga gatcgttaat cccgaacgca ttttgcatat tgcagacctg | |
20341 caagatgcgc gcctcgacga gtacctacga ctctccgaag cgcacctaag gatgcgcagt | |
20401 gacgtggaaa acggtctgta tattgccgag agcaccacgg tggtttcccg cgcaatcaat | |
20461 gccgggcacg ttccacgcag cttcttgcta gcggaaaagc atctggatca gctggcgcaa | |
20521 gaatttgcgc gtttcccgga cgtcccaatt tttgtcggta gtgatgagca acttcaagac | |
20581 ctggtaggtt tccacctgca ccgcggggcg atggcctcga tgaaccgtcc cgaaccgctg | |
20641 aatttgagtg aagtgcttga gcggagctcg cggatcgcta tcctcgaaga catcgccgat | |
20701 catacaaact taggcgcgat tatgcgttcg gcctcaggat tgggcgtgga cgcggtactg | |
20761 attaccccca agtgtgtgga cccctggtat cgccgaagcg cacgcgtctc aatgggcacc | |
20821 gtctttgacc ttccctgggt caggctcacc tcatggcccc aggacatcaa cattcttaag | |
20881 gctcatggct acacgatgct ggccatggag ctcaccgagg acgcagtgtc cttggccgag | |
20941 gttgaaatga ctgagggtaa aaagttcgcg atgatcctgg gcaacgaagg caggggagtg | |
21001 accgaagaaa ccctgagcct ggtggaccag gcggtgatga tcccgatgca ccgcgaggtg | |
21061 tcctcactca atgttggggc ggctagcgcc atcgccttct gggaactgtg ctcttcgaca | |
21121 cctaaatgag tttcacgcag catgcttgca tgagatagga tggaatgtct gtgtgtcggc | |
21181 cttagggtcg aaggcgcagt aaaatttccg agcaagtggt tgctggcaaa atccagtggc | |
21241 ctatcaacat aaaggtgtat agctatgaag gctgatattc atccaaagta cggtccagtt | |
21301 gtcttcaacg acctggcatc cggcgagcag ttcctgaccc gttcgacccg ttcgtcggac | |
21361 aagaccgttg agtgggcaga tggcaacacc tacccagtga tcgacgtcga aatctcggct | |
21421 gcatcgcacc cgttctacac cggtaagcag cgcatcatgg acaccgctgg ccgtgtcgag | |
21481 cgcttcaacg cccgcttcaa gggcttcggc ggcaagaagt aattcttcgc ccctcgcaag | |
21541 ctttttacgg cacgattcca gttcaactgg aatcgtgccg tttgcgttta agcacaggtg | |
21601 acaagacgat agaatcgact tatgatgcat catggcgaat acaaggtggt cggcggcaaa | |
21661 ttagtcgtcg ttgatctcga tagtgacaac ggggtgatcg ttaacgcttc acttaacggc | |
21721 gactttttcc tcgaaccgga tgaggcactc gaagacctca acgcggcatt gaacggtctg | |
21781 cctaccggcg ctagccatgg caccatccgc gacgcggtca acaacaattt gcgcgaaggc | |
21841 gcggtgatgt tcggttttga tgccgacgca gtggcgcgcg cggtccgccg aagcctgggt | |
21901 cacgccacca aatgggaaga tcaccagtgg gaaattctcg gcccagaaat cattcccgta | |
21961 gccgaacagg tagccctcga cgaggtgctc acccggcaaa tcggaaccgg tgagcgaaag | |
22021 cctacgatcc gtttttggga ctgggacgaa tccgcggtcg ttatcggctc cttccaatcc | |
22081 ttaaaaaacg aagtggacat ggaacaagcc acacaccacg gcattaaagt ggtgcgccgc | |
22141 atttcaggtg gcggggcaat gttcatggaa gccggaaact gcattaccta ttccctgtac | |
22201 gccccagatt ccttggtgga cggaatgagc tttgccgatt cctacccatt ccttgacgcg | |
22261 tgggtcatgc aggcgctgaa atcactgggc attaatgcct attacaagcc actgaacgat | |
22321 atcgccacgc cgagtggaaa gatcggggga gcggcgcaga aacgtctggc taagggcgcc | |
22381 ctgttgcacc acgtcaccat gagctacgac atcgatgcac agaagatggt gcaggtgttg | |
22441 cgtattgggc gcgagaaaat ctcggataaa ggcattacct cggccgttaa gcgagtggat | |
22501 ccgctgaaat cacagaccag cgaagatcga gcgcaaatca tttccaccat gatggatacc | |
22561 tttgcagctc gtaccaacgc caccgttgtt gagttagatg acataacgcg aaaagccgcc | |
22621 caagacctgg ctcaaactaa gtttgatacc gaggcctgga cggctcgcgt tccgtaaact | |
22681 actggctagc gcggctgtgc tgctgcgcgt tgaggcttcg ttcaagctct gcgcgctgtt | |
22741 cgatgagaat gcgtagcagt gctgccggag ccccctggtg atgttccagc cagacgtttc | |
22801 cggcctgcaa ggttggattt tcttccggtt cgccggtgag atcctgcgaa cccgggtaaa | |
22861 ggccctcgat gacgcgagtg gcaaattcca tgctcatcgt ttcaaagacc ggcaggattg | |
22921 cagcccagta acgcgactgg aaaccagcta gcaggctagc cgagcccatc gcaaaaccgt | |
22981 cggcgatagc ggaaagtgca tcgtttgata atggaccgtg ttcatcgtgg cccatcaaca | |
23041 cggtatcaaa agcagcttct ttcacgtccg tatccggacg ggcagccaac gcggtgcgga | |
23101 ccgcgttttg tgccacgctc gtaggattgc gcttcgcagc ctgatgcatc cgcgcttcgg | |
23161 cctgcgcgtc caagccgccc gcgaccgcca aagcaatgta gcttgcccag cgaagttgtt | |
23221 cgtcaactgt gacccggtaa ggattctctt cctcggcaag gaaggaatca atcacctcgc | |
23281 gcgccacacc ggagcgcgcc aagcgagcta gcgtgcgcgc ggtagtggtc tgctggtcgc | |
23341 taccagcttc gaaattcgcc agccagccgg tgagaacttc ggcagcacgt tcgcggatcg | |
23401 agactcgcag ttccggggca acatatttcg agattgaagt gaccagctga tcaagcagca | |
23461 tcgcaaagac accggaatcg gtcaccgtgt gcgcatgttc caaaatggcg ttgacatagg | |
23521 tctgagaagc tagctttgac tgacgtacgc cgtcccataa ggaggcccaa ctggtggcgc | |
23581 gtggcaaaga ttcctgcaac gatccaagat ttcccagcaa ggttttcagt gaattttcat | |
23641 caaactcaat gagcgcgtag gtttcatcgc ccacgttggg caagatcaga tcgggtagcg | |
23701 gctgaccgac gaggaaatct agtgcgacgc tatctccgga aagttcaaca cgctgtgttg | |
23761 cggtgcgcgt gagcacgcca tcggtcagcg tgtaggcgcc gacggtgagc acatggggtc | |
23821 gcacaattgc ttggccacta atcggatcta tgccgtgctg ttcaagattc gcagcggtca | |
23881 ggatcccggc gtcatccacg gtgtagttca ccgcgagttt gggcacgcca ctagtcttca | |
23941 gccaggcatc ggcccagctg cgcatatcgc gtccgctggc tttttctagt gcctgcagga | |
24001 agtcttccaa ggaggtgttg gcgtattcgt gttgacggaa gtacgcacga gccgcgtcgc | |
24061 ggaaggcttc tgccccgaca aaggcggcca actgcttgag cacgctagcg cccttggcgt | |
24121 aggtgatgcc atcgaagttc tggtctgcag ccagcagatc tggaatatcg gccacgatcg | |
24181 ggtgggtggt tggcatctga tctgccacgt aggcccacgc cttacgacgc gcggcaaagg | |
24241 tggtccatgc ggtggtgaat tctgtggctt catcgttagc aagcgttccg atatagtccg | |
24301 caaaggattc cttcaaccac agatcgtccc accaggccat ggtcaccagg tcgccaaacc | |
24361 acatgtgcgc catttcgtgc atgagcgtat tagcacgctg ctcatactgg gcttcggtgg | |
24421 cctgggaggt aaatacataa cgttcggtga aggtgacgag gccaggattt tccatggcac | |
24481 cgaggttata ttccggaaca aacgccgagt cgtatttgcc ccatgggtag gggtagtcaa | |
24541 agagctcgtg gaaatagtcc aggccttggc tggtgagctt gagaatttct tcgccgtcaa | |
24601 agtgttcggc caacgaggcg cggcaggtgg ctgccatttc aatgtctagc gattcgccat | |
24661 ctgcaagctt ttgcacgtgg gtaccgcgca ccacatggta tgggccggca aggaccgcgg | |
24721 tgatataggt ggagatcggg ccggttggtg cgcaggcgac ggttttggtg ccgtcaccat | |
24781 gattcatctc gtcgatgatc tgctggttgc tggccagatg ccagtcttcc gggccagtca | |
24841 aggtgaattg gtagctggtt ttgagatccg gctgttcaaa gcaggcaaaa acacggcgtg | |
24901 cttccgaggg ctcaaactgt gtgtagaggt aggtctggcc gtcttgtggg tccacgaagc | |
24961 ggtgcagtcc ctcgccggaa cgtgagtagc tggagcgtcc ggtaatgcgc acggtgtttg | |
25021 ccgcgtccgt gcgcaaacca tcgaggtaga tgcgggcgtc gagtaccgcg tccgcgacgg | |
25081 agatttcggc tccattaacc acgatgcttt caatcgactc atgaatgtag tcaatgaagg | |
25141 tttgcggtga ctttgaagag aaattcagtg ttgtgatcgc ggtgtaggaa gtttcctgcg | |
25201 cttgggtggc gttgctcaga tcaagctcta cggctgcata gtgccagctg atgttcgcgg | |
25261 cacgccaagc ggcctcatcg cgtcgaaggt tctcattggg tgcatagcgt tctaatgtgt | |
25321 ccacccttac agcttagctg tgaaatgaat gtttgataat gctgagctag acgaaaatta | |
25381 atttacccgg ccgcgcatta cggcgagtag ctggcggatt ccttggaaat gatctgcgag | |
25441 taacaggcgc gcggcatcga tgtctttggc gcgcaccgca tcaaaaattg cgcggtgtgc | |
25501 cgccgcggtt tcaaccagtg ctttaatgca ttattcaggc ttgcgaaaag cctggcgata | |
25561 ctccatcggg gagacacctt tgagagcacg gaatcgttgg cggaaagtca caggcgttcc | |
25621 aaaacccaca gccgccgaga cctcagcaat ggatccgtga ctttcctcaa ggagcttgca | |
25681 cgcttcatca atacgccagc tcatcgccca ttggtgtggt gtactgcccg tttcggccag | |
25741 gaagcggcgg agaaaggttc gctccgacat acacgcctca ccggcaaaat cgctaagcgt | |
25801 aagagttctt gtcgggtctt tcatcattag agtgcgaact gtcgtcatcg cttgaccatc | |
25861 accgtgcttc accgcaaccg gtgtcgtgag aaattgtgcc tgaccacccg tacgatgtgg | |
25921 ggccatcacc atggagcgag cgatagtaga ggcaaccgac gatccgcaga actgacctat | |
25981 caggtgaatg cttaaatcga ttccggccgc cacaccagcg gaagtccaga ctctgctttc | |
26041 cccaacaaat aacactgcgg ggtcgacatt gatttctagg aagcgactcg ctagctcatc | |
26101 ggttaaggcc caatgagtgg tagcggtaag accatccaat aatccggtct gggccaatac | |
26161 aaaagcgccc gaacaaagtg aggccaccac tgctccgcgt tgatgagctt cacgtatcgt | |
26221 ttccagatac tgattgggtg gtgtggctgt gaagtctcca agcccgggga tcaagaccag | |
26281 atctgcattt tgggcccatt ccagagtctc atcagccata gcctgcgacg agtcggtcag | |
26341 ttctaccatc cctttgttta tcgcacaccg gcggagatcg acgttcaagt caggcgacga | |
26401 taaacgcttt gccgcccagg tctcggtcac aattgagaca tcgaagagtc gagttcgggg | |
26461 tctgaggaag atcggtacgg aaattcacgc taacgacatc ccggtgtcga tcctggcgtg | |
26521 gatagggctc gcgaaaaagc gaaatgcccg acgcaaagct ttcgcagtgt ggggcaacgg | |
26581 atgagagccg cacgtcatct ttcggtggtg gcaggaagag gtcacggagt gattgtgccg | |
26641 gttttcttgc gttggtcgcg ttcaacggcc cggtagatgg tggatcggct gatggagaat | |
26701 agttctgcca tttcggtcat ggtgtgtttg ccggcatcgt gcagttcgag gaggtgtgtt | |
26761 tcttgtttca cggtgagttt tggctgtttt ccccggagtc ggccgttggc cttggcaacc | |
26821 ttcattcctt cgcgggtgcg catgctgatg aggtcggctt cgaactcagc gatcatcgcc | |
26881 aggacgttga acagcagttt gcccattggg tcggtggggt cgtggacgga accaccgatg | |
26941 ctgagtctga tttcgcgtct ggcgaggtcg tcggctatct cgtgggcgtc tcggacggac | |
27001 cgggccaggc ggtcgagttt ggtaacgacg aaggtatctc cggcccggca ggcggcgagg | |
27061 gcttcgtgaa gtcctgcgcg attcttgttc ctgccggtaa agccatgatc aacatagacg | |
27121 cgttcgggtt caacgccgag ggatgccagg gcatcacgct gggcggtgag gtcttgctcc | |
27181 tccgtggaca cgcgtgcgta accgaccatg atcttagaca tgtagatcag tgtgtcacat | |
27241 agggatcctt caccggacag ttcaccgtac accctatacg gacacttcat aggtcaccat | |
27301 tagcaaagca gcaggtcagc ggttggcgtg tccggtggag gaccgtctta cgggacactt | |
27361 ccatcgaagg tcacttgagc ctcttcaaca actcaaaagt attggaaaat tttctgtagc | |
27421 ccattgatct tttcggtgct agattcgaat catgttccat tcataaagtt ttctcgcaac | |
27481 tatggctctg atttttcaa | |
// | |
LOCUS BW77_ACAGTG.R1_(paired)_contig_49 2639 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_49 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..2639 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
CDS complement(79..858) | |
/db_xref="SEED:fig|6666666.134544.peg.2808" | |
/translation="MKVFRMGVAARGLPQRLLSDNGDALNPIRRGVISELVAYANSLG | |
VATMTGKPYKPTTQGKNERFHSTLFKWLKKQPFAKDLAELQGQVEVFDQAYNTQRGHQ | |
SLEDRMTPQEAWDATPVAEPLAPGEWVKLSTKPAPGVGEAVLAVQPGEEQSPTPQDGS | |
TPEPAKLSATLRTEHMEARGSQLMRVNKNRCLRVAGVELYLGKLLRSTMVKVLWDQAD | |
LMVISMDGELITKYDYPFPDGITYLSLKHATAKFQNQPEMG" | |
/product="Mobile element protein" | |
CDS 911..1066 | |
/db_xref="SEED:fig|6666666.134544.peg.2809" | |
/translation="MEAQNPTGTGTPPVSGGVLEFSHDKERHIADASAGHHTPKYCPF | |
PLELTND" | |
/product="hypothetical protein" | |
CDS complement(1078..2514) | |
/db_xref="SEED:fig|6666666.134544.peg.2810" | |
/translation="MNNNTGLYPCVPTMTTNQALVSHAGLTTLSDLLNTLGFRKLCEN | |
RLSQFVPASAVHRPGKMIADLSLMLAAGGEQVSDTDQLRTAQGLFGPVASDPTFSRFF | |
SRISNHPGAFEYAFATMHRQVRAKLWAAAGKRNPAIRASRTNPLTIDIDASLVNVHSD | |
KEGAKGNYKGGYGYSPMIAMADYGKTNGTGEVLAVRLRPGNKAANSAKDHISILSEAL | |
EQLPDEFYDEQTTLIGEKIMVRTDSAGATREFLKHVDSLGLQFSTSYTLPVVKERFVR | |
WIDQKKYWEPALTADGEHRDNAWVIDASKVIELNDYPPGTRIYLRAEPLHPGAKASLF | |
DTDGNRVTAFLTNSPRYDPAFLDARHRARGRCENRIKSLKAAGLGKLPFTSFAANQAW | |
ANLAMFALNLTSWLQLVVLPAGHQAGSWDLKRWRYRVWSMAGKLTKSGRQPRLLINDQ | |
TPEARLVTLLKGQINGLRQRWAVGSLRT" | |
/product="Mobile element protein" | |
BASE COUNT 540 a 776 c 709 g 612 t 2 others | |
ORIGIN | |
1 tgtgatgtct caagacaccg gtaacagttc tgtaccagca catcggtgac actcggtgtc | |
61 tcaagacatc ggtaacactt accccatttc cggttggttc tggaacttcg ccgtggcatg | |
121 cttcaagctc agatacgtga tgccgtctgg gaatggataa tcgtatttcg tgattaattc | |
181 accgtccatt gagatcacca tcaaatccgc ctgatcccag aggaccttca ccatggtgct | |
241 gcggagcagt ttgcccaaat agagttccac gccagcaacc cgcaggcacc tgttcttatt | |
301 gacccgcatc agctgactgc ccctcgcctc catgtgctcg gtccgcagcg tggcactgag | |
361 cttcgccggc tccggagttg aaccatcctg cggcgttggc gattgctctt cacccggctg | |
421 tacggccagg acagcctcgc cgacgcccgg agcgggcttg gtgctgagct tcacccattc | |
481 cccaggcgcg agaggctcag caaccggcgt ggcatcccac gcttcctgcg gtgtcatccg | |
541 atcctccaag gactgatgac cacgctgcgt gttgtaggcc tggtcaaaga cctcaacctg | |
601 cccttgcaat tcggctaggt ccttggcgaa aggctgcttc ttcaaccact tgaacaacgt | |
661 cgaatgaaac cgctcgttct tcccctgagt cgtgggctta tacggcttgc cggtcatcgt | |
721 ggcaactccc agactgttgg cgtacgcgac caattcgctg atgacgcccc gacggatggg | |
781 attcaaggca tcgccattgt cactgagcaa gcgctgtggc agcccgcggg cggcgacacc | |
841 catgcggaag actttcaccg catccggacc gttctccgtc cttgcaacta annactaacc | |
901 cagatctttc atggaagcgc agaaccccac cggaaccggc accccgccag tatccggtgg | |
961 ggttcttgaa ttctcacacg acaaagagcg ccatatcgct gacgccagcg ccggccacca | |
1021 cacaccgaaa tactgcccct tcccacttga actcactaat gactagtact tgaacactca | |
1081 ggttcgcagc gaaccgactg cccaacgctg acgcaatccg ttgatttgtc ccttgagtaa | |
1141 ggtgactaag cgagcttccg gcgtttgatc attgatcagc aaccggggtt ggcgaccgct | |
1201 cttagtcagc ttcccggcca tagaccacac ccggtaccgc caccgtttca aatcccagct | |
1261 cccggcctga tgccccgcag gtagtaccac caactgcagc cacgacgtca gattcaacgc | |
1321 aaacatggcc aagttagccc acgcttgatt cgccgcgaac gaagtgaatg gcagtttgcc | |
1381 cagccctgcg gctttcagcg acttgatcct gttttcgcaa cgcccacggg cgcggtgacg | |
1441 ggcatccaag aaagcgggat cgtagcgtgg agagttcgtc agaaacgcgg tcactcgatt | |
1501 cccatcagtg tcgaacaggc ttgctttcgc ccccggatgc aacggctcag cacgaagata | |
1561 aattctggtt cctggcgggt aatcgtttag ttcaatgacc ttggaagcat caatcaccca | |
1621 cgcgttatca cggtgttcac cgtccgcggt gagcgctggc tcccaatact ttttctgatc | |
1681 gatccaccgc acgaagcgtt ccttgaccac gggcaacgta tatgaggtgg aaaattgcag | |
1741 acccaacgaa tcaacatgct tcaagaattc tcgggtggcg ccagcgctat cggtgcggac | |
1801 catgatcttc tcaccgatca acgttgtctg ttcgtcatag aactcgtctg gtagttgttc | |
1861 cagtgcttcg ctcaggatgc tgatatggtc cttcgctgag ttcgctgcct tatttcctgg | |
1921 gcgcaagcgt acggcgagga cttcgccggt gccgttggtt tttccgtagt cggccatggc | |
1981 gatcatcggt gaatagccgt acccgccttt atagttgcct ttggcacctt ctttgtctga | |
2041 atgaacgttg actagggacg cgtcgatatc gatggtcaga ggattggttc gggatgcccg | |
2101 tattgcgggg ttgcgtttgc ctgctgctgc ccatagtttg gcccgcactt gccggtgcat | |
2161 ggtcgcgaat gcgtattcaa aagccccggg atgattactg attctgctga agaaccggct | |
2221 gaacgtcggg tcagaggcaa ccggaccgaa gaggccttga gcggttcgca gctggtcggt | |
2281 atcgctgact tgctcgccac cggcggcgag catcagggac aaatctgcga tcatcttccc | |
2341 gggccggtga acggccgaag caggaacgaa ttgcgagagc ctgttttcgc agagcttgcg | |
2401 gaaacccagc gtgttgagca ggtcgctcaa ggtggtaagt cccgcgtggg agaccagggc | |
2461 ttggttcgtt gtcatggttg gtacgcaggg gtaaaggccg gtattgttgt tcactgagag | |
2521 agtgatcctt tgaactgttg agaatatggc ttagacacct ttattttccc agttcaggat | |
2581 cgctttttcc tcgttaatga cgcttaatta ctggccccgt catgaaatac ctgggctaa | |
// | |
LOCUS BW77_ACAGTG.R1_(paired)_contig_86 1277 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_86 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..1277 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
CDS 69..386 | |
/db_xref="SEED:fig|6666666.134544.peg.3588" | |
/translation="MKKQRRSFTEEYRREAAGLVIDTGRTISAVAKELNLGEQTLGTW | |
VKKERSRRGLDGEPTGALDESEREELKRLRKEVFELREDNRFLGKAASFFASKQHRSN | |
GSN" | |
/product="Mobile element protein" | |
BASE COUNT 275 a 373 c 409 g 220 t | |
ORIGIN | |
1 attagtggac agccgaacaa gcgggatcag ccgatcccgc atttgagagg atgtcattaa | |
61 taagcaatat gaaaaagcaa cgcaggtcct tcaccgagga ataccgcagg gaagcagccg | |
121 gccttgtcat cgataccgga cgcaccatca gcgcggtcgc caaggaactg aacctcggcg | |
181 agcaaacact gggcacctgg gtgaagaaag aacgatcccg ccgaggcctg gacggcgagc | |
241 cgaccggcgc gctggacgag tccgaacgcg aagaactcaa acgcttgcgc aaggaagtct | |
301 tcgaactgcg ggaggacaac cgtttcctgg gaaaagcagc gtccttcttc gcgtcgaagc | |
361 aacatcggtc gaacggttcg aactgatgca cgcgttgaag gatgagttcg ccttgacccg | |
421 catggcgtca ttgcttcacg tttcgaaatc aggctattac gcctggaggc aacgccaaac | |
481 cgctggcccg tccccgaggg ctgccgcgca gcgggcacgg gatgtgaagg tcgccaaggt | |
541 cttcaacgat tcccatcaga cctacggggc tccgcgggcg gccgcccagc tggcccgcgt | |
601 gggatccccg gccgatccca agaccgtcgc tgcttcaatg ctgtgccagg gcatcgaagg | |
661 gatcagccca cggaagttca ctccggtgac cacgatccaa ggcgttgaca cttaccacct | |
721 gccggatcgg gtgcgccggc aatgggacca gggcaccttg gacaaggtct ggatcagcga | |
781 cattacgtat ctgcgcacca acgagggctg gctgtacttg tgcgcagtgc gtgatggctg | |
841 ctcccgcagg gtgctgggat gggcgctgga tagcgtgcag aacaccgatc tggtggaaag | |
901 ggccctgcgc atggccagga ccttgcgcgg ccaaattcca ggtcaggtgg tgttccacgc | |
961 ggaccgcggc tcgcaattca cctcagccca gttgcatgag gtggccgttg agctggattt | |
1021 gctgcagtcc gtgggccgca cgggcgtgtg ctgggacaac gccctgagcg agtcattctg | |
1081 gtcgacgctg aagaccgaat tctatgaccg ctaccggtgg gcaaccaggg cggacgccaa | |
1141 gcagaaagcg gcttggtgga ttgaggattt ctatcaccgc cgccgactgc attcaagcct | |
1201 ggggatgctc cctccggtgg agtttgagca gaagcttcgc ggccagcagg aacgcgttga | |
1261 acagcatagg accgtgc | |
// | |
LOCUS BW77_ACAGTG.R1_(paired)_contig_96 2666 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_96 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..2666 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
CDS complement(157..927) | |
/db_xref="SEED:fig|6666666.134544.peg.3693" | |
/translation="MNIFTKQDYEAFRTLRITHMAQAFEALLAQETNELVEPENLFRQ | |
AATDALDLRRSNKIERLIKQAGFAFADATIEQLDYRTEREAINPIRIKRYAKNDWGRD | |
PVNLVITGASGSGKTYLACALGIAACHQEHTVKYWRTDQLALELLLVQDDLIAQKQLL | |
NSLSDVDLLILDDFMAVGIDPRAVAGMFHLLANRDRRLPTMILAQTGPDYWIEAIHDR | |
VTADSIVNRLANNSRRINLGSVDMRREMSLKERQGEDF" | |
/product="insertion element conserved hypothetical | |
protein" | |
CDS complement(927..2513) | |
/db_xref="SEED:fig|6666666.134544.peg.3694" | |
/translation="MADYRAIMQLLLHGHSYEQVTAAQQCSKRAVASARKAMNDHGIN | |
SIQALDALGSDALAVLFPDGRSRRSLEYAQPDYKAILERLKRDRNYTLQRAWDTYLSS | |
TITAEAKKYGYAKFCARFSDFVNTNDLSATIHHEPGKAMQVDWAGQTLRVTDILTGEQ | |
VKAYLFVAVLPYSGLVFVKASLSMNLDAWISLHVDALEHANGVPKILIPDNARTATYR | |
PTRGDKQRLITAGYAAFATHYGCAIVPARVKAPKDKAATERAVQTVNKRVIGYLQDEV | |
FSTLDELNEAIADLLEGINELKNPQGLSKRQIFDTEEAAHLGALPEHRYGQVSWKQVK | |
VGRNYHVSVDYQHYSAPYRLAGKTLKARVTDLKVALFDGEQLICEHLRKSGRKGQYST | |
LTEHTPPAHQNIMNLWSRNWFLDRARAYGPATVQVITQVLDRRVIEAQGYLDCQNILD | |
ALGKKSKTRLEAACRQLLNTHEVPTYSALKRIMAALKSDTDIPAPSRPAASMLKALNE | |
RSSPTGETYVRDSAYYQEWN" | |
/product="Mobile element protein" | |
BASE COUNT 555 a 768 c 723 g 620 t | |
ORIGIN | |
1 tgttaaatcc ccgtatcggg aactactagt ccacgtaacc ggtaccacga ttccccaaac | |
61 cgggtactgg ccctcgccaa caaaactccg tcagctggac cagcaccccg ttcaggaacg | |
121 caacggtatc gttgaaaccg aggctgctag caacagttag aagtcctcac cctggcgttc | |
181 cttcaaactc atttcacggc gcatgtcaac ggatccaagg ttgatgcgtc gagagttatt | |
241 cgccaaccga ttcacgatcg agtcggccgt gactcgatcg tgaatcgcct caatccaata | |
301 atccgggcca gtctgcgcca gaatcatcgt cggcaaccgc cgatcacgat tcgccagcaa | |
361 atgaaacatc cccgcgaccg cacgaggatc aatccccacg gccataaagt catccaggat | |
421 gagaagatct acgtcagaaa gcgaattaag cagttgcttc tgcgcgatga ggtcatcctg | |
481 aaccaagagc aactccaacg ccaactggtc agtacgccaa tacttcaccg tatgttcctg | |
541 atgacaggca gcgatgccca acgcgcacgc caaataggtt ttgccggatc cggaagcgcc | |
601 agtgatcact aggttcacgg ggtcgcgtcc ccaatcattt ttggcgtaac gcttgatcct | |
661 gatcgggttg atcgcctccc gctcggtacg gtagtccagc tgctcaatgg tcgcgtcagc | |
721 aaacgcgaag ccagcctgct tgatcagccg ttcaatcttg ttcgagcggc gcaggtccaa | |
781 cgcatcagtc gctgcctgcc ggaacaggtt ttcaggttcc accagttcgt tggtttcttg | |
841 cgcgagtagc gcctcaaatg cctgagccat atgcgtgatg cgcaaggtgc ggaacgcttc | |
901 gtagtcctgc ttggtgaaga tgttcatcag ttccactcct ggtagtaagc gctatcgcgc | |
961 acgtaagttt cacctgttgg ggaggaccgc tcattgaggg ctttgagcat gctcgctgcc | |
1021 ggacggctcg gtgctgggat gtccgtatcg cttttaagtg cggccatgat ccgtttaaga | |
1081 gccgaatacg ttggcacctc gtgcgtgttc aacagctgtc ggcatgcagc ctccaatcgg | |
1141 gtcttacttt tcttccccaa cgcatccagg atgttctggc agtcaagata gccttgggcc | |
1201 tcgatcaccc gccgatccag gacctgggtg atgacctgca ctgttgccgg accataggcc | |
1261 cgtgcccggt ccagaaacca gtttctggac catagattca tgatgttctg atgcgccggc | |
1321 ggtgtatgct ccgtcagcgt tgaatactgg cctttacgcc ccgacttccg caaatgctca | |
1381 caaatcaact gctccccgtc aaagagcgca actttcaggt cagtgaccct ggccttcaat | |
1441 gtttttccgg ccagccggta cggtgccgag taatgctgat agtcgacgct gacgtgataa | |
1501 ttccgtccga ccttcacctg cttccagctc acctgcccat agcggtgctc cggcaaagca | |
1561 cccaaatgcg cggcttcctc agtgtcgaag atttgccgct tgctcaaccc ttgaggattc | |
1621 ttcagctcgt tgatgccctc caacaggtca gcgatagctt cgttcagctc atcaagggtg | |
1681 gagaacactt catcttgcag gtacccgatg acgcgtttgt tcaccgtctg cacggcccgc | |
1741 tcggtggcag ccttgtcttt cggcgccttc actctggccg gcacgatggc gcatccgtaa | |
1801 tgcgtagcaa aagcggcata cccagcggtg atcaaccgtt gtttatcccc acgggtgggc | |
1861 cggtaggtcg cggtccgtgc attgtctgga atcaggattt tcggaacccc atttgcatgc | |
1921 tcgagcgcat caacatgcaa actaatccac gcatccaagt tcatgctcaa cgatgctttg | |
1981 acgaacacga gcccggaata cggcaggacc gcgacgaaca aataggcttt gacctgttca | |
2041 ccggtaagga tgtcagtcac tcgtagggtt tgcccggccc agtccacctg catcgccttg | |
2101 cctggttcgt gatgaatggt ggccgaaagg tcgttggtat tcacgaagtc ggagaaacgg | |
2161 gcgcagaact tcgcgtaccc gtatttcttg gcctccgcag tgatagtgga acttagatag | |
2221 gtgtcccatg cgcgttgaag cgtgtagttc cggtcgcgtt tgagccgttc aaggatcgct | |
2281 ttgtagtccg gttgagcata ttccagactg cgccgactcc gcccgtccgg gaagagcacg | |
2341 gccagtgcgt ccgagcccaa tgcgtccaac gcttggattg agttgatgcc gtggtcgttc | |
2401 atggccttgc gcgctgaggc gactgctcgt ttcgagcatt gctgggctgc ggtgacctgt | |
2461 tcatagctgt gtccgtggag cagcagctgc atgatggctc ggtaatctgc catcgtgtcc | |
2521 tcctgatgag ttcaattgcg tggcacggga gtgtgccgac gctattgatc agaggatcat | |
2581 ggacaggtta gttgcgatag tacccggtag ggagaatcgg agtaccgggt acgtggactg | |
2641 gcagtttcaa atacggggat ttaaca | |
// | |
LOCUS BW77_ACAGTG.R1_(paired)_contig_94 371 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_94 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..371 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
BASE COUNT 78 a 103 c 120 g 70 t | |
ORIGIN | |
1 gagaccagtc agaaactcgc caaacgcgaa ccgaaagacc agacctttga cggggtccgc | |
61 accgagccga cgttgtttca tgccgatggc cggccggtcg aagaacacgc ggctaacttg | |
121 ttgtctgctg ggcagagtgt cgccgaaacg aacaagcagg tcaaagagct gatcactacc | |
181 gctagcacca ctgcgggtac tgcgacgtct tcgtcgttgc ggagggggtt cttcccgttg | |
241 ccgattaaga acgagttcac ccgcgagttt ttactgcggg tgaccacggt ggagggtgag | |
301 tattttgatt cgttggcggc gcatgcagct aacggacgca cccgcgcggg ggcgcaggct | |
361 cgggtcaacc g | |
// | |
LOCUS BW77_ACAGTG.R1_(paired)_contig_73 3382 bp DNA linear UNK | |
DEFINITION Contig BW77_ACAGTG.R1_(paired)_contig_73 from Arthrobacter sp. | |
BW77 | |
ACCESSION unknown | |
FEATURES Location/Qualifiers | |
source 1..3382 | |
/mol_type="genomic DNA" | |
/db_xref="taxon: 6666666" | |
/genome_md5="" | |
/project="bewolfe_6666666" | |
/genome_id="6666666.134544" | |
/organism="Arthrobacter sp. BW77" | |
CDS complement(112..1638) | |
/db_xref="SEED:fig|6666666.134544.peg.3473" | |
/translation="MPTLENLTPQKKRGRPRSTGNHTCCRCQQLVAKIRVRWTDGSVC | |
GVCFTQATHTYGTCPDCREHRMLPGISSATGEPICRDCAGIATELTCTRCRREAERFR | |
AGLCMQCTLTDDLTAVLKPNEDLRLHRLIKLLTETGRPESIYTYMRPGTKARHLLEKI | |
GNRNLALTHEAFDELPTSTAAEHLRALLIHHRMMPERGNENLARFEQWITARVASLPT | |
DGTSHIVELFARWRHLKRIRDKAADPETNHSTAISAAKQEITEAGKLLLWLKETHDIG | |
AEKLQQKHIDDYLSSGPSTRKHIRNFVRWLNSQPSSRTHELDTPFRKAQANPMITHMQ | |
RTELVRNCLEHQQVARSTRLAGLILLLWAHPLNKIVLLRREHLITAPDGMRLKLGATP | |
AAVPTALTELFWQQLQNPENSNTTNAGTDWLFPGTRAGQHLHPDTLAGRLKVLGIDPQ | |
RARNATLRSLTQEVDGRTLMDLLGYSPGIIAQHASRAAAPMADYIDLKRSAPQIEENP | |
" | |
/product="hypothetical protein" | |
CDS complement(1679..2020) | |
/db_xref="SEED:fig|6666666.134544.peg.3474" | |
/translation="MSRREITYNWKLREIMARRGVHTAKDLAELLHERGITLTPNAIW | |
RIVTQEPERIAFKVLVALCDALDVTPNDLITYTVTDAKTLRQRSNATGQNLPELRQYR | |
PVRARIVEDDE" | |
/product="hypothetical protein" | |
CDS complement(2017..3126) | |
/db_xref="SEED:fig|6666666.134544.peg.3475" | |
/translation="MGNNENVLFAPFGGNDPDPDAFLSMVLDGWAQQQRAKDFALATI | |
RTRRNVVMSMVDFAGSYPWEWSLGDADDFFSHARAVRNLSHGTVRAYQGHIKLFCEYV | |
CDPHYDWCEQSAKLFGQVFAQVVTELNHITHAQPSEARPAKRPFTQRELQELFDLADV | |
EVERILDSGRKGALAAWRDAIAFKSAYSWGLRANELRHLQVVDYSRNAQAPYLGEQGV | |
LRVRWGKPHRGSAKKPRSVLTIWPWSVEMIQDWIRNGLPRYGHPVNDLFPTTGGSIVG | |
ESHLLGKLHTLIDELGFPPGLDLHSFRRSYATHLITGEGFDVTFVQLQLGHEHAATTS | |
IYTMPSPDYQRLALERAHERTIQAALGLKPSRRNS" | |
/product="Mobile element protein" | |
BASE COUNT 647 a 849 c 1086 g 800 t | |
ORIGIN | |
1 tgatgggaaa gcctgttatc cgtttcctcc ggatccaggt acttttgatg gctccctgat | |
61 gagagcttct gagctgtagg tcagtgatcc gatgcttgaa gaacctcaag actaggggtt | |
121 ctcttcaatc tgaggagcag acctcttcag atcaatatag tcagccatag gtgcggctgc | |
181 tcttgacgca tgctgggcga tgattccagg actatagcca agcaagtcca tgagggtgcg | |
241 tccgtcaact tcctgggtga ggctgcgcag cgtcgcgttg cgtgctcttt gaggatcgat | |
301 gccgaggact ttgagccgtc cggcgagggt gtccgggtgt agatgctggc cagcacgagt | |
361 gccggggaag agccagtcgg tgccagcatt cgtggtgttg ctgttctcag ggttttgtaa | |
421 ttgttgccag aacagctcag tgagggctgt gggtacggcg gccggtgttg ctccgagctt | |
481 gaggcgcatg ccgtccggag cagtgatgag atgttctcgg cgaagcagga cgatcttgtt | |
541 cagcgggtgt gcccatagca aaagaatcaa accagccagg cgcgtagacc gagctacttg | |
601 ctggtgttct aaacagttcc tcacgagttc agtccgctgc atgtgggtaa tcattgggtt | |
661 ggcttgagct tttcggaagg gcgtatcaag ctcatgggtg cggctgcttg gctgactatt | |
721 gagccagcga acgaagtttc ggatgtgttt tcgggtgctg gggccactgc tcaggtagtc | |
781 atcgatgtgc ttctgttgga gcttttctgc gccgatatcg tgcgtctcct tgagccagag | |
841 gagaagtttc cctgcctcgg tgatttcctg tttcgcggcg ctgatggcgg tactgtggtt | |
901 ggtctccggg tctgcggctt tgtcgcggat tcgtttgagg tggcgccacc tggcgaagag | |
961 ttcgactata tggcttgtcc cgtcagtggg cagggaggcg actctggctg tgatccattg | |
1021 ctcgaaacga gcgaggtttt cgtttccgcg ctcgggcatc atgcgatggt gaattagcaa | |
1081 ggctcttagg tgctcagcag ctgttgaggt gggtagctcg tcgaaggcct catgggtgag | |
1141 tgcgaggttt cggtttccaa tcttttctag gagatggcgg gctttggtgc ccggacgcat | |
1201 gtaggtataa atactctcgg gtcgccctgt ctctgtgagc agctttatga ggcggtgaag | |
1261 tcgtagatct tcgttaggtt tgaggacagc agtaaggtcg tcggtgagag tgcattgcat | |
1321 gcataagcct gcgcggaatc gttctgcttc gcgtctgcag cgggtgcagg tcagctctgt | |
1381 ggcaatgccg gcgcaatcgc ggcagatcgg ttcaccggtg gcagaagaga tgccagggag | |
1441 catccggtgc tcgcggcagt ccgggcaggt accgtatgtg tgcgtggctt gagtgaagca | |
1501 tacgccgcag actgacccgt ctgtccagcg gacccgaatc ttggcgacta gctgctgaca | |
1561 acggcaacag gtgtggttgc ccgttgagcg gggacggcct ctcttcttct gtggtgtgag | |
1621 gttctcgagc gtgggcatgc gggctgatcc gttgcctccc gtggccggac ggcccgggtt | |
1681 actcatcgtc ttcaacgatt cgtgcgcgca ctggcctgta ctggcgcagt tcaggaaggt | |
1741 tctgcccagt tgcgttgcta cgctgcctga gagtcttggc atccgtcacg gtgtaggtga | |
1801 tgaggtcatt gggggtgaca tccagtgcgt cgcagagtgc aacgaggact ttgaaagcta | |
1861 ttcgttcggg ctcttgggta acgatgcgcc agatggcgtt gggggtcaag gtaataccgc | |
1921 gttcgtgaag caattcagcg aggtccttag cggtatggac accgcgtcgt gccatgattt | |
1981 cgcgtagctt ccagttgtaa gtgatctcgc ggcggctcat gagttcctcc tcgatggttt | |
2041 cagcccaagg gcggcctgga tagtgcgttc atgggcccgt tcgagcgcaa gacgttggta | |
2101 gtcgggcgaa ggcatcgtat agatcgaagt tgtcgccgcg tgctcatggc ccaactgaag | |
2161 ctgaacgaag gtgacgtcga atccttcacc ggtgatcaga tgggtggcgt aggagcgccg | |
2221 gaaagaatgg agatcaagtc cgggagggaa accgagttcg tcgatgagtg tgtgtagctt | |
2281 accgagcagg tgggactcac cgacaatgga gccccctgtg gtggggaaaa gatcatttac | |
2341 gggatgcccg tagcggggga gaccattgcg gatccaatcc tggatcattt ccactgacca | |
2401 aggccagatg gtcagtactg agcggggttt cttcgccgaa ccgcggtgtg gtttccccca | |
2461 gcgcacgcga agcaccccct gctcgccgag atagggtgcc tgcgcattgc gcgaatagtc | |
2521 cacgacctga aggtggcgca actcgttggc acgcaagccc cagctgtagg cgctcttgaa | |
2581 tgcgatcgcg tcacgccaag cggccaaagc gcctttgcgg ccggagtcca agatccgttc | |
2641 gacttcaacg tcagctaagt cgaagagctc ctgcagctcg cgctgagtga acggccgttt | |
2701 ggcagggcgt gcctcggagg gttgggcgtg ggtgatgtgg ttcagttcgg taactacctg | |
2761 agcgaagact tgcccgaaca gcttcgcgct ctgttcgcac cagtcataat gagggtcgca | |
2821 gacgtactcg cagaagagct taatatgacc ctgataggcg cgaacggtcc catgggagag | |
2881 gtttcggaca gccctggcat gcgagaaaaa gtcgtcagcg tccccgaggc tccattccca | |
2941 cggataacta ccggcgaagt ccaccatact catcaccacg ttccgtcggg tccgaatcgt | |
3001 ggctagcgcg aagtcttttg ctctttgctg ctgggcccag ccatccaaga ccatgctgag | |
3061 gaaagcgtcc gggtcgggat cgttcccacc gaacggagca aataaaacat tttcgttgtt | |
3121 gcccatcgac cgtcctcagc gctcgaaact ggattgcgat tcttgcacat tatttgcgag | |
3181 actcgcaata gctgagtcgg aaaagcacgt caacacatac attgccgctg gatctttagc | |
3241 ggcgttctag actaggaaca tcgccagcct gacggacgtc accactgata aagctcaggt | |
3301 caaaaggtag ttgggggtca atgcggttcg ttacccgaaa tgtcatcatg tgcggcagga | |
3361 gcaaatagag tcttttctac tt | |
// |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import re | |
import os | |
from Bio import SeqIO | |
def fix_genbank(some_genbank): | |
path, org_file = os.path.split(some_genbank) | |
org_name = re.sub(r"\W+", "_", os.path.splitext(org_file)[0]) | |
new_genome = [] | |
with open(some_genbank, 'r') as infile, open(os.path.join(path, "{}.gb".format(org_name)), 'w+') as outfile: | |
genome = SeqIO.parse(infile, 'gb') | |
org_file = os.path.split(some_genbank)[1] | |
org_name = re.sub(r"\W+", "_", os.path.splitext(org_file)[0]) | |
for record in genome: | |
# record.name = str(record.name)[:16] | |
try: | |
print(record.annotations['source']) | |
except KeyError: | |
record.annotations['source'] = org_name | |
new_genome.append(record) | |
SeqIO.write(new_genome, outfile, 'gb', standard=False) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment