# STOCKHOLM 1.0 #=GF ID 1.10.150.20/FF/000070 #=GF DE DNA polymerase I, putative #=GF AC 1.10.150.20/FF/000070 #=GF TP FunFam #=GF DR CATH: v4.3 #=GF DR DOPS: 92.942 #=GS O18475/1829-1972 AC O18475 #=GS O18475/1829-1972 OS Drosophila melanogaster #=GS O18475/1829-1972 DE DNA polymerase theta #=GS O18475/1829-1972 DR ORG; Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera; Holometabola; Diptera; Brachycera; Muscomorpha; Ephydroidea; Drosophilidae; Drosophilinae; Drosophilini; Drosophila; Sophophora; melanogaster group; melanogaster subgroup; Drosophila melanogaster; #=GS O18475/1829-1972 DR GO; GO:0003887; GO:0004386; GO:0006281; GO:0006289; GO:0016887; GO:0036297; GO:0051575; GO:0097681; #=GS O18475/1829-1972 DR EC; 2.7.7.7; #=GS A0FLQ6/1453-1585 AC A0FLQ6 #=GS A0FLQ6/1453-1585 OS Caenorhabditis elegans #=GS A0FLQ6/1453-1585 DE DNA polymerase theta #=GS A0FLQ6/1453-1585 DR ORG; Eukaryota; Metazoa; Nematoda; Chromadorea; Rhabditida; Rhabditina; Rhabditomorpha; Rhabditoidea; Rhabditidae; Peloderinae; Caenorhabditis; Caenorhabditis elegans; #=GS A0FLQ6/1453-1585 DR GO; GO:0006287; GO:0071479; #=GS A0FLQ6/1453-1585 DR EC; 2.7.7.7; #=GS Q583X2/726-867 AC Q583X2 #=GS Q583X2/726-867 OS Trypanosoma brucei brucei TREU927 #=GS Q583X2/726-867 DE Mitochondrial DNA polymerase I protein A, putative #=GS Q583X2/726-867 DR ORG; Eukaryota; Kinetoplastida; Trypanosomatidae; Trypanosoma; Trypanozoon; Trypanosoma brucei; Trypanosoma brucei brucei; #=GS Q583X2/726-867 DR GO; GO:0005634; GO:0005654; GO:0005737; #=GS Q86HT8/240-387 AC Q86HT8 #=GS Q86HT8/240-387 OS Dictyostelium discoideum #=GS Q86HT8/240-387 DE Uncharacterized protein #=GS Q86HT8/240-387 DR ORG; Eukaryota; Dictyosteliales; Dictyosteliaceae; Dictyostelium; Dictyostelium discoideum; #=GS Q54S42/1203-1339 AC Q54S42 #=GS Q54S42/1203-1339 OS Dictyostelium discoideum #=GS Q54S42/1203-1339 DE Uncharacterized protein #=GS Q54S42/1203-1339 DR ORG; Eukaryota; Dictyosteliales; Dictyosteliaceae; Dictyostelium; Dictyostelium discoideum; #=GS D6X4C0/1366-1509 AC D6X4C0 #=GS D6X4C0/1366-1509 OS Tribolium castaneum #=GS D6X4C0/1366-1509 DE DNA polymerase theta-like Protein #=GS D6X4C0/1366-1509 DR ORG; Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera; Holometabola; Coleoptera; Polyphaga; Cucujiformia; Tenebrionoidea; Tenebrionidae; Tribolium; Tribolium castaneum; #=GS Q5TX00/1757-1912 AC Q5TX00 #=GS Q5TX00/1757-1912 OS Anopheles gambiae #=GS Q5TX00/1757-1912 DE AGAP007533-PA #=GS Q5TX00/1757-1912 DR ORG; Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera; Holometabola; Diptera; Nematocera; Culicomorpha; Culicoidea; Culicidae; Anophelinae; Anopheles; Cellia; Anopheles gambiae; #=GS B8C4R5/262-407 AC B8C4R5 #=GS B8C4R5/262-407 OS Thalassiosira pseudonana #=GS B8C4R5/262-407 DE DNA polymerase #=GS B8C4R5/262-407 DR ORG; Eukaryota; Bacillariophyta; Coscinodiscophyceae; Thalassiosirophycidae; Thalassiosirales; Thalassiosiraceae; Thalassiosira; Thalassiosira pseudonana; #=GS C4LXM4/432-576 AC C4LXM4 #=GS C4LXM4/432-576 OS Entamoeba histolytica #=GS C4LXM4/432-576 DE DNA-directed DNA polymerase, putative #=GS C4LXM4/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba histolytica; #=GS B0EPC0/426-570 AC B0EPC0 #=GS B0EPC0/426-570 OS Entamoeba dispar SAW760 #=GS B0EPC0/426-570 DE DNA polymerase I, putative #=GS B0EPC0/426-570 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba dispar; #=GS K2HW55/432-576 AC K2HW55 #=GS K2HW55/432-576 OS Entamoeba nuttalli P19 #=GS K2HW55/432-576 DE DNA polymerase I domain containing protein #=GS K2HW55/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba nuttalli; #=GS Q8IS90/701-842 AC Q8IS90 #=GS Q8IS90/701-842 OS Leishmania major #=GS Q8IS90/701-842 DE DNA polymerase I type A #=GS Q8IS90/701-842 DR ORG; Eukaryota; Kinetoplastida; Trypanosomatidae; Leishmaniinae; Leishmania; Leishmania; Leishmania major species complex; Leishmania major; #=GS F0ZMW2/262-409 AC F0ZMW2 #=GS F0ZMW2/262-409 OS Dictyostelium purpureum #=GS F0ZMW2/262-409 DE Uncharacterized protein #=GS F0ZMW2/262-409 DR ORG; Eukaryota; Dictyosteliales; Dictyosteliaceae; Dictyostelium; Dictyostelium purpureum; #=GS E9B4V0/700-841 AC E9B4V0 #=GS E9B4V0/700-841 OS Leishmania mexicana MHOM/GT/2001/U1103 #=GS E9B4V0/700-841 DE Mitochondrial DNA polymerase I protein A,putative #=GS E9B4V0/700-841 DR ORG; Eukaryota; Kinetoplastida; Trypanosomatidae; Leishmaniinae; Leishmania; Leishmania; Leishmania mexicana species complex; Leishmania mexicana; #=GS A0A182KRG9/1698-1853 AC A0A182KRG9 #=GS A0A182KRG9/1698-1853 OS Anopheles coluzzii #=GS A0A182KRG9/1698-1853 DE Uncharacterized protein #=GS A0A182KRG9/1698-1853 DR ORG; Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera; Holometabola; Diptera; Nematocera; Culicomorpha; Culicoidea; Culicidae; Anophelinae; Anopheles; Cellia; Anopheles coluzzii; #=GS M7WDJ9/432-576 AC M7WDJ9 #=GS M7WDJ9/432-576 OS Entamoeba histolytica HM-3:IMSS #=GS M7WDJ9/432-576 DE DNA-directed DNA polymerase #=GS M7WDJ9/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba histolytica; #=GS A0A175JIJ7/432-576 AC A0A175JIJ7 #=GS A0A175JIJ7/432-576 OS Entamoeba histolytica #=GS A0A175JIJ7/432-576 DE DNA-directed DNA polymerase putative #=GS A0A175JIJ7/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba histolytica; #=GS N9V2T8/432-576 AC N9V2T8 #=GS N9V2T8/432-576 OS Entamoeba histolytica HM-1:IMSS-A #=GS N9V2T8/432-576 DE DNA-directed DNA polymerase, putative #=GS N9V2T8/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba histolytica; #=GS M3UXA6/432-576 AC M3UXA6 #=GS M3UXA6/432-576 OS Entamoeba histolytica HM-1:IMSS-B #=GS M3UXA6/432-576 DE DNA polymerase I domain containing protein #=GS M3UXA6/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba histolytica; #=GS M2Q5K1/432-576 AC M2Q5K1 #=GS M2Q5K1/432-576 OS Entamoeba histolytica KU27 #=GS M2Q5K1/432-576 DE DNA-directed DNA polymerase, putative #=GS M2Q5K1/432-576 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba histolytica; #=GS B0ER84/3-145 AC B0ER84 #=GS B0ER84/3-145 OS Entamoeba dispar SAW760 #=GS B0ER84/3-145 DE DNA polymerase I, putative #=GS B0ER84/3-145 DR ORG; Eukaryota; Entamoebidae; Entamoeba; Entamoeba dispar; #=GS B4HGF6/1777-1919 AC B4HGF6 #=GS B4HGF6/1777-1919 OS Drosophila sechellia #=GS B4HGF6/1777-1919 DE GM25985 #=GS B4HGF6/1777-1919 DR ORG; Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera; Holometabola; Diptera; Brachycera; Muscomorpha; Ephydroidea; Drosophilidae; Drosophilinae; Drosophilini; Drosophila; Sophophora; melanogaster group; melanogaster subgroup; Drosophila sechellia; #=GS B4PPE3/1813-1956 AC B4PPE3 #=GS B4PPE3/1813-1956 OS Drosophila yakuba #=GS B4PPE3/1813-1956 DE Uncharacterized protein #=GS B4PPE3/1813-1956 DR ORG; Eukaryota; Metazoa; Arthropoda; Hexapoda; Insecta; Pterygota; Neoptera; Holometabola; Diptera; Brachycera; Muscomorpha; Ephydroidea; Drosophilidae; Drosophilinae; Drosophilini; Drosophila; Sophophora; melanogaster group; melanogaster subgroup; Drosophila yakuba; #=GF SQ 23 O18475/1829-1972 LEMRILAHMSQDKALLEVM-----------KSSQDLFIAIAAHW---NKIE-ESEVTQDLRNSTKQVCYGIVYGMGMRSLAESLNCSEQEARMISDQFHQAYKGIRDYTTRVVNFARSKGFVETITGRRRYLENINS-----DVEHLKNQAERQAVNSTIQGSA A0FLQ6/1453-1585 LELRVLAHLSNDSNLVNLI-----------TSDRDLFEELSIQW---NF----------PRDAVKQLCYGLIYGMGAKSLSELTRMSIEDAEKMLKAFFAMFPGVRSYINETKEKVCKEEPISTIIGRRTIIK--AS-----GIGEERARIERVAVNYTIQGSA Q583X2/726-867 VELRVLAHLSGDSALINVL-----------TKSGDIHRSIAEII-----FR-KTSVTGEERSLAKKVVFGILYGAGPRGLAQQMGVSVEQALRVSSLFKSCFPTVDAYQRRIIDQCRSDGSVRTLSGRVRSIPDIND-----RVLTKRSHAERQAFNTVVQGSA Q86HT8/240-387 IELRIMAHYSKDKHLIEYF-----------ESGKDVINMMASRL--IDGVD-PNNVKKEIRDKVKRIVYGILYGIQKNSLHKLLGVSLDEAQEHINNFNLKFEEVSSFIK--INSQIKNGKILTIGNRIRRFQDHSSIIPSTSSSSSLSSSPIQAINSIMQGSS Q54S42/1203-1339 VELRIIAHFSRDKHLIEYF-----------ESGSDVINMMAVRLSDRDDLD-VNNVDKETRDRVKRIVYGILYGIQAFSLGKLLNIPIYKASDHIKNFYFKFDGVSNFIQITKSNAEKSHVVPTLGKRIRKLD---------------SKFKTKAVNSIIQGSS D6X4C0/1366-1509 LELRVLAHLSRDEVLGGIL-----------RRKGDIFRAIAAKW---NNIS-ENEVTEELRQRAKQIIYGIIYGMGSKALAEQLNTDEAQATRFMQTFRNAYPGVQKYISEIIETCRKTGFVETLAGRRRFLAHINH-----KNGAVKSQAERQAVNTTIQGSA Q5TX00/1757-1912 LELSILTHLSQDPQLMAALGGGGNEAPGRTEARSDVFRALAARW---NHYERESDVSDELRNRTKAIVYGVIYGMGVRAMAAELQLDEDAARTLMEQFHATYPEIRRYIERVVRLTRQLGYIETLTGRRRHLPAITS-----ENARERSEAERQAVCTTIQGSA B8C4R5/262-407 KEVRILAHMSGDKALISLF---------QMDANVDIYKQMSSLI---RNKP-VESITAQERAQFKQVTLALLYGMSPNQVAKKLNITKSQAIQMMNDFFRRFQGVKNWMEDTKEFARRNHYVVTIAGRRRYLDGIDS-----DDNGAKAQAERQAINTVIQGSA C4LXM4/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTVAESKRIAVNSPIQGTA B0EPC0/426-570 IELRILANFTKDHHLIEFF-----------KSNIDIHKLIAAHW---LKKN-VNDITDGERRKAKTIVYGCIYGIGPFSLADQLHISLDESKTFLESFLDQFPSFKKWKEEIITNASTTGFVHTINNRRRRINNLTDS----SDKKTLAESKRIAVNSPIQGTA K2HW55/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTIAESKRIAVNSPIQGTA Q8IS90/701-842 IELRVLAHLCGDAALVEAL-----------TTSADIHRAIAEVV-----FK-KKPVSTEERRLAKRVVFGLLYGAGPKTLATHMGVTVDRALHITSLLANAFPGIDAYQRRVIEEARTNGFVRTLSGRLRYLPDIRS-----TVLSRRSYAERQAFNSVVQGSA F0ZMW2/262-409 LELRILTHLSQDPKLMEMF---------NCNINIDIFKYVAHQV---GNIP-YDSVTDSDRQQAKHLVYGILYGMGIKSIASELHIPIEQARGKLENFKKTYNKLIEYLEMVEENVIQNGYIATLFGRVRNFSNIHSC---KIDNNEISKVKRAARNSIPQGTA E9B4V0/700-841 IELRVLAHLCGDAALVEAL-----------TTSADIHRAIAEVV-----FK-KKPVSTEERSLAKRVVFGVLYGAGPKTLATHMGVTVDRALHITSLLTNAFPGIDAYHRRVVEEARANGFVRTLSGRLRYLPDIRS-----TVLSRRSYAERQAFNSVVQGSA A0A182KRG9/1698-1853 LELSILTHLSQDPQLMAALRGGGNEAPGHTEARSDVFRALAARW---NHYERESDVSDELRNRTKAIVYGVIYGMGVRAMAAELQLDEDAARTLMEQFHATYPEIRRYIERVVRLTRQLGYIETLTGRRRHLPAITS-----ENARERSEAERQAVCTTIQGSA M7WDJ9/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTVAESKRIAVNSPIQGTA A0A175JIJ7/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTVAESKRIAVNSPIQGTA N9V2T8/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTVAESKRIAVNSPIQGTA M3UXA6/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTVAESKRIAVNSPIQGTA M2Q5K1/432-576 IELRILADFTKDHHLIEFF-----------KSNTDVHRLIAAHW---LKKN-VNDITDDERRKAKTIVYGCIYGIGPFSLADQLHVSLDESKAFLESFLDQFPAFKKWKEETITNASTTGFVHTINNRRRRINNLTDC----NDKKTVAESKRIAVNSPIQGTA B0ER84/3-145 --LRILANFTKDHHLIEFF-----------KSNIDIHKLIAAHW---LKKN-VNDITDGERRKAKTIVYGCIYGIGPFSLADQLHISLDESKTFLESFLDQFPSFKKWKEEIITNASTTGFVHTINNRRRRINNLTDS----SDKKTLAESKRIAVNSPIQGTA B4HGF6/1777-1919 LEMRILAHMSQDKALLEVM-----------NSPQDLFIAIAAHW---NKIK-ESEVTPDLRNSTKQVCYGIVYGMGMRSLAESLNCSEQEARILSDQFHEAYKGIRDYTRRVVNFARGKGFVETITGRRRYLEMINS-----DMEHLK-KAERQAVNSTIQGSA B4PPE3/1813-1956 LEMRILAHMSQDKALLEVM-----------NSPQDLFIAIAAHW---NKIE-ESEVSQDLRNSTKHVCYGIVYGMGMRSLAESLNCSEQEARMISEQFHQAYKGIREYTSRVVKFARNQGFVETITGRRRYLDNINS-----DEEQLKNQAERQAINSTIQGSA #=GC scorecons 58777876554934955350000000000045439654367444000232303446535494459465784699574357744744535563344538333754544534445435443757396459583533445000003333335455749576479967 #=GC scorecons_70 _******____*__*___________________*____**______________*____*___*_*_**__**_*___**__*______*______*___*_________________*_*_**__*_*______________________*_*_*__***** #=GC scorecons_80 _******____*__*___________________*_____*___________________*___*___**__**_____*___*_____________*___*___________________*_*___*_*______________________*_*_*___**_* #=GC scorecons_90 _*_________*__*___________________*_________________________*___*____*__**_______________________*_________________________*___*_*________________________*_____**__ //