# STOCKHOLM 1.0 #=GF ID DHFR #=GF DE DHFR only alignment using structural alignment for basis (without fungal DHFR structures; some editing in non-consensus areas); should be processed with hmmbuild --hand --nofrag #=GF AU Smith, Allen Watkins #=GF DR PROSITE; PS00075; ## Weights are from pb2 with idlevel 0.65 ## 1U72A Cluster #=GS 1U70A AC DYR_MOUSE #=GS 1U70A DR SWS; P00375; #=GS 1U70A DR PDB; 1u70 A; #=GS 1U70A OS Mus musculus #=GS 1U70A OC poss_fungi_metazoa #=GS 1U70A OC fungi_metazoa #=GS 1U70A OC metazoa #=GS 1U70A OC vertebrata #=GS 1U70A OC tetrapoda #=GS 1U70A OC mammalia #=GS 1U70A OC placentals #=GS 1U70A DE Mouse (Leu22Arg mutation removed) #=GS 1U70A WT 0.121227785945 ## 1U70A Cluster: 1U72A #=GS DYR_RAT AC Q920D2 #=GS DYR_RAT OS Rattus norvegicus #=GS DYR_RAT OC poss_fungi_metazoa #=GS DYR_RAT OC fungi_metazoa #=GS DYR_RAT OC metazoa #=GS DYR_RAT OC vertebrata #=GS DYR_RAT OC tetrapoda #=GS DYR_RAT OC mammalia #=GS DYR_RAT OC placentals #=GS DYR_RAT DE Rat DHFR (no structure; aligned to 1U70A) #=GS DYR_RAT WT 0.0986232087016 ## DYR_RAT Cluster: 1U72A #=GS DYR_MESAU AC Q2MH30_CRIGR #=GS DYR_MESAU DR EMBL; AAA36974; #=GS DYR_MESAU DR EMBL; AAA36970; #=GS DYR_MESAU DR EMBL; BAE78431; #=GS DYR_MESAU DR EMBL; FAA00073; #=GS DYR_MESAU DR TREMBL; Q78EE3; #=GS DYR_MESAU DR TREMBL; Q9JHB0; #=GS DYR_MESAU DR TREMBL; Q2MH30; #=GS DYR_MESAU OS Mesocricetus auratus #=GS DYR_MESAU OS Cricetulus griseus #=GS DYR_MESAU OC poss_fungi_metazoa #=GS DYR_MESAU OC fungi_metazoa #=GS DYR_MESAU OC metazoa #=GS DYR_MESAU OC vertebrata #=GS DYR_MESAU OC tetrapoda #=GS DYR_MESAU OC mammalia #=GS DYR_MESAU OC placentals #=GS DYR_MESAU DE Golden, Chinese hamsters (no structure; aligned to 1U70A) ## is form with L at 22, not MTX-resistant variant MQ19-97 with F (also doesn't have D->N at 95; I note an additional MTX-resistant variant also subbing F at 22, with no D->N at 95 but a T->S at 144 - http://www.jbc.org/cgi/content/abstract/265/14/8317; probable steric hinderance) #=GS DYR_MESAU WT 0.0971931740642 ## DYR_MESAU Cluster: 1U72A #=GS Q78EH1_9RODE AC Q78EH1 #=GS Q78EH1_9RODE DR EMBL; AAA36972; #=GS Q78EH1_9RODE OS Cricetulus griseus #=GS Q78EH1_9RODE OC poss_fungi_metazoa #=GS Q78EH1_9RODE OC fungi_metazoa #=GS Q78EH1_9RODE OC metazoa #=GS Q78EH1_9RODE OC vertebrata #=GS Q78EH1_9RODE OC tetrapoda #=GS Q78EH1_9RODE OC mammalia #=GS Q78EH1_9RODE OC placentals #=GS Q78EH1_9RODE DE Cricetulus sp ("Chinese hamster" - if griseus, variant 2; no structure; aligned to 1U70A) #=GS Q78EH1_9RODE WT 0.12953646481 ## Q78EH1_9RODE Cluster: 1U72A #=GS 1U72A AC P00374 #=GS 1U72A OS Homo sapiens #=GS 1U72A OC poss_fungi_metazoa #=GS 1U72A OC fungi_metazoa #=GS 1U72A OC metazoa #=GS 1U72A OC vertebrata #=GS 1U72A OC tetrapoda #=GS 1U72A OC mammalia #=GS 1U72A OC placentals #=GS 1U72A DR PDB; 1u72 A; #=GS 1U72A DR PDB; 1u71 A; #=GS 1U72A DR PDB; 1dhf A; #=GS 1U72A DR PDB; 1dhf B; #=GS 1U72A DR PDB; 2dhf A; #=GS 1U72A DR PDB; 2dhf B; #=GS 1U72A DE Human - data on binding also from [12]DHF[AB] paper #=GS 1U72A WT 0.112223669887 ## 1U72A Cluster: 1U72A #=GS 1DHFB AC P00374 #=GS 1DHFB OS Homo sapiens #=GS 1DHFB OC poss_fungi_metazoa #=GS 1DHFB OC fungi_metazoa #=GS 1DHFB OC metazoa #=GS 1DHFB OC vertebrata #=GS 1DHFB OC tetrapoda #=GS 1DHFB OC mammalia #=GS 1DHFB OC placentals #=GS 1DHFB DR PDB; 1dhf A; #=GS 1DHFB DR PDB; 1dhf B; #=GS 1DHFB DR PDB; 2dhf A; #=GS 1DHFB DR PDB; 2dhf B; #=GS 1DHFB DE Human - with folate bound; data on binding also from 1U72A #=GS 1DHFB WT 0.112223669887 ## 1DHFB Cluster: 1U72A #=GS 1PD8A AC P00374 #=GS 1PD8A OS Homo sapiens #=GS 1PD8A OC poss_fungi_metazoa #=GS 1PD8A OC fungi_metazoa #=GS 1PD8A OC metazoa #=GS 1PD8A OC vertebrata #=GS 1PD8A OC tetrapoda #=GS 1PD8A OC mammalia #=GS 1PD8A OC placentals #=GS 1PD8A DR PDB; 1pd8 A; #=GS 1PD8A DE Human #=GS 1PD8A WT 0.112223669887 ## 1PD8A Cluster: 1U72A #=GS XP_001110551 AC XP_001110551 #=GS XP_001110551 OS Macaca mulatta #=GS XP_001110551 OC poss_fungi_metazoa #=GS XP_001110551 OC fungi_metazoa #=GS XP_001110551 OC metazoa #=GS XP_001110551 OC vertebrata #=GS XP_001110551 OC tetrapoda #=GS XP_001110551 OC mammalia #=GS XP_001110551 OC placentals #=GS XP_001110551 DE Rhesus macaque (no structure; aligned to 1U72A) #=GS XP_001110551 WT 0.132289975882 ## XP_001110551 Cluster: 1U72A #=GS XP_001134992 AC XP_001134992 #=GS XP_001134992 OS Pan troglodytes #=GS XP_001134992 OC poss_fungi_metazoa #=GS XP_001134992 OC fungi_metazoa #=GS XP_001134992 OC metazoa #=GS XP_001134992 OC vertebrata #=GS XP_001134992 OC tetrapoda #=GS XP_001134992 OC mammalia #=GS XP_001134992 OC placentals #=GS XP_001134992 DE Chimpanzee (no structure; aligned to 1U72A) #=GS XP_001134992 WT 0.112223669887 ## XP_001134992 Cluster: 1U72A #=GS XP_851329 AC XP_851329 #=GS XP_851329 OS Canis lupus #=GS XP_851329 OC poss_fungi_metazoa #=GS XP_851329 OC fungi_metazoa #=GS XP_851329 OC metazoa #=GS XP_851329 OC vertebrata #=GS XP_851329 OC tetrapoda #=GS XP_851329 OC mammalia #=GS XP_851329 OC placentals #=GS XP_851329 DE Wolf/dog (variant 1; no structure; aligned to 1U72A|8DFR0 (matching results)) #=GS XP_851329 WT 0.178840309381 ## XP_851329 Cluster: 1U72A #=GS XP_536308 AC XP_536308 #=GS XP_536308 OS Canis lupus #=GS XP_536308 OC poss_fungi_metazoa #=GS XP_536308 OC fungi_metazoa #=GS XP_536308 OC metazoa #=GS XP_536308 OC vertebrata #=GS XP_536308 OC tetrapoda #=GS XP_536308 OC mammalia #=GS XP_536308 OC placentals ## trimmed tvvvgylvk at start #=GS XP_536308 DE Wolf/dog (variant 2 - incomplete; no structure; aligned to 1U70A|1U72A|8DFR0) #=GS XP_536308 WT 0.0817937925458 ## XP_536308 Cluster: 1U72A #=GS DYR_PIG AC P00377 #=GS DYR_PIG OS Sus scrofa #=GS DYR_PIG OC poss_fungi_metazoa #=GS DYR_PIG OC fungi_metazoa #=GS DYR_PIG OC metazoa #=GS DYR_PIG OC vertebrata #=GS DYR_PIG OC tetrapoda #=GS DYR_PIG OC mammalia #=GS DYR_PIG OC placentals #=GS DYR_PIG DE Pig (no structure; aligned to 1U70A|1U72A|8DFR0) #=GS DYR_PIG WT 0.115356206894 ## DYR_PIG Cluster: 1U72A #=GS DYR_BOVIN AC DYR_BOVIN ## not sure about cross-references... #=GS DYR_BOVIN DR SWS; P00376; #=GS DYR_BOVIN DR SWS; Q29RI1; #=GS DYR_BOVIN OS Bos taurus #=GS DYR_BOVIN OC poss_fungi_metazoa #=GS DYR_BOVIN OC fungi_metazoa #=GS DYR_BOVIN OC metazoa #=GS DYR_BOVIN OC vertebrata #=GS DYR_BOVIN OC tetrapoda #=GS DYR_BOVIN OC mammalia #=GS DYR_BOVIN OC placentals ## aligned to 1U70A|1U72A|8DFR0 #=GS DYR_BOVIN DE Cow (variant 1; no structure) #=GS DYR_BOVIN WT 0.114235892892 ## DYR_BOVIN Cluster: 1U72A #=GS P00376 AC P00376 ## not sure about cross-references... #=GS P00376 DR EMBL; AAI14163; #=GS P00376 DR SWS; P00376; #=GS P00376 OS Bos taurus #=GS P00376 OC poss_fungi_metazoa #=GS P00376 OC fungi_metazoa #=GS P00376 OC metazoa #=GS P00376 OC vertebrata #=GS P00376 OC tetrapoda #=GS P00376 OC mammalia #=GS P00376 OC placentals ## aligned to 1U70A|1U72A|8DFR0 #=GS P00376 DE Cow (variant 2; no structure) #=GS P00376 WT 0.115463130176 ## P00376 Cluster: 1U72A #=GS Q29RI1_BOVIN AC Q29RI1 ## not sure about cross-references... #=GS Q29RI1_BOVIN DR EMBL; AAI14163; #=GS Q29RI1_BOVIN DR TREMBL; Q29RI1; #=GS Q29RI1_BOVIN OS Bos taurus #=GS Q29RI1_BOVIN OC poss_fungi_metazoa #=GS Q29RI1_BOVIN OC fungi_metazoa #=GS Q29RI1_BOVIN OC metazoa #=GS Q29RI1_BOVIN OC vertebrata #=GS Q29RI1_BOVIN OC tetrapoda #=GS Q29RI1_BOVIN OC mammalia #=GS Q29RI1_BOVIN OC placentals ## aligned to 1U70A|1U72A|8DFR0 #=GS Q29RI1_BOVIN DE Cow (variant 3; no structure) #=GS Q29RI1_BOVIN WT 0.114886291325 ## Q29RI1_BOVIN Cluster: 1U72A #=GS PLACENT AC PLACENTAL #=GS PLACENT OS Placental ancestral #=GS PLACENT OC poss_fungi_metazoa #=GS PLACENT OC fungi_metazoa #=GS PLACENT OC metazoa #=GS PLACENT OC vertebrata #=GS PLACENT OC tetrapoda #=GS PLACENT OC mammalia #=GS PLACENT OC placentals ## Has I at 100 #=GS PLACENT DE Model of placental ancestral #=GS PLACENT WT 0.0939027890563 ## PLACENT Cluster: 1U72A #=GS XP_001363618 AC XP_001363618 #=GS XP_001363618 OS Monodelphis domestica #=GS XP_001363618 OC poss_fungi_metazoa #=GS XP_001363618 OC fungi_metazoa #=GS XP_001363618 OC metazoa #=GS XP_001363618 OC vertebrata #=GS XP_001363618 OC tetrapoda #=GS XP_001363618 OC mammalia #=GS XP_001363618 DE Opossum (no structure; aligned to 1U70A|1U72A|8DFR0) #=GS XP_001363618 WT 0.157856851816 ## XP_001363618 Cluster: 1U72A #=GS 8DFR0 AC DYR_CHICK #=GS 8DFR0 DR SWS; P00378; #=GS 8DFR0 DR PDB; 8dfr; #=GS 8DFR0 OS Gallus gallus #=GS 8DFR0 OC poss_fungi_metazoa #=GS 8DFR0 OC fungi_metazoa #=GS 8DFR0 OC metazoa #=GS 8DFR0 OC vertebrata #=GS 8DFR0 OC tetrapoda #=GS 8DFR0 DE Chicken #=GS 8DFR0 WT 0.169156074524 ## 8DFR0 Cluster: 1U72A #=GS 1DR10 AC DYR_CHICK #=GS 1DR10 DR SWS; P00378; #=GS 1DR10 DR PDB; 1dr1; #=GS 1DR10 OS Gallus gallus #=GS 1DR10 OC poss_fungi_metazoa #=GS 1DR10 OC fungi_metazoa #=GS 1DR10 OC metazoa #=GS 1DR10 OC vertebrata #=GS 1DR10 OC tetrapoda #=GS 1DR10 DE Chicken #=GS 1DR10 WT 0.169156074524 ## 1DR10 Cluster: 1U72A #=GS AGA AC AGA #=GS AGA OS Uramniota AGA #=GS AGA OC poss_fungi_metazoa #=GS AGA OC fungi_metazoa #=GS AGA OC metazoa #=GS AGA OC vertebrata #=GS AGA OC tetrapoda #=GS AGA DE Mammal/chicken ancestral model (seq with AGA) #=GS AGA WT 0.0936328917742 ## AGA Cluster: 1U72A #=GS PGV AC PGV #=GS PGV OS Uramniota PGV #=GS PGV OC poss_fungi_metazoa #=GS PGV OC fungi_metazoa #=GS PGV OC metazoa #=GS PGV OC vertebrata #=GS PGV OC tetrapoda #=GS PGV DE Mammal/chicken ancestral model (seq with PGV) #=GS PGV WT 0.0930436998606 ## PGV Cluster: 1U72A #=GS Q5U543_XENLA AC Q5U543 #=GS Q5U543_XENLA OS Xenopus laevis #=GS Q5U543_XENLA OC poss_fungi_metazoa #=GS Q5U543_XENLA OC fungi_metazoa #=GS Q5U543_XENLA OC metazoa #=GS Q5U543_XENLA OC vertebrata #=GS Q5U543_XENLA OC tetrapoda #=GS Q5U543_XENLA DE no structure; aligned to 8DFR0 (most consistent with others) #=GS Q5U543_XENLA WT 0.173069626093 ## Q5U543_XENLA Cluster: 1U72A #=GS ENSXETP49617 AC ENSXETP00000049617 #=GS ENSXETP49617 OS Xenopus tropicalis #=GS ENSXETP49617 OC poss_fungi_metazoa #=GS ENSXETP49617 OC fungi_metazoa #=GS ENSXETP49617 OC metazoa #=GS ENSXETP49617 OC vertebrata #=GS ENSXETP49617 OC tetrapoda #=GS ENSXETP49617 DE no structure; aligned to 8DFR0 (most consistent with others) #=GS ENSXETP49617 WT 0.167103275657 ## ENSXETP49617 Cluster: 1U72A #=GS AAK01951 AC AAK01951 #=GS AAK01951 OS Danio rerio #=GS AAK01951 OC poss_fungi_metazoa #=GS AAK01951 OC fungi_metazoa #=GS AAK01951 OC metazoa #=GS AAK01951 OC vertebrata #=GS AAK01951 DE Zebrafish variant 1 (no structure; aligned to 1U70A due to that being only metazoan aligning well to it) ## first 2 residues removed #=GS AAK01951 WT 0.194286435843 ## AAK01951 Cluster: 1U72A #=GS CAM14042 AC CAM14042 #=GS CAM14042 OS Danio rerio #=GS CAM14042 OC poss_fungi_metazoa #=GS CAM14042 OC fungi_metazoa #=GS CAM14042 OC metazoa #=GS CAM14042 OC vertebrata #=GS CAM14042 DE Zebrafish variant 2 (no structure; aligned to 1U70A due to that being only metazoan aligning well to it) #=GS CAM14042 WT 0.173997327685 ## CAM14042 Cluster: 1U72A #=GS NP_571850 AC NP_571850 #=GS NP_571850 OS Danio rerio #=GS NP_571850 OC poss_fungi_metazoa #=GS NP_571850 OC fungi_metazoa #=GS NP_571850 OC metazoa #=GS NP_571850 OC vertebrata #=GS NP_571850 DE Zebrafish variant 3 (no structure; aligned to 1U70A due to that being only metazoan aligning well to it) #=GS NP_571850 WT 0.178801462054 ## NP_571850 Cluster: 1U72A #=GS XP_001176553 AC XP_001176553 #=GS XP_001176553 OS Strongylocentrotus purpuratus #=GS XP_001176553 OC poss_fungi_metazoa #=GS XP_001176553 OC fungi_metazoa #=GS XP_001176553 OC metazoa #=GS XP_001176553 DE Sea urchin (no structure; aligned to 1U70A|1U72A, some 8DFR0 (consistent portion)) #=GS XP_001176553 WT 0.263832390308 ## XP_001176553 Cluster: 1U72A #=GS ES AC _E_SKFEDQ #=GS ES OS Deuterostomia ES #=GS ES OC poss_fungi_metazoa #=GS ES OC fungi_metazoa #=GS ES OC metazoa #=GS ES DE Deuterostomia ancestral model (_E_SKFEDQ seq) #=GS ES WT 0.0969611406326 ## ES Cluster: 1U72A #=GS KAG AC _KAGKFEDQ #=GS KAG OS Deuterostomia KAG #=GS KAG OC poss_fungi_metazoa #=GS KAG OC fungi_metazoa #=GS KAG OC metazoa #=GS KAG DE Deuterostomia ancestral model (_KAGKFEDQ seq) #=GS KAG WT 0.0977780967951 ## KAG Cluster: 1U72A #=GS XP_973338 AC XP_973338 #=GS XP_973338 OS Tribolium castaneum #=GS XP_973338 OC poss_fungi_metazoa #=GS XP_973338 OC fungi_metazoa #=GS XP_973338 OC metazoa #=GS XP_973338 DE Flour beetle (no structure; aligned via DHFR.metazoa.only.weighted.hmm) #=GS XP_973338 WT 0.469422280788 ## XP_973338 Cluster: 1U72A #=GS EAL28532 AC EAL28532 #=GS EAL28532 OS Drosophila pseudoobscura #=GS EAL28532 OC poss_fungi_metazoa #=GS EAL28532 OC fungi_metazoa #=GS EAL28532 OC metazoa #=GS EAL28532 DE Drosophila pseudoobscura (no structure; aligned via DHFR.metazoa.only.weighted.hmm) #=GS EAL28532 WT 0.220712319016 ## EAL28532 Cluster: 1U72A #=GS DYR_DROME AC DYR_DROME #=GS DYR_DROME DR SWS; P17719 #=GS DYR_DROME DR SWS; Q9VEU4 #=GS DYR_DROME DR EMBL; AAF55324 #=GS DYR_DROME OS Drosophila melanogaster #=GS DYR_DROME OC poss_fungi_metazoa #=GS DYR_DROME OC fungi_metazoa #=GS DYR_DROME OC metazoa #=GS DYR_DROME DE Drosophila melanogaster (no structure; aligned via DHFR.metazoa.only.weighted.hmm) #=GS DYR_DROME WT 0.207373455167 ## DYR_DROME Cluster: 1U72A #=GS AAA19051 AC AAA19051 #=GS AAA19051 DR EMBL; AAA19051; #=GS AAA19051 DR SWS; P17719 #=GS AAA19051 DR SWS; Q9VEU4 #=GS AAA19051 OS Drosophila melanogaster #=GS AAA19051 OC poss_fungi_metazoa #=GS AAA19051 OC fungi_metazoa #=GS AAA19051 OC metazoa #=GS AAA19051 DE Drosophila melanogaster (no structure; aligned via DHFR.metazoa.only.weighted.hmm; MTX-resistant variant) #=GS AAA19051 WT 0.223387271166 ## AAA19051 Cluster: 1U72A #=GS XP_393902 AC XP_393902 #=GS XP_393902 OS Apis mellifera #=GS XP_393902 OC poss_fungi_metazoa #=GS XP_393902 OC fungi_metazoa #=GS XP_393902 OC metazoa #=GS XP_393902 DE Honeybee (no structure; aligned via DHFR.metazoa.only.weighted.hmm) #=GS XP_393902 WT 0.326980292797 ## XP_393902 Cluster: 1U72A #=GS Q7Q0L5_ANOGA AC Q7Q0L5 #=GS Q7Q0L5_ANOGA OS Anopheles gambiae #=GS Q7Q0L5_ANOGA OC poss_fungi_metazoa #=GS Q7Q0L5_ANOGA OC fungi_metazoa #=GS Q7Q0L5_ANOGA OC metazoa #=GS Q7Q0L5_ANOGA DE Mosquito (no structure; aligned via DHFR.metazoa.only.weighted.hmm) #=GS Q7Q0L5_ANOGA WT 0.269749164581 ## Q7Q0L5_ANOGA Cluster: 1U72A #=GS DYR_CAEEL_1 AC Q93341 #=GS DYR_CAEEL_1 DR SWS; Q93341; #=GS DYR_CAEEL_1 DR EMBL; CAB02272; #=GS DYR_CAEEL_1 OS Caenorhabditis elegans #=GS DYR_CAEEL_1 OC poss_fungi_metazoa #=GS DYR_CAEEL_1 OC fungi_metazoa #=GS DYR_CAEEL_1 OC metazoa #=GS DYR_CAEEL_1 DE C. elegans (no structure; aligned via DHFR.caeno.weighted.hmm; alignment version 1) #=GS DYR_CAEEL_1 WT 0.266028881073 ## DYR_CAEEL_1 Cluster: 1U72A #=GS DYR_CAEEL_2 AC Q93341 #=GS DYR_CAEEL_2 DR SWS; Q93341; #=GS DYR_CAEEL_2 DR EMBL; CAB02272; #=GS DYR_CAEEL_2 OS Caenorhabditis elegans #=GS DYR_CAEEL_2 OC poss_fungi_metazoa #=GS DYR_CAEEL_2 OC fungi_metazoa #=GS DYR_CAEEL_2 OC metazoa #=GS DYR_CAEEL_2 DE C. elegans (no structure; aligned via DHFR.caeno.weighted.hmm; alignment version 2) #=GS DYR_CAEEL_2 WT 0.220306620002 ## DYR_CAEEL_2 Cluster: 1U72A #=GS Q61DT5_CAEBR_1 AC Q61DT5 #=GS Q61DT5_CAEBR_1 DR TREMBL; Q61DT5; #=GS Q61DT5_CAEBR_1 DR EMBL; CAE66962; #=GS Q61DT5_CAEBR_1 OS Caenorhabditis briggsae #=GS Q61DT5_CAEBR_1 OC poss_fungi_metazoa #=GS Q61DT5_CAEBR_1 OC fungi_metazoa #=GS Q61DT5_CAEBR_1 OC metazoa #=GS Q61DT5_CAEBR_1 DE C. briggsae (no structure; aligned via DHFR.caeno.weighted.hmm; alignment version 1) #=GS Q61DT5_CAEBR_1 WT 0.243840783834 ## Q61DT5_CAEBR_1 Cluster: 1U72A #=GS Q61DT5_CAEBR_2 AC Q61DT5 #=GS Q61DT5_CAEBR_2 DR TREMBL; Q61DT5; #=GS Q61DT5_CAEBR_2 DR EMBL; CAE66962; #=GS Q61DT5_CAEBR_2 OS Caenorhabditis briggsae #=GS Q61DT5_CAEBR_2 OC poss_fungi_metazoa #=GS Q61DT5_CAEBR_2 OC fungi_metazoa #=GS Q61DT5_CAEBR_2 OC metazoa #=GS Q61DT5_CAEBR_2 DE C. briggsae (no structure; aligned via DHFR.caeno.weighted.hmm; alignment version 2) #=GS Q61DT5_CAEBR_2 WT 0.201498270035 ## Q61DT5_CAEBR_2 Cluster: 1U72A #=GS 1111_GTF AC 1111_GTF #=GS 1111_GTF OS Fungimetazoa gtf #=GS 1111_GTF OC poss_fungi_metazoa #=GS 1111_GTF OC fungi_metazoa #=GS 1111_GTF DE fungi/metazoa ancestral sequence 1111_GTF #=GS 1111_GTF WT 0.0878647193313 ## 1111_GTF Cluster: 1U72A #=GS 1111_STF AC 1111_STF #=GS 1111_STF OS Fungimetazoa stf #=GS 1111_STF OC poss_fungi_metazoa #=GS 1111_STF OC fungi_metazoa #=GS 1111_STF DE fungi/metazoa ancestral sequence 1111_STF #=GS 1111_STF WT 0.0872488096356 ## 1111_STF Cluster: 1U72A #=GS AAQ02615_1 AC AAQ02615 #=GS AAQ02615_1 DR EMBL; AAQ02615; #=GS AAQ02615_1 DR TREMBL; Q6WEA8; #=GS AAQ02615_1 OS Hartmannella cantabrigiensis #=GS AAQ02615_1 OC poss_fungi_metazoa #=GS AAQ02615_1 DE Hartmannella cantabrigiensis (no structure; variant 1; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 1) #=GS AAQ02615_1 WT 0.172971338034 ## AAQ02615_1 Cluster: 1U72A #=GS AAQ02617_1 AC AAQ02617 #=GS AAQ02617_1 DR EMBL; AAQ02617; #=GS AAQ02617_1 DR TREMBL; Q6WEA6; #=GS AAQ02617_1 OS Hartmannella cantabrigiensis #=GS AAQ02617_1 OC poss_fungi_metazoa #=GS AAQ02617_1 DE Hartmannella cantabrigiensis (no structure; variant 2; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 1) #=GS AAQ02617_1 WT 0.154925167561 ## AAQ02617_1 Cluster: 1U72A #=GS AAQ02619_1 AC AAQ02619 #=GS AAQ02619_1 DR EMBL; AAQ02619; #=GS AAQ02619_1 DR TREMBL; Q6WEA4; #=GS AAQ02619_1 OS Hartmannella cantabrigiensis #=GS AAQ02619_1 OC poss_fungi_metazoa #=GS AAQ02619_1 DE Hartmannella cantabrigiensis (no structure; variant 3; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 1) #=GS AAQ02619_1 WT 0.17264996469 ## AAQ02619_1 Cluster: 1U72A #=GS AAQ02621_1 AC AAQ02621 #=GS AAQ02621_1 DR EMBL; AAQ02621; #=GS AAQ02621_1 DR TREMBL; Q6WEA2; #=GS AAQ02621_1 OS Hartmannella cantabrigiensis #=GS AAQ02621_1 OC poss_fungi_metazoa #=GS AAQ02621_1 DE Hartmannella cantabrigiensis (no structure; variant 4; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 1) #=GS AAQ02621_1 WT 0.173445239663 ## AAQ02621_1 Cluster: 1U72A #=GS AAQ02615_2 AC AAQ02615 #=GS AAQ02615_2 DR EMBL; AAQ02615; #=GS AAQ02615_2 DR TREMBL; Q6WEA8; #=GS AAQ02615_2 OS Hartmannella cantabrigiensis #=GS AAQ02615_2 OC poss_fungi_metazoa #=GS AAQ02615_2 DE Hartmannella cantabrigiensis (no structure; variant 1; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 2) #=GS AAQ02615_2 WT 0.179195031524 ## AAQ02615_2 Cluster: 1U72A #=GS AAQ02617_2 AC AAQ02617 #=GS AAQ02617_2 DR EMBL; AAQ02617; #=GS AAQ02617_2 DR TREMBL; Q6WEA6; #=GS AAQ02617_2 OS Hartmannella cantabrigiensis #=GS AAQ02617_2 OC poss_fungi_metazoa #=GS AAQ02617_2 DE Hartmannella cantabrigiensis (no structure; variant 2; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 2) #=GS AAQ02617_2 WT 0.161148831248 ## AAQ02617_2 Cluster: 1U72A #=GS AAQ02619_2 AC AAQ02619 #=GS AAQ02619_2 DR EMBL; AAQ02619; #=GS AAQ02619_2 DR TREMBL; Q6WEA4; #=GS AAQ02619_2 OS Hartmannella cantabrigiensis #=GS AAQ02619_2 OC poss_fungi_metazoa #=GS AAQ02619_2 DE Hartmannella cantabrigiensis (no structure; variant 3; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 2) #=GS AAQ02619_2 WT 0.184245377779 ## AAQ02619_2 Cluster: 1U72A #=GS AAQ02621_2 AC AAQ02621 #=GS AAQ02621_2 DR EMBL; AAQ02621; #=GS AAQ02621_2 DR TREMBL; Q6WEA2; #=GS AAQ02621_2 OS Hartmannella cantabrigiensis #=GS AAQ02621_2 OC poss_fungi_metazoa #=GS AAQ02621_2 DE Hartmannella cantabrigiensis (no structure; variant 4; aligned via DHFR.weighted.for.fungi.tmp3.hmm; alignment version 2) #=GS AAQ02621_2 WT 0.185040608048 ## AAQ02621_2 Cluster: 1U72A ## end of real 1U72A cluster #=GS DYR_ENCCU_1 AC O62583 #=GS DYR_ENCCU_1 DR SWS; O62583; #=GS DYR_ENCCU_1 DR EMBL; CAA06647; #=GS DYR_ENCCU_1 DR EMBL; CAD24887; #=GS DYR_ENCCU_1 DR EMBL; CAD25017; #=GS DYR_ENCCU_1 DR EMBL; CAD26313; #=GS DYR_ENCCU_1 OS Encephalitozoon cuniculi #=GS DYR_ENCCU_1 OC poss_fungi_metazoa #=GS DYR_ENCCU_1 OC fungi_metazoa #=GS DYR_ENCCU_1 OC fungi #=GS DYR_ENCCU_1 DE Encephalitozoon cuniculi (no structure; aligned via DHFR.weighted.for.enceph.hmm; alignment version 1) #=GS DYR_ENCCU_1 WT 0.389784961939 ## DYR_ENCCU_1 Cluster: 1U72A #=GS DYR_ENCCU_2 AC O62583 #=GS DYR_ENCCU_2 DR SWS; O62583; #=GS DYR_ENCCU_2 DR EMBL; CAA06647; #=GS DYR_ENCCU_2 DR EMBL; CAD24887; #=GS DYR_ENCCU_2 DR EMBL; CAD25017; #=GS DYR_ENCCU_2 DR EMBL; CAD26313; #=GS DYR_ENCCU_2 OS Encephalitozoon cuniculi #=GS DYR_ENCCU_2 OC poss_fungi_metazoa #=GS DYR_ENCCU_2 OC fungi_metazoa #=GS DYR_ENCCU_2 OC fungi #=GS DYR_ENCCU_2 DE Encephalitozoon cuniculi (no structure; aligned via DHFR.weighted.for.enceph.hmm; alignment version 2) #=GS DYR_ENCCU_2 WT 0.408116817474 ## DYR_ENCCU_2 Cluster: 1U72A ## start of real 1DYR0 cluster #=GS EAK84413 AC EAK84413 #=GS EAK84413 DR EMBL; EAK84413; #=GS EAK84413 OS Ustilago maydis #=GS EAK84413 OC poss_fungi_metazoa #=GS EAK84413 OC fungi_metazoa #=GS EAK84413 OC fungi #=GS EAK84413 DE Ustilago maydis (no structure; aligned via DHFR.weighted.for.ust.hmm) ## initial part before, including m (alternative start site?) taken off #=GS EAK84413 WT 0.423381239176 ## EAK84413 Cluster: 1U72A #=GS BAC75955 AC BAC75955 #=GS BAC75955 DR EMBL; BAC75955; #=GS BAC75955 OS Coprinus cinereus #=GS BAC75955 OC poss_fungi_metazoa #=GS BAC75955 OC fungi_metazoa #=GS BAC75955 OC fungi #=GS BAC75955 DE Coprinus cinereus (no structure; aligned via DHFR.weighted.for.fungi.tmp3.hmm) #=GS BAC75955 WT 0.244362533092 ## BAC75955 Cluster: 1U72A #=GS DYR_CRYNE AC Q07801 #=GS DYR_CRYNE DR SWS; Q07801; #=GS DYR_CRYNE DR SWS; Q5KAF0; #=GS DYR_CRYNE DR TREMBL; Q55L31; #=GS DYR_CRYNE DR EMBL; AAB26198; #=GS DYR_CRYNE DR EMBL; AAW45849; #=GS DYR_CRYNE DR EMBL; EAL18511; #=GS DYR_CRYNE OS Cryptococcus neoformans #=GS DYR_CRYNE OC poss_fungi_metazoa #=GS DYR_CRYNE OC fungi_metazoa #=GS DYR_CRYNE OC fungi #=GS DYR_CRYNE DE Cryptococcus neoformans (no structure; aligned via DHFR.weighted.for.cryptococcus.hmm) #=GS DYR_CRYNE WT 0.33968180418 ## DYR_CRYNE Cluster: 1U72A #=GS DYR_SCHPO_1 AC P36591 #=GS DYR_SCHPO_1 DR SWS; P36591; #=GS DYR_SCHPO_1 OS Schizosaccharomyces pombe #=GS DYR_SCHPO_1 OC poss_fungi_metazoa #=GS DYR_SCHPO_1 OC fungi_metazoa #=GS DYR_SCHPO_1 OC fungi #=GS DYR_SCHPO_1 OC ascomycota #=GS DYR_SCHPO_1 DE Schizosaccharomyces pombe (no structure; aligned via DHFR.weighted.for.pombe.hmm; alignment version 1) ## initial part before, including m (alternative start site, am guessing - there is evidence for the full-length transcript being present...) taken off #=GS DYR_SCHPO_1 WT 0.289526998997 ## DYR_SCHPO_1 Cluster: 1U72A #=GS DYR_SCHPO_2 AC P36591 #=GS DYR_SCHPO_2 DR SWS; P36591; #=GS DYR_SCHPO_2 OS Schizosaccharomyces pombe #=GS DYR_SCHPO_2 OC poss_fungi_metazoa #=GS DYR_SCHPO_2 OC fungi_metazoa #=GS DYR_SCHPO_2 OC fungi #=GS DYR_SCHPO_2 OC ascomycota #=GS DYR_SCHPO_2 DE Schizosaccharomyces pombe (no structure; aligned via DHFR.weighted.for.pombe.hmm; alignment version 2) ## initial part before, including m (alternative start site, am guessing - there is evidence for the full-length transcript being present...) taken off #=GS DYR_SCHPO_2 WT 0.306025266647 ## DYR_SCHPO_2 Cluster: 1U72A #=GS DYR_PNECA AC P16184 #=GS DYR_PNECA DR SWS; P16184; #=GS DYR_PNECA DR PDB; 1dyr; #=GS DYR_PNECA DR PDB; 1cd2 A; #=GS DYR_PNECA DR PDB; 1daj; #=GS DYR_PNECA DR PDB; 1e26 A; #=GS DYR_PNECA DR PDB; 1klk A; #=GS DYR_PNECA DR PDB; 1ly3 A; #=GS DYR_PNECA DR PDB; 1ly4 A; #=GS DYR_PNECA DR PDB; 1s3y A; #=GS DYR_PNECA DR PDB; 1vj3 A; #=GS DYR_PNECA DR PDB; 2cd2 A; #=GS DYR_PNECA DR PDB; 3cd2 A; #=GS DYR_PNECA DR PDB; 4cd2 A; #=GS DYR_PNECA OS Pneumocystis carinii f. sp. rattus #=GS DYR_PNECA OC poss_fungi_metazoa #=GS DYR_PNECA OC fungi_metazoa #=GS DYR_PNECA OC fungi #=GS DYR_PNECA OC ascomycota #=GS DYR_PNECA DE Pneumocystis carinii (structures not used - aligned via DHFR.weighted.for.fungi.tmp4.hmm; variant 1 (rat)) #=GS DYR_PNECA WT 0.348079890013 ## DYR_PNECA Cluster: 1U72A #=GS AAF14071 AC AAF14071 #=GS AAF14071 DR EMBL; AAF14071; #=GS AAF14071 OS Pneumocystis carinii f. sp. hominis #=GS AAF14071 OC poss_fungi_metazoa #=GS AAF14071 OC fungi_metazoa #=GS AAF14071 OC fungi #=GS AAF14071 OC ascomycota #=GS AAF14071 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp4.hmm; variant 2 (human)) #=GS AAF14071 WT 0.095573887229 ## AAF14071 Cluster: 1U72A #=GS AAL25720 AC AAL25720 #=GS AAL25720 DR EMBL; AAL25720; #=GS AAL25720 OS Pneumocystis carinii #=GS AAL25720 OC poss_fungi_metazoa #=GS AAL25720 OC fungi_metazoa #=GS AAL25720 OC fungi #=GS AAL25720 OC ascomycota #=GS AAL25720 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 3) #=GS AAL25720 WT 0.2409542799 ## AAL25720 Cluster: 1U72A #=GS AAT99406 AC AAT99406 #=GS AAT99406 DR EMBL; AAT99406; #=GS AAT99406 OS Pneumocystis carinii #=GS AAT99406 OC poss_fungi_metazoa #=GS AAT99406 OC fungi_metazoa #=GS AAT99406 OC fungi #=GS AAT99406 OC ascomycota #=GS AAT99406 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 4) #=GS AAT99406 WT 0.134850770235 ## AAT99406 Cluster: 1U72A #=GS AAT99411 AC AAT99411 #=GS AAT99411 DR EMBL; AAT99411; #=GS AAT99411 OS Pneumocystis carinii #=GS AAT99411 OC poss_fungi_metazoa #=GS AAT99411 OC fungi_metazoa #=GS AAT99411 OC fungi #=GS AAT99411 OC ascomycota #=GS AAT99411 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 5) #=GS AAT99411 WT 0.100311994553 ## AAT99411 Cluster: 1U72A #=GS AAT99412 AC AAT99412 #=GS AAT99412 DR EMBL; AAT99412; #=GS AAT99412 OS Pneumocystis carinii #=GS AAT99412 OC poss_fungi_metazoa #=GS AAT99412 OC fungi_metazoa #=GS AAT99412 OC fungi #=GS AAT99412 OC ascomycota #=GS AAT99412 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 6) #=GS AAT99412 WT 0.0986605361104 ## AAT99412 Cluster: 1U72A #=GS AAT99413 AC AAT99413 #=GS AAT99413 DR EMBL; AAT99413; #=GS AAT99413 OS Pneumocystis carinii #=GS AAT99413 OC poss_fungi_metazoa #=GS AAT99413 OC fungi_metazoa #=GS AAT99413 OC fungi #=GS AAT99413 OC ascomycota #=GS AAT99413 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 7) #=GS AAT99413 WT 0.0989902466536 ## AAT99413 Cluster: 1U72A #=GS AAT99417 AC AAT99417 #=GS AAT99417 DR EMBL; AAT99417; #=GS AAT99417 OS Pneumocystis carinii #=GS AAT99417 OC poss_fungi_metazoa #=GS AAT99417 OC fungi_metazoa #=GS AAT99417 OC fungi #=GS AAT99417 OC ascomycota #=GS AAT99417 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 8) #=GS AAT99417 WT 0.174187868834 ## AAT99417 Cluster: 1U72A #=GS ABB84704 AC ABB84704 #=GS ABB84704 DR EMBL; ABB84704; #=GS ABB84704 OS Pneumocystis carinii #=GS ABB84704 OC poss_fungi_metazoa #=GS ABB84704 OC fungi_metazoa #=GS ABB84704 OC fungi #=GS ABB84704 OC ascomycota #=GS ABB84704 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 9) #=GS ABB84704 WT 0.127951309085 ## ABB84704 Cluster: 1U72A #=GS ABB84712 AC ABB84712 #=GS ABB84712 DR EMBL; ABB84712; #=GS ABB84712 OS Pneumocystis carinii #=GS ABB84712 OC poss_fungi_metazoa #=GS ABB84712 OC fungi_metazoa #=GS ABB84712 OC fungi #=GS ABB84712 OC ascomycota #=GS ABB84712 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 10) #=GS ABB84712 WT 0.0966892316937 ## ABB84712 Cluster: 1U72A #=GS ABB84716 AC ABB84716 #=GS ABB84716 DR EMBL; ABB84716; #=GS ABB84716 OS Pneumocystis carinii #=GS ABB84716 OC poss_fungi_metazoa #=GS ABB84716 OC fungi_metazoa #=GS ABB84716 OC fungi #=GS ABB84716 OC ascomycota #=GS ABB84716 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 11) #=GS ABB84716 WT 0.0981981754303 ## ABB84716 Cluster: 1U72A #=GS ABB84718 AC ABB84718 #=GS ABB84718 DR EMBL; ABB84718; #=GS ABB84718 OS Pneumocystis carinii #=GS ABB84718 OC poss_fungi_metazoa #=GS ABB84718 OC fungi_metazoa #=GS ABB84718 OC fungi #=GS ABB84718 OC ascomycota #=GS ABB84718 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 12) #=GS ABB84718 WT 0.0955388620496 ## ABB84718 Cluster: 1U72A #=GS ABB84720 AC ABB84720 #=GS ABB84720 DR EMBL; ABB84720; #=GS ABB84720 OS Pneumocystis carinii #=GS ABB84720 OC poss_fungi_metazoa #=GS ABB84720 OC fungi_metazoa #=GS ABB84720 OC fungi #=GS ABB84720 OC ascomycota #=GS ABB84720 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 13) #=GS ABB84720 WT 0.0955388620496 ## ABB84720 Cluster: 1U72A #=GS ABB84722 AC ABB84722 #=GS ABB84722 DR EMBL; ABB84722; #=GS ABB84722 OS Pneumocystis carinii #=GS ABB84722 OC poss_fungi_metazoa #=GS ABB84722 OC fungi_metazoa #=GS ABB84722 OC fungi #=GS ABB84722 OC ascomycota #=GS ABB84722 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 14) #=GS ABB84722 WT 0.0953710973263 ## ABB84722 Cluster: 1U72A #=GS ABB84726 AC ABB84726 #=GS ABB84726 DR EMBL; ABB84726; #=GS ABB84726 OS Pneumocystis carinii #=GS ABB84726 OC poss_fungi_metazoa #=GS ABB84726 OC fungi_metazoa #=GS ABB84726 OC fungi #=GS ABB84726 OC ascomycota #=GS ABB84726 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 15) #=GS ABB84726 WT 0.0955388620496 ## ABB84726 Cluster: 1U72A #=GS ABB84744 AC ABB84744 #=GS ABB84744 DR EMBL; ABB84744; #=GS ABB84744 OS Pneumocystis carinii #=GS ABB84744 OC poss_fungi_metazoa #=GS ABB84744 OC fungi_metazoa #=GS ABB84744 OC fungi #=GS ABB84744 OC ascomycota #=GS ABB84744 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 16) #=GS ABB84744 WT 0.0955388620496 ## ABB84744 Cluster: 1U72A #=GS ABB84751 AC ABB84751 #=GS ABB84751 DR EMBL; ABB84751; #=GS ABB84751 OS Pneumocystis carinii #=GS ABB84751 OC poss_fungi_metazoa #=GS ABB84751 OC fungi_metazoa #=GS ABB84751 OC fungi #=GS ABB84751 OC ascomycota #=GS ABB84751 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 17) #=GS ABB84751 WT 0.0965188220143 ## ABB84751 Cluster: 1U72A #=GS ABF06467 AC ABF06467 #=GS ABF06467 DR EMBL; ABF06467; #=GS ABF06467 OS Pneumocystis carinii #=GS ABF06467 OC poss_fungi_metazoa #=GS ABF06467 OC fungi_metazoa #=GS ABF06467 OC fungi #=GS ABF06467 OC ascomycota #=GS ABF06467 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 18) #=GS ABF06467 WT 0.100236237049 ## ABF06467 Cluster: 1U72A #=GS ABF06468 AC ABF06468 #=GS ABF06468 DR EMBL; ABF06468; #=GS ABF06468 OS Pneumocystis carinii #=GS ABF06468 OC poss_fungi_metazoa #=GS ABF06468 OC fungi_metazoa #=GS ABF06468 OC fungi #=GS ABF06468 OC ascomycota #=GS ABF06468 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 19) #=GS ABF06468 WT 0.110260106623 ## ABF06468 Cluster: 1U72A #=GS ABF06469 AC ABF06469 #=GS ABF06469 DR EMBL; ABF06469; #=GS ABF06469 OS Pneumocystis carinii #=GS ABF06469 OC poss_fungi_metazoa #=GS ABF06469 OC fungi_metazoa #=GS ABF06469 OC fungi #=GS ABF06469 OC ascomycota #=GS ABF06469 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 20) #=GS ABF06469 WT 0.108349896967 ## ABF06469 Cluster: 1U72A #=GS ABF06470 AC ABF06470 #=GS ABF06470 DR EMBL; ABF06470; #=GS ABF06470 OS Pneumocystis carinii #=GS ABF06470 OC poss_fungi_metazoa #=GS ABF06470 OC fungi_metazoa #=GS ABF06470 OC fungi #=GS ABF06470 OC ascomycota #=GS ABF06470 DE Pneumocystis carinii (no structure for this variant; aligned via DHFR.weighted.for.fungi.tmp5.hmm; variant 21) #=GS ABF06470 WT 0.0944603905082 ## ABF06470 Cluster: 1U72A #=GS Q6CC38_YARLI_1 AC Q6CC38 #=GS Q6CC38_YARLI_1 DR TREMBL; Q6CC38; #=GS Q6CC38_YARLI_1 DR EMBL; CAG82084; #=GS Q6CC38_YARLI_1 OS Yarrowia lipolytica #=GS Q6CC38_YARLI_1 OC poss_fungi_metazoa #=GS Q6CC38_YARLI_1 OC fungi_metazoa #=GS Q6CC38_YARLI_1 OC fungi #=GS Q6CC38_YARLI_1 OC ascomycota #=GS Q6CC38_YARLI_1 DE Yarrowia lipolytica (no structure; aligned via DHFR.weighted.for.yarrowia.hmm; alignment version 1) #=GS Q6CC38_YARLI_1 WT 0.253606647253 ## Q6CC38_YARLI_1 Cluster: 1U72A #=GS Q6CC38_YARLI_2 AC Q6CC38 #=GS Q6CC38_YARLI_2 DR TREMBL; Q6CC38; #=GS Q6CC38_YARLI_2 DR EMBL; CAG82084; #=GS Q6CC38_YARLI_2 OS Yarrowia lipolytica #=GS Q6CC38_YARLI_2 OC poss_fungi_metazoa #=GS Q6CC38_YARLI_2 OC fungi_metazoa #=GS Q6CC38_YARLI_2 OC fungi #=GS Q6CC38_YARLI_2 OC ascomycota #=GS Q6CC38_YARLI_2 DE Yarrowia lipolytica (no structure; aligned via DHFR.weighted.for.yarrowia.hmm; alignment version 2) #=GS Q6CC38_YARLI_2 WT 0.27892306447 ## Q6CC38_YARLI_2 Cluster: 1U72A #=GS CAG60823_1 AC CAG60823 #=GS CAG60823_1 DR EMBL; CAG60823; #=GS CAG60823_1 DR TREMBL; Q6FPH0; #=GS CAG60823_1 OS Candida glabrata #=GS CAG60823_1 OC poss_fungi_metazoa #=GS CAG60823_1 OC fungi_metazoa #=GS CAG60823_1 OC fungi #=GS CAG60823_1 OC ascomycota #=GS CAG60823_1 DE "Candida" glabrata (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 1) #=GS CAG60823_1 WT 0.268898814917 ## CAG60823_1 Cluster: 1U72A #=GS CAG60823_2 AC CAG60823 #=GS CAG60823_2 DR EMBL; CAG60823; #=GS CAG60823_2 DR TREMBL; Q6FPH0; #=GS CAG60823_2 OS Candida glabrata #=GS CAG60823_2 OC poss_fungi_metazoa #=GS CAG60823_2 OC fungi_metazoa #=GS CAG60823_2 OC fungi #=GS CAG60823_2 OC ascomycota #=GS CAG60823_2 DE "Candida" glabrata (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 2) #=GS CAG60823_2 WT 0.212503701448 ## CAG60823_2 Cluster: 1U72A #=GS AAS51350_1 AC AAS51350 #=GS AAS51350_1 DR EMBL; AAS51350; #=GS AAS51350_1 DR TREMBL; Q75BZ5; #=GS AAS51350_1 OS Eremothecium gossypii #=GS AAS51350_1 OC poss_fungi_metazoa #=GS AAS51350_1 OC fungi_metazoa #=GS AAS51350_1 OC fungi #=GS AAS51350_1 OC ascomycota #=GS AAS51350_1 DE Eremothecium/Ashbya gossypii (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 1) #=GS AAS51350_1 WT 0.346816539764 ## AAS51350_1 Cluster: 1U72A #=GS AAS51350_2 AC AAS51350 #=GS AAS51350_2 DR EMBL; AAS51350; #=GS AAS51350_2 DR TREMBL; Q75BZ5; #=GS AAS51350_2 OS Eremothecium gossypii #=GS AAS51350_2 OC poss_fungi_metazoa #=GS AAS51350_2 OC fungi_metazoa #=GS AAS51350_2 OC fungi #=GS AAS51350_2 OC ascomycota #=GS AAS51350_2 DE Eremothecium/Ashbya gossypii (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 2) #=GS AAS51350_2 WT 0.32664513588 ## AAS51350_2 Cluster: 1U72A #=GS DYR_YEAST_1 AC P07807 #=GS DYR_YEAST_1 DR SWS; P07807; #=GS DYR_YEAST_1 OS Saccharomyces cerevisiae #=GS DYR_YEAST_1 OC poss_fungi_metazoa #=GS DYR_YEAST_1 OC fungi_metazoa #=GS DYR_YEAST_1 OC fungi #=GS DYR_YEAST_1 OC ascomycota #=GS DYR_YEAST_1 DE Saccharomyces cerevisiae (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 1; variant 1) #=GS DYR_YEAST_1 WT 0.1827275455 ## DYR_YEAST_1 Cluster: 1U72A #=GS DYR_YEAST_2 AC P07807 #=GS DYR_YEAST_2 DR SWS; P07807; #=GS DYR_YEAST_2 OS Saccharomyces cerevisiae #=GS DYR_YEAST_2 OC poss_fungi_metazoa #=GS DYR_YEAST_2 OC fungi_metazoa #=GS DYR_YEAST_2 OC fungi #=GS DYR_YEAST_2 OC ascomycota #=GS DYR_YEAST_2 DE Saccharomyces cerevisiae (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 2; variant 1) #=GS DYR_YEAST_2 WT 0.171738773584 ## DYR_YEAST_2 Cluster: 1U72A #=GS EDN63566_1 AC EDN63566 #=GS EDN63566_1 DR SWS; P07807; #=GS EDN63566_1 DR TREMBL; A6ZP76; #=GS EDN63566_1 DR EMBL; EDN63566; #=GS EDN63566_1 OS Saccharomyces cerevisiae #=GS EDN63566_1 OC poss_fungi_metazoa #=GS EDN63566_1 OC fungi_metazoa #=GS EDN63566_1 OC fungi #=GS EDN63566_1 OC ascomycota #=GS EDN63566_1 DE Saccharomyces cerevisiae (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 1; variant 2) #=GS EDN63566_1 WT 0.1827275455 ## EDN63566_1 Cluster: 1U72A #=GS EDN63566_2 AC EDN63566 #=GS EDN63566_2 DR SWS; P07807; #=GS EDN63566_2 DR TREMBL; A6ZP76; #=GS EDN63566_2 DR EMBL; EDN63566; #=GS EDN63566_2 OS Saccharomyces cerevisiae #=GS EDN63566_2 OC poss_fungi_metazoa #=GS EDN63566_2 OC fungi_metazoa #=GS EDN63566_2 OC fungi #=GS EDN63566_2 OC ascomycota #=GS EDN63566_2 DE Saccharomyces cerevisiae (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 2; variant 2) #=GS EDN63566_2 WT 0.171738773584 ## EDN63566_2 Cluster: 1U72A #=GS CAA68779_1 AC CAA63879 #=GS CAA68779_1 DR SWS; P07807; #=GS CAA68779_1 DR EMBL; CAA68779; #=GS CAA68779_1 DR EMBL; AAA34564; #=GS CAA68779_1 OS Saccharomyces cerevisiae #=GS CAA68779_1 OC poss_fungi_metazoa #=GS CAA68779_1 OC fungi_metazoa #=GS CAA68779_1 OC fungi #=GS CAA68779_1 OC ascomycota #=GS CAA68779_1 DE Saccharomyces cerevisiae (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 1; variant 3) #=GS CAA68779_1 WT 0.198279231787 ## CAA68779_1 Cluster: 1U72A #=GS CAA68779_2 AC CAA63879 #=GS CAA68779_2 DR SWS; P07807; #=GS CAA68779_2 DR EMBL; CAA68779; #=GS CAA68779_2 DR EMBL; AAA34564; #=GS CAA68779_2 OS Saccharomyces cerevisiae #=GS CAA68779_2 OC poss_fungi_metazoa #=GS CAA68779_2 OC fungi_metazoa #=GS CAA68779_2 OC fungi #=GS CAA68779_2 OC ascomycota #=GS CAA68779_2 DE Saccharomyces cerevisiae (no structure; aligned via DHFR.weighted.for.saccharomycetaceae.hmm; alignment version 2; variant 3) #=GS CAA68779_2 WT 0.187290474772 ## CAA68779_2 Cluster: 1U72A #=GS CAG86485_1 AC CAG86485 #=GS CAG86485_1 DR TREMBL; Q6BTR6; #=GS CAG86485_1 OS Debaryomyces hansenii #=GS CAG86485_1 OC poss_fungi_metazoa #=GS CAG86485_1 OC fungi_metazoa #=GS CAG86485_1 OC fungi #=GS CAG86485_1 OC ascomycota #=GS CAG86485_1 DE Debaryomyces hansenii (no structure; aligned via DHFR.weighted.for.saccharomycetales.hmm; alignment variation 1) #=GS CAG86485_1 WT 0.229588553309 ## CAG86485_1 Cluster: 1U72A #=GS CAG86485_2 AC CAG86485 #=GS CAG86485_2 DR TREMBL; Q6BTR6; #=GS CAG86485_2 OS Debaryomyces hansenii #=GS CAG86485_2 OC poss_fungi_metazoa #=GS CAG86485_2 OC fungi_metazoa #=GS CAG86485_2 OC fungi #=GS CAG86485_2 OC ascomycota #=GS CAG86485_2 DE Debaryomyces hansenii (no structure; aligned via DHFR.weighted.for.saccharomycetales.hmm; alignment variation 2) #=GS CAG86485_2 WT 0.250264644623 ## CAG86485_2 Cluster: 1U72A #=GS ABN65593_1 AC ABN65593 #=GS ABN65593_1 DR TREMBL; A3LSL9; #=GS ABN65593_1 OS Pichia stipitis #=GS ABN65593_1 OC poss_fungi_metazoa #=GS ABN65593_1 OC fungi_metazoa #=GS ABN65593_1 OC fungi #=GS ABN65593_1 OC ascomycota #=GS ABN65593_1 DE Pichia stipitis (no structure; aligned via DHFR.weighted.for.pichia.hmm; alignment variation 1) #=GS ABN65593_1 WT 0.230044811964 ## ABN65593_1 Cluster: 1U72A #=GS ABN65593_2 AC ABN65593 #=GS ABN65593_2 DR TREMBL; A3LSL9; #=GS ABN65593_2 OS Pichia stipitis #=GS ABN65593_2 OC poss_fungi_metazoa #=GS ABN65593_2 OC fungi_metazoa #=GS ABN65593_2 OC fungi #=GS ABN65593_2 OC ascomycota #=GS ABN65593_2 DE Pichia stipitis (no structure; aligned via DHFR.weighted.for.pichia.hmm; alignment variation 2) #=GS ABN65593_2 WT 0.259779661894 ## ABN65593_2 Cluster: 1U72A #=GS DYR_CANAL_1 AC P22906 #=GS DYR_CANAL_1 DR SWS; P22906; #=GS DYR_CANAL_1 DR SWS; O59840; #=GS DYR_CANAL_1 DR EMBL; AAC05610; #=GS DYR_CANAL_1 OS Candida albicans #=GS DYR_CANAL_1 OC poss_fungi_metazoa #=GS DYR_CANAL_1 OC fungi_metazoa #=GS DYR_CANAL_1 OC fungi #=GS DYR_CANAL_1 OC ascomycota #=GS DYR_CANAL_1 DE Candida albicans (structures not used - aligned via DHFR.weighted.for.saccharomycetales.2.hmm; alignment variation 1) #=GS DYR_CANAL_1 WT 0.216233953834 ## DYR_CANAL_1 Cluster: 1U72A #=GS DYR_CANAL_2 AC P22906 #=GS DYR_CANAL_2 DR SWS; P22906; #=GS DYR_CANAL_2 DR SWS; O59840; #=GS DYR_CANAL_2 DR EMBL; AAC05610; #=GS DYR_CANAL_2 OS Candida albicans #=GS DYR_CANAL_2 OC poss_fungi_metazoa #=GS DYR_CANAL_2 OC fungi_metazoa #=GS DYR_CANAL_2 OC fungi #=GS DYR_CANAL_2 OC ascomycota #=GS DYR_CANAL_2 DE Candida albicans (structures not used - aligned via DHFR.weighted.for.saccharomycetales.2.hmm; alignment variation 2) #=GS DYR_CANAL_2 WT 0.195754885674 ## DYR_CANAL_2 Cluster: 1U72A ## 1J3KA Cluster #=GS 1J3KA AC DRTS_PLAFK #=GS 1J3KA OS Plasmodium falciparum #=GS 1J3KA OC alveolata #=GS 1J3KA DR PDB; 1j3k A; #=GS 1J3KA DR SWS; P13922; #=GS 1J3KA DE Malaria DHFR section (N51I+C59R+S108N+I164L - mutations removed) - residues start at 2 #=GS 1J3KA WT 0.184230655432 ## 1J3KA Cluster: 1J3KA #=GS 1J3KB AC DRTS_PLAFK #=GS 1J3KB OS Plasmodium falciparum #=GS 1J3KB OC alveolata #=GS 1J3KB DR PDB; 1j3k B; #=GS 1J3KB DR SWS; P13922; #=GS 1J3KB DE Malaria DHFR section (N51I+C59R+S108N+I164L - mutations removed) - residues start at 2 #=GS 1J3KB WT 0.184230655432 ## 1J3KB Cluster: 1J3KA #=GS 1J3IA AC DRTS_PLAFK #=GS 1J3IA OS Plasmodium falciparum #=GS 1J3IA OC alveolata #=GS 1J3IA DR PDB; 1j3i A; #=GS 1J3IA DR SWS; P13922; #=GS 1J3IA DE Malaria DHFR section - residues start at 2 #=GS 1J3IA WT 0.184230655432 ## 1J3IA Cluster: 1J3KA #=GS 1J3IB AC DRTS_PLAFK #=GS 1J3IB OS Plasmodium falciparum #=GS 1J3IB OC alveolata #=GS 1J3IB DR PDB; 1j3i B; #=GS 1J3IB DR SWS; P13922; #=GS 1J3IB DE Malaria DHFR section - residues start at 2 #=GS 1J3IB WT 0.184230655432 ## 1J3IB Cluster: 1J3KA #=GS DRTS_PLACH AC P20712 #=GS DRTS_PLACH OS Plasmodium chabaudi #=GS DRTS_PLACH OC alveolata #=GS DRTS_PLACH DE Rodent malaria DHFR section (no structure; aligned only vs 1J3KAB, 2BL9A did not work) #=GS DRTS_PLACH WT 0.26231366396 ## DRTS_PLACH Cluster: 1J3KA #=GS Q7RGH7_PLAYO AC Q7RGH7 #=GS Q7RGH7_PLAYO OS Plasmodium berghei yoelii #=GS Q7RGH7_PLAYO OC alveolata #=GS Q7RGH7_PLAYO DE Rodent malaria DHFR section (no structure; aligned vs combo of 1J3KAB, 2BL9A (for repeat section)) ## cut off after end of 1J3KAB alignment #=GS Q7RGH7_PLAYO WT 0.301809459925 ## Q7RGH7_PLAYO Cluster: 1J3KA #=GS Q95US9_PLAGA AC Q95US9 #=GS Q95US9_PLAGA OS Plasmodium gallinaceum #=GS Q95US9_PLAGA OC alveolata #=GS Q95US9_PLAGA DE Avian malaria DHFR section (no structure; aligned vs 1J3KAB; 2BL9A did not work) ## cut off approximately after end of 1J3KAB alignment #=GS Q95US9_PLAGA WT 0.247906669974 ## Q95US9_PLAGA Cluster: 1J3KA #=GS 2BL9A AC Q9U0E8 #=GS 2BL9A OS Plasmodium vivax #=GS 2BL9A OC alveolata #=GS 2BL9A DR PDB; 2bl9 A; #=GS 2BL9A DR PDB; 2blb A; #=GS 2BL9A DE Malaria DHFR section (aligned only vs 1J3KA, 1J3KB; A24E mutation/error corrected) ## 2 other alterations; gg added onto end from DRTS_PLAVI sequence; residues start at 2 #=GS 2BL9A WT 0.185604080558 ## 2BL9A Cluster: 1J3KA #=GS DRTS_PLAVI AC O02604 #=GS DRTS_PLAVI OS Plasmodium vivax #=GS DRTS_PLAVI OC alveolata #=GS DRTS_PLAVI DE Malaria DHFR section (no structure for this variant; aligned to 2BL9A) #=GS DRTS_PLAVI WT 0.1879632622 ## DRTS_PLAVI Cluster: 1J3KA #=GS DRTS_PLAVN AC P46103 #=GS DRTS_PLAVN OS Plasmodium vinckei #=GS DRTS_PLAVN OC alveolata #=GS DRTS_PLAVN DE Rodent malaria DHFR section (no structure; incomplete - aligned to 2BL9A; 1J3KAB did not work) #=GS DRTS_PLAVN WT 0.208032950759 ## DRTS_PLAVN Cluster: 1J3KA #=GS AAV33644 AC Q5EXQ6_9APIC ## source has problems; records seem to claim is from apicoplast/plastid! #=GS AAV33644 DR EMBL; AAV33644; #=GS AAV33644 DR TREMBL; Q5EXQ6; #=GS AAV33644 OS Plasmodium inui #=GS AAV33644 OC alveolata #=GS AAV33644 DE Old World monkey malaria DHFR section (no structure; incomplete - aligned to 2BL9A; 1J3KAB did not work) #=GS AAV33644 WT 0.238653123379 ## AAV33644 Cluster: 1J3KA #=GS AAV33645 AC Q5EXQ5_9APIC ## source has problems; records seem to claim is from apicoplast/plastid! #=GS AAV33645 DR TREMBL; Q5EXQ5; #=GS AAV33645 DR EMBL; AAV33645; #=GS AAV33645 OS Plasmodium cynomolgi #=GS AAV33645 OC alveolata #=GS AAV33645 DE Rhesus macaque malaria DHFR section (no structure; incomplete - aligned to 2BL9A; 1J3KAB did not work) #=GS AAV33645 WT 0.196945384145 ## AAV33645 Cluster: 1J3KA #=GS 1SEJC AC XP_665866 #=GS 1SEJC DR EMBL; AAC47229; #=GS 1SEJC DR PDB; 1SEJ A; #=GS 1SEJC DR PDB; 1SEJ B; #=GS 1SEJC DR PDB; 1SEJ C; #=GS 1SEJC DR PDB; 1SEJ D; #=GS 1SEJC DR PDB; 1SEJ E; #=GS 1SEJC OS Cryptosporidium hominis #=GS 1SEJC OS Cryptosporidium parvum #=GS 1SEJC OC alveolata #=GS 1SEJC DE Cryptosporidium hominis, parvum (variant of latter) DHFR section ## residues start at 2 #=GS 1SEJC WT 0.29452124238 ## 1SEJC Cluster: 1SEJC #=GS 1QZFD AC XP_665866 #=GS 1QZFD DR EMBL; AAC47229; #=GS 1QZFD DR PDB; 1QZF A; #=GS 1QZFD DR PDB; 1QZF B; #=GS 1QZFD DR PDB; 1QZF C; #=GS 1QZFD DR PDB; 1QZF D; #=GS 1QZFD DR PDB; 1QZF E; #=GS 1QZFD OS Cryptosporidium hominis #=GS 1QZFD OS Cryptosporidium parvum #=GS 1QZFD OC alveolata #=GS 1QZFD DE Cryptosporidium hominis, parvum (variant of latter) DHFR section; folate bound to DHFR #=GS 1QZFD WT 0.29452124238 ## 1QZFD Cluster: 1SEJC #=GS AAC47229 AC AAC47229 ## is missing end of TS section - EAK87446 seems to be full version but with alternative start site #=GS AAC47229 DR EMBL; EAK87446; #=GS AAC47229 OS Cryptosporidium parvum #=GS AAC47229 OC alveolata #=GS AAC47229 DE Cryptosporidium parvum (variant 2) DHFR section (no structure for this variant; aligned to 1SEJC) #=GS AAC47229 WT 0.316687703133 ## AAC47229 Cluster: 1SEJC #=GS CAI76538 AC CAI76538 #=GS CAI76538 DR EMBL; CAI76538; #=GS CAI76538 OS Theileria annulata #=GS CAI76538 OC alveolata #=GS CAI76538 DE Theileria annulata DHFR section (no structure; aligned via DHFR.weighted.for.theileria.hmm) #=GS CAI76538 WT 0.444102674723 ## CAI76538 Cluster: 1SEJC #=GS EAN31856 AC EAN31856 #=GS EAN31856 DR EMBL; EAN31856; #=GS EAN31856 OS Theileria parva #=GS EAN31856 OC alveolata #=GS EAN31856 DE Theileria parva DHFR section (no structure; aligned via DHFR.weighted.for.theileria.hmm) #=GS EAN31856 WT 0.460553497076 ## EAN31856 Cluster: 1SEJC #=GS EAR85731 AC EAR85731 #=GS EAR85731 DR EMBL; EAR85731; #=GS EAR85731 OS Tetrahymena thermophila #=GS EAR85731 OC alveolata #=GS EAR85731 DE Tetrahymena thermophila DHFR section (no structure; aligned via DHFR.weighted.for.tetrahymena.hmm) #=GS EAR85731 WT 0.694769382477 ## EAR85731 Cluster: 1SEJC #=GS DRTS_TRYBB AC Q27783 #=GS DRTS_TRYBB DR SWS; Q27783; #=GS DRTS_TRYBB DR EMBL; AAA91362; #=GS DRTS_TRYBB OS Trypanosoma brucei #=GS DRTS_TRYBB OC kinetoplastida #=GS DRTS_TRYBB DE Trypanosoma brucei DHFR section (variant 1; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## trimmed lsltrilrkkipvhelag at start #=GS DRTS_TRYBB WT 0.265756368637 ## DRTS_TRYBB Cluster: 1SEJC #=GS AAX78868 AC AAX78868 #=GS AAX78868 DR EMBL; AAX78868; #=GS AAX78868 DR EMBL; AAZ12612; ## Also XP_846171 #=GS AAX78868 OS Trypanosoma brucei #=GS AAX78868 OC kinetoplastida #=GS AAX78868 DE Trypanosoma brucei DHFR section (variant 2; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) #=GS AAX78868 WT 0.258467018604 ## AAX78868 Cluster: 1SEJC #=GS DRTS_TRYCR AC Q27793 #=GS DRTS_TRYCR DR SWS; Q27793; #=GS DRTS_TRYCR DR TREMBL; Q95NX3; #=GS DRTS_TRYCR DR EMBL; AAB49898; #=GS DRTS_TRYCR DR EMBL; EAN93476; ## Also XP_815327 #=GS DRTS_TRYCR OS Trypanosoma cruzi #=GS DRTS_TRYCR OC kinetoplastida #=GS DRTS_TRYCR DE Trypanosoma cruzi DHFR section (variant 1; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## trimmed slfkirmpetvae at start #=GS DRTS_TRYCR WT 0.174868986011 ## DRTS_TRYCR Cluster: 1SEJC #=GS AAK71184 AC AAK71184 #=GS AAK71184 DR EMBL; AAK71184; #=GS AAK71184 DR TREMBL; Q95NY4; #=GS AAK71184 OS Trypanosoma cruzi #=GS AAK71184 OC kinetoplastida #=GS AAK71184 DE Trypanosoma cruzi DHFR section (variant 2; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) #=GS AAK71184 WT 0.176356047392 ## AAK71184 Cluster: 1SEJC #=GS AAK71177 AC AAK71177 #=GS AAK71177 DR EMBL; AAK71177; #=GS AAK71177 DR TREMBL; Q963S8; #=GS AAK71177 OS Trypanosoma cruzi #=GS AAK71177 OC kinetoplastida #=GS AAK71177 DE Trypanosoma cruzi DHFR section (variant 3; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) #=GS AAK71177 WT 0.18199890852 ## AAK71177 Cluster: 1SEJC #=GS Q95NI3_TRYCR AC Q95NI3 #=GS Q95NI3_TRYCR DR TREMBL; Q95NI3; #=GS Q95NI3_TRYCR DR EMBL; AAM18487; #=GS Q95NI3_TRYCR DR EMBL; AAK71159; #=GS Q95NI3_TRYCR DR EMBL; AAK71161; #=GS Q95NI3_TRYCR DR EMBL; AAK71162; #=GS Q95NI3_TRYCR DR EMBL; AAK71163; #=GS Q95NI3_TRYCR DR EMBL; AAK71164; #=GS Q95NI3_TRYCR DR EMBL; AAK71165; #=GS Q95NI3_TRYCR DR EMBL; AAK71174; #=GS Q95NI3_TRYCR DR EMBL; AAK71176; #=GS Q95NI3_TRYCR DR EMBL; AAK71178; #=GS Q95NI3_TRYCR DR EMBL; AAK71180; #=GS Q95NI3_TRYCR DR EMBL; AAK71182; #=GS Q95NI3_TRYCR OS Trypanosoma cruzi #=GS Q95NI3_TRYCR OC kinetoplastida #=GS Q95NI3_TRYCR DE Trypanosoma cruzi DHFR section (variant 4; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) #=GS Q95NI3_TRYCR WT 0.175964057446 ## Q95NI3_TRYCR Cluster: 1SEJC #=GS Q95NT2_TRYCR AC Q95NT2 #=GS Q95NT2_TRYCR DR TREMBL; Q95NT2; #=GS Q95NT2_TRYCR DR EMBL; AAK71150; #=GS Q95NT2_TRYCR DR EMBL; AAK71154; #=GS Q95NT2_TRYCR DR TREMBL; Q95NS0; #=GS Q95NT2_TRYCR DR EMBL; AAK71144; #=GS Q95NT2_TRYCR DR EMBL; AAK71145; #=GS Q95NT2_TRYCR DR EMBL; AAK71146; #=GS Q95NT2_TRYCR DR EMBL; AAK71147; #=GS Q95NT2_TRYCR DR EMBL; AAK71148; #=GS Q95NT2_TRYCR DR EMBL; AAK71149; #=GS Q95NT2_TRYCR DR EMBL; AAK71150; #=GS Q95NT2_TRYCR DR EMBL; AAK71151; #=GS Q95NT2_TRYCR DR EMBL; AAK71152; #=GS Q95NT2_TRYCR DR EMBL; AAK71153; #=GS Q95NT2_TRYCR DR EMBL; AAK71155; #=GS Q95NT2_TRYCR DR EMBL; AAK71156; #=GS Q95NT2_TRYCR DR EMBL; AAK71157; #=GS Q95NT2_TRYCR DR EMBL; AAK71158; #=GS Q95NT2_TRYCR DR EMBL; AAK71160; #=GS Q95NT2_TRYCR OS Trypanosoma cruzi #=GS Q95NT2_TRYCR OC kinetoplastida #=GS Q95NT2_TRYCR DE Trypanosoma cruzi DHFR section (variant 5; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) #=GS Q95NT2_TRYCR WT 0.175964057446 ## Q95NT2_TRYCR Cluster: 1SEJC #=GS DRTS_LEIAM AC P16126 #=GS DRTS_LEIAM DR SWS; P16126; #=GS DRTS_LEIAM DR EMBL; CAA36020; #=GS DRTS_LEIAM OS Leishmania mexicana #=GS DRTS_LEIAM OC kinetoplastida #=GS DRTS_LEIAM DE Leishmania amazonensis/mexicana DHFR section (no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## sraaakfkipmpvtka removed from start #=GS DRTS_LEIAM WT 0.218506187201 ## DRTS_LEIAM Cluster: 1SEJC #=GS DRTS_LEIMA AC P07382 #=GS DRTS_LEIMA DR SWS; P07382; #=GS DRTS_LEIMA DR EMBL; AAA29232; #=GS DRTS_LEIMA DR EMBL; CAA36019; #=GS DRTS_LEIMA DR EMBL; CAJ02132; #=GS DRTS_LEIMA OS Leishmania tropica major #=GS DRTS_LEIMA OC kinetoplastida #=GS DRTS_LEIMA DE Leishmania tropica major DHFR section (variant 1; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## sraaarfkipmpetka removed from start #=GS DRTS_LEIMA WT 0.21577231586 ## DRTS_LEIMA Cluster: 1SEJC #=GS AAA29272 AC AAA29272 #=GS AAA29272 DR EMBL; AAA29272; #=GS AAA29272 OS Leishmania tropica major #=GS AAA29272 OC kinetoplastida #=GS AAA29272 DE Leishmania tropica major DHFR section (variant 2; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## section removed from start #=GS AAA29272 WT 0.259000390768 ## AAA29272 Cluster: 1SEJC #=GS Q8MXB7_LEITR AC Q8MXB7 #=GS Q8MXB7_LEITR DR TREMBL; Q8MXB7; #=GS Q8MXB7_LEITR DR EMBL; AAM88660; #=GS Q8MXB7_LEITR OS Leishmania tropica major #=GS Q8MXB7_LEITR OC kinetoplastida #=GS Q8MXB7_LEITR DE Leishmania tropica major DHFR section (variant 3; no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## section removed from start #=GS Q8MXB7_LEITR WT 0.210551708937 ## Q8MXB7_LEITR Cluster: 1SEJC #=GS Q8MQV1_LEICH AC Q8MQV1 #=GS Q8MQV1_LEICH DR TREMBL; Q8MQV1; #=GS Q8MQV1_LEICH DR TREMBL; Q8MQV3; #=GS Q8MQV1_LEICH DR EMBL; AAM88576; #=GS Q8MQV1_LEICH OS Leishmania donovani chagasi #=GS Q8MQV1_LEICH OC kinetoplastida #=GS Q8MQV1_LEICH DE Leishmania donovani chagasi/infantum DHFR section (no structure; aligned via DHFR.weighted.for.kinetoplastids.hmm) ## section removed from start #=GS Q8MQV1_LEICH WT 0.216405808926 ## Q8MQV1_LEICH Cluster: 1SEJC #=GS DRT1_ARATH AC DRTS1_ARATH #=GS DRT1_ARATH DR SWS; Q05762; #=GS DRT1_ARATH DR SWS; Q9SIW4; #=GS DRT1_ARATH OS Arabidopsis thaliana #=GS DRT1_ARATH OC plant_algae #=GS DRT1_ARATH DE Arabidopsis thaliana DHFR section (no structure; aligned via DHFR.weighted.for.plant_algae.hmm) ## atttlndsvttt removed from start #=GS DRT1_ARATH WT 0.260127425194 ## DRT1_ARATH Cluster: 1SEJC #=GS DRTS_SOYBN AC P51820 #=GS DRTS_SOYBN DR SWS; P51820; #=GS DRTS_SOYBN OS Glycine max #=GS DRTS_SOYBN OC plant_algae #=GS DRTS_SOYBN DE Soybean (Glycine max) DHFR section (no structure; aligned via DHFR.weighted.for.plant_algae.hmm) ## psdssvisnghsngsvnp removed from start #=GS DRTS_SOYBN WT 0.312266200781 ## DRTS_SOYBN Cluster: 1SEJC #=GS Q2R481_ORYSA AC Q2R481 #=GS Q2R481_ORYSA DR TREMBL; Q2R481; #=GS Q2R481_ORYSA OS Oryza sativa #=GS Q2R481_ORYSA OC plant_algae #=GS Q2R481_ORYSA DE Rice (Oryza sativa) DHFR section (no structure; aligned via DHFR.weighted.for.plant_algae.hmm) ## attlsngv removed from start #=GS Q2R481_ORYSA WT 0.284552335739 ## Q2R481_ORYSA Cluster: 1SEJC #=GS DRTS_MAIZE AC O81395 #=GS DRTS_MAIZE DR SWS; O81395; #=GS DRTS_MAIZE OS Zea mays #=GS DRTS_MAIZE OC plant_algae #=GS DRTS_MAIZE DE Zea mays DHFR section (no structure; aligned via DHFR.weighted.for.plant_algae.hmm) ## aavlangd removed from start #=GS DRTS_MAIZE WT 0.296936362982 ## DRTS_MAIZE Cluster: 1SEJC ## Pfam seq_cons in use: o:ST; l:ILV; -:DE; requiring 4/5 consensus between ## 1U70A, 1U72A, 8DFR0, 1J3K or 2BL9A, 1SEJ ## Unless noted otherwise, SS is from PDB file in question. Phi/Psi is ## (very rough!) estimate of SS from phi/psi angles, with NP (Non-Pro) being ## residues that are distinctly not capable (from phi/psi) of being Pro ## (both that residue and the one before it are outside the range from ## the Richardsons' data for phi/psi for pro and pre-pro, respectively) and ## GR (Gly-Req) being ones with phi/psi such that the Richardsons' data says ## nothing except Gly fits. For 1J3KAB, this is a consensus of 2 out of 3 ## of 1J3KA, 1J3KB, 2BL9A. [I need to redo these for 1J3KAB et al, and ## also have in 1PD8A]. Programs: check.gly.dang.pl, check.pro.dang.pl. ## Unless noted otherwise, SA is from proportion of Dr. Kahn's surface area ## numbers that get from: ## A. running reduce -build -Density100 on the PDBfile ## B. fgrep -v HETATM on the result ## C. probe -Unformated -Density100 -NOSpike -ASurface on the result ## D. sorting the result (sort -k2n) ## E. running interpret.probe.pl ## S2 is a version of this in which fully-buried (no dots from probe, so theoretically < 0.01) ## areas are indicated as 'B' and fully-exposed (more exposure than for Kahn's numbers) ## are indicated as 'E'. ## Hydrophobic: ## http://www.proteinscience.org/cgi/content/full/15/1/102 ## hydrophobic1: Ala, Ile, Leu, Met, Phe, Pro, Trp, Tyr, Val; ## hydrophobic2: Cys, Ile, Leu, Met, Phe, and Val ## compromise: ILMVFW ## ?: AYC (to | if have + on both sides) ## hydrophilic: all others (pro counted due to frequency in turns/kinks) ## Places to further look at are marked with '!!!' ## First section (59 pos) 1U70A ............VR.PLNCIVAVS.q..n................MGIGKNGDLPWP.p #=GR 1U70A SS ............CC.CEEEEEEEE.C..C................CCCCCCCC-CCC.C ## Phi/Psi: ............XC.EEEEEEEEC.C..C................CEEEELC1EHEE.E #=GR 1U70A LI .....................*.........................*........... #=GR 1U70A NP ............X.............................................. #=GR 1U70A GR ............X...................................G..G....... #=GR 1U70A SA ............38.200000100.5..3................200127743103.6 ## Hydrophobic: ............+-.-+-?++|+-.-..-................+-+-----+-+-.- DYR_RAT ............VR.PLNCIVAVS.q..n................MGIGKNGDLPWP.l DYR_MESAU ............VR.PLNCIVAVS.q..n................MGIGKNGDLPWP.m Q78EH1_9RODE ............VR.PLNCIVAVS.q..n................MGIGKNGDFPWP.m ## 26 1U72A ............VG.SLNCIVAVS.q..n................MGIGKNGDLPWP.p #=GR 1U72A SS ............CC.CEEEEEEEE.C..C................CCCCCCCCCCCC.C ## Phi/Psi: ............XG.EEEEEEEEE.G..G................LECEECL1EGEE.E #=GR 1U72A NP ............X................................*..*.......... #=GR 1U72A GR ............X.............................................. #=GR 1U72A LI ...................**...............................**.*... #=GR 1U72A AS ........................................................... #=GR 1U72A SA ............45.310000100.6..3................201027353003.4 ## Hydrophobic: ............+-.-+-?++|+-.-..-................+-+-----+-+-.- 1PD8A ............VG.SLNCIVAVS.q..n................MGIGKNGDLPWP.p #=GR 1PD8A SS ............CC.CEEEEEEEC.C..C................CEEECCCCCCCC.C #=GR 1PD8A GR ............X.............................................. #=GR 1PD8A SA ............44.310000100.5..3................201028252003.4 ## Hydrophobic: ............+-.-+-?++|+-.-..-................+-+-----+-+-.- 1DHFB ............VG.SLNCIVAVS.q..n................MGIGKNGDLPWP.p #=GR 1DHFB LI ...................**...............................**.*... #=GR 1DHFB AS ........................................................... ## 1DHFA SA ............XX.X20000100.4..3................2X1127663103.5 #=GR 1DHFB SA ............XX.X20000100.5..3................201027453103.5 #=GR 1DHFB S2 ............XX.X20000100.5..3................2B1027453103.5 XP_001110551 ............VS.SLNCIVAVS.q..n................MGIGKNGDLPWP.p XP_001134992 ............VG.SLNCIVAVS.q..n................MGIGKNGDLPWP.p XP_851329 ...gp..qp...WC.TLNCIVAVS.q..n................LGIGRNGDLPWP.p XP_536308 ............--.---------.--.-................------------.. DYR_PIG ............VR.PLNCIVAVS.q..n................MGIGKNGDLPWP.p DYR_BOVIN ............VR.PLNCIVAVS.q..n................MGIGKNGDLPWP.p P00376 ............VR.PLNCIVAVS.q..n................MGIGKNGDLPWP.p Q29RI1_BOVIN ............VR.PLNCIVAVS.q..n................MGIGKNGNLPWP.p PLACENT ............VR.SLNCIVAVS.q..n................MGIGKNGDLPWP.p #=GR PLACENT SA ............35.100000000.5..2................100036352104.4 ## SA is compromise between nonrot.full2, mmtp.full ## POSS1: ............VR.SLNCIVAVS.Q..N................MGIGKNGDLPWP.P ##nonrot.full2 ............36.10BBB00BB.5..2................1B0037352104.4 ##mmtp.full ............35.11BBB00BB.5..2................1B0046352104.2 ##mmtp.fullSS ............XC.CEEEEEEEE.G..G................LEGECCCEEHEC.C ## POSS2: ............VR.SLNCIVAVS.Q..N................MGIGKNGDLPWP.P XP_001363618 ............VR.QLNCIAAVS.k..n................MGIGKDGDLPWP.l ## 8DFR0 ............VR.SLNSIVAVC.q..n................MGIGKDGNLPWP.p #=GR 8DFR0 SS ............CC.CEEEEEEET.T..T................TCCCCCCIIIII.I ## Phi/Psi: ............XH.EEEEEEEE1.H..G................LECEELL1EHEE.E ## I is actually left-handed polyproline helix! Possible that ## is also in 1U70A (note mutation, however), 1U72A but is not marked... ## _is_ noted as being such in 1DHF (also human) #=GR 8DFR0 NP ............X................................*..*.......... #=GR 8DFR0 GR ............X......................................G....... #=GR 8DFR0 SA ............26.200000100.5..3................201127364106.8 ## Hydrophobic: ............+-.-+--++|+?.-..-................+-+-----+-+-.- 1DR10 ............VR.SLNSIVAVC.q..n................MGIGKDGNLPWP.p #=GR 1DR10 SS ............CC.CEEEEEEET.T..T................TCCCCCCIIIII.I #=GR 1DR10 LI ............X........*.........................*...*.*.*... ## Phi/Psi: ............XH.EEEEEEEE1.H..G................LECEELL1EGEE.E #=GR 1DR10 GR ............X......................................G....... #=GR 1DR10 SA ............33.300000100.5..3................200027464106.8 ## Hydrophobic: ............+-.-+--++|+?.-..-................+-+-----+-+-.- AGA ............VR.SLNCIVAVC.q..n................MGIGKDGNLPWP.p #=GR AGA SA ............25.100000000.4..2................100147452105.4 ## AGfullSA2 ............25.100B000BB.4..2................1B0147452105.4 ## AGfull2SA2 ............25.100B000BB.4..2................1B0146452105.4 ## AG: ............VR.SLNCIVAVC.Q..N................MGIGKDGNLPWP.P ## AI: ............VR.SLNCIVAVC.Q..N................MGIGKDGNLPWP.P ## PG: ............VR.SLNCIVAVC.Q..N................MGIGKDGNLPWP.P PGV ............VR.SLNCIVAVC.q..n................MGIGKDGNLPWP.p #=GR PGV SA ............36.200000000.4..2................100027262104.5 ## PGVYSfullSA2 ............36.20BB000BB.4..2................1B0027262104.5 ## PGVYSfull2S2 ............36.200B000BB.4..2................1B0027262104.5 ## PI: ............VR.SLNCIVAVC.Q..N................MGIGKDGNLPWP.P Q5U543_XENLA r........n..-Q.FLHAVVAVCpp..n................QGIGKGGSLPWP.l ENSXETP49617 r........n..-P.FLHAVVAVCpp..n................QGIGKEGSLPWP.l AAK01951 .........s..-E.ILNCIVAVCp...d................MGIGKNGNLPWH.p CAM14042 .........s..-R.ILNCIVAVCp...d................MGIGKNGNLPWH.p NP_571850 .........s..-R.ILNCIVAVCp...d................MGIGKNGNLPWH.p XP_001176553 ........ae..-Kk-LNLIAAAC.t..sk..g.k..........MGIGINGNLPWR.. ## EED: ............-R.-LNLIVAVCte..n................MGIGKNGNLPWR.. ## EEK: ............-R.-LNLIVAVCte..n................MGIGKNGNLPWR.. ## KED: ............-R.-LNLIVAVCte..n................MGIGKNGNLPWR.. ## KEK: ............-R.-LNLIVAVCte..n................MGIGKNGNLPWR.. ## K_D: ............-R.-LNLIVAVCte..n................MGIGKNGNLPWR.. ## K_K: ............-R.-LNLIVAVCte..n................MGIGKNGNLPWR.. ## ^ have distinct doubts about this insertion! Removing, from modeling results... ## _EED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _E_SKFED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _E_GKFED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EE_D: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EAED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EASKFED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EAGKFED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _E_EDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ES ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. #=GR ES SA ............-6.-00000000.5..3................100148363106.. ## S2: ............-6.-00BB0000.5..3................1B0148363106.. ## SA for ES is composite of _E_SKFEDQ.full.new.reduce3.ent, ## _E_SKFEDQ.full2.new.reduce3.ent, ## _E_SKFEDQ.loop.13-27.full.new.reduce3.ent ## _E_GKFEDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EAEDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EASKFEDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EAGKFEDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _EEK: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KE_D: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KAED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KAEDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KASKFED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KASKFEDQ: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _KAGKFED: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. KAG ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. #=GR KAG SA ............-6.-10000100.4..3................101147563106.. ## S2: .............6.-10B001BB.4..3................1B1147563106.. ## SA for KAG is composite of _KAGKFEDQ.full.new.reduce3.ent ## _KAGKFEDQ.full2.new.reduce3.ent ## _KAGKFEDQ.loop.13-27.full2.new.reduce3.ent ## _KEK: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _K_D: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. ## _K_K: ............-R.-LNLIVAVC.e..n................MGIGKNGNLPWR.. XP_973338 .....v......IK.-FDLIAAAC.e..n................MGIGKNNDLPWR.. EAL28532 ............LR.-FNLIVAVS.e..n................FGIGLKGDLPWR.. DYR_DROME ............LR.-FNLIVAVC.e..n................FGIGIRGDLPWR.. AAA19051 ............LR.-FNLIVAVC.e..n................FGIGIRGDLPWR.. XP_393902 ............--.NLHLIAATC.e......g............MGIGIKGTLPWK.. Q7Q0L5_ANOGA .........s..-Kk-FSCIVAVC.e..n................RGIGINGDLPWK.. DYR_CAEEL_1 r.....k.....M-.N--LIVAMDae......g............-GIGKNGVLPWR.. Q61DT5_CAEBR_1 r.....k.....M-.N--MIVAMDte......g............-GIGKNGVLPWR.. DYR_CAEEL_2 ............-Rk-MNLIVAMD.a..e................GGIGKNGVLPWR.. Q61DT5_CAEBR_2 ............-Rk-MNMIVAMD.t..e................GGIGKNGVLPWR.. ## ## 1100_SVFQ .........s..-R.-FTLVVAVT.K..S................MGIGKNGGLPWR.. ## 1111_GTF .........s..-R.-FTLVVAVT.k..s................MGIGKNGGLPWR.. ## 1111_GVF .........s..-R.-FTLVVAVT.K..S................MGIGKNGGLPWR.. 1111_STF .........s..-R.-FTLVVAVT.k..s................MGIGKNGGLPWR.. ## 1111_SVF .........s..-R.-FTLVVAVT.K..S................MGIGKNGGLPWR.. ## in doing models, ^ ^ was actually second of these, not first !!! ## 1111_chars2 .........s..-R.-LTLIVAVT.K..N................MGIGKNGGLPWR.. ## AAQ02615_1 .........ng.-F.--ALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02617_1 .........ng.-F.--ALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02619_1 .........ng.-F.--ALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02621_1 .........ng.-F.--ALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02615_2 .........n..-G.-FALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02617_2 .........n..-G.-FALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02619_2 .........n..-G.-FALVVAVT.k..t................MGIGNKGGLPWS.s AAQ02621_2 .........n..-G.-FALVVAVT.k..t................MGIGNKGGLPWS.s DYR_ENCCU_1 ............--.-LALVVALAs...h................RGIGNANALPWPrp DYR_ENCCU_2 ............--.-LALVVALA.s..h................RGIGNANALPWPrp EAK84413 ..........gkLK.-LVMVAAMS..l.t................NGIGKDGGLPWR.. BAC75955 .........s..-R.-LTIIVAAT.k..a................NGIGKGSNLPWR.. DYR_CRYNE qtta..k.ss..TP.SITAVVAAT..a.e................NGIGLNGGLPWR.. # # 10100_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 10101_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 10110_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 10111_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 11100_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 11101_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 11110_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # 11111_chars2 .........Sg.VPkSLTLIVAVT.kl.s................LGIGKKGGLPWR.. # ^^ I doubt both of these are present (!!!); however, might help make room for C. albicans seq # # 0010_KD .........Sgv.PksLTLIVAVT.Kl.S................LGIGLKNDLPWR.. # 0010_KP .........Sgv.PksLTLIVAVT.Kl.S................LGIGLKNDLPWR.. # 0010_QD .........Sgv.PksLTLIVAVT.Kl.S................LGIGLKNDLPWR.. # 0010_QP .........Sgv.PksLTLIVAVT.Kl.S................LGIGLKNDLPWR.. # 0011_KD .........Sgv.PksLTLIVAAT.Kl.S................LGIGKKGGLPWR.. # 0011_KP .........Sgv.PksLTLIVAAT.Kl.S................LGIGKKGGLPWR.. # 0011_QD .........Sgv.PksLTLIVAAT.Kl.S................LGIGKKGGLPWR.. # 0011_QP .........Sgv.PksLTLIVAAT.Kl.S................LGIGKKGGLPWR.. # DYR_SCHPO_1 .fsaptkept.kHPrDLTMIVAVSsp..n................LGIGKKNSMPWH.. DYR_SCHPO_2 .fsaptkept.kHPrDLTMIVAVS.s..p.....n..........LGIGKKNSMPWH.. DYR_PNECA .........n..QQkSLTLIVALT.t..s................YGIGRSNSLPWK.. AAF14071 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. AAL25720 ............--.---LIVALT..v.s................CGIGKGNALPWR.. AAT99406 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. AAT99411 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. AAT99412 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. AAT99413 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. AAT99417 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84704 .........d..WQkSLTLIVALT..l.s................RGIGSKNDLPWK.. ABB84712 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84716 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84718 ..........g.WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84720 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84722 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84726 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABB84744 .........d..WQkSLTLIVALT..l.p................RGIGLKNDLPWK.. ABB84751 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABF06467 .........d..WQkSLTLIVAST..l.s................RGIGLKNDLPWK.. ABF06468 .........d..WQkSLTLIVALT..l.s................RGIGLKSDLPWK.. ABF06469 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. ABF06470 .........d..WQkSLTLIVALT..l.s................RGIGLKNDLPWK.. Q6CC38_YARLI_1 ............-PpSTTLILAAT..v.p...............rYGIGLNGGLPWR.. Q6CC38_YARLI_2 ............PP.STTLILAAT..v.p.....r..........YGIGLNGGLPWR.. ## ^^ hrm... !!! CAG60823_1 .........s.kVP.-VVGIVAAL..l.p...............eMGIGFQGNLPWR.. CAG60823_2 .........s.kVP.-VVGIVAAL..l.p.....e..........MGIGFQGNLPWR.. AAS51350_1 .......gis.rVP.-VVSIVACL..l.p...............eYGIGYQGQLPWR.. AAS51350_2 .......gis.rVP.-VVSIVACL..l.p.....e..........YGIGYQGQLPWR.. DYR_YEAST_1 ...a...g..gkIP.-IVGIVACL.q..p.....e..........MGIGFRGGLPWR.. DYR_YEAST_2 ...a....g.gkIP.-IVGIVACL..........q.....p...eMGIGFRGGLPWR.. EDN63566_1 ...a...g..gkIP.-IVGIVACL.q..p.....e..........MGIGFRGGLPWR.. EDN63566_2 ...a....g.gkIP.-IVGIVACL..........q.....p...eMGIGFRGGLPWR.. CAA68779_1 ...a...g..gkIP.-IVGIVACL.q..p.....e..........MGIGFRGGVPWR.. CAA68779_2 ...a....g.gkIP.-IVGIVACL..........q.....p...eMGIGFRGGVPWR.. CAG86485_1 .taa...ngkvtPP.-IAMIVAAL..l.p.....e..........LGIGIKGKMPWR.. CAG86485_2 .t.a....angkVTpPIAMIVAAL..l.p...............eLGIGIKGKMPWR.. ABN65593_1 ........sei.KP.TIAIIVAAL.k..p.....d..........LAIGFQGKMPWR.. ABN65593_2 .........s.eIKpTIAIIVAAL..........k.....p...dLAIGFQGKMPWR.. ## ^ not G?!? DYR_CANAL_1 .........s..KP.NVAIIVAAL..k.p...............aLGIGYKGKMPWR.. DYR_CANAL_2 .........s..KP.NVAIIVAAL.k..p...............aLGIGYKGKMPWR.. ## 1J3KA .meq.v..cd..VF.DIYAICACC.kveskneg.kknevfnnytfRGLGNKGVLPWK.c #=GR 1J3KA SS .CCH.H..HH..HH.CEEEEEEEE.EECCCCCG.GGGGCCGGGCEEEEECCCCCCCC.C ## Phi/Psi: .ECC.C..CC..HG.CEEEEEEE1.EECCCCCC.GGCEEECGGHECCCEELL1EHEC.C ## ?Cap Ib?: ^ #=GR 1J3KA SA .844.2..03..00.000000100.21345886.39837564311100017554109.4 ## Hydrophobic: .+--..+.?-..++.-+??+????.-+------.----++--?-+--+----++-+-.? #=GR 1J3KA LI ...................***.........................*...***.*... 1J3KB .meq.v..cd..VF.DIYAICACC.kveskneg.kknevfnnytfRGLGNKGVLPWK.c #=GR 1J3KB SS .CCH.H..HH..HH.CEEEEEEEE.EECCCCCC.CCCCCCGGGCEEEEECCCCCCCC.C ## Phi/Psi: .GCC.C..GG..HG.CEEEE1EE1.EECGLLCE.1CCCEEEGGHCCCCEECG1EGEC.C ## ?Cap Ib?: ^ #=GR 1J3KB SA .943.1..03..00.000000100.21366975.88867563301200017554109.4 ## Hydrophobic: .+--.+..?-..++.-+??+????.-+------.----++--?-+--+----++-+-.? #=GR 1J3KB LI ...................***.........................*...***.*... ## Non-Pro: ...............*..............*.................*.......... ## Gly-Req: ................................G.......................... 1J3IA .meq.v..cd..VF.DIYAICACC.kveskneg.kknevfnnytfRGLGNKGVLPWK.c #=GR 1J3IA SA .735.1..04..00.000000100.21478394.78938553311200117543008.5 #=GR 1J3IA S2 .735.1..04..00.0B00001BB.21478394.789385533112B0117543008.5 1J3IB .meq.v..cd..VF.DIYAICACC.kveskneg.kknevfnnytfRGLGNKGVLPWK.c #=GR 1J3IB SA .925.2..03..00.000000100.21569784.97866554311200017543008.5 #=GR 1J3IB S2 .E25.2..03..B0.0B00001BB.21569784.978665543112B0017543008.5 DRTS_PLACH .med.i..se..IF.DIYAICACC.kvlnsne...kagcfsnktfKGLGNEGGLPWK.c Q7RGH7_PLAYO .med.l..se..IF.DIYAICACC.kvinnne...ksgsfnnktfNGLGNAGMLPWK.y Q95US9_PLAGA .mne.i..sd..IF.DIHAICACC.kvenkne.kkkneifsnntfRGIGNKGVLPWK.s ## 50 2BL9A ..en.l..sd..VF.DIYAICACC.kvaptsegtknepfsp.rtfRGLGNKGTLPWK.c #=GR 2BL9A SS ..CH.H..HH..HH.CEEEEEEEE.EECCCC-CCCCCCCCC.CCCCEEECCCCCCCC.C ## Phi/Psi: ..XE.H..HC..GG.CEEEECEE1.EEEEEGECGGECGGCG.EHCCEGEELL1EHEE.C #=GR 2BL9A LI ...................***.........................***.***..... ## Non-Pro: ..X............*...............-................*.......... ## Gly-Req: ..X.............................G.......................... #=GR 2BL9A SA ..72.2..02..00.000000100.2117596796345818.541100117655108.6 ## Hydrophobic: ..--.+..--..++.-+??+????.-+?----------+--.--+--+-----+-+-.? ## ?Cap Ib?: ^ DRTS_PLAVI ..ed.l..sd..VF.DIYAICACC.kvaptsegtknepfsp.rtfRGLGNKGTLPWK.c DRTS_PLAVN ............--.---AICACC.kvlnsne..kascfsn.ktfKGLGNAGGLPWK.c AAV33644 ............--.----ICACC.kvdppsegiknepfgp.rtfRGLGNNGTLPWK.c AAV33645 ............--.----ICACC.kvspsnegiknepfss.rtfRGLGNNGNLPWK.g ## 1SEJC ........se..-K.NVSIVVAAS..vls................SGIGINGQLPW-.s #=GR 1SEJC SS ........XC..-C.EEEEEEEEE..CCC................CEEECCCCCCC-.C ## Phi/Psi: ........XX..-E.EEEEEEEEC..CCG................LECEECEEEGC-.E #=GR 1SEJC LI ...................*.*.........................*.....*..... #=GR 1SEJC NP ........XX...................................*..*......*... #=GR 1SEJC GR ........XX................................................. #=GR 1SEJC SA ........X9..-1.200000100..144................10001766400-.5 ## Hydrophobic: ........--...-.-+-+++??-..++-................--+-+---+-+..- ## ?Cap IIb?: ^ ^ 1QZFD ........se..-K.NVSIVVAAS..vls................SGIGINGQLPW-.s #=GR 1QZFD SA ........X9..-1.200000100..144................10011766410-.5 #=GR 1QZFD S2 ........X9..-1.200B00100..144................1B011766410-.5 AAC47229 ........sk..-K.NVSIVVAAS..vls................RGIGINGQLPW-.s ## 28 CAI76538 .sed.y..sg..LP.FVKILVAITpe...................NGIGIKNGLPWP.h EAN31856 .aed.y..sg..LP.FVKLLVAITpe...................NGIGISNGLPWP.h EAR85731 .........k..TR.HFDIVLAQTlk..k................QGIGYKNSLPWR.. DRTS_TRYBB ..k..i..srppLR.PFSVVVASD.e..k................GGIGDGGTIPWE.. AAX78868 ..k..i..srppLR.PFSVVVASD.e..k................GGIGDGGTIPWE.. DRTS_TRYCR .g......trlaLR.AFSLVVAVD.e..h................GGIGDGRSIPWN.. AAK71184 .g......trlaLR.AFSLIVAVD.e..h................GGIGDGRSIPWN.. AAK71177 .g......trlaLR.AFSLVVAVD.e..h................GGIGDGRSIPWN.. Q95NI3_TRYCR .g......trlaLR.AFSLVVAVD.e..h................GGIGDGRSIPWN.. Q95NT2_TRYCR .g......trlaLR.AFSLVVAVD.e..r................GGIGDGRSIPWN.. DRTS_LEIAM df.a.f.ps...LR.AFSIVVALD.k..q................HGIGDGESIPWR.. DRTS_LEIMA df.a.f.ps...LR.AFSIVVALDmq...................HGIGDGESIPWR.. AAA29272 df.a.f.ps...LR.AFCIVVALDmq...................HGIGDGESIPWR.. Q8MXB7_LEITR df.a.f.ps...LR.AFSIVVALD.k..q................HGIGDGESIPWR.. Q8MQV1_LEICH df.a.f.ps...LR.AFSIVVALD.k..q................HGIGDGESIPWR.. DRT1_ARATH .las..ep.q..-R.TYQVVVAAT.k..e................MGIGKDGKLPWN.. DRTS_SOYBN .lpn.l...q..-R.TYQVVVAAT.q..d................WGIGKDGKLPWR.. Q2R481_ORYSA s.qng..p.q..-R.NYQVVVAAT.r..d................MGIGKDGVLPWK.. DRTS_MAIZE s..qg.rp.q..-R.NYQVVVAGT.r..d................MGIGKDGVLPWK.. #=GC RF ............XX.XXXXXXXXX.....................XXXXXXXXXXXX.. #=GC SS_cons ............CC.CEEEEEEEE.CE.C...C............----CCCIIIII.I #=GC seq_cons ............l...l..lVA...QV.N...G.............GlG..G.LPW.RP #=GC LI_cons .....................*.........................*.....*.*... ## Ala9: also from 1YHO (NMR) paper ## Note prosite pattern [LVAGC][LIF]G....[LIVMF]PW.....?[DE]...[FYIV]...[STIQ] ## (PS00075), with W in PW interacting w/substrate; from Huang et al, ## Biochemistry 1989, 28, 471-478. ## Ile-7 interacts with MTX; may not be conserved in C. albicans - see ## Biochemistry 1991, 30, 8124 - however, is H-bond, so seems unlikely ## to be altered by altering residue (unless goes to Pro!); original albicans ## paper thinks is present with alignment to rest. #=GC AS_cons .....................................................*..... ## L22 as part of active site mechanism: Faraday Discuss 1992, 93, 217-224; ## Exploring the Molecular Mechanism of Dihydrofolate Reductase; ## Brown, Kraut <- but may need to check on mutation results! #=GC SA_cons ............X8.200000100.51..................200027554106.6 ## Seq_cons2 xxxxxxxxxx..VxxXLNXIXAXCxQVxNxxxGxxxxxxxxxxxxXGIGXNGNLPWXrp ## Hydrophobic: ............+...+-.+.?...-+.-.................-+-.---+-+.-- ## Second section (26 pos; 85 total) 1U70A LR..NEFKYFQRMTT...TS.S.vE. #=GR 1U70A SS HH..HHHHHHHHHHH...HC.C.CC. ## Phi/Psi: EH..HHHHHHHHHGG...EE.G.EE. #=GR 1U70A LI .......................... #=GR 1U70A NP .......................*.. #=GR 1U70A GR .......................... #=GR 1U70A SA 06..30350143002...51.7.48. ## Hydrophobic: +-..--+-?+--+--...--.-.+-. DYR_RAT LR..NEFKYFQRMTT...TS.S.vE. DYR_MESAU LR..NEFKYFQRMTT...TS.S.vE. Q78EH1_9RODE LR..NEFKYFQRMTT...TS.S.vE. ## 44 1U72A LR..NEFRYFQRMTT...TS.S.vE. #=GR 1U72A SS HH..HHHHHHHHHHH...HC.C.TT. ## 43-46 tight turn by 1DR1 paper ## Phi/Psi: EG..GHHCCCHHHGG...EE.G.EE. #=GR 1U72A NP .......................... #=GR 1U72A GR .......................... #=GR 1U72A LI .*...**..*................ #=GR 1U72A AS .....*.................... ## Helix terminator: ^^ ^ #=GR 1U72A SA 06..40460133002...52.7.39. ## Hydrophobic: +-..--+-?+--+--...--.-.+-. 1PD8A LR..NEFRYFQRMTT...TS.S.vE. #=GR 1PD8A SS HH..HHHHHHHHHHH...HC.C.TT. #=GR 1PD8A GR .......................... #=GR 1PD8A SA 04..40360133003...52.6.49. ## Hydrophobic: +-..--+-?+--+--...--.-.+-. 1DHFB LR..NEFRYFQRMTT...TS.S.vE. #=GR 1DHFB LI .*...**..*................ #=GR 1DHFB AS .....*.................... ## 1DHFA SA X7..303302430X2...52.6.49. #=GR 1DHFB SA 06..30450143002...52.7.49. #=GR 1DHFB S2 06..304501430B2...52.7.49. XP_001110551 LR..NEFRYFQRMTT...TS.S.vE. XP_001134992 LR..NEFRYFQRMTT...TS.S.vE. XP_851329 LR..NEFKCFQRMTT...NS.S.vE. XP_536308 --..-----------...TS.-..Et DYR_PIG LR..NEYKYFQRMTT...TS.S.vE. DYR_BOVIN LR..NEFQYFQRMTT...VS.S.vE. P00376 LR..NEFQYFQRMTT...VS.S.vE. Q29RI1_BOVIN LR..NEFQYFQRMTT...VS.S.vE. PLACENT LR..NEFKYFQRMTT...TS.S.vE. #=GR PLACENT SA 06..30350133002...40.6.56. ## POSS1: LR..NEFKYFQRMTT...TS.S.VE. ##nonrot.full2 06..30350133002...40.6.56. ##mmtp.full 05..30350133002...40.6.56. ##mmtp.fullSS EH..HCCCCCCCHHH...EE.G.CC. ## POSS2: LR..NEFKYFQRMTT...TS.S.VE. XP_001363618 LR..NEFKYFQKMTT...TP.S.vE. ## 8DFR0 LR..NEYKYFQRMTS...TS.H.vE. #=GR 8DFR0 SS HH..HHHHHHHHHHH...HC.C.TT. ## Phi/Psi: EH..HHHHHHHHHHG...EE.G.EE. #=GR 8DFR0 NP .......................... #=GR 8DFR0 GR .......................... #=GR 8DFR0 SA 06..30430124102...42.6.49. ## Hydrophobic: +-..--?-?+--+--...--.-.+- 1DR10 LR..NEYKYFQRMTS...TS.H.vE. #=GR 1DR10 SS HH..HHHHHHHHHHH...HC.C.TT. #=GR 1DR10 LI ......*..*................ ## ^ in 2 conformations in 1DR10 ## Phi/Psi: EC..HHHHHHHHHHG...EE.G.EE. #=GR 1DR10 GR .......................... #=GR 1DR10 SA 05..30830124002...42.6.49. ## Hydrophobic: +-..--?-?+--+--...--.-.+-. AGA LR..NEFKYFQRMTT...TS.S.vE. #=GR AGA SA 05..30350244003...40.6.57. ## AGfullSA2 05..30350244003...40.7.57. ## AGfull2SA2 05..30350244003...40.6.57. ## AG: LR..NEFKYFQRMTT...TS.S.VE. ## AI: LR..NEFKYFQRMTT...TS.S.VE. ## PG: LR..NEFKYFQRMTT...TS.S.VE. PGV LR..NEFKYFQRMTT...TS.S.vE. #=GR PGV SA 06..30450234002...41.6.58. ## PGVYSfullSA2 06..20450234002...41.6.58. ## PGVYSfull2S2 06..30450234002...41.7.58. ## PI: LR..NEFKYFQRMTT...TS.S.VE. Q5U543_XENLA LR..NEFKHFQRLTM...T-pT.vE. ENSXETP49617 LR..NEFKHFQRLTM...T-pT.vE. AAK01951 IRlsNELKHFQKMTM...T-pS..De CAM14042 IRlsNELKHFQKMTM...T-pS..De NP_571850 IRlsNELKHFQKMTM...T-pS..De XP_001176553 LR..QEMAYFERLTK...TA.Qm.E. ## EED: LR..SELKYFERMTK...TS.S..D. ## EEK: LR..SELKYFERMTK...TS.S..D. ## KED: LR..SELKYFKRMTK...TS.S..D. ## KEK: LR..SELKYFKRMTK...TS.S..D. ## K_D: LR..SELKYFKRMTK...TS.S..D. ## K_K: LR..SELKYFKRMTK...TS.S..D. ## _EED: LR..SELKYFERMTK...TS.S..D. ## _E_SKFED: LR..SELKYFERMTK...TS.S..D. ## _E_GKFED: LR..SELKYFERMTK...TS.S..D. ## _EE_D: LR..SELKYFERMTK...TS.S..D. ## _EAED: LR..SELKYFERMTK...TS.S..D. ## _EASKFED: LR..SELKYFERMTK...TS.S..D. ## _EAGKFED: LR..SELKYFERMTK...TS.S..D. ## _E_EDQ: LR..SELKYFERMTK...TS.S..D. ES LR..SELKYFERMTK...TS.S..D. #=GR ES SA 06..20360135003...40.5..9. ## S2: 06..20360135003...40.5..9. ## _E_GKFEDQ: LR..SELKYFERMTK...TS.S..D. ## _EAEDQ: LR..SELKYFERMTK...TS.S..D. ## _EASKFEDQ: LR..SELKYFERMTK...TS.S..D. ## _EAGKFEDQ: LR..SELKYFERMTK...TS.S..D. ## _EEK: LR..SELKYFERMTK...TS.S..D. ## _KED: LR..SELKYFKRMTK...TS.S..D. ## _KE_D: LR..SELKYFKRMTK...TS.S..D. ## _KAED: LR..SELKYFKRMTK...TS.S..D. ## _KAEDQ: LR..SELKYFKRMTK...TS.S..D. ## _KASKFED: LR..SELKYFKRMTK...TS.S..D. ## _KASKFEDQ: LR..SELKYFKRMTK...TS.S..D. ## _KAGKFED: LR..SELKYFKRMTK...TS.S..D. KAG LR..SELKYFKRMTK...TS.S..D. #=GR KAG SA 06..20261145002...31.6..8. ## S2: 06..20261145002...31.6..8. ## _KEK: LR..SELKYFKRMTK...TS.S..D. ## _K_D: LR..SELKYFKRMTK...TS.S..D. ## _K_K: LR..SELKYFKRMTK...TS.S..D. XP_973338 LK..SELAFFSQMTT...QT.S..De EAL28532 LK..SELKYFSRTTK...RT.S..Dp DYR_DROME IK..SELKYFSRTTK...RT.S..Dp AAA19051 IK..SELKYFSRTTK...RT.S..Dp XP_393902 LK..SELAFFTYMTT...NT.K..Np Q7Q0L5_ANOGA LK..QELKYFSHTTK...KV.N..Da DYR_CAEEL_1 IK..KDMQYFASVTK...NV.S..D. Q61DT5_CAEBR_1 IR..KDMQYFAAVTK...KV.S..Dp DYR_CAEEL_2 IK..KDMQYFASVTK...NV.S..D. Q61DT5_CAEBR_2 IR..KDMQYFAAVTK...KV.S..Dp ## ## 1100_SVFQ LK..SDMKYFKRVTS...KT.S..Dp ## 1111_GTF LK..GDMKYFKRVTS...KT.S..Dp ## 1111_GVF LK..GDMKYFKRVTS...KT.S..Dp 1111_STF LK..SDMKYFKRVTS...KT.S..Dp ## 1111_SVF LK..SDMKYFKRVTS...KT.S..Dp ## ## 1111_chars2 LR..SDMKYFKRVTS...KT.S..Dp ## AAQ02615_1 IR..GDMNFLKKITS...ET.K..D. AAQ02617_1 IR..GDMNFFKKITS...ET.K..D. AAQ02619_1 IR..GDMNFFKKITS...ET.K..D. AAQ02621_1 IR..GDMNFFKKITS...ET.K..D. AAQ02615_2 IR..GDMNFLKKITS...ET.K..D. AAQ02617_2 IR..GDMNFFKKITS...ET.K..D. AAQ02619_2 IR..GDMNFFKKITS...ET.K..D. AAQ02621_2 IR..GDMNFFKKITS...ET.K..D. DYR_ENCCU_1 LA..ADMAWFRTLSQ...SIp-liSp DYR_ENCCU_2 LA..ADMAWFRTLSQ...SIp-liSp EAK84413 LK..GEMTYFRNVTS...HVaD..Ee BAC75955 LA..KEMKYFARATS...EAp-..E. DYR_CRYNE LP..GEMKYFARVTTg..ETpSs.Dp # # 10100_chars2 LK..XEMKYFKRVTS..lXT.Tf.Dp # 10101_chars2 LK..XEMKYFKRVTS..lXT.Tf.Dp # 10110_chars2 LK..XEMKYFKRVTS..lXT.Tf.Dp # 10111_chars2 LK..XEMKYFKRVTS..lXT.Tf.Dp # 11100_chars2 LK..XEMKYFKRVTS...XT.Tf.Dp # 11101_chars2 LK..XEMKYFKRVTS...XT.Tf.Dp # 11110_chars2 LK..XEMKYFKRVTS...XT.Tf.Dp # 11111_chars2 LK..XEMKYFKRVTS...XT.Tf.Dp # poss remove: ^ # I don't think the "l" is there in the above - that's for ones without TfDp seq. # # 0010_KD LK..SEMKYFKRVTS...KT.Tf.DS # 0010_KP LK..SEMKYFKRVTS...KT.Tf.DS # 0010_QD LK..SEMKYFKRVTS...KT.Tf.DS # 0010_QP LK..SEMKYFKRVTS...KT.Tf.DS # 0011_KD LK..KEMKYFKRVTS...KT.Tf.DP # 0011_KP LK..KEMKYFKRVTS...KT.Tf.DP # 0011_QD LK..KEMKYFKRVTS...KT.Tf.DP # 0011_QP LK..KEMKYFKRVTS...KT.Tf.DP # DYR_SCHPO_1 IK..QEMAYFANVTS...S-.T..Es DYR_SCHPO_2 IK..QEMAYFANVTS...ST.E..Ss DYR_PNECA LK..KEISYFKRVTS...FVpTf.Ds AAF14071 LK..SDMMFFSRVTSgll-V.T..Rs AAL25720 LK..SDMAYFKRVTS...DVp-.vS. AAT99406 LK..SDMMFYSRVTSgll-V.T..Rs AAT99411 LK..SDMMFFTRVTSgll-V.T..Rs AAT99412 LK..SDMMFFSRVTSgll-V.T..Rs AAT99413 LK..SDMMFFSRVTSgll-V.T..Rs AAT99417 LK..SDMMFFSRVTSgll-V.T..Rs ABB84704 LK..SDMMFFSRVTSgll-V.T..Rs ABB84712 LK..SDMMFFSRITSgll-V.T..Rs ABB84716 LK..SDMMFFCRVTSgll-V.T..Rs ABB84718 LK..SDMMFFSRVTSgll-V.T..Rs ABB84720 LK..SDMMFFSRVTSgll-V.T..Rs ABB84722 LR..SDMMFFSRVTSgll-V.T..Rs ABB84726 LK..SDMMFFSRVTSgll-V.T..Rs ABB84744 LK..SDMMFFSRVTSgll-V.T..Rs ABB84751 LK..SDMMFFSRVTSgll-V.T..Rs ABF06467 LK..SDMMFFSRVTSgll-V.T..Rs ABF06468 LK..SDMMFFSRVTSgll-V.T..Rs ABF06469 LK..FDMMFFSRVTSgll-V.T..Rs ABF06470 LK..SDMMFFSRVTSgll-V.T..Rs Q6CC38_YARLI_1 LA..KEMKFFKQVTT..aQ-.-..-. Q6CC38_YARLI_2 LA..KEMKFFKQVTT...-A.-..Q. CAG60823_1 LA..KEMKYFREVTT..lT-.N..Dn CAG60823_2 LA..KEMKYFREVTT...LT.N..Dn AAS51350_1 LA..REMKYFRQATT...AT.F..Dp AAS51350_2 LA..REMKYFRQATT...-A.Tf.Dp DYR_YEAST_1 LP..SEMKYFRQVTS..lTK.Dp.N. DYR_YEAST_2 LP..SEMKYFRQVTS...LT.K..Dp EDN63566_1 LP..SEMKYFRQVTS..lTK.Dp.N. EDN63566_2 LP..SEMKYFRQVTS...LT.K..Dp CAA68779_1 LP..SEMKYFRQVTS..lTK.Dp.N. CAA68779_2 LP..SEMKYFRQVTS...LT.K..Dp CAG86485_1 LR..QEIKYFKNVTT...TT.K..Dp CAG86485_2 LR..QEIKYFKNVTT..tTK.Dp.Ng ABN65593_1 LR..KEIRYFKDVTT..kTS.Dp.S. ABN65593_2 LR..KEIRYFKDVTT...KT.S..Dp ## DYR_CANAL_1 LR..KEIRYFKDVTT..rTT.Kp.Nt DYR_CANAL_2 LR..KEIRYFKDVTT...RT.T..Kp ## 1J3KA NS..LDMKYFCAVTT...YV.N..Es #=GR 1J3KA SS -H..HHHHHH-HHHH...HC.H..HH ## Phi/Psi: CG..HHHHHHHHHGG...EE.E..GH ## ?Cap Ib?: ^ ^^ #=GR 1J3KA LI .....*...*................ #=GR 1J3KA SA 04..20462144101...51.2..57 ## Hydrophobic: --..+-+-?+??+--...?+.-..-- 1J3KB NS..LDMKYFCAVTT...YV.N..Es #=GR 1J3KB SS -H..HHHHHH-HHHH...HC.H..HH ## Phi/Psi: CG..HHHHHCCCHGC...EE.E..GG ## ?Cap Ib?: ^ ^^ #=GR 1J3KB LI .....*...*................ #=GR 1J3KB SA 04..20462154102...51.2..58 ## Hydrophobic: --..+-+-?+??+--...?+.-..-- ## Non-Pro: .......................... ## Gly-Req: .......................... 1J3IA NS..LDMKYFCAVTT...YV.N..Es #=GR 1J3IA SA 05..20462134102...51.2..57 #=GR 1J3IA S2 05..204621341B2...51.2..57 1J3IB NS..LDMKYFCAVTT...YV.N..Es #=GR 1J3IB SA 05..20462134102...51.2..57 #=GR 1J3IB S2 05..204621341B2...51.2..57 DRTS_PLACH NS..VDMKHFSSVTS...YV.N..Et Q7RGH7_PLAYO NL..VDMNYFSSVTS...YV.N..En Q95US9_PLAGA NP..LDMKYFTTVTT...YV.N..Es ## 68 2BL9A NS..VDMKYFSSVTT...YV.D..Es #=GR 2BL9A SS HH..HHHHHHHHHHH...HC.G..GG ## Phi/Psi: EH..HHHHHCCCCGG...EE.E..GH #=GR 2BL9A LI .....*...*................ ## Non-Pro: .......................... ## Gly-Req: .......................... #=GR 2BL9A SA 05..20472124102...51.1..57 ## Hydrophobic: --..+-+-?+--+--...?+.-..-- ## ?Cap Ib?: ^ ^^ DRTS_PLAVI NS..VDMKYFSSVTT...YV.D..Es DRTS_PLAVN NS..VDMKHFVSVTS...YV.N..En AAV33644 NS..VDMKYFSSVTT...YV.D..Es AAV33645 NS..VDMKYFSSVTT...YV.D..Es ## 1SEJC IS..EDLKFFSKITN...NK.C..D. #=GR 1SEJC SS HH..HHHHHHHHHHH...HC.C..C. ## Phi/Psi: EG..GHHHHHHCHGG...CE.G..E. #=GR 1SEJC LI .....**..**............... #=GR 1SEJC NP .......................... #=GR 1SEJC GR .......................... #=GR 1SEJC SA 04..40552226102...62.9..3. ## Hydrophobic: +-..--+-++--+--...--.?..-. ## ?Cap IIb?: ^ ^^ 1QZFD IS..EDLKFFSKITN...NK.C..D. #=GR 1QZFD SA 06..40552125102...62.9..3. #=GR 1QZFD S2 06..405521251B2...62.9..3. AAC47229 IS..EDLKFFSKITS...NN.C..D. ## 45 CAI76538 IK..RDFLFMFRATT...YV.Dp.Ef EAN31856 IK..RDFLFMFRATT...YV.Dp.Ef EAR85731 LP..NELKNFKKITT...ET.K..N. DRTS_TRYBB IP..EDMQYFRRVTT...NL.Rg.Kn AAX78868 IP..EDMQYFRRVTT...NL.Rg.Kn DRTS_TRYCR VP..EDMKFFRDLTT...KL.Rg.Kn AAK71184 VP..EDMKFFRDVTT...KL.Rg.Kn AAK71177 VP..EDMKFFRDLTT...KL.Rg.Kn Q95NI3_TRYCR VP..EDMKFFRDVTT...KL.Rg.Kn Q95NT2_TRYCR VP..EDMKFFRDVTT...KL.Rg.Kn DRTS_LEIAM VP..EDMAFFKDQTT..l-L.R..N. DRTS_LEIMA VP..EDMTFFKNQTT..l-L.R..N. AAA29272 SP..EDMTFFKNQTT..l-L.R..N. Q8MXB7_LEITR VP..EDMAFFKDQTT..l-L.R..N. Q8MQV1_LEICH VP..EDMAFFKDQTT..l-L.R..N. DRT1_ARATH LP..TDLKFFKDITL...TT.S..D. DRTS_SOYBN LP..TDLKFFKEITM...KT.S..E. Q2R481_ORYSA L-l.GDLKFFKELTV...TT.A..D. DRTS_MAIZE LP..GDLKFFKELTL...TT.S..D. #=GC RF XX..XXXXXXXXXXX...XX.X..X. #=GC SS_cons HH..HHHHHHHHHHH...HC.C..T. #=GC seq_cons l....-.KYF...To.........-. #=GC LI_cons .....*...*................ ## F-34 binding: JBC 1989, 264, 34:20786-20795; Probing the Role of Two ## Hydrophobic Active Site Residues in the Human Dihydrofolate Reductase by ## Site-directed Mutagenesis; Schweitzer et al PLUS Biochemistry 1994, 33, ## 9945-9952; Critical Role of Phenylalanine 34 of Human Dihydrofolate ## Reductase in Substrate and Inhibitor Binding and in Catalysis; Nakano et al ## F|M|whatever-31 may be active in binding to MTX (or at least create problems ## w/binding to MTX if mutated to something much smaller or larger - 10.1139/G03-046) #=GC AS_cons .....*.................... ## Glu/Asp-30 activity: Biochemistry 1990, 29, 5195-5202; Kinetic Mechanism of ## Wild-Type and Mutant Mouse Dihydrofolate Reductases; ## Thillet, Adams, Benkovic; also 1YHO (NMR) article #=GC SA_cons 05..30451134102...52.6..9. ## Helix cap: .............^?........... ## Seq_cons2 LXxxXEXKYFXKMTS...XX.N.VEx ## Hydrophobic: +....-.-?+.-+--......-.+-. ## Third section (51 pos; 136 total) 1U70A ...........................................g..k.... #=GR 1U70A SS ...........................................C..C.... ## Phi/Psi: ...........................................C..E.... #=GR 1U70A LI ................................................... #=GR 1U70A NP ................................................... #=GR 1U70A GR ...........................................G....... #=GR 1U70A SA ...........................................8..2.... ## Hydrophobic: ...........................................-..-.... DYR_RAT ...........................................g..k.... DYR_MESAU ...........................................g..k.... Q78EH1_9RODE ...........................................g..k.... ## 46 1U72A ...........................................g..k.... #=GR 1U72A SS ...........................................T..T.... ## 43-46 are a tight turn by 1DHF|2DHF paper ## Phi/Psi: ...........................................L..E.... #=GR 1U72A NP ................................................... #=GR 1U72A GR ................................................... #=GR 1U72A LI ................................................... #=GR 1U72A AS ..............................................*.... ## AS by loop regions paper - see below #=GR 1U72A SA ...........................................8..2.... ## Hydrophobic: ...........................................-..-.... 1PD8A ...........................................g..k.... #=GR 1PD8A SS ...........................................T..T.... #=GR 1PD8A GR ................................................... #=GR 1PD8A SA ...........................................9..2.... 1DHFB ...........................................g..k.... #=GR 1DHFB LI ................................................... #=GR 1DHFB AS ..............................................*.... ## 1DHFA SA ...........................................9..2.... #=GR 1DHFB SA ...........................................9..2.... #=GR 1DHFB S2 ...........................................9..2.... XP_001110551 ...........................................g..k.... XP_001134992 ...........................................g..k.... XP_851329 ...........................................g..k.... XP_536308 ...........................................g..k.... DYR_PIG ...........................................g..k.... DYR_BOVIN ...........................................g..k.... P00376 ...........................................g..k.... Q29RI1_BOVIN ...........................................g..k.... PLACENT ...........................................g..k.... #=GR PLACENT SA ...........................................7..2.... ## POSS1: ...........................................G..K.... ##nonrot.full2 ...........................................7..2.... ##mmtp.full ...........................................8..2.... ##mmtp.fullSS ...........................................C..E.... ## POSS2: ...........................................G..K.... XP_001363618 ...........................................g..k.... ## 8DFR0 ...........................................g..k.... #=GR 8DFR0 SS ...........................................T..T.... ## Phi/Psi: ...........................................L..E.... #=GR 8DFR0 NP ................................................... #=GR 8DFR0 GR ...........................................G....... #=GR 8DFR0 SA ...........................................9..2.... ## Hydrophobic: ...........................................-..-.... 1DR10 ...........................................g..k.... #=GR 1DR10 SS ...........................................T..T.... #=GR 1DR10 LI ................................................... ## Phi/Psi: ...........................................L..E.... #=GR 1DR10 GR ...........................................G....... #=GR 1DR10 SA ...........................................9..2.... ## Hydrophobic: ...........................................-..-.... AGA ...........................................g..k.... #=GR AGA SA ...........................................7..2.... ## AGfullSA2 ...........................................7..2.... ## AGfull2SA2 ...........................................7..2.... ## AG: ...........................................G..K.... ## AI: ...........................................G..K.... ## PG: ...........................................G..K.... PGV ...........................................g..k.... #=GR PGV SA ...........................................9..2.... ## PGVYSfullSA2 ...........................................9..2.... ## PGVYSfull2S2 ...........................................9..2.... ## PI: ...........................................G..K.... Q5U543_XENLA ...........................................g..k.... ## Strongly suspect all of the above at the end should be pushed back 1 ## residue with "k" being considered aligned (and 1 further with g being vs s); ## Have done; confirmed that at end area is flexible in not only 1J3KAB ## but above (high B-factors). However, deletion of that area (45-46 in ## particular) can admittedly cause human DHFR to look a bit more similar to ## characteristics of C. albicans DHFR (e.g., urea, KCl not activating; MTX ## not binding as well), so will probably want to put "K" back to non-aligned ## for fungal (done). (Refs: Importance of Loop Region Residues 40-46 in Human ## Dihydrofolate Reductase as Revealed by Site-directed Mutagenesis; ## Characterization of Candida albicans Dihydrofolate Reductase.) ENSXETP49617 ...........................................d..k.... AAK01951 ...........................................g..k.... CAM14042 ...........................................g..k.... NP_571850 ...........................................g..k.... XP_001176553 ...........................................gm.k.... ## EED: ...........................................g..k.... ## EEK: ...........................................g..k.... ## KED: ...........................................g..k.... ## KEK: ...........................................g..k.... ## K_D: ...........................................g..k.... ## K_K: ...........................................g..k.... ## _EED: ...........................................g..k.... ## _E_SKFED: ...........................................g..k.... ## _E_GKFED: ...........................................g..k.... ## _EE_D: ...........................................g..k.... ## _EAED: ...........................................g..k.... ## _EASKFED: ...........................................g..k.... ## _EAGKFED: ...........................................g..k.... ## _E_EDQ: ...........................................g..k.... ES ...........................................g..k.... #=GR ES SA ...........................................7..1.... ## S2: ...........................................7..1.... ## _E_GKFEDQ: ...........................................g..k.... ## _EAEDQ: ...........................................g..k.... ## _EASKFEDQ: ...........................................g..k.... ## _EAGKFEDQ: ...........................................g..k.... ## _EEK: ...........................................g..k.... ## _KED: ...........................................g..k.... ## _KE_D: ...........................................g..k.... ## _KAED: ...........................................g..k.... ## _KAEDQ: ...........................................g..k.... ## _KASKFED: ...........................................g..k.... ## _KASKFEDQ: ...........................................g..k.... ## _KAGKFED: ...........................................g..k.... KAG ...........................................g..k.... #=GR KAG SA ...........................................7..2.... ## S2: ...........................................7..2.... ## _KEK: ...........................................g..k.... ## _K_D: ...........................................g..k.... ## _K_K: ...........................................g..k.... XP_973338 ...........................................s..k.... EAL28532 ...........................................n..k.... DYR_DROME ...........................................t..k.... AAA19051 ...........................................t..k.... XP_393902 ...........................................n..k.... Q7Q0L5_ANOGA ...........................................d..k.... DYR_CAEEL_1 ..........................................qs....... Q61DT5_CAEBR_1 ...........................................a..k.... DYR_CAEEL_2 ..........................................qs....... Q61DT5_CAEBR_2 ...........................................a..k.... ## ## 1100_SVFQ ...........................................G..K.... ## 1111_GTF ...........................................g..k.... ## 1111_GVF ...........................................G..K.... 1111_STF ...........................................g..k.... ## 1111_SVF ...........................................G..K.... ## ## 1111_chars2 ...........................................G..K.... ## AAQ02615_1 ...........................................aa.k.... AAQ02617_1 ...........................................aa.k.... AAQ02619_1 ...........................................aa.k.... AAQ02621_1 ...........................................aa.k.... AAQ02615_2 ...........................................aa.k.... AAQ02617_2 ...........................................aa.k.... AAQ02619_2 ...........................................aa.k.... AAQ02621_2 ...........................................aa.k.... DYR_ENCCU_1 ................................d.rialap...sa...... DYR_ENCCU_2 ................................d.rialap...sa...... EAK84413 ........................................qrqg.t..... BAC75955 ...........................................g.t..... DYR_CRYNE ...........................................s..e.... # # 10100_chars2 ..........................................tg..k.... # 10101_chars2 ..........................................tg..k.... # 10110_chars2 ..........................................tg..k.... # 10111_chars2 ..........................................tg..k.... # 11100_chars2 ..........................................tg..k.... # 11101_chars2 ..........................................tg..k.... # 11110_chars2 ..........................................tg..k.... # 11111_chars2 ..........................................tg..k.... # # 0010_KD ..........................................tG..K.... # 0010_KP ..........................................tG..K.... # 0010_QD ..........................................tG..K.... # 0010_QP ..........................................tG..K.... # 0011_KD ..........................................tG..K.... # 0011_KP ..........................................tG..K.... # 0011_QD ..........................................tG..K.... # 0011_QP ..........................................tG..K.... # DYR_SCHPO_1 ................s..........g.qlee..........g..k.ski DYR_SCHPO_2 ...........................g.qleegk........s..ki..m DYR_PNECA .f........................................es....... AAF14071 ..........................................tg..q.... AAL25720 ..........................................ds.tk...w AAT99406 ..........................................tg..q.... AAT99411 ...........................................g..q.... AAT99412 ..........................................tg..q.... AAT99413 ..........................................tg..q.... AAT99417 ..........................................tg..q.... ABB84704 ..........................................tg..q.... ABB84712 ..........................................tg..q.... ABB84716 ..........................................tg..q.... ABB84718 ..........................................tg..q.... ABB84720 ..........................................tg..q.... ABB84722 ..........................................tg..q.... ABB84726 ..........................................tg..q.... ABB84744 ..........................................tg..q.... ABB84751 ..........................................tg..q.... ABF06467 ..........................................tg..q.... ABF06468 ..........................................tg..q.... ABF06469 ..........................................tg..q.... ABF06470 ..........................................tg..q...l Q6CC38_YARLI_1 ................................................... Q6CC38_YARLI_2 ................................................... CAG60823_1 ...........................................s..k.... CAG60823_2 ...........................................s..k.... AAS51350_1 ...........................................t..k.... AAS51350_2 ..........................................t...k.... DYR_YEAST_1 ..............................................k.... DYR_YEAST_2 ...........................................n..k.... EDN63566_1 ..............................................k.... EDN63566_2 ...........................................n..k.... CAA68779_1 ..............................................k.... CAA68779_2 ...........................................n..k.... CAG86485_1 ...........................................n..g.... CAG86485_2 ..................................................i ABN65593_1 ..............................................k...i ABN65593_2 ...........................................s..k.... ## DYR_CANAL_1 ................................................... DYR_CANAL_2 ...........................................n..t.... ## 1J3KA kyeklkykrckylnket.........vdnvnd.....mp...ns.kk...l #=GR 1J3KA SS HHHHHHHHHHHHHHCCC.........XXXXXX.....XX...XX.CC...C ## Phi/Psi: HHGCHHHHHCGGGLE1X............................XE...C #=GR 1J3KA LI ................................................... #=GR 1J3KA SA 41750352015228689.........XXXXXX.....XX...XX.96...1 ## Hydrophobic: -?--+-?--?-?+----.........+--+--.....+-...--.--...+ 1J3KB kyeklkykrckylnket.........vdnvnd.....mp...ns.kk...l #=GR 1J3KB SS HHHHHHHHHHHHHXXXX.........XXXXXX.....XC...CC.CC...C ## B Phi/Psi: GHHHHHHHCCCCX..........................X..CE.GE...E #=GR 1J3KB LI ................................................... #=GR 1J3KB SA 5166036206726XXXX.........XXXXXX.....X9...84.75...1 ## Hydrophobic: -?--+-?--?-?+----.........+--+--.....+-...--.--...+ ## Non-Pro: ................................................... ## Gly-Req: ................................................... 1J3IA kyeklkykrckylnket.........vdnvnd.....mp...ns.kk...l #=GR 1J3IA SA 41650252015328569.........XXXXXX.....XX...XX.97...0 #=GR 1J3IA S2 41650252015328569.........XXXXXX.....XX...XX.E7...0 1J3IB kyeklkykrckylnket.........vdnvnd.....mp...ns.kk...l #=GR 1J3IB SA 50661152004328376.........3XXXX9.....66...35.75...1 #=GR 1J3IB S2 50661152004328376.........3XXXXE.....66...35.75...1 DRTS_PLACH nymrlkwkrdryme........knn.vk.lntdg...ip....svdk...l Q7RGH7_PLAYO nyirlqwkrdkym........gknnlknnaeln.ng...el..n.nn...l Q95US9_PLAGA kykklkykrekylek.t.k...dtkc...les.....iiql..s.nn...l ## 98 2BL9A kyeklkwkrerylrmeasqgggdntsggd.nthg.......gdnadk...l #=GR 2BL9A SS HHHHHHHHHHHHHHHHHXXXXXXXXXXXX.XXXX.......XXXXXC...C ## Phi/Psi: HHHHHHHGCHHCCCHHX.............................X...E #=GR 2BL9A LI ................................................... ## Non-Pro: ................................................... ## Gly-Req: ................................................... #=GR 2BL9A SA 51460352035125549XXXXXXXXXXXX.XXXX.......XXXXX8...0 ## Hydrophobic: -?--+-+----?+-+-?------------.----.......---?--...+ DRTS_PLAVI kyeklkwkrerylrmeasqgggdntsggd.nthg.......gdnadk...l DRTS_PLAVN nyirlkwkrdkyik.......ennvk...vntdg...ip....sidk...l AAV33644 kyeqlkwkreryllreasggsddtlqtgd.ntngsghtvgmgddttk...l AAV33645 kyeklkwkrerylqrevsggsgdt.hsgd.ntngsgdavgtgdnntk...l ## 1SEJC ...........................................s.nk.... #=GR 1SEJC SS ...........................................C.CC.... ## Phi/Psi: ...........................................G.G1.... #=GR 1SEJC LI ................................................... #=GR 1SEJC NP ................................................... #=GR 1SEJC GR ................................................... #=GR 1SEJC SA ...........................................7.82.... ## Hydrophobic: ...........................................-.--.... 1QZFD ...........................................s.nk.... #=GR 1QZFD SA ...........................................7.82.... #=GR 1QZFD S2 ...........................................7.82.... AAC47229 ...........................................s.nk.... ## 48 CAI76538 k............................................ekhpga EAN31856 k............................................ekhpga EAR85731 k..........................................g......l DRTS_TRYBB .............................vk..ps....p...s..k.... AAX78868 .............................vk..ps....p...s..k.... DRTS_TRYCR .............................vk..ps....p...a..k.... AAK71184 .............................vk..ps....p...a..k.... AAK71177 .............................vk..ps....p...a..k.... Q95NI3_TRYCR .............................vk..ps....p...a..k.... Q95NT2_TRYCR .............................vk..ps....p...a..k.... DRTS_LEIAM k.............................k..p.....pt..d.kk.... DRTS_LEIMA k.............................k..p.....pt..e.kk.... AAA29272 k.............................k..p.....pteeea.q.... Q8MXB7_LEITR k.............................k..p.....pt..e.kk.... Q8MQV1_LEICH k.............................k..p.....pt..e.kk.... DRT1_ARATH ........................................s..s..k.... DRTS_SOYBN .......................................p...g..k.... Q2R481_ORYSA .......................................p....v.k.... DRTS_MAIZE .......................................p....v.k.... #=GC RF ................................................... #=GC SS_cons ...........................................C.C-.... #=GC seq_cons ...........................................G.-K.... #=GC LI_cons ................................................... #=GC AS_cons ................................................... #=GC SA_cons ...........................................8.82.... ## Seq_cons2 xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxGxxKxxxx ## Hydrophobic: ...........................................-.--.... ## Fourth section (73 pos; 209 total) 1U70A QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.RG............a................. #=GR 1U70A SS EE.EEEEEHHHHHGGGGGGGSCCCEEEEEEC.CCCC...CCC.CC............C................. ## Phi/Psi: EE.EEEEEHHHHGGEEGGGeEEELEEEEEEC.CCEG...EEE.CC............E................. #=GR 1U70A LI .........*................................................................. ## ^ this one looks to be binding to one or more Ps in NADPH (esp non-pyro); other is backbone N ## h-bonding to pyro, possibly side-chain binding to other pyro #=GR 1U70A NP ........................*..............*................................... #=GR 1U70A GR ............................................G.............................. #=GR 1U70A SA 30.0000136204314773120450000000.7727...741.92............0................. ## Hydrophobic: --.++++----++-+------+---+-+++-.--+-...---.--............?................. DYR_RAT QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............a................. DYR_MESAU QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............a................. Q78EH1_9RODE QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............a................. ## 86 1U72A QN.LVIMGKKTWFSIPEKNRPLKGRINLVLS.RELK...EPP.QG............a................. #=GR 1U72A SS EE.EEEEEHHHHHGGGGGGGSCCCEEEEEEC.CCCC...CCC.CC............C................. ## Phi/Psi: EE.EEEEEHHHGGGEECHGeECELEEEEEEC.GHEG...EEE.CC............E................. #=GR 1U72A NP ........................................................................... #=GR 1U72A GR ............................................G.............................. #=GR 1U72A LI ..............**..*..*..*.................................................. ## ^ as per 1U70A #=GR 1U72A AS ........................................................................... #=GR 1U72A SA 30.0000125204315784120740100001.7738...630.83............1................. ## Hydrophobic: --.++++----++-+------+---+-+++-.--+-...---.--............?................. 1PD8A QN.LVIMGKKTWFSIPEKNRPLKGRINLVLS.RELK...EPP.QG............a................. #=GR 1PD8A SS EE.EEEEEHHHHHHHGGGGGSCCCCEEEEEC.CCCC...CCC.CC............C................. #=GR 1PD8A GR ............................................G.............................. #=GR 1PD8A SA 40.0000035104315672120740000000.7628...630.83............1................. ## Hydrophobic: --.++++----++-+------+---+-+++-.--+-...---.--............?................. 1DHFB QN.LVIMGKKTWFSIPEKNRPLKGRINLVLS.RELK...EPP.QG............a................. #=GR 1DHFB LI ..............**..*..*..*.................................................. #=GR 1DHFB AS ........................................................................... ## 1DHFA SA 4X.0XXX1261X4415564110540000X00.6726...630.54............1................. #=GR 1DHFB SA 30.0000136104415773120740000000.8616...631.93............1................. #=GR 1DHFB S2 30.0BBB1361044157731207400B0B00.8616...631.93............1................. XP_001110551 QN.LVIMGKKTWFSIPEKNRPLKGRINLVLS.RELK...EPP.QG............a................. XP_001134992 QN.LVIMGKKTWFSIPEKNRPLKGRINLVLS.RELK...EPP.QG............a................. XP_851329 QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RDLK...EPP.QG............a................. XP_536308 QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RDLK...EPP.QG............a................. DYR_PIG QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............a................. DYR_BOVIN QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.KG............a................. P00376 QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.KG............a................. Q29RI1_BOVIN QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.KG............a................. PLACENT QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............a................. #=GR PLACENT SA 30.0000035104415571130450000000.6626...630.45............0................. ## POSS1: QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............A................. ##nonrot.full2 3B.BBBB0351B44145811304500BBB00.6625...630.45............0................. ##mmtp.full 3B.BB0B0341044155711304500BBB00.6626...630.45............0................. ##mmtp.fullSS EE.EEEEEHHCHHHEEGGGEECCLEEEEEEC.CHEG...EEE.CC............C................. ## POSS2: QN.LVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.QG............A................. XP_001363618 QN.LVIMGKKTWFSIPEKCRPLKDRINVVLS.RELK...EPP.QG............a................. ## 8DFR0 QN.AVIMGKKTWFSIPEKNRPLKDRINIVLS.RELK...EAP.KG............a................. #=GR 8DFR0 SS EE.EEEEEHHHHHHCTTTTCSTTTTEEEEEE.CCCC...CCT.TT............T................. ## Phi/Psi: EE.EEEEEHHHCGGEEGGGeEECLEEEEEEC.GGEG...ECC.CC............E................. ## ^ is residue down as both sheet, helix #=GR 8DFR0 NP ........................*.................................................. #=GR 8DFR0 GR ............................................G.............................. #=GR 8DFR0 SA 30.0000136204316585120740000000.8729...720.82............0................. ## Hydrophobic: --.?+++----++-+------+---+-+++-.--+-...-?-.--............?................. 1DR10 QN.AVIMGKKTWFSIPEKNRPLKDRINIVLS.RELK...EAP.KG............a................. #=GR 1DR10 SS EE.EEEEEHHHHHHCTTTTCSTTTTEEEEEE.CCCC...CCT.TT............T................. ## ^ is residue down as both sheet, helix #=GR 1DR10 LI ..........*.......*.............*.......................................... ## ^ as per 1U70A ## Phi/Psi: EE.EEEEEHHHHGGEEGGGeECCLEEEEEEE.GGEG...EEE.CC............C................. #=GR 1DR10 GR ............................................G.............................. #=GR 1DR10 SA 30.0000126204316585120640000000.8726...721.82............1................. ## Hydrophobic: --.?+++----++-+------+---+-+++-.--+-...-?-.--............?................. AGA QN.AVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EAP.KG............a................. #=GR AGA SA 40.0000034104315482131650000010.7738...720.63............0................. ## AGfullSA2 4B.B0BB0341042154821316500BBB10.7738...720.63............0................. ## AGfull2SA2 4B.B0B00342043254821316400BBB10.7738...720.63............0................. ## AG: QN.AVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EAP.KG............A................. ## AI: QN.AVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EAP.KG............A................. ## PG: QN.AVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.KG............A................. PGV QN.VVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.KG............a................. #=GR PGV SA 40.0000034105315582131650000000.7738...540.63............0................. ## PGVYSfullSA2 40.B0B00341053155821315500BB000.7728...540.53............0................. ## PGVYSfull2S2 40.B0B00341053255831416500B0000.7738...540.62............0................. ## PI: QN.AVIMGRKTWFSIPEKNRPLKDRINIVLS.RELK...EPP.KG............A................. ## ^ V also used for some Q5U543_XENLA KN.VVIMGRKTWFSIPEKNRPLKERINIVLS.KELK...EPP.TG............a................. ENSXETP49617 KN.VVIMGRKTWFSIPEKNRPLKERINIVLS.KELK...EPP.TG............a................. AAK01951 KN.VVIMGRKTWFSIPAAHRPLKNRINIVLS.RELK.t.-AP.EG............a................. CAM14042 KN.VVIMGRKTWFSIPAAHRPLKNRINIVLS.RELK.t.-AP.EG............a................. NP_571850 KN.VVIMGRKTWFSIPAAHRPLKNRINIVLS.RELK.t.-AP.EG............a................. XP_001176553 -N.AVIMGRKTWDSIPEKFRPLKDRVNVVLS.NSL-.t.ECPp-G............a...........d..... ## EED: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## ^ I suspect this should probably be an A, not a deletion! ## EEK: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## KED: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## KEK: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## K_D: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## K_K: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EED: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _E_SKFED: KN.-VIMGRKTWESIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _E_GKFED: KN.-VIMGRKTWEGIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EE_D: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EAED: KN.AVIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EASKFED: KN.AVIMGRKTWESIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EAGKFED: KN.AVIMGRKTWEGIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _E_EDQ: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ES KN.-VIMGRKTWESIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............a................. #=GR ES SA 40.-000044105314774251630100000.6726.9.605.-5............1................. ## S2: 40.-000044105314774251630100000.6726.9.605.-5............1................. ## _E_GKFEDQ: KN.-VIMGRKTWEGIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EAEDQ: KN.AVIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EASKFEDQ: KN.AVIMGRKTWESIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EAGKFEDQ: KN.AVIMGRKTWEGIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _EEK: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KED: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KE_D: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KAED: KN.AVIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KAEDQ: KN.AVIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KASKFED: KN.AVIMGRKTWESIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KASKFEDQ: KN.AVIMGRKTWESIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _KAGKFED: KN.AVIMGRKTWEGIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............A................. KAG KN.AVIMGRKTYEGIPEKFRPLKDRINIVLS.RNLK.t.EAP.-G............a................. ## Note that the above is the correct alignment by structal._KAGKFEDQ.loop.13-27.full2.new.reduce3.ent.1J3IA.GCG.txt ## ^ This should be a Tyr if have a Gly 2 later (53,55) - probable H-bonding #=GR KAG SA 50.0000045204425675142730100000.6737.8.615.-3............1................. ## S2: 50.00B0045204425675142730100000.6737.8.615.-3............1................. ## _KEK: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _K_D: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. ## _K_K: KN.-VIMGRKTWESIPE--RPLKDRINIVLS.RNLK.t.EAP.-G............A................. XP_973338 KN.VVLMGRKTWDSIPPKFKPLHQRFNFIMS.RAG-..vE-L.EG..yk........d................. ## end area here and below has problems ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ !!! EAL28532 RN.VVIMGRKTYFGVPASKRPLPERLNIVLS.TTLK..pAELpS-............d................. DYR_DROME QN.AVVMGRKTYFGVPESKRPLPDRLNIVLS.TTLQ.e.SDLpKG.............................. AAA19051 QN.AVVMGRKTYFGVPESKRPLPDRLNIVLS.TTLQ.e.SDLpKG.............................. XP_393902 RN.VVLMGRRTWESIPKENRPLKNRINIVLT.SQ-S..l-DY.-G.........n..d................. Q7Q0L5_ANOGA RN.AVIMGRKTYFGVPESKRPLPERLNIVLT.RNAA..aYTFp--........p...d................. DYR_CAEEL_1 RN.AVLMGRKCWESIPVTRRPLAGRLNIVLS.RQLP..aQKS.D-............d................. Q61DT5_CAEBR_1 RN.AVLMGRKCWESIPESRRPLPGRLNIVLS.RQLE.k.QNT.D-............n................. DYR_CAEEL_2 RN.AVLMGRKCWESIPVTRRPLAGRLNIVLS.RQLP.a.QKS.D-............d................. Q61DT5_CAEBR_2 RN.AVLMGRKCWESIPESRRPLPGRLNIVLS.RQLE.k.QNT.D-............n................. ## ## 1100_SVFQ RN.AVIMGRKTWESIPEKFRPLPNRINIVLS.RNAK..vEEL.-G............D................. ## 1111_GTF RN.AVIMGRKTWESIPEKFRPLPNRINIVLS.RNAK.t.EEL.-G............d................. ## 1111_GVF RN.AVIMGRKTWESIPEKFRPLPNRINIVLS.RNAK..vEEL.-G............D................. 1111_STF RN.AVIMGRKTWESIPEKFRPLPNRINIVLS.RNAK.t.EEL.-G............d................. ## 1111_SVF RN.AVIMGRKTWESIPEKFRPLPNRINIVLS.RNAK..vEEL.-G............D................. ## ## 1111_chars2 RN.AVIMGRKTWESIPEKFRPLKNRINIVLS.RNLK.t.EEL.-G............N................. ## AAQ02615_1 QN.AVIMGRKTYVGIPAKFRPLSNRVNIVIS.TNAN..lRKE.E-si......p...d...........s..... AAQ02617_1 QN.AVVMGRKTYVGIPAKFRPLSNRVNIVIS.TNAN..lRKE.E-si......p...d...........s..... AAQ02619_1 QN.AVIMGRKTYVGIPAKFRPLSNRVNIVIF.TNAN..lRKE.E-si......p...d...........s..... AAQ02621_1 QN.AVTMGRKTYVGIPAKFRPLSNRVNIVIS.TNAN..lRKE.E-si......p...d...........s..... AAQ02615_2 QN.AVIMGRKTYVGIPAKFRPLSNRVNIVIS.TNAN..lRKE.ES.i......p...d...........s..... AAQ02617_2 QN.AVVMGRKTYVGIPAKFRPLSNRVNIVIS.TNAN..lRKE.ES.i......p...d...........s..... AAQ02619_2 QN.AVIMGRKTYVGIPAKFRPLSNRVNIVIF.TNAN..lRKE.ES.i......p...d...........s..... AAQ02621_2 QN.AVTMGRKTYVGIPAKFRPLSNRVNIVIS.TNAN..lRKE.ES.i......p...d...........s..... DYR_ENCCU_1 SN.AVVMGRRTWDSIPSRFRPLANRINVVLS.R-GP..aRST.E-............n................. DYR_ENCCU_2 SN.AVVMGRRTWDSIPSRFRPLANRINVVLS.R-GP.a.RST.EN.............................. EAK84413 RN.AVIMGRKTWASIPPKFRPLAGRFNVVIS.RTSS..aTDL.-G.i....r.pelia.clhcihpnsdpdsnd. BAC75955 RN.AVVMGRTTWESIPEKFRPLPNRVNVVVS.RNEN.y.ELEp-Gk........e.ps.......p........m DYR_CRYNE QN.VVIMGRKTWESIPSRFRPLKNRRNVVISgK-GV...D-L.-Gta.......e..n...........s..... # # 10100_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 10101_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 10110_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 10111_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 11100_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 11101_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 11110_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # 11111_chars2 RN.VVIMGRKTWESIPAKFRPLPNRINIVIS.RNAK.t.DELp-G............N................. # poss remove: ^ and/or perhaps next should be D? Yes. ## Should the initial M in the below be back one (align vs l et al) and M be a gap? !!! # # 0010_KD RN.VVIMGRKTWESIPPKFRPLKNRINIVIS.RNSK.T.DEL.DG............N................. # 0010_KP RN.VVIMGRKTWESIPPKFRPLKNRINIVIS.RNSK.T.DEL.DG............N................. # 0010_QD RN.VVIMGRKTWESIPPKFRPLKNRINIVIS.RNSK.T.DEL.DG............N................. # 0010_QP RN.VVIMGRKTWESIPPKFRPLKNRINIVIS.RNSK.T.DEL.DG............N................. # 0011_KD RN.VVIMGRKTWESIPAKFRPLPNRINIVLS.RNSK.T.DEL.EG............D................. # 0011_KP RN.VVIMGRKTWESIPAKFRPLPNRINIVLS.RNSK.T.DEL.EG............D................. # 0011_QD RN.VVIMGRKTWESIPAKFRPLPNRINIVLS.RNSK.T.DEL.EG............D................. # 0011_QP RN.VVIMGRKTWESIPAKFRPLPNRINIVLS.RNSK.T.DEL.EG............D................. # ^ D doesn't work here with L right before... I note "G" below. DYR_SCHPO_1 MN.VVIMGRSCYDSLPKKNRPLKDRINIVIT.RNSN.y.NF-.-G.ltkkekmpe..n................. DYR_SCHPO_2 -N.VVIMGRSCYDSLPKKNRPLKDRINIVIT.RNSN..yN-F.-G.ltkkekmpe..n................. DYR_PNECA MN.VVLMGRKTWESIPLQFRPLKGRINVVIT.RNES..lD-LgNG.............................. AAF14071 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. AAL25720 MN.VVLMGRKTWESLPERFRPLKGRINVVIS.RQEV..lD-LgQG.............................. AAT99406 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. AAT99411 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. AAT99412 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. AAT99413 MN.VVLMGRKTWESLPAHSRPLKNRINVIIS.RQEV..lD-LgGG.............................. AAT99417 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84704 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84712 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84716 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84718 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84720 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84722 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84726 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84744 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABB84751 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABF06467 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABF06468 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABF06469 MN.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. ABF06470 -N.VVLMGRKTWESLPAHSRPLKNRINVVIS.RQEV..lD-LgGG.............................. Q6CC38_YARLI_1 KNaVVIMGRTTWDSIPPKFRPLPDRTNIVLTsRPMT...D-ApEE.............................. Q6CC38_YARLI_2 KNaVVIMGRTTWDSIPPKFRPLPDRTNIVLTsR-PM.t.D-ApEE.............................. CAG60823_1 QN.VVIMGRKTWESIPQKFRPLPKRINVVVS.RSFDgelRKVeDG.............................. CAG60823_2 QN.VVIMGRKTWESIPQKFRPLPKRINVVVS.RSFDgelRKVeDG.............................. AAS51350_1 RN.AVVMGRKTWESIPARWRPLPGRLNVVVS.RTYTsp.-WAhDE............n.......gh........ AAS51350_2 RN.AVVMGRKTWESIPARWRPLPGRLNVVVS.RTYT.sp-WAhDE............n.......gh........ DYR_YEAST_1 KN.ALIMGRKTWESIPPKFRPLPNRMNVIIS.RSFKd..DFVhDK............e........r..s..... DYR_YEAST_2 KN.ALIMGRKTWESIPPKFRPLPNRMNVIIS.RSFK.d.DFVhDK............e........r..s..... EDN63566_1 KN.ALIMGRKTWESIPPKFRPLPNRMNVIIS.RSFKg..DFVhDK............e........r..s..... EDN63566_2 KN.ALIMGRKTWESIPPKFRPLPNRMNVIIS.RSFK.g.DFVhDK............e........r..s..... CAA68779_1 KN.ALIMGRKTWESIPPKFRPLPNRMNVIIS.RSFKd..DFVhDK............e........r..s..... CAA68779_2 KN.ALIMGRKTWESIPPKFRPLPNRMNVIIS.RSFK.d.DFVhDK............e........r..s..... CAG86485_1 IN.AVIMGRKTWESIPTKFRPLPGRLNIVLS.RSYVs..HGSnDE............d................. CAG86485_2 -N.AVIMGRKTWESIPTKFRPLPGRLNIVLS.RSYV.s.HGSnDE............d................. ABN65593_1 -N.AVVMGRKTWDSIPARFRPLPDRINIVLS.RSFQ...NETvDT............n................. ABN65593_2 IN.AVVMGRKTWDSIPARFRPLPDRINIVLS.RSFQ.n.ETV.DT............n................. ## DYR_CANAL_1 RN.AVIMGRKTWESIPQKFRPLPDRLNIILS.RSYE.n.KII.DD............n................. DYR_CANAL_2 RN.AVIMGRKTWESIPQKFRPLPDRLNIILS.RSYE...NKIiDD............n................. ## 1J3KA QN.VVVMGRTSWESIPKKFKPLSNRINVILS.RTLK.k.EDF.DE............d................. #=GR 1J3KA SS CC.EEEEEHH-HHHHGGGGGSCCCCEEEEEC.CCCG.G.GGG.CC............C................. ## ?Cap IIa?: ^^ ^ ^ ## ?Cap VIIa?: ^ ^^ ^ ## Phi/Psi: EE.EEEEEHHCGGGEEGGGeECELEEEEEEC.GHEE.G.GGE.GE............C................. #=GR 1J3KA LI ........***..................**.**......................................... #=GR 1J3KA SA 00.0000035104214774130440100010.7725.6.651.92............8................. ## Hydrophobic: --.++++----+--+---+--+---+-+++-.--+-.-.--+.--............-................. 1J3KB QN.VVVMGRTSWESIPKKFKPLSNRINVILS.RTLK.k.EDF.DE............d................. #=GR 1J3KB SS EE.EEEEEHH-HHHHCCCCCSCCCEEEEEEC.CCCC.C.CCC.CC............C................. ## Phi/Psi: EE.EEEEECCHHHHC1HGCeECCLEEEEEEE.GCEE.G.CCC.EH............G................. #=GR 1J3KB LI ........***..................**.**......................................... #=GR 1J3KB SA 10.0000035104313786240550100010.8734.6.672.59............6................. ## Hydrophobic: --.++++----+--+---+--+---+-+++-.--+-.-.--+.--............-................. ## Non-Pro: ........................*.................................................. ## Gly-Req: ........................................................................... 1J3IA QN.VVVMGRTSWESIPKKFKPLSNRINVILS.RTLK.k.EDF.DE............d................. #=GR 1J3IA SA 20.0000025105315874130550100000.7725.6.651.93............8................. #=GR 1J3IA S2 2B.BBBB02510531587413055010BB00.7725.6.651.93............8................. 1J3IB QN.VVVMGRTSWESIPKKFKPLSNRINVILS.RTLK.k.EDF.DE............d................. #=GR 1J3IB SA 10.0000035104314875230650000010.6535.5.782.58............4................. #=GR 1J3IB S2 10.BBBB035104314875230650000B10.6535.5.782.58............4................. DRTS_PLACH QN.IVVMGKASWESIPSKFKPLQNRINIILS.RTLK.k.EDLaKE..y.........d...........n..... Q7RGH7_PLAYO QN.VVVMGKRSWDSIPPKFKPLQNRINIILS.RTLK.k.EDIaNE............dnknnengt......... Q95US9_PLAGA QN.VVVMGRTSWESIPERFRPLVNRINVVLS.RSLK.k.EDI.KG............d................. ## 139 2BL9A QN.VVVMGRSSWESIPKQYKPLPNRINVVLS.KTLT.k.EDV.KE............k................. #=GR 2BL9A SS CE.EEEEEHHHHHHCGGGGGSCCCEEEEEEC.CCCC.C.CCC.CC............C................. ## Phi/Psi: EE.EEEEEHHHHHGEECGGeEEELEEEEEEC.CCEE.G.HGE.HE............E................. #=GR 2BL9A LI .......****..**..............**.**......................................... ## Non-Pro: ........................*.................................................. ## Gly-Req: ........................................................................... #=GR 2BL9A SA 10.0000035204314565020650100000.6614.7.660.71............7................. ## Hydrophobic: --.++++----+--+---?--+---+-+++-.--+-.-.--+.--............-................. DRTS_PLAVI QN.VVVMGRSSWESIPKQYKPLPNRINVVLS.KTLT.k.EDV.KE............k................. DRTS_PLAVN QN.IVVMGKTSWESIPSKFKPLENRINIILS.RTLK.k.ENLaKE..y......s..n................. AAV33644 QN.IVVMGRSSWESIPKQYKPLPNRINVVLS.KTLT.q.EEV.KE............k................. AAV33645 QN.VVVMGRSSWESIPKQYKPLPNRINVVLS.KTLT.y.EHV.KE............k................. ## 1SEJC KN.ALIMGRKTWDSIGR--RPLKNRIIVVIS.SSLP.q.DEA.DP............n................. #=GR 1SEJC SS EE.EEEEEHHHHHHHCC--CCCCCCEEEEEC.CCCC.C.CCC.CC............C................. ## Phi/Psi: EE.EEEEEHCGGGHGLC--EEECLEEEEEEE.GCCC.C.CCC.EG............G................. #=GR 1SEJC LI ......*.*.*...*..--..*..*....**.*.......................................... #=GR 1SEJC NP .................--......................*................................. #=GR 1SEJC GR .................--........................................................ #=GR 1SEJC SA 20.00000361034344--631740100000.7616.4.387.27............2................. ## Hydrophobic: --.?+++----+--+--..--+---+++++-.--+-.-.--?.--............-................. 1QZFD KN.ALIMGRKTWDSIGR--RPLKNRIIVVIS.SSLP.q.DEA.DP............n................. #=GR 1QZFD SA 20.00000261034344--631740100000.7606.4.387.27............2................. #=GR 1QZFD S2 20.0BB00261034344--6317401B0000.7606.4.387.27............2................. AAC47229 KN.ALIMGRKTWDSIGR--RPLKNRKIVVIS.SSLP.q.DEA.DP............n................. ## 87 CAI76538 EN.VIIIGRNTYDSLPESVFPLKNRINIVIS.RNLT...E-VpGG.............................. EAN31856 QN.VIIIGRKTYDSLPEGTFPLKNRINVVIS.RNLT...E-VpGG.............................. EAR85731 QN.AVIMGKNTWEALPKKQQPLKDRLNIVIS.TTMQ.e.GQI.AD.........h..s................. ## ^ ^ I suppose the first one (TRP) _could_ be doing H-bonding from N on ring... DRTS_TRYBB RN.AVVMGRKTWDSLPPKFRPLSNRLNVVLS.RSAT.k.EQLlAG.i......pdp.ikraeaan.d........ AAX78868 RN.AVVMGRKTWDSLPPKFRPLSNRLNVVLS.RSAT.k.EQLlAG.i......pdp.ikraeaan.d........ DRTS_TRYCR RN.AVVMGRKTWDSIPPKFRPLPGRLNVVLS.STLT.t.QHLlDG.l......pdee.krnlha..d..s..... AAK71184 RN.AVVMGRKTWDSIPPKFRPLPGRLNVVLS.STLT.t.QHLlDG.l......pdee.krnlya..d..s..... AAK71177 RN.AVVMGRKTWDSIPPKFRPLPGRLNVVLS.STLT.t.QHLlDG.l......pdee.krnlha..d..s..... Q95NI3_TRYCR RN.AVVMGRKTWDSIPPKFRPLPGRLNVVLS.STLT.t.QHLlDG.l......pdee.krnlha..d..s..... Q95NT2_TRYCR RN.AVVMGRKTWDSIPPKFRPLPGRLNVVLS.STLT.t.QHL