#=GF ID CBP66
#=GF AC PF19043.4
#=GF DE Nuclear cap binding complex subunit CBP66 C-terminal region
#=GF AU Bateman A;0000-0002-6982-4660
#=GF SE Bateman A
#=GF GA 27.00 27.00;
#=GF TC 87.50 86.20;
#=GF NC 21.10 19.60;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -E 1000 --cpu 4 -Z 75585367 HMM pfamseq
#=GF TP Family
#=GF CL CL0179
#=GF RN [1]
#=GF RM 3120186
#=GF RT Trypanosome mRNAs have unusual "cap 4" structures acquired by
#=GF RT addition of a spliced leader.
#=GF RA Perry KL, Watkins KP, Agabian N;
#=GF RL Proc Natl Acad Sci U S A. 1987;84:8190-8194.
#=GF RN [2]
#=GF RM 15743819
#=GF RT Novel and essential subunits in the 300-kilodalton nuclear cap
#=GF RT binding complex of Trypanosoma brucei.
#=GF RA Li H, Tschudi C;
#=GF RL Mol Cell Biol. 2005;25:2216-2226.
#=GF DR INTERPRO; IPR043965;
#=GF DR SO; 0100021; polypeptide_conserved_region;
#=GF CC This entry represents the CBP66 component of the trypanasome
#=GF CC nuclear cap binding complex. Trypanosomes have a different cap 4
#=GF CC structure for mRNAs [1]. CBP66 is part of the complex that
#=GF CC recognises this cap. This domain adopts a beta-grasp like
#=GF CC structure.
#=GF SQ 15
#=GS A0A061IXS3_TRYRA/187-556 AC A0A061IXS3.1
#=GS A0A422NUS2_9TRYP/185-562 AC A0A422NUS2.1
#=GS Q57XW7_TRYB2/191-579 AC Q57XW7.1
#=GS A0A422P1X4_TRYRA/187-564 AC A0A422P1X4.1
#=GS A0A0N0DV58_LEPPY/195-676 AC A0A0N0DV58.1
#=GS Q4Q9X1_LEIMA/187-605 AC Q4Q9X1.1
#=GS V5D8Y9_TRYCR/186-556 AC V5D8Y9.1
#=GS A4HE65_LEIBR/191-619 AC A4HE65.1
#=GS A0A1X0NNM1_9TRYP/207-623 AC A0A1X0NNM1.1
#=GS A0A0S4J8F6_BODSA/217-520 AC A0A0S4J8F6.1
#=GS A4I1G5_LEIIN/187-609 AC A4I1G5.1
#=GS F9WHT0_TRYCI/190-573 AC F9WHT0.1
#=GS S9TU24_9TRYP/191-619 AC S9TU24.1
#=GS K2NPM4_TRYCR/186-558 AC K2NPM4.1
#=GS Q4DTX4_TRYCC/186-556 AC Q4DTX4.1
A0A061IXS3_TRYRA/187-556 .................ls--QMTTEERALVDRVVCSTRHAEESVVPPEMRIDF..SLHVPITRDEAEAL....VDGM.TGG-----.-----TSPPATVLARVE...........AAGGG....HAGPYFVKFGFPGG......APWDWSLHDEAEGLLQLRRRVPFPANGAPTPLERDIFCQELLYHVNQMNRFDTLPAALRALAHSPKVREALQCHLKN--..........-AAGR-ECEAKGAGG...GDIATLELCIRPWLFLPTAGVEVGVLLESGGEQVRGVVQRHGALRLMTCFSFLQKHG.----.................................................LNFSRYAVPGN..GQDVDAETFLEAEMRRVETAVKRDVERLRRHL.......RQRVSL-GELPPHAPWCFQLA-VTSA...................ATPPSLMAVCE.DAAAMRCVVLSMKPYWEALEE........FAAMHPAGR-R---.-GEAGSGGATDVTWNTKRHTYVALFP----------as..................
A0A422NUS2_9TRYP/185-562 .................ls--QMAPEERALVDRITCSTRCAEENVVPPGMGMEF..SLHVPLTRDEAEAL....VGG-.--------.--ATGVPPPAAVLSRVE...........AACAG....HAGPYFVKFGFPGG......APWDWSLHDEAEGLPQLRRRVPFPANGAPTPLERDIFCQKLLYHLNQMNCFDTPAAALRALAQSPKVREALRCQLKT--..........--AAGHEGEAEEAGG...GDAAALELCVRPWIFLPTAGVEVDVLLEEGGERVRGVVQRHGSLRLMTCFSFLQKHE.----.................................................MDFSRYAVLGS..GHDVDAEAALEAEMRRVEAVVKRGVEGLRQHL.......RQRMSREGDLPAHAAWCFRLA-VTPT...................AAAPSRMAACE.DAAAMRCAVLSMRPYRAALEE........FAALHAAPA-----.RGEAGGGGVTDVAWNTRRHTYVALFPRELLARLRA-s...................
Q57XW7_TRYB2/191-579 ..................k-QPMSSEELTRLRHVTHNTKCGEEQLVPTDMKFDF..SVYVPVAYKEAVAL....VDSE.GTG-----.---GSNRLVDDVIKRVE...........AACSA....YSGPYFVKFAFCGG......APWDWSLHNTSLGLSALRKRAPFPTNGAPTPLERDIFTQQLLYHMNQMNRFDTIALAVHALAKSPKVRRALQRELEY--..........---DQSLTSCNDKGD...KDAVSLHLCVRPWLFLPTVGVEATVFLEGGGEVLRGIVQRKGAVRLMISHALLRQQE.EKQG.................................................MDFSRFAVLGS..GQDLEAESYLESEIQRMSLLVKRSAQRLQQYI.......RQQRDR---FPPGAAWCVHIA-VSPPplvpfrpq...qygsgveqQKGECKQEESE.ERVTSKCVVLSLQEYQPAYEE........HVALHGELR-----.--------AGEVMWNTRKHGYVALIPREMLERLRL-e...................
A0A422P1X4_TRYRA/187-564 .................ls--QMTTEERVLVDRVVCSTRCTEESVVPPEMRIDF..SLHVPITRDEAEAL....VDGT.T-------.---GGTSLPATVLARVE...........AARGG....HAGPYFVKFGFPGG......APWDWSLHDEAEGLSQLRRRLSFPANGAPTPLERDIFCQELLYHVNQMNRFDTLPAALRALAQSPRVGEALRHHLKN--..........--AAGRECEAEETGR...GDIGTLELCIRPWLFLPTAGVEVGVLLEGGGEQVRGVVQRHSALRLMTCFSFLQKHE.----.................................................LNFSRYAVPGS..GQDVDAETFLEAEMRRVETAVKRGVEGLRQHL.......RQRVSL-GKLPPHASWCFQLA-VTSA...................ATPPSLMAVCE.DAAAMRCVVLSMKPYWEALEE........FAAMHPAGRRG---.--EAGSSGATDVTWNTKRHTYVALFPRELMERLKA-s...................
A0A0N0DV58_LEPPY/195-676 ..................a-AHLSAEQQQTVQRLLACVKDARAALAPVSLELKG..CIYVPVTEAEMEAI....FGSQtDSTTGNHS.SSVHQETMYQTVLQRVEaam.....asaSSASS....AGVSYFPRLSCPGG......APSDWAM-ESEEGRRALQRDCPLPANGAPTPLERDLYIQKLWYHMNQLHRCRTAPEVMRRLRGSRRVRDALRRRVSDKHaaa...shflPSHPHANAALASPSE...AAAAPLYICLQPWLYLPTVGCEVSAFVERGGRRVRGVVQRYGQLRLMTSAALLATST.SSRTrtrgeeekegrkgaeagrspnaeptspqqregrgddadgdaaddsgdvdALLSRYAVLDS..GNDSLAEASLAKELRAFQRCIAAAVNELRRHL.......QQHPSSTGG--EGAAWCVHLAVL-PLppstsmss...ssslqsapVTDPAGVAASS.SPAAPSVVLLSCSAYQRALEEc.....pmYSALAPSTSSSAAAeAADAPRPGQVEVTWNTQRHPYIPLFSREVLEKLRAD....................
Q4Q9X1_LEIMA/187-605 ..................g-ARLTCEQEAVVRHLLSSAEAARAALTPASMAMKD..CTYVPVSAEEMGLLsqlaCEAL.SSAPLPAF.ETLEAHPTYQAVLQRIDdalq...aqraAAVAG....ESMTFFPRLSCPGG......APWDWSV-ESEDGRRLLRQRCPLPANGAPTPLERDVYTQRLWYHMNQLNRCHSARDVLRMLCGSHRAREALRRHSEAIDg........gDARTHASSSSLPSSSp.aTKAAGLTICLQPWLYLPTVGCEVTAYLERGGRRVRGVVQRYGQVRLMTSATLLASAS.AVVGdaa...........................................hvdALLARYAVLES..ATDAAAEEDLTGELRALQRSFASAVGDVAHHL.......QTHPDSIGG--DGAAWCVHLAAVLTP...................SVAPAAGPPPP.------VTLLSASPYQRALEEc.....smYSSLAPPIRGDDMA.ASAATAPAKVDVTWNTQRHPYISLFSRSVLEKLRAD....................
V5D8Y9_TRYCR/186-556 ..................v-HHMTPEERALVHRISCSTRRAEECVIPAEMRIDF..SLHVSLTRDEAEAL....VDD-.--------.---AAGVVPASVLQRVE...........TACAG....HDGPYFVKFDFTGG......APWDWSLHDDREGLPRLRQRLPFPENGAPTPLERDIFCQQLLYHLNQMNRFETISSALRALAHSPKVQEALRRVAQN--..........---PRVHEGKPEEGE...GDAVALGLCIRPWLFLPTVGVEVSVLLEGGGDRVQGIVQRRSALRLMTCFSFLQKHG.----.................................................MDLSRYAVIGS..GQDVYAEESLETEMRRVEKAVKRAVEGLRQHL.......RWQVSRGGQLPSNAAWCFQLA-VMP-...................STSPSSVAAGE.DAAEMRCVVLSMKPYEEAFEE........FTAMHPSLM-----.----RDEAVTDVIWNTKRHTYVALFPRELMERLKKE....................
A4HE65_LEIBR/191-619 ..................s-AHLTSEQQATVRHLLSSVEASRAALTPVPMIMKN..CTYVPVSAEEMEMLnrlaCEAP.SCTSLPAF.ESLEAHPTYQTLLQRIDdalqsqraatvVTAGG....ESTAFFPRLGCPGG......APWDWSV-ESEEGRRLLRQRCPLPANGAPTPLERDLYTQRLWYHMNQLNRCHSARDVVRMLCGSRRVREALRRCSEAINdasvpspsgtRADDKAQTNVSPSSS..tTKASGLTICLQPWLYLPTVGCEVTAYLERGGRRIRGVVQRYGQVRLMTSATLLASAF.AVVGdaa...........................................dpdALLARYAVLES..ATDAAAEEDLTRELRVFQRSFASAVGDVALHL.......QTHSNSVGG--DGAAWCVHLAVVLTP...................NSVPTAGRLPS.------VALLSASPYQRALEEc.....smYSSLAPPSRGADPT.ASTETRPTNVDVAWNTQRHPYIPLFSRDLLEKLRA-g...................
A0A1X0NNM1_9TRYP/207-623 ..................e-AEMTREEMEVVRNVTRSTRLTEELLVPAEMQLDF..SVYVSITHEEALSL....VGNT.GSTACSNT.IAATATAVRANIVKRVK...........ESCST....YKGPYFIRFAFPGG......APWDWSLHDESEGLPQLRQRAPFPENGAPTPLERDLFCQKLLYHVNQMNKFTTIDAALRAFETSPRVCEALHQYLQQEN..........DQKDKKEKNSNEDSS...GTSTMIELCIRPWLFLPTADMETVVLLEKGGEYIRGVAQRHAALRLMTSATFLQQHQ.----.................................................LDFTRYAVIGN..NEDPEAEDALEMELRRVGTVVKRGVDTLRRHV.......RQQCTR-EKIPSSSAWCIQLAVVIPDglgmeennnsgnsnvngpvSTTTVSGENST.DVGTMHTVVLSLKPYQTALEE........FTAIYGTRQDVSSA.GNDDNDRVRKEVLWNTKKHPYISLFSRELMERLKRD....................
A0A0S4J8F6_BODSA/217-520 ssssstrrllpqtlrghsw----------------------ETAMIPESYRVAR..-RFVSVGATVLREA....VTEL.RAATTSAItSSFAQQPAIQQFLATFAaa......fpsPAAPS....ESSSWFVKLENLGSatssflAPWDWALHDASVGVPLLQSVAPLPPNGIPTPLERDRFLETLLDAMNRT----SNRFVLAANAGEDAVRALGLNMLRA--..........LASSPKTFAAITSSS...SSHSECRLVLEPWVRIPSVLHESVFMFREG--KLRSVLQRRGNVRYCTRDDGKQLAQ.RILE.................................................DPLRAAASAIS..AQLKQTFHDNEAELQNVSVAV-----------.......--------------------------...................-----------.---------------------........--------------.------------------------------------rcvcvpqrhslsspsptags
A4I1G5_LEIIN/187-609 ..................g-ARLTREQQAVVRHLLSSAEAARAALTPASMAMKD..CTYVPVSAEEVELLsqlaCEAP.SSASLPAL.EKLEAHPTYQAVLQRIDdalqarraaaaAAVAG....ESMAFFPRLSCPGG......APWDWSV-ESADGRRLLRQRCPLPANGAPTPLERDVYTQRLWYHMNQLNRCHSARDVLRMLCGSHRVREALRRRSEAIDs........gEAQTHALSSPLPSSSspaTRAAELTICLQPWLYLPTVGCEVTAYLERGGRRVRGVVQRYGQVRLMTSATLLASAS.AVVGdaa...........................................ntdALLARYAVLES..ATDAAAEEDLARELRALQRSFASAVGDVALHL.......QTHSDSIGG--DGAAWCVHLAVVLTP...................SVAPAAGPPPP.------VALLSASPYQRALEEc.....smYSSLAPPIRGDDTA.ASAATAPAKVDVTWNTQRHPYIPLFSRSVLEKLRAD....................
F9WHT0_TRYCI/190-573 ..................q-HSMTAEERGLVDRITNNTRCAEEYIVPPEMKLEF..SIFVSVTREESLAL....VGTG.AP------.--DESRGVVDAVVQRVE...........AACAA....HPGPYFVKFAFPGG......APWDWSLYDEERGLRELRRRTPFPPNGAPTSLERDIFTQQLLYHMNQMNRFETIASAIHALSTSHRARQALHRQLEK--..........---GHCGNAGKDDADv.eGEEASLELCVRPWLFLPTVGVEATIFIESGGELLRGIVQRRGAVRLMTSYALLHQKAhDTLK.................................................AAFTRFAILGS..GDDVEAESCLEAEIHKLSTLLKRAAQRLQHFI.......RRQQQH-AKLAPGASWSVQVA-VSPPpdd.............vaqSEQAAARQEGV.EDPVSKCVVLSLQEYQTSLEE........HTALHGEVR-----.--------GGGIMWNTKKHGYIPLIPREVMEQLS--es..................
S9TU24_9TRYP/191-619 .................fa--QLSPTERATVTALERSLPQSIAALVPPHGALHLvpEVNVALTAEELAWL....Q---.--------.--APAAAPPADLVGRVE...........AACAAgglaAGAPRFLRLSCPGG......APWDWAL-QDPAGLARLRALCPLPANGAPTPLERDLLLQKLLYYLNQLNRFTSVAAGLAALRASAKVRRALAQHVEEAA..........GRRSAAQRHRAEAEG...EGEEVVHLCVRPWLYLPTVGCEVTVFLEQGGAVLRGAVQRRGEVRLMASAAQLVAAL.A--Gptssaapdg...............................leaaapavrQVLDRCAQLGRegGGDEDAPQQLEAELLRHDGLFGRAVQVLQRYItketsrrQQHVTDLEVLPSQASWCLQLALAQPD...................PLRPAAAGRGEgGEGQRRVVVLSCQPYQRALEEcsmynyilRSSTAASEGDGSAG.AKSGTHAAPVKVGWNTQHHPFVSLFERSVLESLRP-e...................
K2NPM4_TRYCR/186-558 ..................v-HHMTPEERALVHRIACSTRRAEECVIPAEMRIDF..SLHVSLTRDEAEAL....VDD-.--------.---AAGVLPASVLQRVE...........TACAG....HGGPYFVKFDFPGG......APWDWSLHDDREGLPQLRQRVPFPANGAPTPLERDIFCQQLLYHLNQMNRFDTISSALRALAHSPKVREALRRVVQT--..........-PTVCGGKPEEEEEE...GNAVALGLCIRPWLFLPTAGMEVSVLLEGGGDRVRGIVQRRSALRLMTCFSFLQKHG.----.................................................MNFSRYAVLGS..GQDVYAEESLEAEMRLVEKVVKRGVEGLRQHL.......RQQVSHGGQLPSNAAWCFQLA--VTP...................STSPSPVAACT.DAAEMRCVVLSMKPYEEAFEE........FTAMLPSVL-----.----RDEAVTDVIWNTKRHTYVALFPRELMVRLRE-v...................
Q4DTX4_TRYCC/186-556 ..................v-HHMTPEERALVHRISCNTRRAEECVIPAEMRIDF..SLHVSLTRDEAEAL....VDD-.--------.---AAGVVPASVLQRVE...........AACAG....HGGPYFVKFDFPGG......APWDWSLHDDREGLPRLRQRLPFPENGAPTPLERDIFCQQLLYHLNQMNRFETISSALRALAHSPKVQEALRRVAQN--..........---PRVHEGKPEEGE...GGAVALGLCIRPWLFLPTVGVEVSVLLESGGDRVRGIVQRRSALRLMTCFSFLQKHG.----.................................................MNLSRYAVIGS..GQDVYAEESLEAEMRRVEKAVKRAVEGLRQHL.......RQQVSRGGQLPSNAAWCFQLA-VMP-...................STSPSSVAAGE.DAAEMRCVVLSMKPYEEAFEE........FTAMHPSLM-----.----RDEAVTDVIWNTKRHTYVALFPRELMERLKED....................
#=GC seq_cons ..................s.tpMTsEEcAlVc+lssST+pAEEsllPscMcl-F..SlaVslTc-EuEAL....V-s..ss..........sussssssVLpRVE...........AAsuG....auGPYFVKFuFPGG......APWDWSLHD-pEGLspLRpRsPFPANGAPTPLERDlFsQcLLYHhNQMNRFcTlsuALRALupSs+VREALRRplcs..............ts+spssst-sus...ucAusLpLClRPWLFLPTVGsEVoVhLEpGG-+VRGVVQR+GulRLMTshohLpppt......................................................hshoRYAVLGS..GpDstAEpsLEuElR+lppsVKRuVpsLppHL.......RQpsop.GtlPssAAWChpLA.Vhss...................ussPuussssp.-sut.+sVVLShpPYpcALEE........aoAhtPshp........ttss.ussDVhWNT+RHsYluLFsRElhE+L+t.....................
//