#=GF ID Tox-SGS
#=GF AC PF15651.10
#=GF DE Salivary glad secreted protein domain toxin
#=GF AU Zhang D;0000-0001-8535-7620
#=GF AU de Souza RF;0000-0002-5284-4630
#=GF AU Anantharaman V;0000-0001-8395-0009
#=GF AU Iyer LM;0000-0002-4844-2022
#=GF AU Aravind L;0000-0003-0771-253X
#=GF AU Finn RD;0000-0001-8626-2148
#=GF SE [1]
#=GF GA 25.00 25.00;
#=GF TC 26.60 25.90;
#=GF NC 24.20 21.40;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -Z 75585367 --cpu 4 -E 1000 HMM pfamseq
#=GF TP Family
#=GF RN [1]
#=GF RM 22731697
#=GF RT Polymorphic toxin systems: comprehensive characterization of
#=GF RT trafficking modes, processing, mechanisms of action, immunity
#=GF RT and ecology using comparative genomics.
#=GF RA Zhang D, de Souza RF, Anantharaman V, Iyer LM, Aravind L;
#=GF RL Biol Direct. 2012;7:18.
#=GF DR INTERPRO; IPR028901;
#=GF DR SO; 0100021; polypeptide_conserved_region;
#=GF CC An alpha+beta fold domain with four conserved cysteine residues
#=GF CC and a conserved [DE}xx[ND] motif. This domain is mainly present
#=GF CC at the c-terminus of RHS repeats containing proteins in insects
#=GF CC and crustaceans. Although no bacterial homologs have been
#=GF CC identified, the domain architecture suggests an origin from
#=GF CC bacterial polymorphic toxin systems [1].
#=GF SQ 27
#=GS A0A6E8P844_AEDAE/3163-3258 AC A0A6E8P844.1
#=GS A0A1S4KCQ8_CULQU/3095-3189 AC A0A1S4KCQ8.1
#=GS A0A182HF67_AEDAL/3121-3217 AC A0A182HF67.1
#=GS A0A182HF68_AEDAL/3123-3220 AC A0A182HF68.1
#=GS A0A6E8P7V7_AEDAE/3070-3165 AC A0A6E8P7V7.1
#=GS A0A084W8P1_ANOSI/3082-3179 AC A0A084W8P1.1
#=GS Q5XLG6_ANOGA/3122-3215 AC Q5XLG6.1
#=GS A0A1D2MHN7_ORCCI/2050-2155 AC A0A1D2MHN7.1
#=GS A0A2Z5V6W4_9COXI/3596-3684 AC A0A2Z5V6W4.1
#=GS E9HD60_DAPPU/3956-4063 AC E9HD60.1
#=GS A0A8J2RK80_9CRUS/2934-3029 AC A0A8J2RK80.1
#=GS A0A084W8P3_ANOSI/3166-3261 AC A0A084W8P3.1
#=GS E9HNC3_DAPPU/3929-4027 AC E9HNC3.1
#=GS A0A8J2RUX2_9CRUS/3965-4077 AC A0A8J2RUX2.1
#=GS A0A8W8EU36_CULQU/2933-3030 AC A0A8W8EU36.1
#=GS A0A8W8EX59_CULQU/2776-2869 AC A0A8W8EX59.1
#=GS A0A8W8EWM2_CULQU/2865-2962 AC A0A8W8EWM2.1
#=GS A0A182HF68_AEDAL/6246-6343 AC A0A182HF68.1
#=GS Q5XLG7_ANOGA/3146-3243 AC Q5XLG7.1
#=GS A0A6E8P7U5_AEDAE/3116-3210 AC A0A6E8P7U5.1
#=GS A0A182YMR4_ANOST/344-441 AC A0A182YMR4.1
#=GS A0A164SNZ8_9CRUS/398-497 AC A0A164SNZ8.1
#=GS A0A0Q9YVT8_9COXI/686-788 AC A0A0Q9YVT8.1
#=GS A0A499FX22_ANOGA/1457-1554 AC A0A499FX22.1
#=GS A0A1S4FPC9_AEDAE/3122-3219 AC A0A1S4FPC9.1
#=GS A0A8W8EM59_CULQU/2924-3017 AC A0A8W8EM59.1
#=GS A0A084W8P2_ANOSI/3142-3239 AC A0A084W8P2.1
A0A6E8P844_AEDAE/3163-3258 ......lcyspaddn--------------.....TRLICPQRESFVNVFSKLPAFE--EN...S--F...GRDTF..S..NCMPLSWQQHPSVVCDGHETTFIYTPQQD----LRVFELVDGWLLLARIAPAAIKN---lma................
A0A1S4KCQ8_CULQU/3095-3189 .lqncyhfkqsdesi--------------.....-VTKCFSMNSQYTVFTKMYR------...---I...VEDSY..S..FCKPIEFNGNASVVCDGKQSSLVFTPKPSGLG----LDYINGCLMLAMVAPAAFSSI--kn.................
A0A182HF67_AEDAL/3121-3217 .............kl-C-YSPSDDS----.....THVICPQRESIVTVFSKRPAFE----...EINF...GRDTF..S..NCMPLSWQDRSSVTCDGQDSTLIYTPQP----DVRVFDLLDGWLLLARVTPAAIRNV--ka.................
A0A182HF68_AEDAL/3123-3220 ........klcyapd---------S--EG.....NQIICPQRESIVNVFSKSATFD---N...PEVF...GQDLF..S..KCLPLTWHDRPSVVCDGQETTFIYTPIQS----LRVFDMVDGWLLLARIAPAALRNL--ks.................
A0A6E8P7V7_AEDAE/3070-3165 ...............NC-FQLHPNND-GN.....PSIKCYGHHSQTSIHYKTYHAE----...-IT-...-QDRF..Q..SCYPIYYNGIPSVSCEGQESSLLFTSYET----PRLFDHVDGWILLARVIPTAIKNIV-s..................
A0A084W8P1_ANOSI/3082-3179 ...............NCFF-RSSDG--VF.....DRIVCYEQHGFSYVFPHEANGA---A...SFT-...-EDSY..S..RCYPIEYEGSPSVVCSGTSSSYVFTPHAK---PVNYLDHLNGALTLLLVAPAVTRTI--as.................
Q5XLG6_ANOGA/3122-3215 .....ncypvthgel--------------.....NYVNCYSDQGLVTIF---PKVE----...AILQ...SHDEY..R..NCLPLTYDGVRGISCDGEQSTLLAVQIE----PPRLFEYVDSWLLLAHVAPAAVREVK-r..................
A0A1D2MHN7_ORCCI/2050-2155 .cqngawvdrsyvmn--------------.....-GITCLSKLSKMTVFRITTDNDLTREnfgSLHQpfiGGDTFekK..SCAPVDFNGMPSVTCNGQKTNLVYTPYLQDR----LFDNLDANIL--------------lgrtlihl...........
A0A2Z5V6W4_9COXI/3596-3684 ......arhgqaylk--------------.....-GFTCYTQNMQMMIFLKDSYVK----...-LEK...AEDSY..SkkSCRPIEFNGRPSVYCEGKKTNIVYTPEIS------------------------------qrpfeqlneqlmllqvvlh
E9HD60_DAPPU/3956-4063 ...............NC-YSFSSDTDCFD.....DTIVCYGHRGQTKVFSHSPSIDTCPP...PLQQ...DQDTY..R..DCRPIEWHGQPSVTCRGDETTFIHTPYNTNSAAANFFRTVDSWLILAYVTPGIYRETVK...................
A0A8J2RK80_9CRUS/2934-3029 ..........dvsiqNC-HSISP------.....DVIVCYGSHGKTTVFTS--KVN----...----...-RDTY..N..HCRPIEWHGQPSVTCQGEQTTFIHTPYNRNSTAAHLFNAVDGWLILAQATPGIYRELIK...................
A0A084W8P3_ANOSI/3166-3261 ncyrvangdsdgyfv--------------.....---KCFSL-------DSTTSIHPKPD...AILE...AHDTY..R..RCLPLTYDGTPAISCDGERSSLLSAGV----VTPKLIDLVDGWLLLAHITPAAVREA--gr.................
E9HNC3_DAPPU/3929-4027 ...............NCYYSISPDA----.....PVVVCYGYHGKTTVFSHSPRVD----...PLR-...-QDTY..S..HCRPIEWHGQPSVTCRGEETSFIHTPYNRNSGMANLFDAVDGWLMLVQAGPAMYREISK...................
A0A8J2RUX2_9CRUS/3965-4077 ...............NC-YSFSLDVDRVDdtivhDTIVCYGHQGQTKVFSHSPSYETCPP...PIKK...IQDTY..R..DCRPIEWYGQPTVTCRGDETTFIHIPYNTNSAAAYVFGAVDSWLILAHVTPGFYRETVK...................
A0A8W8EU36_CULQU/2933-3030 .......srycyrpt-----------NFK.....NHVICSQPNSQISVYPKAKSFE----...EINF...GQDTF..S..RCMPIHWHGLPSVSCEGERSTFIYTPNDQ----VTVFNYLDGWIMLAGVAPAIFADL--kr.................
A0A8W8EX59_CULQU/2776-2869 ..nciamnpdrsfye--------------.....----CFQSTAKVLLFAQNLSLESGSI...PTG-...----I..D..RCVPLHWHGQPSVGCQGQQFGFIYTPYE----ATKMFSFLDGWLMLARVGLQ-------vvenwr.............
A0A8W8EWM2_CULQU/2865-2962 ..sfqncvptnsdis--------------.....-SYTCYQSTAKVEVFPKEPTGPRAPH...SVV-...---PM..D..GCAPFHWYGRPAIGCEGQDFAFIYTPYETP----KWFSFLDGWLLLVRVGVQI------vgdlk..............
A0A182HF68_AEDAL/6246-6343 ........klcyapd-----------SKG.....NQIICPQRESTVNVFSKSVTFD---N...PEIF...GQDLF..S..RCLPLTWKDRPSIVCDGQETTFIYTPVQS----LRVFDMVDGWLLLARIAPASMRNL--ks.................
Q5XLG7_ANOGA/3146-3243 ...............NCYKIYSEE--HLD.....GMISCFGHSSTVTII---PKFE-S-N...PRIE...NADHY..K..YCMPLTYDGHPSASCEGEWSSLVYTAKE----TARVFDFVDGWILLAQVAPIAWKEI--kl.................
A0A6E8P7U5_AEDAE/3116-3210 ........nchrfvi-------SDD--F-.....SHVECYGLNSRYKIFPK-PNHQ----...-LG-...TEDYY..A..KCFPIEYDGQPAVVCHGKSSNLLFTPEQ----SVDVLDVVNGWLMLALVIPSAMKSI--qq.................
A0A182YMR4_ANOST/344-441 .......nchamprn--------DGGVEG.....NYVNCYSHRSFVTIHPKDEA------...-VLE...AQDHY..R..HCLPLTYNGVPAISCDGQHSTLLAVVQ----EPPNMFAQVDGWLLLARVAPAAVREA--kr.................
A0A164SNZ8_9CRUS/398-497 ..............n-C-VTFSEDA----.....-AVVCYGLDGQTLLFAQSADRS---L...PLEH...AEDTF..R..QCRPIEWNGKPSVTCRGEKTTFIHTPYERTSAAVHLLNAVDGWLLLAYAAPGFYREVGK...................
A0A0Q9YVT8_9COXI/686-788 .lyafctpqlddaep--------------.....PFLFCQGDSFQSFVFPNGEHPD----...-MAG...DNYHF..N..QCRPVDYYGKPSVVCPGEKSTVVLTPKLRERPFENLGGNIALGAVLLYWAKSLYQ----aft................
A0A499FX22_ANOGA/1457-1554 ...............NCFRTNSADN---L.....NTITCYEQHGLSYVFPHNTSNI----...-IGI...TEDHY..S..SCYPIEYNGLLTTACAGTNSSYMYTPYIRP---VNYLDQLNGTLTLLLVAPTVVRNIA-s..................
A0A1S4FPC9_AEDAE/3122-3219 ...........qklc-----YSPDSD--G.....NQIICPQRESTVNIFSKGETFA----...PEAF...GQDLF..S..RCLPLTWHDRPSIACDGEQTTFIYTP-NQN---IRVFDMVDGWLMLARIAPAALRNL--ka.................
A0A8W8EM59_CULQU/2924-3017 ..nciamnpdrsfye--------------.....----CFQSTAKVLLFAQNLSLESGSI...PTG-...----I..D..RCVPLHWHGQPSVGCKGQQFGFIYTPYEA----SKMFSFLDGWLMLARVGLQ-------vvenwr.............
A0A084W8P2_ANOSI/3142-3239 ...............NC-YQLRSEQ-HPD.....GMIACYGH---STVVSILPKQDQNP-...-KIG...LADRY..K..HCLPLTYDGNPSVSCDGEWSSLLYTAQ----EAPRIFDFVDGWLLLAQIAPSVYKELKK...................
#=GC seq_cons ..................................shlhCapppupsplFs+ssshc........hh....spDpa..s..pChPlpapGpPSVsCcGppoohlaTPhpp....splFchlDGWLlLApluPuhh+ph..h..................
//