#=GF ID M1E1E6-like
#=GF AC PF21648.1
#=GF DE Integron cassette protein
#=GF AU Bateman A;0000-0002-6982-4660
#=GF AU Lazaro Pinto Beatriz;0000-0001-6837-2941
#=GF SE ECOD:EF19998
#=GF GA 27.00 27.00;
#=GF TC 27.20 27.00;
#=GF NC 26.80 26.60;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -E 1000 -Z 75585367 --cpu 4 HMM pfamseq
#=GF TP Domain
#=GF RC Paper describing PDB structure 3fy6
#=GF RN [1]
#=GF RM 23349695
#=GF RT Integron gene cassettes: a repository of novel protein folds
#=GF RT with distinct interaction sites.
#=GF RA Sureshan V, Deshpande CN, Boucher Y, Koenig JE, Stokes HW,
#=GF RA Harrop SJ, Curmi PM, Mabbutt BC;
#=GF RL PLoS One. 2013;8:e52934.
#=GF DR SO; 0000417; polypeptide_domain;
#=GF CC This domain family is found in a group of bacterial
#=GF CC uncharacterised sequences from mobile gene cassettes, including
#=GF CC Integron cassette protein from Vibrio cholerae (M1E1E6). This
#=GF CC protein forms a dimer in which each protomer adopts a
#=GF CC two-layered alpha+beta fold with an anti-parallel beta-sheet of
#=GF CC five strands which curves around a pair of antiparallel helices
#=GF CC [1]. Its specific function is unknown.
#=GF SQ 12
#=GS A0A2K4ZAW1_9FIRM/193-290 AC A0A2K4ZAW1.1
#=GS A0A073JUM9_9BACI/112-208 AC A0A073JUM9.1
#=GS K7W483_9NOST/2-105 AC K7W483.1
#=GS A0A1V4HE65_9BACL/110-205 AC A0A1V4HE65.1
#=GS A0A428J106_9BACI/187-290 AC A0A428J106.1
#=GS W4QK99_9BACI/186-289 AC W4QK99.1
#=GS A0A1M5SWY6_9FIRM/177-271 AC A0A1M5SWY6.1
#=GS A0A1Y0KM30_9PSED/3-106 AC A0A1Y0KM30.1
#=GS F3ZV42_DESAL/5-112 AC F3ZV42.1
#=GS A0A091AID3_9PROT/2-105 AC A0A091AID3.1
#=GS A0A1H0VI21_9DELT/103-200 AC A0A1H0VI21.1
#=GS A0A0B5ATE6_9BACL/186-289 AC A0A0B5ATE6.1
A0A2K4ZAW1_9FIRM/193-290 krl---MFEVYTRRWGHTDRYRIKRTIDGWDCSHIAIKGKCEKNG------EG......ALFENLHHDCVF.FPED.AVKYGMEELWEAADEGEIGLEELQRRLQQVADWISHV-e..
A0A073JUM9_9BACI/112-208 ..h-EFDFKVFSRRWGNEDVYKIKRIESGWHLSHLSYTGDCK--KDGSPF---......--LYASFTHDSI.NYPE.SLPGYFEWLWEQAQEEGLSYDDVQSSLNQLAEWVN---lce
K7W483_9NOST/2-105 ..i-TITAEIYTPRWGNNDTYTFEFGEQSMSVSMIGPKAVCTYIPGRDPVWSG......DSLEGILRNNLV.HPPV.SFQDLIEHLWNSWRDGDINEAELNKELQEVIVWLNKIT...
A0A1V4HE65_9BACL/110-205 ..h-TFEFPVFSRRWGHKDSYKVTRNEQGWSFS---------FHKNEQGDKTG.....sPALYRFLDHDSI.NYPQ.ELPGYLEWLWIQAEEQGLSHDEVQESINDLADWVS---ace
A0A428J106_9BACI/187-290 .lp--IKLRIYSSRWGHDDIYSVKRTMTGWNFKHLSYDENCS----KDGTLNGd...knDGFFRILAHDSI.QCPNdGVKYALETLWKSADSTGMSIKELEIKLQDIGNWINAV-e..
W4QK99_9BACI/186-289 .sp--LKMKIYSSRWEHNDIYFVKRTMTGWNFKHLSYDVDCSKD-GTLNSMKN......DGFYSILAHDSIqYPYD.GVKYALETLWKTADSTSMTTKELEIKLQDIGDWINAV-e..
A0A1M5SWY6_9FIRM/177-271 ..k-EIDIKIYSRRWGHKDTYSVERTLEGWTVTFHQKK---------VGDKEG......KALIETLEHDFI.NYPH.ELGVFMWHLWNKADSNEMTVEEVEQDLKQIANWINV--ce.
A0A1Y0KM30_9PSED/3-106 ..t-TVDLEIFSPRWGNEDTYTVQLNRDFMEIKMSPRVSRATWIENQDPEWSG......ESIQAIMNNDNI.YPPK.ITQDLFEHVWKEWRNGDINDQQAEAELQEIAKWINAVT...
F3ZV42_DESAL/5-112 ..t-EFQVLLFSPRWGRDDTYNLQFSREKMQID-GPKSAECTWVEDGDPVWTGyqigqgNPLVNIMKNDHI.YPPS.VFVSALEWAWSEWRNTGLNED-IVQEVKGLFEWVNQIT...
A0A091AID3_9PROT/2-105 ..r-IVELKIYSPRWGHHDIYEIELAKDKMTITHNISSAICTWRDNLDPVWSG......NNLEDILRNDAI.YPPA.ILNDLLEHVWEAWRNGYLKDESVDQELHAVEEWLNTIT...
A0A1H0VI21_9DELT/103-200 ..q-EFTFTVFSRRWGHTDTYKMKRIATGWHFSHASVHMSGNCDKDGTP----......-FLYENLNHDSI.NYPE.ELPGYFEWLWDQAAERGLTNKEVQDNLDALGEWVS---lc.
A0A0B5ATE6_9BACL/186-289 ..k-KMKMKIYTNRWGRHDYYTVQRTIEGWIISFLTFQNVKCK-VNGESLDTD......TGFYEILRHDSVqYPKD.GVRYALETLWEEADSTEMSKEVLEKKLNEIAVWISEV-e..
#=GC seq_cons ..p.phchclaSpRWG+cDhYplcRshpGWphoahshps.ssh..stss.hpG......sslhplLpcDsI..sPp.tltshhEaLWcpAcssslspc-lppcLpplucWlNtl....
//