#=GF ID Internalin_N
#=GF AC PF12354.12
#=GF DE Bacterial adhesion/invasion protein N terminal
#=GF AU Gavin OL;
#=GF SE Prosite
#=GF GA 24.10 24.10;
#=GF TC 26.50 25.70;
#=GF NC 22.60 21.60;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch --cpu 4 -E 1000 -Z 75585367 HMM pfamseq
#=GF TP Domain
#=GF CL CL0220
#=GF RN [1]
#=GF RM 12526809
#=GF RT Structure of internalin, a major invasion protein of Listeria
#=GF RT monocytogenes, in complex with its human receptor E-cadherin.
#=GF RA Schubert WD, Urbanke C, Ziehm T, Beier V, Machner MP, Domann E,
#=GF RA Wehland J, Chakraborty T, Heinz DW;
#=GF RL Cell 2002;111:825-836.
#=GF DR INTERPRO; IPR024634;
#=GF DR SO; 0000417; polypeptide_domain;
#=GF CC This domain family is found in bacteria, and is approximately 60
#=GF CC amino acids in length. The family is found in association with
#=GF CC Pfam:PF00560, Pfam:PF08191, Pfam:PF09479. There are two
#=GF CC completely conserved residues (I and F) that may be functionally
#=GF CC important. Internalin mediates bacterial adhesion and invasion
#=GF CC of epithelial cells in the human intestine through specific
#=GF CC interaction with its host cell receptor E-cadherin. This family
#=GF CC is the N terminal of internalin, the cap domain of the protein.
#=GF CC The cap domain is conserved between different internalin types.
#=GF CC The cap domain does not interact with E cadherin, therefore its
#=GF CC function is presumably structural: capping the hydrophobic core.
#=GF SQ 22
#=GS A0A5R8QH70_9FIRM/1-55 AC A0A5R8QH70.1
#=GS Q7AP88_LISMO/3-58 AC Q7AP88.1
#=GS A0A5R8QCR1_9FIRM/6-59 AC A0A5R8QCR1.1
#=GS Q8Y8U2_LISMO/1-57 AC Q8Y8U2.1
#=GS INLA_LISMO/3-58 AC P0DJM0.1
#=GS A0A5R8Q796_9FIRM/2-59 AC A0A5R8Q796.1
#=GS A0A1E5GQ73_9ENTE/1-53 AC A0A1E5GQ73.1
#=GS Q8Y5N0_LISMO/1-55 AC Q8Y5N0.1
#=GS Q7AP86_LISMO/2-56 AC Q7AP86.1
#=GS INLH_LISMO/3-58 AC Q7AP87.1
#=GS A0A1H9SDM3_9LACT/1-49 AC A0A1H9SDM3.1
#=GS INLB_LISMO/3-58 AC P0DQD2.1
#=GS A0A5R8QH37_9FIRM/2-59 AC A0A5R8QH37.1
#=GS Q8Y7Y3_LISMO/1-58 AC Q8Y7Y3.1
#=GS A0A5R8QAT7_9FIRM/1-50 AC A0A5R8QAT7.1
#=GS A0A5R8QCS7_9FIRM/4-59 AC A0A5R8QCS7.1
#=GS A0A191HTP3_9FIRM/3-50 AC A0A191HTP3.1
#=GS Q8Y9W0_LISMO/2-59 AC Q8Y9W0.1
#=GS Q8Y4H2_LISMO/1-55 AC Q8Y4H2.1
#=GS A0A5R8QCU0_9FIRM/2-59 AC A0A5R8QCU0.1
#=GS A0A0R2FR41_9LACO/3-57 AC A0A0R2FR41.1
#=GS Q8Y6A8_LISMO/1-56 AC Q8Y6A8.1
A0A5R8QH70_9FIRM/1-55 mkkiriims-----------CMSLIVL.FSLTIMPINH.....VVVSAE..dAVAP.PAAISAIFPDPVVAEYI-r
Q7AP88_LISMO/3-58 .........QRKTSVLHVLLVVTAILG.ISLWVNASHG.....MKAQAE...SIAQ.PAPINEIFTDPALADEVK.
A0A5R8QCR1_9FIRM/6-59 ...kilfsf----------ILLTTITG.TSIYVGESQK.....EIVQATy.eSTPP.PAAINEIFPDANFASTIA.
Q8Y8U2_LISMO/1-57 .........------MKKLCTVILFLT.LLLNGFVPNAha.ktESPSADnnlQVAP.PAAIKDLFPDPAMANEV-l
INLA_LISMO/3-58 .........KKRYVWLKSILVAILVFG.SGVWINTSNG.....TNAQAA...TITQ.DTPINQIFTDTALAEKMK.
A0A5R8Q796_9FIRM/2-59 .....ktik----SLLCITLLIGGIFA.SSLLLGTKTE.....ITTKAA..sNTTPpPAAINQIFPDANLAEII-r
A0A1E5GQ73_9ENTE/1-53 .......mi-------KKNVYLSLVFAvVAVFTFVGFG.....ESAEAY..vYLDK.PTKVNEVFPDPAFAGYM-a
Q8Y5N0_LISMO/1-55 .......mk-------KILTGLSTTLL.LTVLLLTITG.....GDLKAKaasDLYPlPAPIIDVFPDEGLAKDMA.
Q7AP86_LISMO/2-56 .........KRNKTALRILVTLAVVLA.ITFWVGMSSK.....-EVQAA...VIEH.PTPINEIFTDPVLTDNVK.
INLH_LISMO/3-58 .........KRWNSVFKLVLMVTAILG.LSLYVTTSQG.....VEVRAE...SITQ.PTAINVIFPDPALANAIK.
A0A1H9SDM3_9LACT/1-49 .....mkkl--------KLMILALVVI.IGLHSYH---.....LTTQAE...EVAF.PAAITEIFPDENVAEKIR.
INLB_LISMO/3-58 ........e-KHNPRRKYCLISGLAII.FSLWIIIGNG.....AKVQAE...TITV.PTPIKQIFSDDAFAETIK.
A0A5R8QH37_9FIRM/2-59 ....mklfk---------LLFSIALFA.FMIGSTVFIQen.rtDIVHAAs.tSTPP.PAAVNEIFPDPNLAAVIA.
Q8Y7Y3_LISMO/1-58 .........------MKKTIKITTSLL.LSFACVFSIGdftkpHTVEAEivySLTN.PKPVNEIFTDPKLAQVVA.
A0A5R8QAT7_9FIRM/1-50 .........------MKKLVTVLFAVL.MMLGGVFTNT.....-IVHAA..dQIEP.PATIAELFPDQALAEII-a
A0A5R8QCS7_9FIRM/4-59 .cklmisfs----------LVVFGVLS.SLFITATQQN.....ISVQAS..qSTTPpPAAINEIFPDPGLAQEI-q
A0A191HTP3_9FIRM/3-50 ........r------------IGLVLF.LSFMLIFNTG.....LSLLAGtqkNLPG.PTPINQVFPDSILAEKMR.
Q8Y9W0_LISMO/2-59 .........KSKNNYFKQITTIMTVVS.LLIMVLGIQG....nNDVKAA..pQVAP.PASINQIFPDADLAEGIR.
Q8Y4H2_LISMO/1-55 ........m------RKVLMFLSTALL.LAILSLSFTG.....LDLKAKaasDLYPlPAPIIDVFPDDGLAKDMA.
A0A5R8QCU0_9FIRM/2-59 .kifktics--------IVLFSAALFG.TTTLINTHDE.....TVVHATs.sSTTP.PAAINEVFPDANFAEVIR.
A0A0R2FR41_9LACO/3-57 ..kggekmv----------KKIWLALC.VVLAVVMMSTv...aSPVQAA...ILAE.PRKISEIFPDDNFAQTVA.
Q8Y6A8_LISMO/1-56 .........MKKNNWLQNAVIAMLVLI.VGLCINMGSG.....TKVQAE...SIQR.PTPINQVFPDPGLANAVK.
#=GC seq_cons ................p.hlhlshllh.hslhlhhtps.....hslpAt...slss.PssIN-IFPDssLAptlt.
//