#=GF ID FokI_D1
#=GF AC PF02981.19
#=GF DE FokI, recognition domain, subdomain 1
#=GF PI FokI_N;
#=GF AU Griffiths-Jones SR;0000-0001-6043-807X
#=GF SE Structural domain
#=GF GA 25.00 25.00;
#=GF TC 25.40 40.50;
#=GF NC 24.80 23.50;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -E 1000 --cpu 4 -Z 75585367 HMM pfamseq
#=GF TP Domain
#=GF CL CL0123
#=GF RN [1]
#=GF RM 9724743
#=GF RT Structure of FokI has implications for DNA cleavage.
#=GF RA Wah DA, Bitinaite J, Schildkraut I, Aggarwal AK;
#=GF RL Proc Natl Acad Sci U S A. 1998;95:10564-10569.
#=GF RN [2]
#=GF RM 10508668
#=GF RT Type II restriction endonucleases: structural, functional and
#=GF RT evolutionary relationships.
#=GF RA Kovall RA, Matthews BW;
#=GF RL Curr Opin Chem Biol 1999;3:578-583.
#=GF RN [3]
#=GF RM 9214510
#=GF RT Structure of the multimodular endonuclease FokI bound to DNA.
#=GF RA Wah DA, Hirsch JA, Dorner LF, Schildkraut I, Aggarwal AK;
#=GF RL Nature. 1997;388:97-100.
#=GF DR INTERPRO; IPR004234;
#=GF DR SCOP; 2fok; fa;
#=GF DR SO; 0000417; polypeptide_domain;
#=GF CC Type IIS restriction endonuclease FokI is a member of an unusual
#=GF CC class of bipartite restriction enzymes that recognises the
#=GF CC double-stranded DNA sequence 5'-GGATG-3' and cleave DNA
#=GF CC phosphodiester groups 9 base pairs away on this strand and 13
#=GF CC base pairs away on the complementary strand [1]. FokI contains
#=GF CC amino- and carboxy-terminal domains corresponding to the DNA-
#=GF CC recognition and cleavage functions, respectively. The
#=GF CC recognition domain is made of three smaller subdomains (D1, D2
#=GF CC and D3) which are evolutionarily related to the
#=GF CC helix-turn-helix- containing DNA-binding domain of the
#=GF CC catabolite gene activator protein CAP [3]. This entry represents
#=GF CC the subdomain D1 of FokI. Subdomain D1 of the recognition domain
#=GF CC covers the DNA major groove, recognizing base pairs at the 3'
#=GF CC end of the recognition sequence (GGATG) [3].
#=GF SQ 29
#=GS A0A1Y4GKR9_9BACT/13-146 AC A0A1Y4GKR9.1
#=GS D9R4Y5_LACSW/4-140 AC D9R4Y5.1
#=GS E0NM75_9FIRM/4-141 AC E0NM75.1
#=GS A0A1Y1RMG1_9MICC/4-149 AC A0A1Y1RMG1.1
#=GS G8PBE9_PEDCP/16-169 AC G8PBE9.1
#=GS A0A1M7IV76_9FIRM/13-146 AC A0A1M7IV76.1
#=GS A0A3E2NAJ0_9CLOT/4-140 AC A0A3E2NAJ0.1
#=GS A0A0F2J3F6_9BACT/4-137 AC A0A0F2J3F6.1
#=GS A0A137SQ27_9FIRM/4-141 AC A0A137SQ27.1
#=GS A0A172Q519_9STRE/4-148 AC A0A172Q519.1
#=GS A0A6S6XGQ4_9FIRM/13-146 AC A0A6S6XGQ4.1
#=GS A0A419T8E6_9FIRM/4-140 AC A0A419T8E6.1
#=GS R9JR57_9FIRM/4-140 AC R9JR57.1
#=GS A0A0D4CKH1_LIMMU/4-149 AC A0A0D4CKH1.1
#=GS A0A174M7L2_9CLOT/4-140 AC A0A174M7L2.1
#=GS A0A1Q2MCL2_9BACT/2-137 AC A0A1Q2MCL2.1
#=GS A0A1Y4GEU6_9BACT/13-146 AC A0A1Y4GEU6.1
#=GS A0A8J6TVX0_9FIRM/3-159 AC A0A8J6TVX0.1
#=GS A0A1K1PVB9_RUMFL/5-141 AC A0A1K1PVB9.1
#=GS C6JKY8_FUSVA/4-141 AC C6JKY8.1
#=GS R6AWC6_9BACT/4-157 AC R6AWC6.1
#=GS I3DCT9_9PAST/4-148 AC I3DCT9.1
#=GS A0A1C0BUS6_9FIRM/4-149 AC A0A1C0BUS6.1
#=GS A0A1I6BRX5_9BACI/8-143 AC A0A1I6BRX5.1
#=GS A0A7Y4LB84_9BURK/4-148 AC A0A7Y4LB84.1
#=GS A0A0V8JLM2_9BACI/8-143 AC A0A0V8JLM2.1
#=GS A0A1V4I7R7_9FIRM/12-146 AC A0A1V4I7R7.1
#=GS V9H5A9_9CLOT/13-146 AC V9H5A9.1
#=GS R6MYT0_9CLOT/13-146 AC R6MYT0.1
A0A1Y4GKR9_9BACT/13-146 ....RAFGWVQDPSNLRSLCDVVAVFAPCSAKHREMVDSVIPRLVA....EQDGRGAFIEALR.....LRPLKLKYAHLVGTSfTP--...-...-...RSASRCNGIIQAAV..KGQ..................GRDFIVDWPADNFVRWAHCFGFIKYDYADDSFEITDSGLELVRA..
D9R4Y5_LACSW/4-140 ....RTFGWVQEAYTLENLKKVVSAFVPDSAINRSLRMDKIPRLIS....EKDGRDEFIQELS.....GNEISIPYPHLKGKG.TPVG...Y...T...RSNAPCSGIIQAVL..PGQ..................RKEYQSDWPADSFLRWAVSIGFLDYSRKEDVCSLSALGRLYAVA..
E0NM75_9FIRM/4-141 ....RTLGWIQNPSSFENLKNVVSVFDKNSDIYKEILNTKLPKLVK....DLDLQNKLISELE.....KDPLEMDYVLLKGHG.IKSG...Q...K...RADAECSGIVQAAI..TTQ.................gGRAYTDDWTADGFLRWGISIGLLDYDTEKDTVSITKLGEKFV--ks
A0A1Y1RMG1_9MICC/4-149 ....RTYGWVQNPSDFNKLKLVVQILDSGSAHYRRLRDSTVQGVIH....FDDVKRNLQSKLD.....LGEEIFTYKELVGTQrNALG...EvasR...RADAVADSLIQITV..MPQsy.............kttGKNFTDNWTSQGYLSWALSLGFLEHSPETDTVRITTLGREFSQ-s.
G8PBE9_PEDCP/16-169 stgl-----GQDVGSLRSMINILCVFIVNSKIQTEIKESFEWRFID....DDVLKEKLFNKLT.....TNPVTLTVDDLSAEQ.KKEP...G...K...PASWRIKSILPAIL..KGQkparnqdntlatdnkgesFKSSMRQWPIRNFIGEAVGLGLLDWDRKTGNVTITTIGKKLANA..
A0A1M7IV76_9FIRM/13-146 ....RAFGWVQDPSNLRSLCNVTAIFDESSPMHQLLVHSIIPELVE....KRDGKDELIEVLN.....KRPLRISYNKLVGTA.---F...K...P...RSASRCNGIVQATV..KGQ..................VRPFIGEWQADNFVRWAYAFHFIRYNYEDDTFEITEEGRELVRA..
A0A3E2NAJ0_9CLOT/4-140 ....RTFGWVQEAYTLDNLKNVISVFVTDSRINRLLKTDKIPRLIQ....DEDKREEFIKELD.....QEEIRIPYTHLKGKG.TPKG...Y...T...RSNAPCSGIIQAVL..PGQ..................RKEYQSDWPADSFLRWAVSIGFLDYDRETDECSLSVMGRQYAKA..
A0A0F2J3F6_9BACT/4-137 ....RTFGWVQDPGKVEHLRLVVEIFAPNSKTHEYIKNKVIPTLIL....EKDGLSRLITELN.....KKPLSLNYRDLVGTAfK---...-...P...RASARCNAIIQAAV..KGQ..................KRPFISDWPADNFLRWAVSLGFVKWNEKTDEFSITELGLSLSQ-t.
A0A137SQ27_9FIRM/4-141 ....RTLGWIQNPSSFENLKNVVSVFDKNTDIYKEILNTKLPKLVK....DLDLQNKLISEMK.....KDPLEMDYVLLKGHG.IKSG...Q...K...RSDAACSGIVQAAI..TTQ.................gGRAYTDDWTADGFLRWGISIGLLDYDTENDTVSITKLGEKFV--ks
A0A172Q519_9STRE/4-148 ....RTYGWVQNPSSFISLKKVVQIFNNKSNHYQ-LLKEKLVDTIY....FEDIRTIFLNKLQ.....EGVEEFSYLELVGTSkDRNGrlpK...K...RSDAVADALIQISI..TPQqt.............kntGKTWTDNWTADGFLRWAVSLNFVSVDRETDCFSITAKGRAFS--tt
A0A6S6XGQ4_9FIRM/13-146 ....RTFGWVQDPSNLRSLCDVVAVFDEDSEKHRELVLSSIPRLVS....EEDGRSRLLEALS.....TRPVRIRYPDLVGTAfTP--...-...-...RSASRCNGILQAAV..RGQ..................GRDFIGDWPADNFLRWAHAFGFVRYHYEDDSFEITPAGLELTK-a.
A0A419T8E6_9FIRM/4-140 ....RTFGWVQEAYTLGNLKNVVSVFVPGSEINRLLCTDKIPRLIT....KKDGRDIFISELS.....TEEICIPYTHLKGKG.TPTG...Y...T...RSNAPCSGIIQAVL..PGQ..................RKEYQSDWPADSFLRWAVSVGFLEYSRSKDVCCISALGQEYAM-s.
R9JR57_9FIRM/4-140 ....RTFGWVQEAYKISSLKRVIKLFLLNSDVNRELRFDKIPRLVS....QEYGRDAFIKELS.....EERIHIPYQHLKGKG.TPKG...Y...T...RSNAPCSGIVQAAL..PGQ..................RKEYQSDWPADSFLRWGVSVGLLDYDRQSDECSLSELGEQYA--ht
A0A0D4CKH1_LIMMU/4-149 ....RTFGWVQNPSDFKKLKKTVQVFDPSSEHYQQLRKHIVHDVVY....FAEDKNRLQDQLD.....NRVCEFSYKDLVGSNiNKDG...K...SpkkRSESVANSLLQVSI..LPQst.............ktkGKLHTDNWTADGFLRWAVSLNFVSHNRDTDTFKITDFGKKFS--ss
A0A174M7L2_9CLOT/4-140 ....RTFGWVQEAYKLENLKNVVSVFVPGSPVNRQLIEDKLVRLIS....VEDGKAEFIEELE.....ADPVIVPYAHLKGKG.TPKG...Y...T...RSNAPCSGIIQAVL..PGQ..................RKEYQSDWPADSFLRWAVSIGFLNYDRNADTCSLSDLGRSYAEA..
A0A1Q2MCL2_9BACT/2-137 ..rp--RGWIQDSGSFENLIKVVELFDKNSTTNKLLTNKFIRDKVL....NLDCQEYLVKSLLnedgyKNNPLIEYKALVGSR.TN--...-...-...--KEEVDGLIQVLI..PGQ..................SRLGIVDWACDNFIRLAYTFNYLQYSEKNDSFSITEVGLKLANA..
A0A1Y4GEU6_9BACT/13-146 ....RAFGWVQDPSNLRSLCDVVAVFDPCSAKHGEMIDKVIPRLVA....EQDGRDVFIEALR.....HKPLKLKYAHLVGTSfTP--...-...-...RSASRCNGIIQAAV..KGQ..................GRDFIGDWPADNFVRWAHCFGFIKYDYADDSLEITDSGLELVQA..
A0A8J6TVX0_9FIRM/3-159 ....RTFGWVQNPNRLETLKYITGIFQKDSDSNIDLRTNRLPKLLEyrfiTREHYDQFILELS.....KEKIEISYDLLKGKG.LNGA...K...S...RKDAICTGIVQAAI..DAHssskfivr..edgneekiKKPYVDDWTADGYLRWAVSTGLIKHSPSTDSCKITDLGVRLVHA..
A0A1K1PVB9_RUMFL/5-141 ....RTFGWVQEAYTISNLKNVVRVFVLDSAVNKKLREDKIPRLIS....DEYHKDDMIKHLS.....AAKMQIPYTLLKGKG.TPKG...Y...T...RTNAPCSGIIQAVL..PGQ..................RKEYQSDWPADSFLRWAVSIGFLNYDRDKDTCSISELGYRYA--vs
C6JKY8_FUSVA/4-141 ....RTFGWIQNPSDFSKLKNVVSVFMTDSDIYKDLLNRKIPSLIE....NEVLKKKMIEEMK.....KVPLEMDYRLLKGHG.PCNK...E...S...RSNVKCSGIIQAAI..PNQ.................kRREYSDDWTADGFLRWAISIGLLDYNIDNDTVSITELGKKYILA..
R6AWC6_9BACT/4-157 ....RTFGWIQNPSSTDTLRNILGIFVPGSDFHTFMVSERLPLLASaglfKTPGLYMDFQKIL.....RRNKSIAYDILKGQG.-AGG...E...S...RSKAKCSGLAQAAV..TGQqfkdyvv....dgkniriKKPYTDDWTADGFLRWAVSLGFLDYNYADDTCCITNSGVSLVMA..
I3DCT9_9PAST/4-148 ....RTYGWIQNPSSFQSLKKVVQIFDTASQHYQNLKDNLINSIYN....E-VIRNNLKDKLI.....NNENEFTYLELVGTSkNKQG...KppsS...RKDAVADALIQISI..EPQqi.............kstGKTWIDNWSADGFLRWAVSFNFIKVDREKDTFSITEKGLAFSQA..
A0A1C0BUS6_9FIRM/4-149 ....RTYGWVQNPSDFKKLKLVVQIFDNTSVHYENLKSNLISRYIY....FDDIKSDLLNKFT.....RKIEEFSYLDLVGTSkNKHGrspK...S...RSEAVADALIQITI..LPQss.............ktkGKFWTDNWTSDGYLRWALSLNFVKHNRETDMCSITPLGREFS--rs
A0A1I6BRX5_9BACI/8-143 ....RTFGWVQNPGKFENLKRTVQVFDKDSKVYKEVKDHKIPNLVK....DKGVRDTLVKAMN.....RSDNLYTYKELVGTG.TS--...-...I...RANAPCDAIIQATIldQGN..................KKGYIDNWSADGFVRWAHALGFIEYEHSKDAFYLTDTGKAYS--is
A0A7Y4LB84_9BURK/4-148 ....RTYGWVQNPSSFLHLKKVVQIFVPSSTHYQNLKNS-LLDLIP....FTNLRQELRDKLD.....KKKTEFTYTELVGSSkDKNGkspR...S...RSNAVANSLIQISI..PSQka.............sttGKTWTDNWTADGYLRWAISLNFIEVNTSKDTFRITPKGMAFAK-t.
A0A0V8JLM2_9BACI/8-143 ....RTFGWIQNPGKFENLKRTVQVFDENSKVYKEVRDIKIPNLVK....DKDVRTTLIAAMN.....RLENYYSYKELVGTG.TS--...-...V...RAQAPCDAIIQAAI..QDQg................nKKGYIDNWSSDGFVRWAHALGFLEYNSDKDSFYLTDIGLEYS--rs
A0A1V4I7R7_9FIRM/12-146 ....RTFGWIQNPGDFNKLKKVVQVFDHTSNTHEKLKNVIIPSLIE....ERDGRDRFIQELS.....KIPLKLKYADLVGTGfK---...-...P...RNSARCNGIIQAIV..EGQ.................gGKKFVDNWSADGYIRWAHALGFIDYEYATDTFFITQLGFDYSR-a.
V9H5A9_9CLOT/13-146 ....RTFGWVQNPSNFESLKKVVAIFDNTSKTYNELKDKKIKKLVD....ERDGQKELLNALN.....ANPLKIKYCNLVGTSfTP--...-...-...RSSARCNGIVQATV..KGQ..................RKEFIDDWSSDNFVRWAHALGFIKYNYDTDTFEITDVGRKYVQ-s.
R6MYT0_9CLOT/13-146 ....RTFGWVQDPSDFRSLCDVVAIFDETSLKHQELAGQVIPALVE....ERDGRQRLLDALN.....QRPLRISYTDLVGTSfTP--...-...-...RSAARCNGIVQAAV..RGQ..................VRPFIGDWPADNFVRWAHALGFLRYGYQGDAFELTETGKALAQA..
#=GC seq_cons ....RTFGWVQsPushcsLKpVVplFs.sSshacpLpsshIPcLlp....ccDs+sphlpcLs.....ppslclsYscLsGpu.ss.h.......p...RSsAhCsGIIQAsl...GQ..................tKtahsDWsADuFLRWAlSlGFlcYspcsDohpITchGhcau....
//