#=GF ID CoV_NSP2_N
#=GF AC PF19211.6
#=GF DE Coronavirus replicase NSP2, N-terminal
#=GF PI Corona_NS2_N;
#=GF AU Bateman A;0000-0002-6982-4660
#=GF AU Chuguransky S;0000-0002-0520-0736
#=GF SE Bateman A
#=GF GA 29.70 29.70;
#=GF TC 29.90 33.80;
#=GF NC 28.90 28.20;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -E 1000 -Z 90746521 --cpu 8 HMM pfamseq
#=GF TP Family
#=GF RN [1]
#=GF RM 16227261
#=GF RT The nsp2 replicase proteins of murine hepatitis virus and severe
#=GF RT acute respiratory syndrome coronavirus are dispensable for viral
#=GF RT replication.
#=GF RA Graham RL, Sims AC, Brockway SM, Baric RS, Denison MR;
#=GF RL J Virol. 2005;79:13399-13411.
#=GF RN [2]
#=GF RM 34398430
#=GF RT Structure and Function of N-Terminal Zinc Finger Domain of
#=GF RT SARS-CoV-2 NSP2.
#=GF RA Ma J, Chen Y, Wu W, Chen Z;
#=GF RL Virol Sin. 2021;36:1104-1112.
#=GF RN [3]
#=GF RM 34159380
#=GF RT Nsp2 has the potential to be a drug target revealed by global
#=GF RT identification of SARS-CoV-2 Nsp2-interacting proteins.
#=GF RA Zheng YX, Wang L, Kong WS, Chen H, Wang XN, Meng Q, Zhang HN,
#=GF RA Guo SJ, Jiang HW, Tao SC;
#=GF RL Acta Biochim Biophys Sin (Shanghai). 2021;53:1134-1141.
#=GF DR INTERPRO; IPR043615;
#=GF DR SO; 0100021; polypeptide_conserved_region;
#=GF CC This entry corresponds to the N-terminal region of coronavirus
#=GF CC non-structural protein 2. NSP2 is encoded by ORF1a/1ab and
#=GF CC proteolytically released from the pp1a/1ab polyprotein.
#=GF CC Viral-host protein interaction studies in SARS-CoV and
#=GF CC SARS_CoV-2 found that this protein could interact with several
#=GF CC host proteins including prohibitin 1 (PHB1) and PHB2, which are
#=GF CC implicated in a number of cellular functions, including cellular
#=GF CC migration, differentiation and apoptosis [2,3]. NSP2 structure
#=GF CC from SARS-CoV-2 has been recently solved and revealed that it
#=GF CC has three zinc fingers, covered in this entry, which may be
#=GF CC involved in binding nucleic acids and regulating intracellular
#=GF CC signalling pathways [2].
#=GF SQ 61
#=GS R1A_BCHK4/196-440 AC P0C6T4.1
#=GS A0A2P1G738_9ALPC/111-315 AC A0A2P1G738.1
#=GS A0AAE6R639_9ALPC/111-315 AC A0AAE6R639.1
#=GS A0A1B3Q5W8_9BETC/191-395 AC A0A1B3Q5W8.1
#=GS A0A3G8EWF8_9ALPC/109-313 AC A0A3G8EWF8.1
#=GS A0A120I2U3_9ALPC/110-310 AC A0A120I2U3.1
#=GS A0A4Y6GLC9_9BETC/191-395 AC A0A4Y6GLC9.1
#=GS A0A1L2KGC1_9ALPC/111-314 AC A0A1L2KGC1.1
#=GS A0A2P1G718_9ALPC/111-315 AC A0A2P1G718.1
#=GS A0AA48ZMR4_9ALPC/111-314 AC A0AA48ZMR4.1
#=GS A0A0U1WHG4_9ALPC/111-315 AC A0A0U1WHG4.1
#=GS A0A4Y6GLA1_9ALPC/99-303 AC A0A4Y6GLA1.1
#=GS R1AB_CVPPU/110-310 AC P0C6Y5.1
#=GS R1AB_CVH22/112-316 AC P0C6X1.1
#=GS R1AB_BCHK9/191-395 AC P0C6W5.1
#=GS A0AA48UFJ9_9ALPC/114-317 AC A0AA48UFJ9.1
#=GS A0AAE9NLE9_9NIDO/185-386 AC A0AAE9NLE9.1
#=GS R1A_MERS1/194-443 AC K9N638.1
#=GS R1AB_CVHNL/111-315 AC P0C6X5.1
#=GS A0A088DIE1_9BETC/176-416 AC A0A088DIE1.1
#=GS B1PHK1_9ALPC/112-316 AC B1PHK1.1
#=GS R1AB_SARS2/182-423 AC P0DTD1.1
#=GS A0A4Y5QL57_9ALPC/111-315 AC A0A4Y5QL57.1
#=GS Q6UZF5_SARS/182-423 AC Q6UZF5.1
#=GS R1AB_BCHK5/196-441 AC P0C6W4.1
#=GS A0A2R4QL11_9ALPC/111-312 AC A0A2R4QL11.1
#=GS R1A_CVHNL/111-315 AC P0C6U6.1
#=GS A0A0K1Z0N1_SARS/182-423 AC A0A0K1Z0N1.1
#=GS Q6JH39_SARS/182-423 AC Q6JH39.1
#=GS R1AB_SARS/182-423 AC P0C6X7.1
#=GS R1AB_BCHK4/196-440 AC P0C6W3.1
#=GS A0A060A8I5_9ALPC/111-316 AC A0A060A8I5.1
#=GS R1A_BCHK5/196-441 AC P0C6T5.1
#=GS Q6JH40_SARS/182-423 AC Q6JH40.1
#=GS R1AB_FIPV/110-310 AC Q98VG9.2
#=GS R1A_CVH22/112-316 AC P0C6U2.1
#=GS R1AB_MERS1/194-443 AC K9N7C7.1
#=GS R1A_CVPPU/110-310 AC P0C6V2.1
#=GS A0AAE8CC16_9NIDO/114-208 AC A0AAE8CC16.1
#=GS A0A891ZAE5_9BETC/201-450 AC A0A891ZAE5.1
#=GS A0A6B9KDC4_9ALPC/111-315 AC A0A6B9KDC4.1
#=GS R1A_SARS/182-423 AC P0C6U8.1
#=GS A0A1L2KGC3_9ALPC/111-314 AC A0A1L2KGC3.1
#=GS A0A096XNJ3_9ALPC/114-290 AC A0A096XNJ3.2
#=GS A0A0U1WHK4_SARS/182-423 AC A0A0U1WHK4.1
#=GS A0A6B9KKB5_9ALPC/113-316 AC A0A6B9KKB5.1
#=GS A0A0U1UZC3_9ALPC/112-317 AC A0A0U1UZC3.1
#=GS B1PHK0_9ALPC/112-316 AC B1PHK0.1
#=GS A0AAE8CC16_9NIDO/195-288 AC A0AAE8CC16.1
#=GS A0A240FW17_9ALPC/111-292 AC A0A240FW17.1
#=GS A0AAE9BUP5_9ALPC/112-317 AC A0AAE9BUP5.1
#=GS R1A_SARS2/182-423 AC P0DTC1.1
#=GS B0LJR0_9ALPC/110-310 AC B0LJR0.1
#=GS B0LJQ9_9ALPC/110-310 AC B0LJQ9.1
#=GS R1A_BCHK9/191-395 AC P0C6T6.1
#=GS A0A915V9U8_9BETC/196-445 AC A0A915V9U8.1
#=GS A0A2Z4EVM4_9BETC/190-394 AC A0A2Z4EVM4.1
#=GS A0A2R4QKW4_9ALPC/111-312 AC A0A2R4QKW4.1
#=GS K4KCJ9_9ALPC/111-315 AC K4KCJ9.1
#=GS A0A0K1YZY7_SARS/182-423 AC A0A0K1YZY7.1
#=GS A0A0U1UZA8_9ALPC/111-318 AC A0A0U1UZA8.1
R1A_BCHK4/196-440 ............DCIPIDQYMCGKNGKPI..ADYAKIVAKEGLTTL.ADievdvks....rmdsdrfIVL.NKKLYRVV.......WNVTRR.NVPYPKQTAFTIVSVVQCd.dkDSVPEHTftIGSQILMVSP-LKATNNKNFNLKQRLLYTFYGKDAVQQ........PGYIYHSAYVD.CNACGRGTWCTGNAIqGFACD.CGANYSaNDVDL..QSSGLVPRNALFlancpcannga....cshsaaqvyniLD..GKACVEV....gGKSFtLTFGGVVYAYMGCCDGTMYF...........
A0A2P1G738_9ALPC/111-315 ...........n-VVSVDNYMCGADGKPA..VPSEQWSFVEHFDDD.TD.................eITV.NGVTFRHV.......WNTVRA.DDPYEKQGLLSIKSIEYI....SNVPHKL..PNGSVLGVAGTPKKRKAIVLDEKYSKLYDACGVPFVTNgksisevvPKPLFLHALVK.CK-CDNESWTVGDWT.GFKTT.CCGSTG.KVTTL..-AVGDVTPGDI-..........................VF..TTLGAGK.....GTKF.--FCGLVLTFVDTLEGVSAW...........
A0AAE6R639_9ALPC/111-315 ............NTVYVDQYLCGANGYPA..LDETLWEFKDYFGEL.DE..................IVI.NGTTFVKA.......WLVVRS.PGPYNTQNLLSIQAITWC....GECPHTL..ADGTTLKNAGPIKKNKSVVIGGKFSQLYDRVGSPFVTNgkvlsevlTNPTFCHALVK.CH-CGTTSWTVGDWS.GYKSM.CCGKVC.KPSTI..-VVGEVKPGDV-..........................LV..TSSKVAT....nGVKY.--YSGMVLDFVTKVDDVCLW...........
A0A1B3Q5W8_9BETC/191-395 ...........l-AAPIKEVLGGKGAGMS..LVELTKFLGKYRTAD.G-..................YEL.PSGIVKVA.......VKVVRK.NLPVSKQSIFTVLGVTERvvdgFYYPYS-..TNSVVSYTKPRAGATVGNTVQSVMLSMYGTEA------........YNPVTPVVRLR.CSSCDFYGWVPVKDLgCVTCS.CAAVHQiTSSCIdaESAGLIKQGAVM..........................LV..DRSPSMRv..vpGNRLyVAFGGAIWSPIGKVNGVQVW...........
A0A3G8EWF8_9ALPC/109-313 ..........ae--VCVDNYMCDQSGKPV..LPESVWKFQDYFGDA.ET..................IVL.DGITYRKA.......WNVMRS.PVSYKSQSVASITYIEWC....GDVAHTL..PSGSVLDLAKPVSKSKVVVLAEPFATFYAQVGSPYLTNgtgllevvVKPCFLHGYVK.CL-CGSSQWVVGDWHaGYKSL.CCGITR.TPTCV..-AAGYVESGDV-..........................LL..TTIGAGK.....GLKY.--YKGLTLKYLGDAENVSLW...........
A0A120I2U3_9ALPC/110-310 ...........g-AIYVDQYMCGADGKPV..IEG---DFKDYFGDE.DI..................IEF.EGEEYHCA.......WTTVRD.EKPLNQQTLFTIQEIQYN....LDIPHKL..PNCATRHVAPPVKKNSKIVLSEDYKKLYDIFGSPFMGNgdclskcfDTLHFIAATLR.CP-CGSESSGVGDWT.GFKTA.CCGLSG.KVKGV..-TLGDIKPGDA-..........................VV..TSMSTGK.....GVKF.--FANCVLQYAGDVEGVSIW...........
A0A4Y6GLC9_9BETC/191-395 ...........l-VEPVKELLGAIKSDFT..LEQLLAALSAYSKDD.G-..................YDL.PGGFVKIA.......VTVIRK.PLPVVRQSIFTVQGVIEHlvegYYYPLT-..TGSVVKHTKPRPNVPLSNTVESIMLSLYGTSG------........YSPATPVVRLN.CNYCYFYGWVPLRDMgSVVCS.CKAEHQlTSSCIdaESAGVVKPGCVL..........................LL..DKSPGMRi..ipGNRTyVAFGGAIWSPIGVVNNVTVW...........
A0A1L2KGC1_9ALPC/111-314 ...........n-KIPVDQYMCGYDGKPV..IPAGSWEFKNYFEDG.NE..................ITL.NGVVYYLA.......WQVERK.PLPHANQNLLSITEILYL....SKEQHTL..LPGSILTTAAPPKRSAKVVLSDDWKSLYEECGSPFVNNgttllevvPKPVFLNAFVN.CK-CGNSCWSVGDWT.GYKSA.CCGENA.QRVCV..-VPGEVVAGDI-..........................VV..TSKAAGV.....GVKY.--YTGMTLKFVKECGNVHLW...........
A0A2P1G718_9ALPC/111-315 ...........n-VVSVDNYMCGADGKPA..VPSEQWSFVEHFDDD.TD.................eITV.NGVTFRHV.......WNTVRA.DDPYEKQGLLSIKSIEYI....SNVPHKL..PNGSVLGVAGTPKKRKAIVLDEKYSKLYDACGVPFVTNgksisevvPKPLFLHALVK.CK-CDNESWTVGDWT.GFKTT.CCGSTG.KVTTL..-AVGDVTPGDI-..........................VF..TTLGAGK.....GTKF.--FCGLVLTFVDTLEGVSAW...........
A0AA48ZMR4_9ALPC/111-314 ...........t-VVPVDNYMCGADGRPA..VGEDRWTGDDMFGDN.TE..................LVI.NDTTFVKA.......WTVVRT.AVPHAKTNVTGIESIKYN....LAIPHRL..RDGCVVTLPKPVKRSAKLVLDSKFNDLLINFGVGFVQSgetlsavvSRPVFMHALVA.CP-CGASGWTVGDWT.GFVST.CCGLRS.NVITS..-ACGFVVPGDA-..........................VI..ATANAGT.....GTKY.--YNGMTLKYVCTMEGVSIW...........
A0A0U1WHG4_9ALPC/111-315 ............NTVYVDNYMCGSNGVPV..LPEDQWEFVDYFGEL.TE..................VSI.GDTTYIKA.......WNVDRV.EGPYKSQTLLSINAISYC....GEVIHAL..ADGSTMSYATAVKKNSKTVVNKTYQKLYDNIGVPFVTNgkvlteiiPKPVFNHGLVK.CH-CGKVSWTVGDWS.CYKST.CCGTVC.KPIAI..-VNGDVNPGDV-..........................VI..TSKQVAT....nGVKY.--YNGMVLKYVDTIEDVHLW...........
A0A4Y6GLA1_9ALPC/99-303 ...........n-TVHVDNYMCDANGKPV..LPENVWECKDYFGEL.SE..................ILV.NGTTYVKA.......WIVDRS.PGPFASQSLLSIKAITWC....GTLAHTL..ADGATLSVAAPARKSKTVVLDKYYSKLYDAVGVPFVRNgktlkdviTNPVFCHALIK.CH-CGITSWTVGDWS.SYKST.CCGVAC.KPICI..-ASGVVKPGSV-..........................LV..TSNKVST....dGVKY.--YNGMVLKFIDTLDGLHLW...........
R1AB_CVPPU/110-310 ...........g-AIYVDQYMCGADGKPV..IEG---DFKDYFGDE.DI..................IEF.EGEEYHCA.......WTTVRD.EKPLNQQTLFTIQEIQYN....LDIPHKL..PNCATRHVAPPVKKNSKIVLSEDYKKLYDIFGSPFMGNgdclskcfDTLHFIAATLR.CP-CGSESSGVGDWT.GFKTA.CCGLSG.KVKGV..-TLGDIKPGDA-..........................VV..TSMSAGK.....GVKF.--FANCVLQYAGDVEGVSIW...........
R1AB_CVH22/112-316 ............NVTYTDQYLCGADGKPV..MSEDLWQFVDHFGEN.EE..................III.NGHTYVCA.......WLTKRK.PLDYKRQNNLAIEEIEYV...hGDALHTL..RNGSVLEMAKEVKTSSKVVLSDALDKLYKVFGSPVMTNgsnileafTKPVFISALVQ.CT-CGTKSWSVGDWT.GFKSS.CCNVIS.NKLCV..-VPGNVKPGDA-..........................VI..TTQQAGA.....GIKY.--FCGMTLKFVANIEGVSVW...........
R1AB_BCHK9/191-395 ...........l-VEPVMKLLGVIKSDFT..LEQLLAALGKYRTED.G-..................YDL.PDGYVKVA.......IKVGRK.AVPVLKQSIFTVVGVTEQlvpgYYYPFS-..TSSVVEHTKPTRGGPVGKTVEAVMLSLYGTNN------........YNPATPVARLK.CSYCDYYGWTPLKDIgTVNCL.CGAEFQlTSSCVdaESAGVIKPGCVM..........................LL..DKSPGMRl..ipGNRTyVSFGGAIWSPIGKVNGVTVW...........
A0AA48UFJ9_9ALPC/114-317 ...........d-VVYVDQYMCDSTGAPA..LQESEWEYTDYFGDQ.EE..................IDY.HGITFVKA.......WHVERL.AVPYQKQTITAITSIQWC....GTVPHTL..NDGVTTAVAQPPKRSKNVVLADAYAVLYDQIGSPFMTNgsklreciVKPVFLHALVQ.CK-CGNTHWTVGDWS.CFKSL.CCGLVC.KPKCT..-VSGDVVPGDV-..........................VL..TSQSVCS.....GVKY.--YNGMILKFIEKRDGVSVW...........
A0AAE9NLE9_9NIDO/185-386 ...svcelpgfs-------------ADMS..LEQ-LEGLLSPFTED.GY..................INL.PTGVLCVA.......WRVKRK.PVPVCKQSLLSVLRVEEQvipgLYYPFV-..VGADVVHTKPSHDAGEFKGWRRAVRRLYGHAQ------........VNPATPVAHISgCTECGYTGWVPLRDTaTTVCL.CGCVYSlQSPYVdmESAGRVGKGVML..........................AL..KTGEGHRtvtldRVYY.-CFGGALWARVGNNDGVDLY...........
R1A_MERS1/194-443 ...........d-VTPVDQYMCGVDGKPI..SAYAFLMAKDGITKL.ADveadvaa....raddegfITL.KNNLYRLV.......WHVERK.DVPYPKQSIFTINSVVQKdgveNTPPHYF.tLGCKILTLTPRNKWSGVSDLSLKQKLLYTFYGKESLEN........PTYIYHSAFIE.CGSCGNDSWLTGNAIqGFACG.CGASYTaNDVEV..QSSGMIKPNALLcatcpfakgdscssnckhsvaqlvsyLS..ERCNVIA....dSKSFtLIFGGVAYAYFGCEEGTMYF...........
R1AB_CVHNL/111-315 ...........s-VVFVDKYMCGFDGKPV..LPKNMWEFRDYFNNN.TD.................sIVI.GGVTYQLA.......WDVIRK.DLSYEQQNVLAIESIHYL....GTTGHTL..KSGCKLTNAKPPKYSSKVVLSGEWNAVYRAFGSPFITNgmslldiiVKPVFFNAFVK.CN-CGSESWSVGAWD.GYLSS.CCGTPA.KKLCV..-VPGNVVPGDV-..........................II..TSTSAGC.....GVKY.--YAGLVVKHITNITGVSLW...........
A0A088DIE1_9BETC/176-416 .........dfh--RYVDNYYCTGDGKPL..P-----CIVTLLEKA.GHankpld......damdylRGL.NRMGQPCRdhdhervWEVERD.NAPYPEQSLFSISAIKTL....GEIPHCVfaPDCAVKVMKPRKVKRGADGFMTKLRRVYNINGFDEV--........-KPMALCALHY.CEDCGMEMWCHSNFE.EAYCP.CGKIYT.NTPCT.lTSAGYVVEGSVVampcdacksdsd.hsngtfydsckylAE..DKAEPGN.....RENF.VYFGGCCFAYVGCRNGNAIW...........
B1PHK1_9ALPC/112-316 .........asp--VYVDNYMCGANGKPV..LPADVWVYQDYFGEE.TE..................LIV.NGVKHVKV.......WHVTRT.DIPYQFQSLGAIESIEWL....TDIPHTL..RNGSRLSAARAVKHSKNVVLSEPLKTLYQACGSPFVTNgstlreavPKPVFAHAYVA.CK-CGRKAWSVGDWS.GYKST.CCGVFG.KPQCV..-VFGEVVPGDV-..........................FI..TTSSVGS.....GTRY.--YNGLTVKHVVTVDGLACW...........
R1AB_SARS2/182-423 ..........yt--RYVDNNFCGPDGYPL..E-----CIKDLLARA.GKasctlseqldfidtkrgvYCC.REHEHEIA.......WYTERS.EKSYELQTPFEIKLAKKFdtfnGECPNFVfpLNSIIKTIQPRVEKKKLDGFMGRIRSVYPVASPNE---........CNQMCLSTLMK.CDHCGETSWQTGDFV.KATCE.FCGTENlTKEGA..TTCGYLPQNAVVkiycpachnsev..gpehslaeyhneSG..LK----Til.rkGGRT.IAFGGCVFSYVGCHNKCAYW...........
A0A4Y5QL57_9ALPC/111-315 ...........s-TTYVDNFMCGANGQPV..LSEDKWEFKDYFGEL.TE..................VLI.DGITYVKA.......WNVDRA.EGPYSSQTLVSINAITWC....GNIPHTL..PDGTTTAVAPIVRKSKTVVLDKYYNKLYETVGVPFVRNgsclkdvlTKPVFLHALVK.CH-CGTTSWTVGDWG.CYKST.CCGVVC.KPICT..-SSGNVEPGDV-..........................VV..TSNKVSP....aGVKY.--YNGMVLKFVDTLDGFHLW...........
Q6UZF5_SARS/182-423 ..........vt--RYVDNNFCGPDGYPL..D-----CIKDFLARA.GKsmctlseqldyieskrgvYCC.RDHEHEIA.......WFTERS.DKSYEHQTPFEIKSAKKFdtfkGECPKFVfpLNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CNHCDEVSWQTCDFL.KATCE.HCGTEN.LVIEG.pTTCGYLPTNAVVkmpcpacqdpeigpehsvadyhnhsnIE..TRLRKGG.....RTRC.--FGGCVFAYVGCYNKRAYW...........
R1AB_BCHK5/196-441 ..........df--TPIDQYMCGKNGKPI..AEFAALMASEGITKL.ADveaevks....rtdsdryIVF.KNKLYRIV.......WNVQRK.DVAYSKQSAFTMNSIVQLd.tmEDVPRHSftIGSEIQVIAPSTAVQANGHLNLKQRLLYAFYGKQAVSE........PNYIYHSAYVD.CTSCGKGSWLTGNAVqGFACD.CGAHYCaNDVDL..QSSGLVRKNAVLlttcpcnkdge....ckhtlpqlvsmMT..DKCDVEV....vGKTFiLTYGGVIYAYMGCSGGTMH-f..........
A0A2R4QL11_9ALPC/111-312 ...........t-VVYVDQFLCGADGKPV..RQG---EMKDYFGDL.ED..................IVI.DGITYTHA.......WDVVRDmEVPHAKQTALTIQSIMYL....MDVDHKI..VNGATRQRAAPVKISSKVCLTEPYNSLYKQFGSPYMHNgsnlnecfSKLNFIVANVK.CK-CGGESSGVGDWT.GFKSA.CCGTPG.KVIGV..-SIGDASVGEA-..........................VI..TSKGCGT.....GTKF.--YAGAVLKFVGDAEGVSVW...........
R1A_CVHNL/111-315 ...........s-VVFVDKYMCGFDGKPV..LPKNMWEFRDYFNNN.TD.................sIVI.GGVTYQLA.......WDVIRK.DLSYEQQNVLAIESIHYL....GTTGHTL..KSGCKLTNAKPPKYSSKVVLSGEWNAVYRAFGSPFITNgmslldiiVKPVFFNAFVK.CN-CGSESWSVGAWD.GYLSS.CCGTPA.KKLCV..-VPGNVVPGDV-..........................II..TSTSAGC.....GVKY.--YAGLVVKHITNITGVSLW...........
A0A0K1Z0N1_SARS/182-423 ..........vt--RYVDNNFCGPDGYPLecIKGLLARAGKSMCTL.SEqldfi.......eskrgvYCC.REHEHEIA.......WYTERS.DKSYEHQTPFDIKSAKKFdtfkEECPKFVfpLNSTVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CSHCDEVSWQTCDFL.KATCE.HCGTENlVVEGP..TTCGYLPINAVVkmpcpacqnkevgpehsvadyhnysnIE..TRLRKGG.....RTKC.--FGGCVFSYVGCYNKRAYW...........
Q6JH39_SARS/182-423 ..........vt--RYVDNNFCGPDGYPL..D-----CIKDFLARA.GKsmctlseqldyieskrgvYCC.RDHEHEIA.......WFTERS.DKSYEHQTPFEIKSAKKFdtfkGECPKFVfpLNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CNHCDEVSWQTCDFL.KATCE.HCGTEN.LVIEG.pTTCGYLPTNAVVkmpcpacqdpeigpehsvadyhnhsnIE..TRLRKGG.....RTRC.--FGGCVFAYVGCYNKRAYW...........
R1AB_SARS/182-423 ..........vt--RYVDNNFCGPDGYPL..D-----CIKDFLARA.GKsmctlseqldyieskrgvYCC.RDHEHEIA.......WFTERS.DKSYEHQTPFEIKSAKKFdtfkGECPKFVfpLNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CNHCDEVSWQTCDFL.KATCE.HCGTEN.LVIEG.pTTCGYLPTNAVVkmpcpacqdpeigpehsvadyhnhsnIE..TRLRKGG.....RTRC.--FGGCVFAYVGCYNKRAYW...........
R1AB_BCHK4/196-440 ............DCIPIDQYMCGKNGKPI..ADYAKIVAKEGLTTL.ADievdvks....rmdsdrfIVL.NKKLYRVV.......WNVTRR.NVPYPKQTAFTIVSVVQCd.dkDSVPEHTftIGSQILMVSP-LKATNNKNFNLKQRLLYTFYGKDAVQQ........PGYIYHSAYVD.CNACGRGTWCTGNAIqGFACD.CGANYSaNDVDL..QSSGLVPRNALFlancpcannga....cshsaaqvyniLD..GKACVEV....gGKSFtLTFGGVVYAYMGCCDGTMYF...........
A0A060A8I5_9ALPC/111-316 ...........n-IVPVDQYMCGADGKPV..LQESEWEYTDFFADS.EDg................qLNI.AGITYVKA.......WIVERS.DVSYASQNLTSIKSITYC....STYEHTF..PDGTAMKVARTPKIKKTVVLSEPLATIYREIGSPFVDNgsdarsiiKRPVFLHAFVK.CK-CGSYHWTVGDWT.SYVST.CCGFKC.KPVLV..-ASCSATPGSV-..........................VV..TRAGAGT.....GVKY.--YNNMFLRHVADIDGLAFW...........
R1A_BCHK5/196-441 ..........df--TPIDQYMCGKNGKPI..AEFAALMASEGITKL.ADveaevks....rtdsdryIVF.KNKLYRIV.......WNVQRK.DVAYSKQSAFTMNSIVQLd.tmEDVPRHSftIGSEIQVIAPSTAVQANGHLNLKQRLLYAFYGKQAVSE........PNYIYHSAYVD.CTSCGKGSWLTGNAVqGFACD.CGAHYCaNDVDL..QSSGLVRKNAVLlttcpcnkdge....ckhtlpqlvsmMT..DKCDVEV....vGKTFiLTYGGVIYAYMGCSGGTMH-f..........
Q6JH40_SARS/182-423 ..........vt--RYVDNNFCGPDGYPL..D-----CIKDFLARA.GKsmctlseqldyieskrgvYCC.RDHEHEIA.......WFTERS.DKSYEHQTPFEIKSAKKFdtfkGECPKFVfpLNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CNHCDEVSWQTCDFL.KATCE.HCGTEN.LVIEG.pTTCGYLPTNAVVkmpcpacqdpeigpehsvadyhnhsnIE..TRLRKGG.....RTRC.--FGGCVFAYVGCYNKRAYW...........
R1AB_FIPV/110-310 ...........g-AIYVDQYMCGADGKPV..IEG---EFKDYFGDE.DV..................IIY.EGEEYHCA.......WLTVRD.EKPLWQQTLLTIREIQYN....LDIPHKL..PNCAIREVAPPVKKNSKVVLSEEYRKLYDIFGSPFMGNgdslntcfDSLHFIAATLK.CP-CGAESSGVGDWT.GFKTA.CCGLHG.KVKGV..-TLGAVKPGDA-..........................IV..TSMSAGK.....GVKF.--FANSVLQYAGDVENVSVW...........
R1A_CVH22/112-316 ............NVTYTDQYLCGADGKPV..MSEDLWQFVDHFGEN.EE..................III.NGHTYVCA.......WLTKRK.PLDYKRQNNLAIEEIEYV...hGDALHTL..RNGSVLEMAKEVKTSSKVVLSDALDKLYKVFGSPVMTNgsnileafTKPVFISALVQ.CT-CGTKSWSVGDWT.GFKSS.CCNVIS.NKLCV..-VPGNVKPGDA-..........................VI..TTQQAGA.....GIKY.--FCGMTLKFVANIEGVSVW...........
R1AB_MERS1/194-443 ...........d-VTPVDQYMCGVDGKPI..SAYAFLMAKDGITKL.ADveadvaa....raddegfITL.KNNLYRLV.......WHVERK.DVPYPKQSIFTINSVVQKdgveNTPPHYF.tLGCKILTLTPRNKWSGVSDLSLKQKLLYTFYGKESLEN........PTYIYHSAFIE.CGSCGNDSWLTGNAIqGFACG.CGASYTaNDVEV..QSSGMIKPNALLcatcpfakgdscssnckhsvaqlvsyLS..ERCNVIA....dSKSFtLIFGGVAYAYFGCEEGTMYF...........
R1A_CVPPU/110-310 ...........g-AIYVDQYMCGADGKPV..IEG---DFKDYFGDE.DI..................IEF.EGEEYHCA.......WTTVRD.EKPLNQQTLFTIQEIQYN....LDIPHKL..PNCATRHVAPPVKKNSKIVLSEDYKKLYDIFGSPFMGNgdclskcfDTLHFIAATLR.CP-CGSESSGVGDWT.GFKTA.CCGLSG.KVKGV..-TLGDIKPGDA-..........................VV..TSMSAGK.....GVKF.--FANCVLQYAGDVEGVSIW...........
A0AAE8CC16_9NIDO/114-208 ...........n-FIYVDQYLCGADGRPI..RPG--LVFKNYFENG.DD.................vYVE.PGKTYKWA.......WDVERT.PGDF---TLDGILAIKYR....SDVPHKL..RDGTVQGVAACV--------------------------........-----------.---------------.-----.------.-----..------------..........................--..-------.....----.--------------------tpvndttqlvk
A0A891ZAE5_9BETC/201-450 ...........d-AIPVDQYMCGFDGVPI..KPYLDLANKEGLTKL.ADveadvcs....rvdkhgfLIF.KGTTYRVV.......WFTERK.DVDYGKQTLFTVNCVIQRn.gvENVPAHPftLGGQVEQLKPHVAKGNLVGLTLKAKILYTMYGEDAVEE........PSYIYHSAFVD.CGSCNEGKWCTGNAVsGFACE.CGASYSaNEVLL..QSSGLVKPNALFcatcpfakgdrcsleckhtvpqvvsyLS..EKCFVFP....sGKSFvLAFGGALYTYMGCAEGTMYF...........
A0A6B9KDC4_9ALPC/111-315 ............NVVFVDNYMCGADGKPA..VPSEQWSFVDHFDDD.TD.................eVII.DGVTFRHA.......WNTVRA.DDPYEKQGLLSIRSIEYV....SNVPHKL..PNGAALGIAGAPKKRKAVVLDEKYSKLYEACGVPFVTNgksisevvPKPLFLHALVK.CK-CGNESWTVGDWT.SFKTT.CCGFIG.KVTTL..-AVGDVIPGDI-..........................VF..TTPGAGR.....GTKF.--FCGLVLTFVDTLEGISAW...........
R1A_SARS/182-423 ..........vt--RYVDNNFCGPDGYPL..D-----CIKDFLARA.GKsmctlseqldyieskrgvYCC.RDHEHEIA.......WFTERS.DKSYEHQTPFEIKSAKKFdtfkGECPKFVfpLNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CNHCDEVSWQTCDFL.KATCE.HCGTEN.LVIEG.pTTCGYLPTNAVVkmpcpacqdpeigpehsvadyhnhsnIE..TRLRKGG.....RTRC.--FGGCVFAYVGCYNKRAYW...........
A0A1L2KGC3_9ALPC/111-314 ...........n-KIPVDQYMCGYDGKPV..IPAGSWEFKNYFEDG.NE..................ITL.NGVVYYLA.......WQVERK.PLPHANQNLLSITEILYL....SKEQHTL..LPGSILTTAAPPKRSAKVVLSDDWKSLYEECGSPFVNNgttllevvPKPVFLNAFVN.CK-CGNSCWSVGDWT.GYKSA.CCGENA.QRVCV..-VPGEVVAGDI-..........................VV..TSKAAGV.....GVKY.--YTGMTLKFVKECGNVHLW...........
A0A096XNJ3_9ALPC/114-290 ...........n-PIYVDQYLCGPDGTPV..KKG--LEFKDYFMNG.GD..................IYVePGKTYVRV.......WDVERK.QDDL---TLDGILSIKYL....SDKPHKL..RDGAIQGVADAV------------SELNDTNQ------........-MVRFIHAFVS.CP-CGKSAFTVGSWM.GFATV.CCGKIVkTPMCV..KFSGEA--GSIFa.......................lpVG..SRGFSAN.....GKRS.--YAGAEFQFCCELSGVEIW...........
A0A0U1WHK4_SARS/182-423 ..........vt--RYVDNNFCGPDGYPL..D-----CIKDFLARA.GKsmctlseqldyieskrgvYCC.RDHEHEVA.......WFTERS.DKSYEHQTPFEIKSAKKFdtfkGECPKFVfpLNSKVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CNHCDEVSWQTCDFL.KATCEhCGTENS.IAEGP..TTCGYLPTNAVVkmpcpacqdpeigpehsvadyhnhsnIE..TRLRRGG.....RTRC.--FGGCVFAYVGCYNKRAYW...........
A0A6B9KKB5_9ALPC/113-316 ..........gp--VYVDNYMCGANGKPV..LPADVWVFQDYFGEE.TE..................LIV.NGVKHVKV.......WHVTRT.DIPYQFQSLGAIESIEWL....TDIPHTL..RSGSKLSAARAVKHSKNVVLSEPLKTLYQACGSPFVTNgstlreavPKPVFAHAYVA.CK-CGRKSWSVGDWS.GYKST.CCGVFG.KPQCV..-VFGEVVPGDV-..........................FI..TTSSVGS.....GTRY.--YNGLTVKHVVTVDGLACW...........
A0A0U1UZC3_9ALPC/112-317 ..........pp--IYVDNYLCGADGTPV..VQESMWSYTDHFGED.CD.................eITL.CGITYVHA.......WNVQRA.DVPYEQQNVTSIFSIEYL....LDVDHAL..QNGAVLNVASGVKYKKSVVLSEGFKKLYDACGVPAVQNgntlvdilTKPAFFHAIVS.CS-CGLSSYTVGDWKiGFRSL.CCGKRL.EPITV..-VVGDVKPGDI-..........................VV..TSANAGD.....GVRY.--FNGLTLQYVGDWEGVSCW...........
B1PHK0_9ALPC/112-316 .........asp--VYVDNYMCGANGKPV..LPADVWVYQDYFGEE.TE..................LIV.NGVKHVKV.......WHVTRT.DIPYQFQSLGAIESIEWL....TDIPHTL..RNGSRLSAARAVKHSKNVVLSEPLKTLYQACGSPFVTNgstlreavPKPVFAHAYVA.CK-CGRKAWSVGDWS.GYKST.CCGVFG.KPQCV..-VFGEVVPGDV-..........................FI..TTSSVGS.....GTRY.--YNGLTVKHVVTVDGLACW...........
A0AAE8CC16_9NIDO/195-288 acvtpvndttql-----------------..---------------.--..................---.--------.......------.------------------....-------..--------------------------------------........--VKFIHAFVV.CP-CGKGSFTVGSWR.GYTTM.CCGVVIkQPVCV..KFSGLA--GSIF..........................ALplGSRSVG-.....SSKF.--YAGCYFEYCCDFSGVEVW...........
A0A240FW17_9ALPC/111-292 ...........k-VVYVDNYLCGNNGKPV..VPKDKWKILSK-GQQ.G-..................LLA.DNVYYKVV.......WDVKRD.DVPYEKQNMSSIVSIRYL....IDIPHFL..ADGAVREKKRPPQD---------YTTM-LVKGFPFLMA........YDWKFVNHAVK.CGKCDNHVVEAGAFE.SVITS.CCRDEI.VHQGV..-V--TAKAGEL-..........................VL..TPLS---.....NKKL.ILVGSTVLRNIGTAHNLSIW...........
A0AAE9BUP5_9ALPC/112-317 ..........pp--VYVDNYLCGSDGNPV..VAENMWSFIDHFEDGlDE..................IVV.CGITYVHA.......WNVERF.DVPYEQQNITTIKSIDYL....LDVDHKL..QNGAKYSAVQPAKYKKSVVLSEAFKPLYDACGSPFVQNgttlvdiiANPKFFHAIVE.CN-CGRSSYTVGDWTkGYSSV.CCGKRC.EPLVV..-VTGNVKPGDI-..........................VL..TSTATGT.....GVRY.--YEGLTMQFVGEFEHLNCW...........
R1A_SARS2/182-423 ..........yt--RYVDNNFCGPDGYPL..E-----CIKDLLARA.GKasctlseqldfidtkrgvYCC.REHEHEIA.......WYTERS.EKSYELQTPFEIKLAKKFdtfnGECPNFVfpLNSIIKTIQPRVEKKKLDGFMGRIRSVYPVASPNE---........CNQMCLSTLMK.CDHCGETSWQTGDFV.KATCE.FCGTENlTKEGA..TTCGYLPQNAVVkiycpachnsev..gpehslaeyhneSG..LK----Til.rkGGRT.IAFGGCVFSYVGCHNKCAYW...........
B0LJR0_9ALPC/110-310 ...........g-AIYVDQYMCGADGKPV..IDG---EFRDYFGDE.DV..................IIY.EGEEYHCA.......WLTVRD.EKPLCQQTLLTIREIQYN....LDIPHKL..PNCAIREVAPPVKKNSKVVLSEEYRKLYDIFGSPFMGNgdslnkcfDSLHFIAATLK.CP-CGAESSGVGDWT.GFKTA.CCGLLG.KVKGV..-TLGAVKPGDA-..........................VV..TSMSAGK.....GVKF.--FANSVLQYAGDVENVSVW...........
B0LJQ9_9ALPC/110-310 ...........g-AIYVDQYMCGADGKPV..IDG---EFRDYFGDE.DV..................IIY.EGEEYHCA.......WLTVRD.EKPLCQQTLLTIREIQYN....LDIPHKL..PNCAIREVAPPVKKNSKVVLSEEYRKLYDIFGSPFMGNgdslnkcfDSLHFIAATLK.CP-CGAESSGVGDWT.GFKTA.CCGLLG.KVKGV..-TLGAVKPGDA-..........................VV..TSMSAGK.....GVKF.--FANSVLQYAGDVENVSVW...........
R1A_BCHK9/191-395 ...........l-VEPVMKLLGVIKSDFT..LEQLLAALGKYRTED.G-..................YDL.PDGYVKVA.......IKVGRK.AVPVLKQSIFTVVGVTEQlvpgYYYPFS-..TSSVVEHTKPTRGGPVGKTVEAVMLSLYGTNN------........YNPATPVARLK.CSYCDYYGWTPLKDIgTVNCL.CGAEFQlTSSCVdaESAGVIKPGCVM..........................LL..DKSPGMRl..ipGNRTyVSFGGAIWSPIGKVNGVTVW...........
A0A915V9U8_9BETC/196-445 ..........df--IPIDQFMCGKDGAPV..PDYATLAASENLISL.ADvatdvsa....radsdgyIDF.KSKLYRIV.......WHVERK.NVPYAKQTIFTINSVVQRd.giEDVPPHTftLGGKVDLIVPRNKWTGKTALNLKQKILYTFYGKDALDN........HSYIYHSAYAD.CTSCGKGSWLTGNAVqGFACD.CGAQYSaNDVEL..QSSGVVNPNAIFcatcpfakgdscsssckhtlaqmvsqLS..EKCDVAP....dGKSFtLAFGGVVYAYLGCLDGTMYF...........
A0A2Z4EVM4_9BETC/190-394 ..........lv--KPIMDLLGPLKSGYT..LANLLDDLAPYKCDD.G-..................YEL.PTGTVCVA.......FEVVRK.NVPAAKQNIFTVQGVLNQlvpgIYYPYS-..SGSKVVTTKPARDSPAAKTVSSIMLSLYGTAQ------........YAPVTPVARIA.CPTCGFLGWLPLKDAgTVVCG.CNATYNmTSTAVqaESSGFIRQGAVL..........................CL..EKGEAMRli.pgGRTY.LAFGGAIWSPIGKDKDVTVW...........
A0A2R4QKW4_9ALPC/111-312 ...........t-VVYVDQFLCGADGKPV..RQG---EMKDYFGDL.ED..................IVI.DGITYTHA.......WDVVRDmEVPHAKQTALTIQSIMYL....MDVDHKI..VNGATRQRAAPVKISSKVCLTEPYNSLYKQFGSPYMHNgsnlnecfSKLNFIVANVK.CK-CGGESSGVGDWT.GFKSA.CCGTPG.KVIGV..-SIGDASVGEA-..........................VI..TSKGCGT.....GTKF.--YAGAVLKFVGDAEGVSVW...........
K4KCJ9_9ALPC/111-315 ...........t-TVFVDNFLCGANGLPA..CSEQEWEFKDHFGEL.DE..................VTI.NGTTFVKA.......WNVDRT.PGPYSTQNLLSINSISWC....GEIPHSL..ADGSIRRVAKVVKKSKSVLLGKQFQQLYDSVGSPFVTNgknlsdvlVKPIYCHALVK.CQ-CGKTSWTVGDWS.CYKSM.CCGFNC.KPLAI..-VNGEVVPGDV-..........................LV..TSDKVSA....sGTKY.--YNGMVLKFVDKIDNACLW...........
A0A0K1YZY7_SARS/182-423 ..........vt--RYVDNNFCGPDGYPLecIKGLLARAGKSMCTL.SEqldfi.......eskrgvYCC.REHEHEIA.......WYTERS.DKSYEHQTPFDIKSAKKFdtfkEECPKFVfpLNSTVKVIQPRVEKKKTEGFMGRIRSVYPVASP---QE........CNNMHLSTLMK.CSHCDEVSWQTCDFL.KATCE.HCGTENlVVEGP..TTCGYLPINAVVkmpcpacqnkevgpehsvadyhnysnIE..TRLRKGG.....RTKC.--FGGCVFSYVGCYNKRAYW...........
A0A0U1UZA8_9ALPC/111-318 ..........ts--IPVDNYMCGANGKPV..LPEDMWCFCDYFGDD.GD.................nITV.NGQAYHKA.......WNVTRS.DVPYQFQNASTILSIEYL....ADEKHVL..PDGAVAKTAKPPKFSKNIVLSEKYKALYDACGSPFVTNgtnvlevvTNPIFAHGFVQ.CK-CGSKHWTTGDWA.GFKSV.CCGIPG.RVLCT..-VFGGVAPGSV-..........................LL..TSTRVDAs..pgAARY.--YHGLTLKHICNVDGVACW...........
#=GC seq_cons ...........s..haVDpYhCGsDGcPl..h.t..hphpDahsct.s-..................lsl.sstpaphA.......WpVpRs.-hPYppQolhoIpuIphh....t-hPHpl..hsuslhplsssscpspphslstphppLYshhGsshhpp........spshahsAhlc.Cs.CGppSWssGDas.uapss.CCGhhs.pshsl...ssG.lhsGsl...........................ll..Tptssus.....Gs+a...auGhlhpalGshcGlshW...........
//