#=GF ID bCoV_NSP3_N
#=GF AC PF12379.11
#=GF DE Betacoronavirus replicase NSP3, N-terminal
#=GF PI DUF3655; Corona_NSP3a;
#=GF AU Gavin OL;
#=GF AU Chuguransky S;0000-0002-0520-0736
#=GF SE Prosite
#=GF GA 26.70 26.70;
#=GF TC 28.50 158.60;
#=GF NC 24.70 23.20;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -Z 61295632 -E 1000 --cpu 4 HMM pfamseq
#=GF TP Family
#=GF RN [1]
#=GF RM 18367524
#=GF RT Proteomics analysis unravels the functional repertoire of
#=GF RT coronavirus nonstructural protein 3.
#=GF RA Neuman BW, Joseph JS, Saikatendu KS, Serrano P, Chatterjee A,
#=GF RA Johnson MA, Liao L, Klaus JP, Yates JR 3rd, Wuthrich K, Stevens
#=GF RA RC, Buchmeier MJ, Kuhn P;
#=GF RL J Virol. 2008;82:5279-5294.
#=GF RN [2]
#=GF RM 31776274
#=GF RT Nucleocapsid Protein Recruitment to Replication-Transcription
#=GF RT Complexes Plays a Crucial Role in Coronaviral Life Cycle.
#=GF RA Cong Y, Ulasli M, Schepers H, Mauthe M, V'kovski P, Kriegenburg
#=GF RA F, Thiel V, de Haan CAM, Reggiori F;
#=GF RL J Virol. 2020; [Epub ahead of print]
#=GF RN [3]
#=GF RM 23943763
#=GF RT Severe acute respiratory syndrome coronavirus nonstructural
#=GF RT proteins 3, 4, and 6 induce double-membrane vesicles.
#=GF RA Angelini MM, Akhlaghpour M, Neuman BW, Buchmeier MJ;
#=GF RL mBio. 2013; [Epub ahead of print]
#=GF RN [4]
#=GF RM 17728234
#=GF RT Nuclear magnetic resonance structure of the N-terminal domain of
#=GF RT nonstructural protein 3 from the severe acute respiratory
#=GF RT syndrome coronavirus.
#=GF RA Serrano P, Johnson MA, Almeida MS, Horst R, Herrmann T, Joseph
#=GF RA JS, Neuman BW, Subramanian V, Saikatendu KS, Buchmeier MJ,
#=GF RA Stevens RC, Kuhn P, Wuthrich K;
#=GF RL J Virol. 2007;81:12049-12060.
#=GF DR INTERPRO; IPR024358;
#=GF DR SO; 0100021; polypeptide_conserved_region;
#=GF CC This domain family corresponds to the N-terminal domain of NSP3
#=GF CC (non-structural protein 3, also known as nsp3) found in
#=GF CC Betacoronavirus, which is encoded on the replicase polyprotein.
#=GF CC This family includes the NSP3a domain which has the
#=GF CC ubiquitin-like 1 (UB1) and glutamic acid-rich acidic (AC)
#=GF CC hypervariable domains [1]. NSP3a interacts with numerous other
#=GF CC proteins involved in replication and transcription and may serve
#=GF CC as a scaffolding protein for these processes. The N-terminal
#=GF CC NSP3a domain interacts with N (nucleocapsid) protein to
#=GF CC colocalise genomic RNA with the nascent replicase-transcriptase
#=GF CC complex at the earliest stages of infection, essential for the
#=GF CC virus [3]. The C-terminal Glu-rich subdomain is best described
#=GF CC as a flexible tail attached to the globular UB1 subdomain [4].
#=GF CC The family is found in association with Pfam:PF08716,
#=GF CC Pfam:PF01661, Pfam:PF05409, Pfam:PF06471, Pfam:PF08717,
#=GF CC Pfam:PF06478, Pfam:PF09401, Pfam:PF06460, Pfam:PF08715,
#=GF CC Pfam:PF08710.
#=GF SQ 17
#=GS Q6UZF5_SARS/881-1029 AC Q6UZF5.1
#=GS Q6UZF1_SARS/881-1029 AC Q6UZF1.1
#=GS U5WI49_SARS/881-1029 AC U5WI49.1
#=GS Q5DIC6_SARS/881-1029 AC Q5DIC6.1
#=GS A0A0K1Z0N1_SARS/881-1029 AC A0A0K1Z0N1.1
#=GS R1A_SARS/881-1029 AC P0C6U8.1
#=GS R1AB_SARS/881-1029 AC P0C6X7.1
#=GS R1AB_SARS/881-1029 DR PDB; 2ACF A; 184-211;
#=GS R1AB_SARS/881-1029 DR PDB; 2ACF C; 184-211;
#=GS R1AB_SARS/881-1029 DR PDB; 2FAV A; 2-30;
#=GS R1AB_SARS/881-1029 DR PDB; 2GRI A; 63-112;
#=GS R1AB_SARS/881-1029 DR PDB; 2FAV C; 3-30;
#=GS R1AB_SARS/881-1029 DR PDB; 2IDY A; 63-112;
#=GS R1AB_SARS/881-1029 DR PDB; 2FAV B; 3-30;
#=GS R1AB_SARS/881-1029 DR PDB; 2ACF B; 184-211;
#=GS R1AB_SARS/881-1029 DR PDB; 2ACF D; 184-211;
#=GS R9QTH2_SARS/881-1030 AC R9QTH2.1
#=GS Q5DIC7_SARS/881-1029 AC Q5DIC7.1
#=GS R1A_SARS2/880-1051 AC P0DTC1.1
#=GS R1AB_SARS2/880-1051 AC P0DTD1.1
#=GS R1AB_SARS2/880-1051 DR PDB; 5S27 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z6I D; 206-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S29 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6WOJ C; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1Q A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S28 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z5T B; 206-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1E A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1Y B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1W B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1O B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1M B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 7CZ4 B; 4-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S20 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z5T A; 206-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1Q B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S28 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S24 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6WOJ A; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S29 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S18 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1W A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1S B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6WEY A; 207-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z72 A; 206-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1U A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S27 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1I B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 7C33 D; 4-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1G A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 7C33 C; 4-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S2C B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1U B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S18 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S20 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S2C A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1E B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6WOJ B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z72 C; 206-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1G B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 7C33 B; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S24 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S2B A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1M A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1C A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1I A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6WEN A; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z6I B; 207-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1S A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 7KAG A; 62-111;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S74 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1C B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z72 B; 207-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 7C33 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6WOJ D; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S2A B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S26 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1K B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1A A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z6I A; 207-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 7KAG B; 62-111;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S26 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S73 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S74 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S22 B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1K A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S73 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1A B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1Y A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S1O A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 7CZ4 A; 4-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z6I C; 206-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S2B B; 3-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 6Z72 D; 207-233;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S22 A; 5-29;
#=GS R1AB_SARS2/880-1051 DR PDB; 5S2A A; 5-29;
#=GS R1AB_BC279/881-1027 AC P0C6V9.1
#=GS R1A_BC279/881-1027 AC P0C6F5.1
#=GS A0A0U1WJY1_SARS/881-1027 AC A0A0U1WJY1.1
#=GS A0A0K1YZY7_SARS/881-1029 AC A0A0K1YZY7.1
#=GS R9QTB2_SARS/881-1022 AC R9QTB2.1
#=GS U5WLB9_SARS/881-1029 AC U5WLB9.1
Q6UZF5_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEENFSSRMYCSFYPPDEEEEDDAECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVRVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
Q6UZF1_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEENFSSRMYCSFYPPDEEEEDDAECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVRVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
U5WI49_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEKLSSRMYCSFYPPDDEEDCDEYDEEEEvL.EESCAHEYGTEEDYQGLSLEFGASTE-MQVEEEEEEDWLGDATEL.......S............EHEP..EPELTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQ-n
Q5DIC6_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEENFSSRMYCSFYPPDEEEEDDAECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVRVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
A0A0K1Z0N1_SARS/881-1029 VKTLQPVSDLLTEMGVVLDEWSVATFYLFDDAGEENLSSRMYCSFYPPDEEEEDDVECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVQVEEEEEEDWLDDTTEQ.......S............EIEP..EPESTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
R1A_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEENFSSRMYCSFYPPDEEEEDDAECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVRVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
R1AB_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEENFSSRMYCSFYPPDEEEEDDAECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVRVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
#=GR R1AB_SARS/881-1029 SS HHTTXSXHHHHHHHTXXHHHHTTSXXEEEXSSSSSXXSSBXEEESSXSXXXXXXXXXXXXXX.X.XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX.......X............XXXX..XXXXXX...XX-S----S-EESSSSEEEEES-HHHHHHH.
R9QTH2_SARS/881-1030 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDSGEENLSSRMYCSFYPPDEEEEGDAECEEEE.IaDETCEHEYGTEDDYQGLPMEFGASTETVQVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTS...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQ-n
Q5DIC7_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEENFSSRMYCSFYPPDEEEEDDAECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVRVEEEEEEDWLDDTTEQ.......S............EIEP..EPEPTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
R1A_SARS2/880-1051 IKTLQPVSELLTPLGIDLDEWSMATYYLFDESGEFKLASHMYCSFYPPDEDEE-EGDCEEEE.F.EPSTQYEYGTEDDYQGKPLEFGATSAALQPEEEQEEDWLDDDSQQtvgqqdgSednqtttiqtivEVQPqlEMELTPvvqTIEVNSFSGYLKLTDNVYIKNADIVEEAK-k
R1AB_SARS2/880-1051 IKTLQPVSELLTPLGIDLDEWSMATYYLFDESGEFKLASHMYCSFYPPDEDEE-EGDCEEEE.F.EPSTQYEYGTEDDYQGKPLEFGATSAALQPEEEQEEDWLDDDSQQtvgqqdgSednqtttiqtivEVQPqlEMELTPvvqTIEVNSFSGYLKLTDNVYIKNADIVEEAK-k
#=GR R1AB_SARS2/880-1051 SS HHHHCCCHCCCTTTTXXHHHHTTSXXEEEXTTSXSSXXSEEEEESSXSXXXXX-XXXXXXXX.X.XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXTS---S-EESSSSEEEEES-HHHHHH-H
R1AB_BC279/881-1027 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEKLSSRMYCSFYPPDEEEDCEEYEDEEE.IpEETCEHEYGTEDDYKGLPLEFGASTEIQQVDEEEEEDWLEEAI--.......-............AAKP..EPEPLP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQ-h
R1A_BC279/881-1027 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEKLSSRMYCSFYPPDEEEDCEEYEDEEE.IpEETCEHEYGTEDDYKGLPLEFGASTEIQQVDEEEEEDWLEEAI--.......-............AAKP..EPEPLP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQ-h
A0A0U1WJY1_SARS/881-1027 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEKLSSRMYCSFYPPDEEEDCEEYEDEED.IpEETCEHEYGTEDDYKGLPLEFGASTEAQQVDEEEEEDWLEEAI--.......-............AAEP..EPVPLP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
A0A0K1YZY7_SARS/881-1029 VKTLQPVSDLLTEMGVVLDEWSVATFYLFDDAGEENLSSRMYCSFYPPDEEEEDDVECEEEE.I.DETCEHEYGTEDDYQGLPLEFGASAETVQVEEEEEEDWLDDTTEQ.......S............EIEP..EPESTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
R9QTB2_SARS/881-1022 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEKLSSRMYCSFYPPDEEEECEEYEEEEE.VpEQTCEHEYGTEDDYKGLPLEFGAST--QQVDEEEEEDWLD-----.......-............EAEP..EPESLS...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQS.
U5WLB9_SARS/881-1029 VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEKLSSRMYCSFYPPDDEEDCDEYDEEEEvL.EESCAHEYGTEEDYQGLSLEFGASTE-MQVEEEEEEDWLGDATEL.......S............EHEP..EPELTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQ-n
#=GC SS_cons HHCCCCCHCCCCCCTXXHHHHTTSXXEEEXTTSSSSXSSEEEEESSXSXXXXX-XXXXXXXX.X.XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXTS---S-EESSSSEEEEES-HHHHHHHH
#=GC seq_cons VKTLQPVSDLLTNMGIDLDEWSVATFYLFDDAGEEpLSSRMYCSFYPPDEEEEsDs-CEEEE.I.-ETCEHEYGTEDDYQGLPLEFGASsEslQVEEEEEEDWLDDsTEQ.......S............ElEP..EPEsTP...EEPVNQFTGYLKLTDNVAIKCVDIVKEAQ..
//