#=GF ID SUB1_ProdP9
#=GF AC PF18213.5
#=GF DE SUB1 protease Prodomain ProdP9
#=GF AU Smart A;0000-0002-6965-5633
#=GF SE ECOD:EUF03039
#=GF GA 25.00 25.00;
#=GF TC 25.80 25.10;
#=GF NC 24.80 23.60;
#=GF BM hmmbuild HMM.ann SEED.ann
#=GF SM hmmsearch -Z 75585367 --cpu 4 -E 1000 HMM pfamseq
#=GF TP Domain
#=GF RN [1]
#=GF RM 24785947
#=GF RT The malaria parasite egress protease SUB1 is a calcium-dependent
#=GF RT redox switch subtilisin.
#=GF RA Withers-Martinez C, Strath M, Hackett F, Haire LF, Howell SA,
#=GF RA Walker PA, Christodoulou E, Dodson GG, Blackman MJ;
#=GF RL Nat Commun. 2014;5:3726.
#=GF DR INTERPRO; IPR041089;
#=GF DR SO; 0000417; polypeptide_domain;
#=GF CC This domain is the bound prodomain fragment ProdP9 of the SUB1
#=GF CC protein present in Plasmodium falciparum. SUB1 is a serine
#=GF CC protease that processes a subset of parasite proteins that play
#=GF CC indispensable roles in egress and invasion. The C-terminal stalk
#=GF CC of ProdP9 binds in the active site groove in a substrate-like
#=GF CC manner and is truncated at the N terminus as a result of the
#=GF CC chymotrypsin digestion step used during purification. ProdP9 is
#=GF CC structural similar to MIC5 from Toxoplasma gondii, despite low
#=GF CC sequence identity [1].
#=GF SQ 27
#=GS A0A0L1IEY1_PLAFA/144-223 AC A0A0L1IEY1.1
#=GS A0A653H707_9APIC/133-212 AC A0A653H707.1
#=GS A0A1J1HAX9_PLARL/118-197 AC A0A1J1HAX9.1
#=GS A0A024XCT6_PLAFC/141-220 AC A0A024XCT6.1
#=GS A0A1D3U8X6_9APIC/121-200 AC A0A1D3U8X6.1
#=GS A0A1A8VVU6_9APIC/121-200 AC A0A1A8VVU6.1
#=GS Q7RGL7_PLAYO/116-195 AC Q7RGL7.1
#=GS SUB1_PLAF7/138-217 AC Q8I0V0.1
#=GS A0A024VIT3_PLAFA/96-175 AC A0A024VIT3.1
#=GS A0A024WBB7_PLAFA/143-222 AC A0A024WBB7.1
#=GS A0A1Y1JGV4_PLAGO/122-201 AC A0A1Y1JGV4.1
#=GS W7JH37_PLAFA/139-218 AC W7JH37.1
#=GS K6UDQ1_PLACD/123-202 AC K6UDQ1.1
#=GS A0A509AM03_PLABA/116-195 AC A0A509AM03.1
#=GS A0A0L1I7Y3_PLAFA/144-223 AC A0A0L1I7Y3.1
#=GS SUB1_PLAFO/138-217 AC W7K9M0.1
#=GS A0A4Y2L115_ARAVE/90-162 AC A0A4Y2L115.1
#=GS A0A1A8YZI9_9APIC/121-200 AC A0A1A8YZI9.1
#=GS A0A024WUI1_PLAFA/141-220 AC A0A024WUI1.1
#=GS A0A0L7K723_PLAFX/140-219 AC A0A0L7K723.1
#=GS W4IU16_PLAFP/141-220 AC W4IU16.1
#=GS A0A0L0CTV0_PLAFA/151-230 AC A0A0L0CTV0.1
#=GS A0A384KKS5_PLAKH/122-201 AC A0A384KKS5.1
#=GS A5KB03_PLAVS/123-202 AC A5KB03.1
#=GS A0A1A8W494_PLAMA/120-199 AC A0A1A8W494.1
#=GS A0A0L7M2G5_PLAF4/1-37 AC A0A0L7M2G5.1
#=GS A0A0L7LXW7_PLAF4/140-219 AC A0A0L7LXW7.1
A0A0L1IEY1_PLAFA/144-223 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A653H707_9APIC/133-212 ....LRLIVSENHATTPSFFEE.SLLQEDVI..NFIHSKGKVFHLPNMKFMLIDLNSNTNDEELELYINTLENKGAHVEPDQLVGGD.......
A0A1J1HAX9_PLARL/118-197 ....LRLIVSENHSTTPSFFEE.SLLQEDVI..SLIESKGKLSNLPSLKSAIIDLNDDTTDKELEAYITTLEKKGALVESDKLVGAD.......
A0A024XCT6_PLAFC/141-220 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A1D3U8X6_9APIC/121-200 ....LRLIVSENHSTSPSFFEE.SLLQEDVI..SFIQSKGTLSNLKNLKSVIIDLNSETTDEELESYIKMLEQKGALIESDKLVGAD.......
A0A1A8VVU6_9APIC/121-200 ....LRLIVSENHSTSPSFFEE.SLLQEDVI..SFIQSKGTLSNLKNLKSVIIDLNSETTDEELESYIKMLEQKGALIESDKLVGAD.......
Q7RGL7_PLAYO/116-195 ....LRLIVSENHATTPSFFEE.SIIQEDFM..SFIQSKGEIVNLKNIKSMIIELNSDMTDKELETYITLLKKKGAHVESDELVGAD.......
SUB1_PLAF7/138-217 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A024VIT3_PLAFA/96-175 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A024WBB7_PLAFA/143-222 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A1Y1JGV4_PLAGO/122-201 ....LRLLVSENHKTSPSFFEE.SLLQEDVL..SFIQSKGTLSNLKNIKSVIIELNTDTTDEELEEYIKTLENKGALIESDKLVGAD.......
W7JH37_PLAFA/139-218 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
K6UDQ1_PLACD/123-202 ....LRLIVSENHATSPSFFEE.SLLQEDVM..SFIQSKGKLANLKNLKSIIIDLNDDMTDEELAEYISMLERKGALIESDKLVGAD.......
A0A509AM03_PLABA/116-195 ....LRLIVSENHATSPSFFEE.SLIQEDFM..SFIQSKGEIVNLKNLKSMIIELNSDMTDKELEAYITLLKKKGAHVESDELVGAD.......
A0A0L1I7Y3_PLAFA/144-223 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
SUB1_PLAFO/138-217 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A4Y2L115_ARAVE/90-162 aass------TSTAVDPSTFHEaAILDDDIVrySKVKKKGYLQIVTNLGPLNIELHCDMTPKTCENFIKLSK---------------sgyyent
A0A1A8YZI9_9APIC/121-200 ....LRLIVSENHSTSPSFFEE.SLLQEDVI..SFIQSKGTLSNLKNLKSVIIDLNSETTDEELESYIKMLEQKGALIESDKLVGAD.......
A0A024WUI1_PLAFA/141-220 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A0L7K723_PLAFX/140-219 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
W4IU16_PLAFP/141-220 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A0L0CTV0_PLAFA/151-230 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A384KKS5_PLAKH/122-201 ....LRLIVSENHATSPSFFEE.SLLQDEVM..SFIQSKGKLSNLKNLKSIIIDLNGDMTDEELAEYINMLEKKGALIESDKLVGAD.......
A5KB03_PLAVS/123-202 ....LRLIVSENHATSPSFFEE.SLLQEDVV..SFIQSKGKLSNLKNLKSMIIDLNSDMTDEELAEYISLLERKGALIESDKLVGAD.......
A0A1A8W494_PLAMA/120-199 ....LRLIVSENHSTSPSFFEE.SLLEEEVV..SFLQSKGKLSNLKNIKSLIIDLNNDTSDEELEKYIKKLEEKGAHVESDKLVGAD.......
A0A0L7M2G5_PLAF4/1-37 ....------------------.--------..-----------------MIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
A0A0L7LXW7_PLAF4/140-219 ....LRLIVSENHATTPSFFQE.SLLEPDVL..SFLESKGNLSNLKNINSMIIELKEDTTDDELISYIKILEEKGALIESDKLVSAD.......
#=GC seq_cons ....LRLIVSENHAToPSFFpE.SLLp.DVl..SFlpSKGsLSNLKNlpSMIIELppDTTD-ELhSYIKlLEcKGALIESDKLVuAD.......
//