# STOCKHOLM 1.0 #=GF ID RP1-2 #=GF AC PF12042.9 #=GF DE Tubuliform egg casing silk strands structural domain #=GF AU Mistry J;0000-0003-2479-5322 #=GF AU Gavin OL; #=GF SE pdb_2k3n #=GF GA 21.10 21.10; #=GF TC 23.30 23.60; #=GF NC 19.90 20.90; #=GF BM hmmbuild HMM.ann SEED.ann #=GF SM hmmsearch -Z 47079205 -E 1000 --cpu 4 HMM pfamseq #=GF TP Domain #=GF RN [1] #=GF RM 19458259 #=GF RT Solution structure of eggcase silk protein and its implications #=GF RT for silk fiber formation. #=GF RA Lin Z, Huang W, Zhang J, Fan JS, Yang D; #=GF RL Proc Natl Acad Sci U S A. 2009;106:8906-8911. #=GF DR INTERPRO; IPR021915; #=GF DR SO; 0000417; polypeptide_domain; #=GF CC Spiders use fibroins to make silk strands. This family includes #=GF CC tubuliform silk fibroins which are used to protect egg cases. #=GF CC This domain is a structural domain which is found in repeats of #=GF CC up to 20 in many individuals (although this is not necessarily #=GF CC the case). RP1 makes up structural domains in the N terminal #=GF CC while RP2 makes up structural domains in the C terminal. [1] #=GF SQ 38 #=GS A0A087URD1_9ARAC/3529-3695 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/1398-1565 AC A0A087URD1.1 #=GS A0A087TBY8_9ARAC/1504-1662 AC A0A087TBY8.1 #=GS A0A087URD1_9ARAC/623-793 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/2175-2345 AC A0A087URD1.1 #=GS A0A087U004_9ARAC/192-357 AC A0A087U004.1 #=GS A0A087URD1_9ARAC/816-983 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/1013-1177 AC A0A087URD1.1 #=GS A0A087TBY8_9ARAC/899-1066 AC A0A087TBY8.1 #=GS A0A087URD1_9ARAC/2945-3114 AC A0A087URD1.1 #=GS A0A087TBY8_9ARAC/1102-1274 AC A0A087TBY8.1 #=GS A0A087TBZ4_9ARAC/231-382 AC A0A087TBZ4.1 #=GS A0A087URD1_9ARAC/1790-1953 AC A0A087URD1.1 #=GS A0A087U004_9ARAC/834-991 AC A0A087U004.1 #=GS A0A087UQ25_9ARAC/559-680 AC A0A087UQ25.1 #=GS A0A087URD1_9ARAC/235-407 AC A0A087URD1.1 #=GS A0A087U004_9ARAC/3231-3394 AC A0A087U004.1 #=GS A0A087U004_9ARAC/683-839 AC A0A087U004.1 #=GS A0A087UJV0_9ARAC/60-194 AC A0A087UJV0.1 #=GS A0A087U004_9ARAC/3895-4061 AC A0A087U004.1 #=GS A0A087URD1_9ARAC/433-595 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/3723-3886 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/2561-2752 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/1589-1758 AC A0A087URD1.1 #=GS A0A314KSL0_NICAT/10-90 AC A0A314KSL0.1 #=GS A0A087TBY8_9ARAC/696-874 AC A0A087TBY8.1 #=GS A0A087URD1_9ARAC/1979-2146 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/3336-3501 AC A0A087URD1.1 #=GS A0A087TBY8_9ARAC/1301-1462 AC A0A087TBY8.1 #=GS A0A087URD1_9ARAC/1203-1372 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/3139-3306 AC A0A087URD1.1 #=GS A0A087UPZ6_9ARAC/42-158 AC A0A087UPZ6.1 #=GS A0A087U004_9ARAC/1772-1936 AC A0A087U004.1 #=GS A0A087TBY8_9ARAC/334-498 AC A0A087TBY8.1 #=GS A0A087URD1_9ARAC/2754-2919 AC A0A087URD1.1 #=GS A0A087URD1_9ARAC/3911-4079 AC A0A087URD1.1 #=GS A0A087TBY8_9ARAC/522-695 AC A0A087TBY8.1 #=GS A0A087URD1_9ARAC/2362-2532 AC A0A087URD1.1 A0A087URD1_9ARAC/3529-3695 ...............ypapsg--------AAVPSRV.................ISEVANKLASALLRSSVFQRAFNTRVSSSVANRIASALAQSIASSLQLDyATASKCRNAIMQALSG.VRSGSDTSVYALAIASALAGQLAATGRLS..ASNAS.GIGSSLLSGVVQGSYSGARQAGV.......DLSGVDVSSDISSSLSAYGADSSAGQDIAP-s........................... A0A087URD1_9ARAC/1398-1565 ..................dyg-----APSAGAAPSV.................VSDVANTLASGLLTSNAFQRAFNSRISSSVANRIAAALAQSVASSMQLDyGTASKCRNAIMQALSS.VRSGSDTRVYALTIASSLATQLANAGVLN..ASNMS.SIGSSLLSSVVQGAYSGARQAGI.......DVSGIDVSSDISSSISAYGG-----------srtggqetgist................ A0A087TBY8_9ARAC/1504-1662 .......qdatsaastaagga--------------Qvagtss....tatdigvISKFTNTVSSSLLSSNDFTSIFGSGLPVTTAFNLASNLAQSLATQIGLDeAGINSLLSLLSQYISA.IGSSADASAYANALSLAIGNTLAKAGNLS..PILTA.SLASADAQPIANLVNSVTSSTL-.......-------------------------------iaqqpnlir................... A0A087URD1_9ARAC/623-793 ..............ygalsgg---------AVPSAV.................ISDVANNLASALLRSNIFQRSFNARISASVANRIAAALAQSIASSFQLDyATASKCRNAIMQALSS.VRSGSDTRTYATAIATTLASQLAAAGRLN..TSNAS.GIGTTLLSGVLQGAYSGARQAGV.......DVSGVDVSTDISSSVSAY-------------aggpaagqvpamsaqya........... A0A087URD1_9ARAC/2175-2345 ............gepsaavlp------------SSI.................ISDVANNLASALLRSNIFQRAFNARISSSVANRIAAALAQSISSSMQLDyATASKCRNAIMQALSG.VRSGSDTRVYALAIASALVAQLAAAGRLN..ASNAS.GIGSSVLPGVVQGAYSGARQAGV.......DVTGVDLSSDISSSISAFGGSSIGGQGI---aaapqfae.................... A0A087U004_9ARAC/192-357 ...............aastdk-----ETTSQQVTSA.................SSSFIEQLYNALINDSGFQSAFSGTVSTNIINAFATAIAGSVASASEFSsVGYSSLVKAYLQALSS.EKDGATIEDYARAIATATSNVLEQNGIFS..EGVAS.GHITAAVNAITSGISSTHITESA.......VTTTSV--GSQTTVSSDAG------------tssgvghipa.................. A0A087URD1_9ARAC/816-983 ................dygap------SSGAVPSSL.................ISDVANNIASALLRSNIFQRAFNARVSTSVANRIAVALTQSIASTFQLDyGTASKCRNAVMQALSS.VRSGSDTRVYALAIASALAAQLAAAGRLN..ASNAS.SIGSSLLSGVVQGAYSGARQAGV.......DVSGVDVSSDISSSISAYGAGSAAGQD----ivaa........................ A0A087URD1_9ARAC/1013-1177 .............apapgvap------------SGV.................ISDVANNLASALLRSNIFQRAFNARVSSSVANRISAALAQTIASSLQLDyATAVKCRNAIMQAISG.VRSGSDTRAYALAIASALAAQLGNAGRLN..ASNAS.GIGSSLLSGVVQGAYSGARQAGV.......DMSGVDVSSDISSSISAYSAG----------ptagqvpavt.................. A0A087TBY8_9ARAC/899-1066 ...................pg----QSASAAASAAAgggqgvgtsstttdidvISKFTNAITSTLLSSNDFTSLFKSGLPVTAAVNLASNLALSLANQIGLDqAGINSLLSLLSQYIST.IDSSADASAYANALSLAIVNTLANAESLS..PTLAS.YLASADTQPFANFVSSVTSRTL-.......-------------------------------naqqpkivrngrtssf............ A0A087URD1_9ARAC/2945-3114 .........adfsvasggalp------------SDV.................ISDVANNLASALLRSNVFQRSFNPRVSSSVTNRIAAALAQSICTSLQLDyRTASKCRSAIMQALSS.VRTGSDTRVYALAIASALAAQLAASGRLN..ASNAS.SIGSSLLSGVVQGAYSGARQAGV.......DVSGVDVSTDISSSISAYGAGSTAAQDISA-aa.......................... A0A087TBY8_9ARAC/1102-1274 .............qgaiaaas--------AAAGGAQvagtsn....satdidvISKFINTISSSLLSSNDFTSIFGSGLPVTSALNLASNLAHSLATQIGLDeAGINSLLSLLSQYISA.IDSSADASAYANALSLAIGSTLASAGSLS..PALAS.SLASADTQRIANFVSSVTSRTLN.......-------------------------------tqqpnlvrsgvastfrnaplaa...... A0A087TBZ4_9ARAC/231-382 ............ymstdeiqk---------------.................AKKFSETLFVALLKSNLFRETFVRTISKVRAQYLAFKMAFHAITNYGYS.EYAKETAYACAASIKL.LPKNSAPQAFGGKISKAITSIFYQKGLIQenTREQAqYLASEMLNYLSNII---------.......-------------------------------svqldsdslilnltrqssrsiddkqgd. A0A087URD1_9ARAC/1790-1953 ...........svpavptgii---------------.................-SDVANNIASALLRSNIFQRAFNARVSTSVANRIAAALAQTIASSLQLDnATAAKCRNAIMQALSG.VRSGSDTRIYALAIASALAGQLAAAGRLN..ASNAS.GIGSSLLSGVVQGAYSGARQTGI.......DVSGVDVSSDISSSISAFAAGSTAGQDVAS-aq.......................... A0A087U004_9ARAC/834-991 ............tfssfvkqs-------------GI.................ASKFASSLYNSLLSNELFQAIFSHIQNTEHLDSYGKALIKNVF-SLGN-.INVSELSDNLLKAFQT.IPLGSSLSQYAQVIVNTVAEAFIKHEVLI..PGNEE.SLAASTLNVLISGLREQSEEEAA.......QVSISK-ATAAIPVVAK--------------vetaerpysap................. A0A087UQ25_9ARAC/559-680 ..................ria---------------.................-------LENALVSSEPFLEIFNPSTTSEDAAIYATLIAREALSEYGA-.PVVEDVDTVVRDAMSN.LPPGSSSSDYASSLVNSIIATLNMYGLTT..DIQPE.FLASTMLLNLDS-----------.......-------------------------------eiqkfmasgddsftet............ A0A087URD1_9ARAC/235-407 ................ygtps-------AAVTPSGI.................ISEVTNNLASALLRSNVFQRVFNNRVPSSISTRIASELAQSIISKLQLDyTTASKCRNSIIQAVSG.IRSGSDTRVYAQAIASVLTSELATTGRLN..ASNAS.VIGSSILSGILQGAYSAARQAGLdlsgidvTSDISSSLSAYSSSSAAPQTVAET-------qqltav...................... A0A087U004_9ARAC/3231-3394 ................dvgfq-------AAAGTSSY.................AAEFGRQIYDALLSNPRFTETFAGEITLLRIRPFFTVLAENIIAIPVFSsLTLNDLVDPYISAVLR.IERGSSLRAYAQEIAGLTVEILLSRNLLT..AEAAS.LARTSVQRAISTALESTSTRTET......sTTTAVETAESES-------------------glaageeegvatgfv............. A0A087U004_9ARAC/683-839 ................vgstp--------------V.................ARNFGRLIYNSLLADEKFSSVFGIGNSFVNIRLFLTTLATSICSFPQFSsVTVSELVGKYIQAITP.IPQGSDIHQYAQAIAQATAEIMSSRKLLS..LQGVT.ALSSSLESAISSALESSSKST--.......SVTQKSSSEIITTATAESGET----------teitfssfv................... A0A087UJV0_9ARAC/60-194 .................agin-----------AQDT.................TAAFSDSLYFQLMNSMAFRNIFDGRATPDFIINVGRNIAQGIALELRL-.QDVSSVINFIVNTLSS.VYPGAGPEEYASAIADSILQIMLTNNILT..GNNPL.TFAGRLASIIDNALS--------.......-------------------------------lnlsagasldnfgs.............. A0A087U004_9ARAC/3895-4061 ................nvgfq-------AAAGTTSY.................AAEFGRQIYDALLSNPRFTETFAGEITLLRIRPFFTVLAENIIAIPVFSsLTLNDLVDPYISAVLR.IERGSSLRAYAQEIAGLTVEILLSRNLLT..AEAAS.LARTSVQRAISTALESTSTRTET......sTTTAVETAESES-------------------glaageeegvatgfvara.......... A0A087URD1_9ARAC/433-595 .............savnvpsg--------------V.................ISNVANNLVTALLRSNVFQRAFNSRVPSSVVNRIAVALAQSIASSLQLDyGTASKCRNAITQALAG.VRSGSDTRAYAVAIASAVSGQLAAVGRLN..SSNAS.SIGSSLLSSVVQGAYSAARQAGI.......DVSGVDVSSDISSSISAYGTGPAVAFDTA--it.......................... A0A087URD1_9ARAC/3723-3886 ..........ygapsggavps-------------GV.................ISDVANNLASALLRSNIFQRAFNGRVSSSVANRIGAALAQSIASTLQLDyGTAAKCRNAIMQALSG.VRSGSDTRVYALAIASAVVAQLAAAGRLN..TSNAS.GIGSSLLSGVVQGTYSGAKQAGV.......DVSGVDVSSDISSSISAYGA-----------gpmgevss.................... A0A087URD1_9ARAC/2561-2752 .........epsaavlpsgii---------------.................-SDVGNNLASALLRSNVFQRAFNARISSSVVSRIATALTQSISSSMQLDyATASKCRNAIMQALSG.VRSGSDTRTYALAIASALVAQLAAAGRLN..ASNAS.GIGSSLLSGVVQGAYSGARQAGV.......DVTGVDVSSDISSSISAFGGSSTGGQGIAA-aqqfaesisdisqgvsgvseaiagsgad A0A087URD1_9ARAC/1589-1758 .................gady----GASSTGAAQSA................vVSDVANKIASALLRSNLFQRVFNTRISSSVASRIATTLAQTTASSLQLDyGTASKCRNAIMQALSG.VRTGSDTRVYALAIASALAAQLAASGRLN..ASNAS.GIGSSVISGVVQGTYSGASQAGV.......DVSGVDVSSDISSSISAYGRGSAVGQDIA--gp.......................... A0A314KSL0_NICAT/10-90 ................mhnfq---------------.................-----------------------------EANKVAHLLAKESTKLVTL-.NKASILPSP-RPMVEAvVNAGAEGTSYSRSISEAVSNILTSMGNVN..AVNSI.-----------------------.......-------------------------------stfvsph..................... A0A087TBY8_9ARAC/696-874 .......fpgqsgasaaataa--------------AgggqgagtsstttdievISKFTNTVISSLLSSNDFTSIFGSGLPVTTALNLASNLAQSLATQIGLDeAGINSVLSLLNQYISA.IDPSADASTYANALSLAIGNTLASAGSLS..PALAS.SLASVDAQPIANFVSSVASKTLN.......-------------------------------aqqpnlvrsggtstfrnvpfkqvq.... A0A087URD1_9ARAC/1979-2146 ........dygaptsgavpsg--------------I.................ISDVANNLASALLRSNVFKRAFNVRVSSNVANRIAGALAQSIASSLQLDfGTASKCRNAITQALSG.VRSGSDTRVYALAISSALTAQLAAAGRLN..ASNAS.GIGSSLLSGVVQGTYSGAKQAGV.......DVSGVDVSSDISSSVSAYGAGPTGAQE----sdvs........................ A0A087URD1_9ARAC/3336-3501 .........gapsgsvvpsgl---------------.................ISEVASKLASALLRSNIFQLAFNARVSSSVASRIAAVLVQSIASSLQLDyGTASKCRNAIMQALSG.VRTGSETRAYALTVASALATQLAGAGRLN..ASNAS.DIGSSVLSAAVQGAYSGASQAGV.......DVSGVDVSSDISSSISAYGAGPTGGSET---glt......................... A0A087TBY8_9ARAC/1301-1462 ...................pg----QSASAATSTAAggaqgagtygtatdidvISKFTNTISSSLLSSNDFTSIFGSELPVATAFNLASNLAQSLATQIGLDeAGINSLLSLLSQYISA.IGSSGDASAYANALSLAIGNTLASAGSLS..PALAS.SLASANAQAIANFVRSVTSR---.......-------------------------------tlnvqqpilvgs................ A0A087URD1_9ARAC/1203-1372 ...............aeygap------SSGAVPSAL.................ISDLANNLASALLRSNVFQRAFNARNSSAVTNRIAAALAQSIVSSLQLDyGTASKFRNAITQALSS.VRSGSNTRVYALAIASALAAQLAAAGRLN..ASNAS.SIGSSLLSGVVQGAYSGARQAGV.......DVSGVDVSSDISSSISAYGAGSAAGQ-----dvvaaq...................... A0A087URD1_9ARAC/3139-3306 .......sdygapssggvpsg--------------L.................ISDIASNLASALVRSKIFQRAFNARVSSSIANRIASALTQSIASSLQLDnTTASKCRIAVTQALSS.VRSGSDTRAYALSIASALARQLAAVGRLN..SSNAS.SIGSSLLSGVVQGAYSGARQAGV.......DVSGVDVSSDISSSVSAYGAGRTVSSE----tdv......................... A0A087UPZ6_9ARAC/42-158 ..............aidgtve---------------.................-ESFRESLYSQIINSASFSIKFGGSVTDVDIINVGRNIATGIASELNL-.QDYDSVSNFMISALGS.VYPVGKLEDYASIIVEAVLELLSTYNILN..EYN--.-----------------------.......-------------------------------yfdlslrigniidst............. A0A087U004_9ARAC/1772-1936 .................gyqa--------AAGTSVF.................AADFGRQIYEALLSNPKFAEAFTGAITILRIRPFFTVLAENIIAIPVFSsLTLNELVDPYISAVLR.IERGSSLRAYAQEIAGLTVEILLSRNLLT..AEAAS.LARTSVQSAISTALESTSTTTET.......-STTSAVATAESEGVVA--------------agaeegvatgfvara............. A0A087TBY8_9ARAC/334-498 ................dreil-------SSSSDIDV.................ISKFTNSITSSLLSSNDFTSTFRTGLPATTAVNLASSLARSFATQMALDeTTINTLLPLVSQYVSE.ISSSADVSAYANAISRAVGDALASTGNVP..PVLTA.SLAPADTQPIANLVNSVTSTNVNe.....qQ------------------------------snlvrrgggstlrniaakqvqenrqn.. A0A087URD1_9ARAC/2754-2919 .........gapsgvvvpsgi---------------.................ISDVANNLASALLRSNVFQRAFNARISSSIANKVAAALTQTLASSLQLDySTAAKCRNAIMQALSA.VRSGSDTRVYALAIASSLVAQLAAAGRLD..ASNAS.GIGSSLLSGVVQGAYSGARQAGV.......DVSGIDVSTDISSSISTYGAGSPAGQDIAA-t........................... A0A087URD1_9ARAC/3911-4079 ...............adygap------SAAAVPSGV.................ISDVVNNLASALLRSNSFQRAFNARVSSSVANRIVVALSQSIASNLQLDyGTASKLRNAVVQALSG.VRSGSDTRVYAVTIASSLAAQLANAGLLK..ASNAS.SIGSSLLSSIVQGSYSGARQAGV.......DVSGIDIRSDISTSASAYSSSASSIQTSS--vs.......................... A0A087TBY8_9ARAC/522-695 asaaanggsggaqatditsta--------------Rni.............dvISQFTNTITSSLLSSNEFTSIFGSGLPVTTALNLASNLAQSLAAQIGLDeTGINYLLSLLRQYISA.IDLSADASAYANAVSRAIGNALASAGNLS..PALAS.SLASADTQPIANLVNSVTSSTLI.......-------------------------------aqqpkligsggastvgtkpepslsg... A0A087URD1_9ARAC/2362-2532 .........sadygaltsgav-----------PSGV.................ISDVANNLASALLRSNVFQRAFNVRVSSSVANRIAGVLAQSIASSLQLDyGTASKCRNAIMQALSG.VRSGSDTRVYALAIASALTTQLAAAGRLN..ESNAS.GIGSSLLSGVVQGTYSGAKQAGV.......DVSGVDVSSDISSSVSAYGAGPTGAQES---vvss........................ #=GC seq_cons ................sssss..............h.................ISchuNsLsSALLpSNhFpcsFsuclososAsplAssLAQSIASplpLD.sTsucspsslhQAlSu.lcoGSDs+sYA.AIAsAluspLAusGpLs..suNAS.uluSSllsulspus.Ssuppsss.......ssos.s.uss.Sss.ut..............st.......................... //