# STOCKHOLM 1.0 #=GF ID Pentapeptide #=GF AC PF00805.17 #=GF DE Pentapeptide repeats (8 copies) #=GF AU Bateman A #=GF SE Bateman A #=GF GA 20.20 20.20; #=GF TC 20.20 20.20; #=GF NC 20.10 20.10; #=GF BM hmmbuild HMM.ann SEED.ann #=GF SM hmmsearch -Z 23193494 -E 1000 --cpu 4 HMM pfamseq #=GF TP Repeat #=GF WK Pentapeptide_repeat #=GF RN [1] #=GF RM 7592418 #=GF RT The hglK gene is required for localization of #=GF RT heterocyst-specific glycolipids in the cyanobacterium Anabaena #=GF RT sp. strain PCC 7120. #=GF RA Black K, Buikema WJ, Haselkorn R; #=GF RL J Bacteriol 1995;177:6440-6448. #=GF RN [2] #=GF RM 9655353 #=GF RT Structure and distribution of pentapeptide repeats in bacteria. #=GF RA Bateman A, Murzin A, Teichmann SA; #=GF RL Protein Sci 1998;7:1477-1480. #=GF RN [3] #=GF RM 9654141 #=GF RT Characterisation of an Arabidopsis cDNA encoding a thylakoid #=GF RT lumen protein related to a novel 'pentapeptide repeat' family of #=GF RT proteins. #=GF RA Kieselbach T, Mant A, Robinson C, Schroder WP; #=GF RL FEBS Lett 1998;428:241-244. #=GF DR INTERPRO; IPR001646; #=GF DR URL; http://www.sanger.ac.uk/Users/agb/Pentapeptide/Pentapeptide.html; #=GF DC Pentapeptide repeat web page. #=GF CC These repeats are found in many cyanobacterial proteins. The #=GF CC repeats were first identified in hglK [1]. The function of these #=GF CC repeats is unknown. The structure of this repeat has been #=GF CC predicted to be a beta-helix [2]. The repeat can be #=GF CC approximately described as A(D/N)LXX, where X can be any amino #=GF CC acid. #=GF SQ 95 #=GS Y1851_SYNY3/33-72 AC P73063.1 #=GS SPKB_SYNY3/504-543 AC P74297.1 #=GS Q9Z4J6_PSEAI/167-206 AC Q9Z4J6.1 #=GS YMO3_ERWST/247-286 AC Q52118.1 #=GS Q55112_SYNY3/64-103 AC Q55112.1 #=GS P72857_SYNY3/46-85 AC P72857.1 #=GS Q55773_SYNY3/89-128 AC Q55773.1 #=GS P74725_SYNY3/57-96 AC P74725.1 #=GS P74206_SYNY3/256-295 AC P74206.1 #=GS Q55531_SYNY3/57-96 AC Q55531.1 #=GS FIP2_ARATH/166-205 AC Q9SE95.1 #=GS YMO3_ERWST/107-146 AC Q52118.1 #=GS Q44230_NOSS1/596-635 AC Q44230.1 #=GS P74206_SYNY3/100-139 AC P74206.1 #=GS Q55201_SYNY3/320-359 AC Q55201.1 #=GS Y1819_SYNY3/100-139 AC P73709.1 #=GS YJCF_ECOLI/267-306 AC P32704.1 #=GS FIP2_ARATH/126-165 AC Q9SE95.1 #=GS O85899_SPHAR/129-168 AC O85899.1 #=GS O85899_SPHAR/34-73 AC O85899.1 #=GS Y1152_SYNY3/50-89 AC P74221.1 #=GS Q9ZCY8_RICPR/479-518 AC Q9ZCY8.1 #=GS YJCF_ECOLI/307-346 AC P32704.1 #=GS YJCF_ECOLI/162-201 AC P32704.1 #=GS Q9ZCY8_RICPR/66-105 AC Q9ZCY8.1 #=GS P74206_SYNY3/60-99 AC P74206.1 #=GS Q55112_SYNY3/24-63 AC Q55112.1 #=GS YISX_BACSU/63-102 AC O06733.1 #=GS Y1152_SYNY3/90-129 AC P74221.1 #=GS TL17_ARATH/124-163 AC P81760.2 #=GS Y1819_SYNY3/271-310 AC P73709.1 #=GS P73963_SYNY3/118-157 AC P73963.1 #=GS O85899_SPHAR/84-123 AC O85899.1 #=GS Q44230_NOSS1/511-550 AC Q44230.1 #=GS P72857_SYNY3/86-125 AC P72857.1 #=GS Y1819_SYNY3/231-270 AC P73709.1 #=GS YMO3_ERWST/207-246 AC Q52118.1 #=GS P73963_SYNY3/203-242 AC P73963.1 #=GS O24772_BACME/102-141 AC O24772.1 #=GS P73013_SYNY3/196-235 AC P73013.1 #=GS Y1152_SYNY3/140-179 AC P74221.1 #=GS SPKB_SYNY3/454-493 AC P74297.1 #=GS Q9Z4J6_PSEAI/127-166 AC Q9Z4J6.1 #=GS Y1819_SYNY3/20-59 AC P73709.1 #=GS P74206_SYNY3/145-184 AC P74206.1 #=GS P73963_SYNY3/78-117 AC P73963.1 #=GS Y1819_SYNY3/191-230 AC P73709.1 #=GS Y1819_SYNY3/60-99 AC P73709.1 #=GS YYBG_BACSU/214-253 AC P37497.1 #=GS Q9RD75_STRCO/214-253 AC Q9RD75.1 #=GS Q44230_NOSS1/636-675 AC Q44230.1 #=GS Q8T0F7_DROME/310-349 AC Q8T0F7.1 #=GS O85307_SALDU/199-238 AC O85307.1 #=GS Q9Z4J6_PSEAI/77-116 AC Q9Z4J6.1 #=GS FIP2_ARATH/256-295 AC Q9SE95.1 #=GS Y1152_SYNY3/185-224 AC P74221.1 #=GS Q8T0F7_DROME/230-269 AC Q8T0F7.1 #=GS P74392_SYNY3/89-128 AC P74392.1 #=GS Q55201_SYNY3/280-319 AC Q55201.1 #=GS FIP2_ARATH/216-255 AC Q9SE95.1 #=GS Y516_SYNY3/38-77 AC Q55837.1 #=GS Q9RR64_DEIRA/209-248 AC Q9RR64.1 #=GS Q8T0F7_DROME/190-229 AC Q8T0F7.1 #=GS YMO3_ERWST/67-106 AC Q52118.1 #=GS O85307_SALDU/154-193 AC O85307.1 #=GS Y516_SYNY3/118-157 AC Q55837.1 #=GS Y1819_SYNY3/151-190 AC P73709.1 #=GS Q55773_SYNY3/49-88 AC Q55773.1 #=GS Y1851_SYNY3/73-112 AC P73063.1 #=GS Q9Z4J6_PSEAI/37-76 AC Q9Z4J6.1 #=GS Q55112_SYNY3/104-143 AC Q55112.1 #=GS YMO3_ERWST/162-201 AC Q52118.1 #=GS P73524_SYNY3/288-327 AC P73524.1 #=GS P74206_SYNY3/195-234 AC P74206.1 #=GS P74206_SYNY3/20-59 AC P74206.1 #=GS Y516_SYNY3/78-117 AC Q55837.1 #=GS P74392_SYNY3/129-168 AC P74392.1 #=GS P74725_SYNY3/102-141 AC P74725.1 #=GS MCBG_ECOLX/112-151 AC P05530.1 #=GS YISX_BACSU/143-182 AC O06733.1 #=GS Q55531_SYNY3/97-136 AC Q55531.1 #=GS TL17_ARATH/169-208 AC P81760.2 #=GS Q9ZCY8_RICPR/519-558 AC Q9ZCY8.1 #=GS Q9ZCY8_RICPR/136-175 AC Q9ZCY8.1 #=GS Q9ZCY8_RICPR/351-390 AC Q9ZCY8.1 #=GS Q9ZCY8_RICPR/206-245 AC Q9ZCY8.1 #=GS O50390_MYCTU/72-111 AC O50390.1 #=GS O50390_MYCTU/72-111 DR PDB; 2BM6 A; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM7 C; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM5 A; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM4 A; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM7 B; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM7 A; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM4 B; 72-111; #=GS O50390_MYCTU/72-111 DR PDB; 2BM5 B; 72-111; #=GS O85899_SPHAR/169-208 AC O85899.1 #=GS P73963_SYNY3/158-197 AC P73963.1 #=GS YYBG_BACSU/174-213 AC P37497.1 #=GS P73013_SYNY3/151-190 AC P73013.1 #=GS Q44230_NOSS1/551-590 AC Q44230.1 #=GS O50390_MYCTU/112-151 AC O50390.1 #=GS O50390_MYCTU/112-151 DR PDB; 2BM6 A; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM7 C; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM5 A; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM4 A; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM7 B; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM7 A; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM4 B; 112-151; #=GS O50390_MYCTU/112-151 DR PDB; 2BM5 B; 112-151; #=GS Y1152_SYNY3/230-269 AC P74221.1 #=GS Y1851_SYNY3/113-152 AC P73063.1 Y1851_SYNY3/33-72 ASLIGAQLIFVDLGGANLTRAQLDSATLKNANLALANMTE SPKB_SYNY3/504-543 ANLSDAYFGYADLRGADLRGANLNGVNFKYANLQGANFSG Q9Z4J6_PSEAI/167-206 ADLRDANLQEVKLAEANLEDADLRGSKVRFGNFQGSNMQG YMO3_ERWST/247-286 ANLSDANLTNVDLKRADLSNAILKGANLLHINVEGTNMTG Q55112_SYNY3/64-103 CYFNNADLSGANLAKADLRQASLIKTFLLKVNLQGAHLNN P72857_SYNY3/46-85 CDLSGADLSGAHLIGADLRNANLSGTNLNEANLEGADLTG Q55773_SYNY3/89-128 ANLSGANLNGAITDGTDFREAYFDRATFINTNLETAYMQG P74725_SYNY3/57-96 AQFTNVDLTSSIFEAMDLRGSVFNGANLTDANLKGVDLTN P74206_SYNY3/256-295 ANFQNANFEYALMEKALLAGAILRGANLIDACLRGADLRN Q55531_SYNY3/57-96 AVFAAADLRESNFEGSDLSFSILTDAVFLHASLRGANLSG FIP2_ARATH/166-205 TNLQCAKFRNADAEGSIFHNAILRECEFTSANLRGALLAG YMO3_ERWST/107-146 ANLAHANLTMAYLSEADLSNANLSGADLTNANLNQTDLPN Q44230_NOSS1/596-635 AQLSFANLTKTDWQSSDLSGADLERANLSNADLSATRMTG P74206_SYNY3/100-139 ANLAYAKLKQARLIRTNLEGANLAETDCQGAILEAVNFSR Q55201_SYNY3/320-359 SSLALATLIGTDLREADLRGATLQNVNFSGAKVENLSFGD Y1819_SYNY3/100-139 SDMTLATLQDTNLIGADLRGADLSGATLTGACLRGANMRQ YJCF_ECOLI/267-306 INLFRADLSFSKLDLINFEHADLSRVNLNKATLQNINLID FIP2_ARATH/126-165 IQTERVRFRGVNLSGIDLSKLDLSLVDFSYACLRNVFFSR O85899_SPHAR/129-168 IHFEEVLLVSAKLPGFSFRKETLRRVDLSGADLRKGDFRM O85899_SPHAR/34-73 CDLEEADLSGLDLTGWRFERCNLRKADCSAAKLEGSIWQG Y1152_SYNY3/50-89 ENLQNADLSGFTLISVDFERTNLIGSNLQRTFLTKARLGH Q9ZCY8_RICPR/479-518 SNLANMNLTNFNLSNLVFNGVDFSKSIFKKANLTNTVIKN YJCF_ECOLI/307-346 SKLFFTRLTNTFLEMVICTDSNMANVNFNNANLSNCHFNC YJCF_ECOLI/162-201 EDLSNSNFAGCRLQNAIFQDCNMYKTNFNFAIMEKILFDN Q9ZCY8_RICPR/66-105 SNLKGVKLIGIKLTNEDLSGIDFTSCEILRTDFMGSNLEK P74206_SYNY3/60-99 TNLSHARLMGVKFVGSDLTGIDLSYSDLSWADLTDCDLSG Q55112_SYNY3/24-63 LALRHIDLHGFTLAGADFSGSDFSEANLRGTDLQGCKLQG YISX_BACSU/63-102 VSFRHIELTDVIFEKCDLSNADFSGAVIHRTSVKQSKMVG Y1152_SYNY3/90-129 CQMNWADLTYAKLNQADLSHADLTKASLYGAFAVKTNFKG TL17_ARATH/124-163 TNLKGKTLSAALMVGAKFDGADMTEVVMSKAYAVEASFKG Y1819_SYNY3/271-310 ANLTKANLQEAELIEAFFARANLTEANFINANLVRADLMS P73963_SYNY3/118-157 CNLSEADLTESDANEALFCQAVFTEVEAHGLRLYRAKVSQ O85899_SPHAR/84-123 ANLSEAAFAGGDFNNSVWRRATLTSAKFVGTKLTGADFSE Q44230_NOSS1/511-550 ANFTDANLSRVLMTRSDLSRATLNRANLSNARLIGANLSS P72857_SYNY3/86-125 ANLQNADLRGAMVTNATLNRANLTSANFAFAKLYDVDVTG Y1819_SYNY3/231-270 AEMTAVNCQGAIMTHVNLNRTNLTGSNLSFTRMNSADLSR YMO3_ERWST/207-246 VNLSGANLAHANLTMAYLSEADLSNANLSNADLKRADLSD P73963_SYNY3/203-242 GNFRGANLTQADFTGANLKGANLRGANLVGTNLQRADLSD O24772_BACME/102-141 ANLRGANLKGALFIAADLREADLRLTDLIGADFRDADLSG P73013_SYNY3/196-235 ANLFRANLFRANLLEANLRGANLQEANLVGADLSGADLSG Y1152_SYNY3/140-179 ANLRGANLEQTNLTGANLFAANLREANFQKADFSWANLQE SPKB_SYNY3/454-493 QNLVGIVLAKAFVPGINCYQANLTNANFEQAELTRADFGK Q9Z4J6_PSEAI/127-166 ADLTAAYLEXARXSGGRLHQATLRAADLEMTWLSRADLKG Y1819_SYNY3/20-59 LKLPGINLEAADLIGIVLNEADLRGANLLFCYLNRANLGQ P74206_SYNY3/145-184 ADLTRVDLAEANFSRADLSGADFRKANFDHANLYKVNLSQ P73963_SYNY3/78-117 CDLRFANLEGADLTDANLIAASLHKSNLRRANLCRATLNR Y1819_SYNY3/191-230 ADLSYANLKGALLTDANLSGAKLNGADLQNANLMRAKISE Y1819_SYNY3/60-99 ANLVAANLSGASLNQADLAGADLRSANFHGAMLQGAILRD YYBG_BACSU/214-253 ALLIAADLRNADLRMTDFIGADMRDADLSGADLTGSIFLT Q9RD75_STRCO/214-253 AYLIAADLTGADLRGADLIGADLRDADLTDADLTGAFFLT Q44230_NOSS1/636-675 AILRSAQLENANLRNADLSLVDLRGANVAGADFKDTILTP Q8T0F7_DROME/310-349 CNLRAAVLAGADLEKCNLSGSDLQEANLRGANLKDAELTL O85307_SALDU/199-238 ANLHAVNLMGSNMTKANLTHADLTCANMSGVNLTAAILFG Q9Z4J6_PSEAI/77-116 ANLEKANLRGADLTRAXLXQANXRGAXLSGARAVAXXAWG FIP2_ARATH/256-295 AKLSNANFKGANLQRAYLRHVNLREAHMEGANLGGANMTG Y1152_SYNY3/185-224 ANLRDARLWATDLRRAFMKEMDLSALSLHGLAMDGAKLTG Q8T0F7_DROME/230-269 CCLERADLQYANLECAQLVSVRGLCANMEGANLRGCNFED P74392_SYNY3/89-128 ANLRGADFTGANLQGARFFSANMDGAILEGADARGVDFES Q55201_SYNY3/280-319 AILTDSDLSNTDLRRSNFRGADLSGAYLEGANLSQVDFRK FIP2_ARATH/216-255 ACLVGCSFCGADLRTAHLQNADLTNANLEGANLEGANLKG Y516_SYNY3/38-77 GECLDCNLAGADLREFNLENARLNRSDLSGANLSGVNLRR Q9RR64_DEIRA/209-248 TTLRGVNFRGADLTRANFENANLSGAQLQNADLSSADLSQ Q8T0F7_DROME/190-229 LRFQGVNLSGADLRKLDFRNINFKYANMSHCNLSHTNLNY YMO3_ERWST/67-106 INLKGVNLSDTDLKGAYLSDANLSDADLSDANLSDANLSG O85307_SALDU/154-193 LNLRGVNLAHKDFQGEDLSDIDASDADFRETNLSNVNLVG Y516_SYNY3/118-157 SFLRDVDLTGANLKGANLAWANLTAANLTDVDLEEAEFWE Y1819_SYNY3/151-190 AILGRADLQGANMKGVDLSRADLSYANLKEANLRDVDLRK Q55773_SYNY3/49-88 VNLTRADLTGADLSGANLSGADLTGANLSGANLTSASLNG Y1851_SYNY3/73-112 VCLIYADLSNADLSGANLVGADLTNADLSGAKLGGADLRK Q9Z4J6_PSEAI/37-76 ARCAKADLRGADLRNLDLGRIDLAGADLSGADLRHARLDL Q55112_SYNY3/104-143 ALCAGALLTRANLEDACLHGALLTGADLTGAKLSKAKYNQ YMO3_ERWST/162-201 AYLSEADLSNANLSNADLKRADLSNANLSGADLTNANLNQ P73524_SYNY3/288-327 IYLIRANLSQADLVKANLSRTVLYEANLDGADLKGTRLFY P74206_SYNY3/195-234 AFLQGADLSQANLKGANLGRALMKEVNLSLINLSEIHLKA P74206_SYNY3/20-59 IELHHADLIQSDLVGIILNRALLAYGNFSGSNLSEAQLRR Y516_SYNY3/78-117 ALLDRANLTGANLSETDLTEAALTEANLAGADLSGANLER P74392_SYNY3/129-168 ARLTHANLRNARLEGSFGTNTKFGEVDIEGADLTDIILRP P74725_SYNY3/102-141 TSFNGANLENAILAEAIMLRTSFKNAKIQGADFSLAVLDT MCBG_ECOLX/112-151 CRFRDCLFEETDLRKSDFTGSEFNNTEFRHSDLSHCDFSM YISX_BACSU/143-182 SECSDTVLQQTHFDGCELEGASFTGTSLQNMDISTCRFEQ Q55531_SYNY3/97-136 SLVDRVTLDFADLRDTIFTEAIATRTRFYDTDITGADFSD TL17_ARATH/169-208 AVIDRVNFGKSNLKGAVFRNTVLSGSTFEEANLEDVVFED Q9ZCY8_RICPR/519-558 SILKDANFSAAILTKTDFSKSILTGSIFKFAQIDQTCFSN Q9ZCY8_RICPR/136-175 SIFNNITLQNTNFVQSNFSDTAFNKSTIINVNFENSKFSN Q9ZCY8_RICPR/351-390 AIFSNNDLKEFKVINTDLNNSEIINSNFTNGQFNNVNFSQ Q9ZCY8_RICPR/206-245 SIFYGADLGKSVINNTNFTNNYFESSDLSNTKFTSVIIKD O50390_MYCTU/72-111 SVFVACRLRPLTLDDVDFTLAVLGGNDLRGLNLTGCRLRE #=GR O50390_MYCTU/72-111 SS -EEES-B--SEEEEEEE-TT-B-TT-B-TT-B-TT-B-TT O85899_SPHAR/169-208 TVFEECSLREAMVAGSRFEGSDLRGANLGGLRLVDANLFR P73963_SYNY3/158-197 AQLMGAHLHQAYAPEADFSAVAAIAVDLRWANLRKTNFRG YYBG_BACSU/174-213 SELVRAQARHPKLPKKVSRGSVLIGAKLKGLDLRGANLRG P73013_SYNY3/151-190 RDLTGADLRWANLKEKDLSGRKMVSANLSNADLSDSFLHQ Q44230_NOSS1/551-590 AQLVGADLRGTVLENASLTGADLGDAKLQEANLYGARLSR O50390_MYCTU/112-151 TSLVDTDLRKCVLRGADLSGARTTGARLDDADLRGATVDP #=GR O50390_MYCTU/112-151 SS -B-TT-B-TT-B-TT-B-TT-B-TT-B-TT-B-TT-B--H Y1152_SYNY3/230-269 TNLSHSSLRGANLRGADLTGANLTGVDLTGADLMGANLTQ Y1851_SYNY3/113-152 ANLSEASLRGADLRGVNLIEANLTNTDFSEADLTGAYISD #=GC SS_cons -EECT-B-TTEEECCEE-TT-B-TT-B-TT-B-TT-B-TC #=GC seq_cons usLpsAsLpsusLpsusLptAsLssAslpsAsLpsuslps //