At2g03360.1/MSA

>gi|15227618|ref|NP_178435.1|	  393 residues, 50 /line  unknown protein [Arabidopsis thaliana]

--MAASAKITCDRSHT-SYDLCSI---NGSCILNPK T-GTLTLMDRTLTT--SAPLVEKIRPYPRK--

SENWIMPRIRELKL-TSGPSDLTRSCDITH-- --DSPAIVFSAGG-YTGSI--YHDFIDGFIPLFITAN--S --VYPDRDFILVVV-NPKEW-WMPKYIDILGT F--S--KHK---TI---LLDKENA-SITHCFT SATVGLISHGPMT--I--DPTQ-IP--NS--- -KSLVDFHNLLDKALNPN-- -LSIIKINKPR--LILVRRYG--NIGRVILNEEEIREML-EDVG -FEVITFRPSKTTSLREAYKLIKSSHGMIGVHGAALTQLLFLRPGS-VLVQI VPVG-LG--WVSKTCFETPAKAMK--LDYTEYRV--NVEESS-- --LIEKYSRD-DLVLKDPI---AYRG-MDWNVTK--MKVYLKDQDVRLDVNR FRKHMNEAY---

KKA-KSFM--DL--NG >gi|109041288|ref|XP_001108195.1|	  470 residues, 50 /line  PREDICTED: similar to glycosyltransferase [Macaca mulatta]

---MHLSAVFNALLVSVLAAV-LWKHVRLREHAATLEEEL ALGRQA-- TEPAPALRIDYPKALQILMEGGTHMVCTGRTH-TDRICRF---KWLCYSNEA E--EFIFFHGNTSVMLPNLGSRRFQPALLD--

LSTVEDHNTQYFNF-VELPAAALRFMPK PVFVPDVALIANRFNPDNL--MHVFHDDLLPLFYTLR--Q --FPGLAH--EARLFFMEGW-GEGAHFDLYKL L--S--PKQ---PLLRAQLKTL---GRLLCFS HAFVGLSKITTWY--Q--YGFVQPQGPKA--NILVSGNEIRQFARFMTEKLNVSHT

--GAP-LGEE--YILVFSRTQNRLILNEAELLLAL-AQEF -QMKTVTVSLEDHAFADVVRLVSNASMLVSMHGAQLVTTLFLP-

---GRPGP-RKQKWTVGLYPGKVREAQCQASVHGASEARL TVSWQIPWNLKYLKVR---EVKYEVWLQEQGENTYV--PYILALQNHTFTENIKPF TTYLVWVRCIFNKILLGPFAD-VLVCST >gi|119936279|gb|ABM06100.1|	  438 residues, 50 /line  glycosyltransferase [Bos taurus]

-MPK PVFVPDVALIANRFNPDNL--MHVFHDDLLPLFYTLR--Q --FPGLAR--EARLFFMEGW-GEGAHFDLYKL L--S--PKQ---PLLRAQLKAL---GRLLCFS HAFVGLSKVTTWY--Q--YGFVQPQGPKA--NILVSGNEIRQFAHFLMEKLNVSQA

--GGP-LGEE--YILVFSRTQNRLILNEAELLLAL-AQEF -QMKTVTVSLEDHAFADVVRLVSNASMLVSMHGAQLVTALFLPRGA-AVVEL FPYAVN---PDHYTPYKTLATLPGMDLQYIAWQN--TMPENTVTHPERPWDQGGIAHLDR AEQARILQSREVPR-HLCCRNP--EWLFRIYQDTKVDIPS LIQTIRRVV-KGHPGP-RKQKWTVSLYPGKVREARCQASVQGASEARL SVSWQIPWNLKYLKVR---EVKYEVWLQEQGENTYV--PYMLALQNHTFTENIKPF TTYLVWIRCIFNKTLLGPFAD-VLVCST >gi|110637270|ref|YP_677477.1|	  366 residues, 50 /line  capsular polysaccharide biosynthesis protein [Cytophaga hutchinsonii ATCC 33406] ---MCLQRICYEKIFLKKKIIA--

--TGTIWMSNMQQINNASVRPVSAYNTKHL-- -QIPAIALLQSSPLP- EQAIRTFSRA--LLTP TNHLFVNGRYIRT--G LISGFDSRKLSFFQRIYLFLKSRFFTEN KSVKISAVWAHDS-WSNNY--FHWFNDTLPRLFLLSK--Q --IEDSVA--VLPV-ELS--KITFIVES LE--LL---KIEHQ---WIDQKKS HRFESLSVLHTATLQ-PDINPLLQKQMRDAVFSAMKID--

PQERPFR--KIYISRAH--ARYRKIINEQELLPVL-KKYG -YDIIYPE---TYSFKEQVKLFAESNALISIHGAGHTNCMFMKQDA-KVMEI RNTEWESQPLCFWGLANIFELK--WEYITATRVSEVSNF- ---NDVFIAPHI FEESLRTFEN--

--IK >gi|119484873|ref|ZP_01619355.1|	  320 residues, 50 /line  hypothetical protein L8106_15410 [Lyngbya sp. PCC 8106] ---MPLYDLSQGLKQNYY--

---VTPTVYKTHLKNVMYCPASNL

---LFSSSKKIIVDSSSTVK TKEKIANSVNIRKLYFSNPE KIEGDCTVFHTFA-NGSNY--YHTLIDHIPRLYTLHHN-- --SYQSLKEIKVLC-NSELTKVESFF--LEKL LPKNTII--TWVDQ---SKIYSLD RFIFLG-- -YLSRRFAGFLPSTYLNWFIE--K VRPNKLREKKN--RIFISRKK---ITDQSTRCILNEDEVCSVL-KKYG -FKKYVLE---SLSIEEQIDLFYNAEFVVGVHGAGLTNIIFSEK-I-KVLEL HPMQS--IFPHYYYLSKSRK--HSYLYWCA--QEKE -KNTNFEVNIGE IEQIIKSNF---

---T >gi|121915175|gb|EAY19966.1|	  434 residues, 50 /line  hypothetical protein TVAG_402200 [Trichomonas vaginalis G3]

---MPFIANYKATLKCGQERKFKISLNTTEFVQSN-

-YSRFKCHNKFY-ETRWCEG---KNIGFINKN F--TFYSKAEINFDKPFLVPGPRAPPFDKIDERWNGEPII

--MKTLYNDTIP IIRGNSYVYGTFW-NEQML--WHSIFDFIVPFLTFTK--Y --FTKDNRENRTI--FVHHY-GDLEFSEYLQT I--G--EIK---ILER-ENDFLME HCYVGIDKFEDNPYDNRP---FDDSISFS--Y NFLRSDYNNLRNQTLLLNN---VS LLGFGINNKPL--VLIIDRN---TSKRNITNQNEFYLTI-KKIF -NDCE---VININLDHMHPRDQLYYFARCSFVIGVHGSGLTNVVFMNNYCSKRKTHLLEI LPLN-YSCRNWFNVACNYSG--VRYHKIMS-NQT-- --IHEDYNT--KNCR---KYSY-KCST---SSCHDILRDQDITVPIHE FEEILNEIH---

NEI-KDSETFNEFGVVPIYRENDEIEEIDDDL >gi|123457421|ref|XP_001316438.1|	  483 residues, 50 /line  hypothetical protein TVAG_298350 [Trichomonas vaginalis G3] ---MASLILTFSFISFACAMVYSKHFIGEDNYSNKCIIKDGKCHFTIKDVDNKLTFFI--

-PVMAANASGSLRKFCNVSDKMTC ALPLFFNGSQKIYIKHENTIVRTLNAHYTHGQFECFGPDTWDRRLCRF---ANLSFAHDK FFFFPPYDIK--

WASPIMIASCRALPIAPW--EGSVYMNNYKGPPYENL--- SYRPGKYMYNHPGYLTYSL--WHGMIEQTIPLWQTWYT-- --YMNRDPDTVWLVK--RGLLQSVRYSDIAMF MSPAE---VLE---EWATYE EVFMGMTKVIDTKWHIPKEREKNPPKYQLEWFNFENITDWKVLKQLFWKRYN

-PPTFPQNKP--LVLFIRRASKRKIVNQQEAYERLVKE-FPQVN ITLIEPEWYEYEEQMGLFEAADVVIAAHGMALCQVLWMKPGK-SVIEI FPYGI-EARDWYKYLSLLNG--LHHQYYAPTFNRFEEENKKDKRLWE- CMQEEPL--KYDCLDKTLFTDAWVDIDQ LVVMTRKALID-

---AGVKL >gi|125829255|ref|XP_001338543.1|	  431 residues, 50 /line  PREDICTED: similar to glycosyltransferase [Danio rerio] MLLLVALCLLCNNKTVSATDSSRTPQLDYNSLALPQRHIPFFLHNNKPLAKLCKEDPLCP FKDALLLRKACWGYEKSCSAEHRF --SYPVCTSLDSGWANSIQAAQELFWKQADFGYVRERLNEMKTL CKPSKPADSSLKCSS---HMRFCRATNLY---LDLRSPRRGHER

F--- ---SELQTYSELDF-HPLDD---GHCDVII-- --DRPTVFMKLDA--GVNM--YHHFCD-FVNLYISQHLNN -SFSRDIN--IVMW-DTSVYGYGDLFSETWRA F--T--DYD---II---HLKNLD-

---SKRQGQVR--VTLLARS---TEYRRIINQQELINAL-KTVP LFEVKLVD---YKYKEMPFLEQIHVTHNSDIFIGMHGAGLTHLLFLPDWA-VIFEL YNC---QDESCYRDLARLRG--VQYMTWQ-KRDK-- --VFPQDKGH-HPTLGEHP--KFTNYTFDVEE FMRLVLLAA---

EHV-TRHPD-WRAKQSREEL >gi|58036800|emb|CAE45897.2|	  459 residues, 50 /line  hypothetical protein [Homo sapiens]

YKKHLEKLKYCWGYEKSCKPEFRF --GYPVCSYVDMGWTDTLESAEDIFWKQADFGYARERLEEMHVL CQPKETSDSSLVCSR---YLQYCRATNLY---LDLRNIKRNHDR FKEDFFQ-SGEIGGHCKLDIRTLTSEGQ RKSPLQSWF--- ---AELQSYTQLNF-RPIED---AKCDIVI-- --EKPTYFMKLDA--GVNM--CHHFCD-FINLYITQHVNN -SFSTDVY--IVMW-DTSSYGYGDLFSDTWNA F--T--DYD---VI---HLKTYD--SKRVCFK EAVFSLLPRMRYG--LFYNTPL-IS--G-CQNTGLFRAFAQHVLHRLNITQE

---GPKDGKIR--VTILARS---TEYRKILNQNELVNAL-KTVS TFEVQIVD---YKYRELGFLDQLRITHNTDIFIGMHGAGLTHLLFLPDWA-AVFEL YNC---EDERCYLDLARLRG--VHYITWR-RQNK-- --VFPQDKGH-HPTLGEHP--KFTNYSFDVEE FMYLVLQAA---

DHV-LQHPK-WPFKKKHDEL >gi|113476678|ref|YP_722739.1|	  386 residues, 50 /line  Capsular polysaccharide biosynthesis protein-like [Trichodesmium erythraeum IMS101] ---MLYWSDEKNTDLIINDNLKDLARQNGWLF---EVVEKSMSQIFQPSKTIEEDI

IYAIQDWGKILNNKNDKELKDIII PRENNF-- -YHLYCVTSSEIGETFRCTIPNATILEP NGLVLTSDFEIITQSVMSEKLKLDFNLEKI-- ---KEAINNSEKLL-- GTYVSLLSD-YSLNY--AHWLMDGLPKLALLES--- --LKQELK--FIIPKNSPSY-IIDSLK- LL---GIKEQ---QLIKIQH -PCLV--V--EKLILIHGAQK--NGRVCKKYILKIRNKLLQA--

--INDNNKPNK--LIYISRSN---YTRKIINESEILPII-KKYN -FEILRCE---ELSFREQINIFSQAQVLLGPHGAGIYNQIFCNRGA-IIIEI YNKQYW--NHSSRIISSFLN--HNHWHIFG-- -ENVAQDYQTYVEPLK LDKVLSYAI---

NDYI >gi|115434210|ref|NP_001041863.1|	  482 residues, 50 /line  Os01g0119000 [Oryza sativa (japonica cultivar-group)] ---MGSEVKPAKLG-- -LRRHLNAGFFAGFLLVLLTYVIVSQQFAMETPTAV ---TSRAPRIDEN--ESVTKARVETEKKREQEWQRP KD--TSGAVSAEEFSKRDSTNAK---PIENGKVVCGSNGF-YSDTCDV---DGDVRINGT A-LSVTLVPASRR--SERRREWKIQPYPRR--

TVSGIAEVTVTRQQDRAAAPACTVTH-- --GVPGVVFALGG-LTGNY--WHDFSDVLVPLFVASR--R --YGGEVQ--FLVS-NIQPW-WLGKYEAVVRR L--S--RYD---AV---DLDRD---TEVRCFR RVAVGLRMHKEFS--V--KPEL-AP--GG--Q RLTMADFAAFLRDTYALPRAAA-- AGARRPR--LVVIRRAHYRKIVNMDEVVRAA-EAAG -FEAAVMSPRFDEPVEEVARKVNAFDAMVGVHGAGLTNAVFLPAGA-VVIQV VPYGRLE--RMARADFGEPVADMG--LRYMEYSV--AADEST-- --LLEMLGPE-HQVVKDPE---AVHR-SGWDKVA---EYYLGKQDVRINVAR FAATLAAAF---

DHL-RPSH---S >gi|115442317|ref|NP_001045438.1|	  491 residues, 50 /line  Os01g0956200 [Oryza sativa (japonica cultivar-group)] ---MASKLPDL- GGGGVEDGGGKKWPGFVQFFFVLSVVLCVLLYAPRFIVLTPTYG ---LDFFPQPPPNVTTSPARVVGDHNAG EVVVLDNQLRSPCSSLAGDTICCDRSDF-NTDVCFM---AGDVRTDPS S-LSLLLFPKQPPA-ANATVEERIRPYTRK--

WEALIMSRVEEVRL-RMAPPE--EEPGHRCDVRH-- --DAPLLVMTAGG-YTGNL--FHAFSDGFVPAWLTVQ--H --LRRRVV--LGVL-SYNPW-WAGTYGEIISG L--S--DYH---VV---DLLHD---KRTHCFP GAIVGTRFHGILS--V--DPAR-LR--DN--- -KTIVDFHDLLAGVYETAGDTVV---VD DVTQPAPRRPR--LGIVSRRGTRVIENQAAVARLA-RSVG -FDVDILETANGLPLPASYASVSACDVLVGVHGADLTKLLFLRPGA-ALVQI APLG-VA--PIARGCYAEASARMG--LHYEQYDA--EGHESS-- --LSRKYGLR-DVVVSDPE---AAKRDKGWGFVA---RVYLGGQNVTLDLSR FRHTLTRLH---

ARA-LRVRS--LHPAP >gi|115444075|ref|NP_001045817.1|	  485 residues, 50 /line  Os02g0135500 [Oryza sativa (japonica cultivar-group)] ---MKQSMRS-- -RQ-EPRRVSNGVIIAAMLLSLCVLSIVKARYCSTPFVKPDDQL ---QEQMNSSIRMETDEPATM-AAGEQEEDEEEESS GGGGAEPEVSATPAVVVTAAAGGG---GGKRKPTCRMTSK-RSERCEA---RGDIRVEGN A-STIYIGGIDKEWKTKPYARY--

HDPVAMAVVREFTL-KPVTE-SSPACTRNH-- --SVPAFVFSNGG-FSGNL--YHDYTDVLVPLFLSTH--Q --FKGQVQ--FLLS-GLKPW-WVNKFNLFFRQ L--T--KYD---IL---DIDND---KDVHCFP RIVVGATFHKDMG--V--DPKR-SP--GH--- -VSVVDFKRALRRAFGLERVAAS- RGGATGNGKPR--LLIISRKNSRRFLNEREMAQAA-AAVG -FEVRIAEPDQHTDMSTFAQLVNSADVMIGVHGAGLTNMVFLPRGA-VLIQV VPFGGLE--WLTTVTFKNPAKDME--VTYMDYNV--QLEESS-- --LIDQYPRN-HQVLTDPY---AVHK-QGWDALK---TAYLDKQNIKMDMDR FKKTLQEAL---

DRL-PP-A >gi|115727689|ref|XP_791542.2|	  371 residues, 50 /line  PREDICTED: similar to glycosyltransferase, partial [Strongylocentrotus purpuratus] ---LSKFTTWYQYGFDKPQ-GPLDD---

IAVT SKEITLFTSFYKSKLNIDG- -CDSNAEIENT--FVILSRRTNRLILNEVELSLAL-AQHF -DALVVVASLEMYSLSELIGLISCSKGLVAVHGSLLSLSIFLPPCS-VLVEI FPYAVN---PDNYTPYRTLAHLKG--MNIVYRAWRNFDEINTVTYPDAEPEIGGIAHLEP ELQEQILSSAEVPS-HLCCNDP--AWLFRIYQDTIVDVDS FVEVVRDALLESQDGAIENEIGRVPYQPGAVQEVSCFTIPLPSGVVTSEDDDGDDDAVGL LLSWSPPWNIPFIQNTIKADNSITLDYEVTIQEQGKGEVYAGAFVLPMTSHLFKEGFKKG HVYFAWVRCKAGGKT-GPYAA-ITSCPYKE-D >gi|116499226|gb|EAU82121.1|	  426 residues, 50 /line  predicted protein [Coprinopsis cinerea okayama7#130] -MIDRLYLRNGTFYIVTN--DPTFPPRK ALIGK--- PVALSNGVDSEATDKEMQFLSPEEAPGVL--- GDVATLIP

--DVTVFLYDSPQ-FMHHF--YHWWGEIILGMWRVYSTL-ALDHKPSS LDPVGFPLPWPTRFVMPAVSG---AEWRDRAGIIGPTMRAAFPQ ASIEKADYWNDLIKLDTTV---VFERSMII---NRDKAHKHPLSGRWFKMVGGTMGLTGP EFFWEPLRHSLVR--N--TIGYVPVVDSK--G -RILASSLKHTLSSPSESIT--ALEDDM ESPDGRYDLPV--VTYISRQG--SGRRLVAEDHELLV--KSLKDLE---KQG -VCTVLIPQMEKLSIREQIAIIAKTTILVGVHGNGLTHQLIMPPSLR---SATFEI MDPPS--YTFDYEMLARNMG--HKHYAVH-NDTF-- --LTYPRGKT-HNKVHFTKGFHGVSIPV YGPAVADMIR--

---RRLTEPDD-AVED >gi|119500630|ref|XP_001267072.1|	  488 residues, 50 /line  conserved hypothetical protein [Neosartorya fischeri NRRL 181] ---MSWLSLSSQ --R-RVVRLSATVIGVLFVLFLLHVTLTRTRFQYSPLPSSTSG- --PRRNDSDTKGHLPNAEQAPTLP AEYSAVAEEPSYCADQFGITYLEKLRDS-RTEYCTPNSPSGLTCFHSQ S--ASGSRIDTFCFGRGA--VYDP AQRLFVMDCQLRDLGGENVP--TFGKFHNYWYETGPGIVFQKAVS--- --LQGKLDHTVP PVVSNHTILIQRE-GAGNV--WHSLMEIFSMTMTFDVLRMT--- ---AGPNPHRPLFSIGDIENTQVV---ILDEI-EDGPYFDLWKI F--A--QRP---PL---RISDLRP---TNEFE NLIVPLAGGSNPL--W--QGDWEIH--SC-EDSALVHTFSRRVLSHFHVEF-

---RRPRQGPQIVVTFIDRTGSRKLINQEDYFKTV-KKQF -PHIT---VQMIDFASIPFREQLRIAQESDILVGVHGAGLTHGIFLPSGS-VMVEI LPPGL--NHKGFRNLASLLG--HLYFSAHA--TKPAK--- --TVKR-DDW---HNDDVYLEHEK FMELMNVAI---

KAL-YNRG---ERNYD--VN >gi|121918045|gb|EAY22815.1|	  454 residues, 50 /line  hypothetical protein TVAG_075620 [Trichomonas vaginalis G3] ---MSIMTIVGFFTFNL--- TTVLEEPEINFDQLVLTVSNVNKD LYFRFEGVGASAYSRIYPFCKE--NKCEIPLI IGGDVKFSLIYR-RFPIYTKHYIIEHAKMNCTNEPW-TNRICTF---RDICYANKK Y--HLISPYNITFEEKLLC- ---LGAKTPPVDLELN RFENMIDTWHEKPLFGR--- HVVAHSFLVSIYY-NMHML--WHQYFDFLLPLYQTMVR-- --DGPFDNRSIVYLPT-YATSYPMQTNY LSLGNKVAKM---ELDGCFE QLTMGMVKITDLS--L--DKDD-PP--YS-FCNNCSSGLRNIILRKMNIN--

DTSKSPI--AVILARKGNVRFFNVDVVEKVVKKL-LPKYK -VKVEYF---ENVPIEKQMKIMSKASLFVSIHGSGLSHILWMKPGT-CVIEL KTWLH-TCNDWYQKAARATG--IHYMAYYPHETL-- --DKPSYISPY---LQHCI---DNRI-FCGS---KHCKDALRDQNITVNAER FENGIKEFV---

NNH-L--K >gi|123432397|ref|XP_001308412.1|	  295 residues, 50 /line  hypothetical protein TVAG_222780 [Trichomonas vaginalis G3] ---MKTTNTMFQDATFIPN-

QSFIIGVDR-SNRNL--WGDLYDNVVSIYLHLVKDREY-- --TQNERIFT-T-LKFEYPPMLSY LLS-NV---DIERL---QEPHCFE SFSFGIDK---IA--I--GSESY---YYN--YD-IKPNQTINLRNILLSQLDIKKS

---NE--KKVIIHQNTGTGVIRNINDVVDVIKKL-FPDYN -ISIIELN---KLSKIEQIREVSQADVLIGPTSPALSSLVFMKPSS-ILIEI NPYK-YSCLNWYQTAAKGAG--LKFIKYVA--SLESE--- -FISTD-NQILKDCW---DGIV-ECQSIIC---TNLFSMQNIIVDSTN FENVLRKEL---

NQL- >gi|123496899|ref|XP_001327065.1|	  445 residues, 50 /line  hypothetical protein TVAG_411080 [Trichomonas vaginalis G3] ---MKSNICSISSKVDKFI-DTYSMHSLTFKV---PILISSVYKICIYTKNYQQKINIYT NTVN

-CTFSLDEFPFTNYTSIVCFGKSF-NERWCVA---ENACRENLT V--VFSFPYNVKFSSPFVNPSARPSPYS

RDEFIINSNRI-KFLPELPYVE-- --NSTAILCSRYL-NHRML--WHNLVDFVIPIYRAMHT-- --TNISSDCTIHAFD--NDGKYGLFYAN A--L--CQN---II-HEN---SNIYCHK RMIIGVPKTGGSQ--S--ERKLFLN---YDIP RNELIGLRELMLKEAN---S TGCMPSREHPK--VLLIKRRTK-EEKRRLINSDEVSKAI-HEVC -PFCEVL---NTDLQDFNKMQQVSFTCSVSLLIGLHGSGLTHLMWQYPSSKEQKTAVIEI LPYL-YTCRDWYSKLASMAG--VEYFSLKT--LRKNQS-- --RWEKVSDERERSCHSGS---EMCG-KGW--CHDFLRDQSVIVDIDQ FKKLLSSIV---

ENL-TKNR---L >gi|124003265|ref|ZP_01688115.1|	  369 residues, 50 /line  hypothetical protein M23134_01118 [Microscilla marina ATCC 23134] ---MFQRITQKIAAA-LA-- KSPQGTTSLSP--DNAQDYALLYK G-KAYLSQQINAVK-- APQVTLLGSGTPSKHWQDFEATTHAMCIDSTHSGFKFC-- ---CQHLVDPHNHVLVAPGVTPEA LPILQQ-- KLPTKVEKLK-- --GT--VAYLANV-SPRHY--GRWMRETLPLLQIYQQHIGL--- ---EQIDH--FYIGD--LSRIPDF-ISECFE- TL---GISPY---KIVTNPC K---GTRTL--A--AFTVHSPLPHY--YS---QATYTYARQVVTSRLDLSDN

--CCYHP--KVYIARGN--VHRRQVRNQEAVYEVL-RPYD -FELRVLD---NLKVREQAQIFYHAEVLIAAHGSALTNLMYGKPGN-KVLEI LPHDC--ATVGYFSLAAYAA--MPYFCMYG--KATGT--- --AKGCNQDIEVDLEL LDAFCRQH

---C >gi|125539247|gb|EAY85642.1|	  456 residues, 50 /line  hypothetical protein OsI_006875 [Oryza sativa (indica cultivar-group)] ---MAKSAMK-- QGI-WRRRI-GVPFAAVLVAAVLAVVVFSGQFAKGPNDSLSKES PPQSQEGDGGTAESGAE--- --PYIKCT---AQSDIKICDLSNP-RFDICEL---CGDARTIGQ S-STVVYVPQNRA---SNGEEWIIRAQSRK--

HLPWIKKVTI-KSVNSS---EPEPICTSKH-- --HIPAIVFALGG-LTANV--WHDFSDVLVPLFLTAR--Q --FNRDVQ--LIIT-NNQPW-FIKKYSAIFSR L--T--RHE---II---DFDSD---GQIRCYP HVIVGLRSHRDLG--I--DPSS-SP--QN--- -YTMVDFRLFVREAYGLPAAEVD--IPY---K ADKDDPDKKPR--IMLIDRGKSRRFVNVAHVVQGL-DWFG -FEVVKADPKIDSNLDEFVRLVDSCDAIMGVHGAGLTNMVFLRSGG-VVVHI VPYG-IK--FMADGFYGAPARDMG--LRHVEYSI--SPEEST-- --LLEKYGWN-HTVINDPE---TIRK-GGWEKVA---EFYMSKQDIVLNMTR FGPSLLNAI---

EFI-M--- >gi|125559459|gb|EAZ04995.1|	  433 residues, 50 /line  hypothetical protein OsI_026227 [Oryza sativa (indica cultivar-group)]

---MGNDSLCCDRTST-RADICFA---RGDVRMHSA S-ASFQLVSSSSGN---ATAAAVEEERIRPYTRK--

WEANVMATIDEVRL-RRVPAGGAARCDVVH-- --DVPAVVFSTGG-YTGNV--YHEFNDGILPLFVTSN--H --LRRRVV--FVIL-EYHDW-WMTKYGDVVSR L--S--AFP---PI---DFTAD---RRVHCFP EVIAGLRIHGELT--V--DPEK-TP--EG--- -KSIRHFRTLLDDAYRGRIQYLERLERRAARSRKRRAAAAKPTTTSIALPIMAPPA---K QASPSPPDRPR--LVIVSRTGSRVIENEADVAALA-ADVG -FDVRVVRPERTTELCKIYRELNASDAMVGVHGAAMTHFLFMRPGK-VFVQV VPLG-TD--WAAGAYYGEPAARLG--LRYVGYKI--LPEESS-- --LSREYPTG-DPVLTDPA---GVGK-RGWDVTK---KVYLDRQNVRLDLPR FREVLVGAH---

RHL-VAG-KRRRRQRE--SQ >gi|125563028|gb|EAZ08408.1|	  410 residues, 50 /line  hypothetical protein OsI_029640 [Oryza sativa (indica cultivar-group)] ---MEEDLIR--QDI-DQA-

---GTKNGTNHK--PGAPRKPICDLLDP-RYDICEI---SGDARTMGT N-RTILYVPPVGER---GLADDSHEWSIRDQSRK--

YLEYINKVTV-RSLDAQAAPGCTSRH-- --AVPAVVFAMNG-LTSNP--WHDFSDVLIPLFITTR--V --YEGEVQ--FLVS-DLQPW-FVDKYRLILTN L--S--RYD---IV---DFNQD---SGVRCYP KITVGLRSHRDLG--I--DPAR-TP--RN--- -YTMLDFRLYIREVYSLPPAGVD---IP FKESSMQRRPR--AMLINRGRTRKFVNFQEIAAAV-VAAG -FEVVPVEPRRDLSIEEFSRVVDSCDVLMGAHGAGLTNFFFLRTNA-VMLQV VPWGHME--HPSMVFYGGPAREMR--LRDVEYSI--AAEEST-- --LYDKYGKD-HPAIRDPE---SIHK-QGWQFGM---KYYWIEQDIKLNVTR FAPTLQQVL---

QML-R--G >gi|125564041|gb|EAZ09421.1|	  447 residues, 50 /line  hypothetical protein OsI_030653 [Oryza sativa (indica cultivar-group)] ---MKKSREGNLKHV-KGSLCLVP---PLLLAVFFYLQFQTLGLFSPIFRCG GQSAGGGGGDD-YVDRLRASATFLPLKDTREWAETW --FISTLDDT-SEPEG

EAKNIVFPSAAS AGRLLCMS-APS RRDGTRNAYALAWRE--ALPGGAELR-- --PGLAYVSETAY-DHSNL--WHGISALIPFASWHARSG- --CRARPARWALFH---HGEVRLGMSPW-LTSLAEATTGV GMV-VE---TFNASDV---PVCFE EAVVFRRNMAGMT--R--ERLL-- --AAFDFMRCKARAQCGVVA DVSDPDSAA--VRVTILFRTGARAFKDEAAVTRVFKSE--CARVAGCA -LTTARSD---NLTFCDQVKLMSGTDVLISSHGAQMTNLVFMDRNS-SIMEF YPKGWRERAGGGQFVYRWGADRSG--MRHEG--S-- --WWDPHGEP-CPGSPDIL---SCYK-NRQIGHDEA---YFAQWAARVFAAA KERKAGGSPAST

--RRR-EA--PTCQCS >gi|125578938|gb|EAZ20084.1|	  383 residues, 50 /line  hypothetical protein OsJ_034293 [Oryza sativa (japonica cultivar-group)] ---MK--- GGGGGLW-RPRVESRGTFRRRLLTVTAGCFLFFIVFLLSSRHDAIVLLDTRRVRET VTGVETNDDG-AERGAEPAERDNAAPAAAAAISGGDQEAQPGTA-AVDAAPGHDKSLRTA AATGTSPPRHEQPGETTTRADSVDQPRHPLCDLSDH-RTDVCDL---AGDIRMDAN A-SAFVVVVDPAV--GADGPTYKVRPYPRK--

GDATSMGRVTEITV-RTTAAGATAA---

-AVHDDAR---GAGGRVLD-QRVG -FEAVASELDMAGADHDDVARVARLVNSFDAVVGVHGAGLTNMVFLPPGA-AAVQI VPWGGLR--WLARADFGEPAVAMG--LRYIQYEV--AAGEST-- --LKDKYPRD-HEIFTNPT---ALHK-KGFTFMR---HTFLNGQDIIVDIDR FKPVLLRAL---

NSL-A--R >gi|125594130|gb|EAZ34189.1|	  425 residues, 50 /line  hypothetical protein OsJ_017672 [Oryza sativa (japonica cultivar-group)] ---MQQASSH--QHH-YQHSAKPP---VSRSSSWIRRS--PPPSPPHK KLWGGGGGGGG-GRSRYVCRIVPLLVLTVYSIFTVVRIPSSSLVVSTADSERVERR ED---VEAFKTHLPSNQNNLEAREETRSPASL PCSALINGEAGGGQAAAESALCCDRSHY-RSDVCYL---RGDVRTDPS T-SSVLLYNAPRGS-APEKVRPYTRK--

FEGSIMSTIDEVTI-VPVVDAGSGSNGTTAGDTGKDSLRRRCDVRHPP --GVPAVVFSTGG-YTGNV--YHEFSDGLIPLFITAQ--R --FAGEVV--FVVL-EYHYW-WLGRYGAVLER L--T--NYK---VV---DFRYD---RRVHCFS EMIVGLRIHGELV--V--DPKL-MP--NG--- -AGEIMAQIIIRRGGWMDG- -WVSEWIGKKR--WLLQKRCGEKRVCSSQMRGCETDAGGR -IGQPIG- ---ASTTAAQRARVPRR--- ---FCACSEIRASLGT

---K >gi|126647025|ref|ZP_01719535.1|	  324 residues, 50 /line  tetratricopeptide repeat protein [Algoriphagus sp. PR1] --MEEIYV---KR--- -NPP VNLRPEDEKLFLDAYQVSFRVRPI H---

HLENVAILQDTVFSPSHMSFYATHTHVNSLGPLPLGKRVVYC-- ALKKWR-- --TIPHGIWVKDE-WSANY--FHWMTDCLPRLWLGLNTGLS--- --DRVILHDSYRHLPY-VSQSLE- LL---GIQPT-- YYQSQENIW--V--KNLVLTPRTSS--FP--- -NFHEDLTKMTRERLS --VSPKSTPSR--LIYISRKY--ANKRKTHNEIDVELLM-IRHG -FEVIYTE---KMSLKEQIDLMSETKILVSLHGAALTNMLFLPEGS-KVVEL RNNGDSDT-QCYFNLANALN--LPYYYTLN--QGDSQD-- --T--IMTDFTINLES LEETLNQLK---

---N >gi|145356110|ref|XP_001422282.1|	  306 residues, 50 /line  predicted protein [Ostreococcus lucimarinus CCE9901] MSKF---HQ---

---LPLRA---YVDVKVDPV I---

-FTHALNKNH-- --TSNLFVIAPDDKRGANP--FHFAQSAMFFFHSALRTLENSDSSSVVIIFRQRPPAQSW IDSLTQQIFGDVR--- VV---YGDELTS---PICAR RVVVAGT---MIG--LL-QGPYDAQLFRDRVYGNLKINPK

---RINRAD--LRVTLIDR-KKRRVTNVGELQEILDE---RRLW -YKTVRLD---TLSFKEQVSLMSETDLLISSHGADLTNVIFMQRES-AVIEL FPSTVW-YYELYAKIARNAG--LFHTYA LG-DQTH---AVTK-TIAECFESACLTE-LKRDFMIPPER FRTSLDHAL---

SLL-GV--ANAV >gi|147840299|emb|CAN66138.1|	  395 residues, 50 /line  hypothetical protein [Vitis vinifera] ---MNIKIKT--HQR-LED-

---VCCGRLAHSKHSRRHSSPRAPRK--

REVYVLGFADSFGE-YDGP-VA-- --EMDAKTLCSSI-ANGNI--YHEFNDGILPLYITSQ--H --LNKRVV--FVIL-EYHDW-WITKYGDVISQ L--S--DYP---PI---DFSGD---NRTHCFP EAIVGLRIHDELT--V--DSSL-VE--GN--- -ESIRDFRNLLDQAYLPRIRSLIQAKEQKVQSKMKEEPSLPPSLKPPLETGK EEQVDQLKKPK--LVVLSRTGARAITNEDLMVQMA-KEIG -FQVKVLRPNRATELAKIYRVLNSSDAMVGVHGAAMTHILFLQPGS-VFIQV IPLG-TE--WPAETYYGEPAEKLG--LKYMGYKI--LPRESS-- --LYNEYAKD-DPVLRDPE---SLAK-KGWEFTK---RVYLDRQTVTLDLRR FRKQLVCAY---

DYY-ILK--ASRHSHF--LS >gi|149119468|ref|ZP_01845941.1|	  399 residues, 50 /line  Capsular polysaccharide biosynthesis protein-like protein [Methylobacterium sp. 4-46] ---MTPPTAG---QVLAGTV---VD--- -DHAVAADYPDARRVAMRA-

LQLWPDFRWTTQELVSF--- TARDVLVTSAFVPID- TRRSRMFLNQSYSGVETIFPTRFRVEEGRYRLEG-- TPVPCP-- --GR--HIVLGGP-IDGVW--YHWLFNWCPRLLLLGQLRPD---LLACA--- -DLRIAV-HPLALREP-YRAVLD- SF---GLPAE---RFLVLDP GRDHL--L--EEACLVSFLDQ--NR-LYPEMIRAFAAHLLAAWGLDGAGDPG PGPARGPLAAIVRRFAGPNL---G ARGPAPGAAPR--GLFASRQDLPAPKRRIANFEEVAPVL-ARFG -LDVVACG---GLPAREQARLFRSARVVVGGHGSDLSNLLFCRPGT-RVLVF ESRFSVE--AFLHRGLEQLCALLG--LDYVLKIV--PTDGE--- --AGPG-AGTQARINQDYRIDPDD LARTLAALT---

---R >gi|15229594|ref|NP_188446.1|	  470 residues, 50 /line  unknown protein [Arabidopsis thaliana] ---MTKKDIL--YDT-VLARSFSK---TD--- -QKRLCCGAFIASLLLVLTLCTVVKPYLSPL- --PIVELQLSVGTGLRMLSITELTTNTTI--- --SKEEVISECNKMEKPICHCNTLGSKEFCDV---SGDVRIHGK S-ATVLAAVT---FAFSGNSTWYMRPYARK--

DQVPAMKRVREWTV-KLVQNASLSRCVRNH-- --SVPAILFSLGG-FSLNN--FHDFTDIVIPLYTTAR--R --FSGEVQ--FLVT-NKNLL-WINKFKELVRK L--S--NYE---VI---YIDEE---DETHCFS SVIVGLNRHRDYD--K--ELTT-DP--SN--S EYSMSDFRKFLRDTYSLRNSAV-- TTRRKPR--ILILSRSRSRAFVNAGEIARAA-RQIG -FKVVVAE--ANTEIASFAITVNSCDVMLGVHGAGMTNMVFLPDNA-IVIQI LPIGGFE--WLAKMDFEYPSKGMN--LRYLEYKI--TAEEST-- --LVKQYGRD-HEFVRDPL---AVAK-RGWGTFK---SVYLVQQNVSVDINR FKLVLVKAL---

ELL-HN---QSV >gi|16126091|ref|NP_420655.1|	  383 residues, 50 /line  hypothetical protein CC_1848 [Caulobacter crescentus CB15] ---MTAPISL--R--LV--- -VEAR---DLP--PMLPDVLRERF DR---G-ETGVAWAPEHDASVGAP LGVLGGPEATAWPFAISEPPPV---NVPALCA---VGPCWWYP- SFGAVIGN DGALYNATVGEARH-- --GSADLSAIPGVASGGT-RLVPPQ---DAPVLD-- --GG--AVFMPW-GAGFNY--GHFVIDALPSILALEQAG- ---LLHDT--PLLAPRLTDW-QRELI-- AM---ATPGV---RLQEVDA -PAVR--L--GRAVFATSMDH--FL--- -HHPNGLLATLAERVT -ANAPKGAGAR--RVYLSRRG--QSMRVMVGEAAFERAL-QARG -FVIVRPE---TLGARAQVALMRDAEIIVGASGAALANAVFLPRGA-RVIEI QPTNF--TSQWVRAACRQVG--VEWRGYVCASP--- -CPAHAAPLLARLR-RGFKFAFRPDLDD LLSFVDAA

---L >gi|2558980|gb|AAB81629.1|	  448 residues, 50 /line  unknown [Listonella anguillarum] ---MRDSYIF--I--MNKLK---IV--- -SI---LKVFY--YMLPKFIRVQY SD---SVTVLRNMALGDKSLHNDF---FVENKIKLVKELESLGA TFDIITHIIGRKNII---GAPAIYIDNV-RCFRPSL---EG--- --GLLDVKVIHLFHVTLIGS TDGVIYKD-KMYHQELLSMRHTNDLKQP --DIFV-SQNFVKIHNYDYLVR---SRKNVLNIE-- --GP--AISLLKE-HSSNY--YHCVTEILPKLQQILSCVPS--- --NKDSFS--ILIDDCMPIQ-VVNMINVILSA YTCF--QYE---LI---KVEKG---QKVNCNE VI-YCTPLWLSL--DNTQYLPDPKN--EF--- -FVSVDSLKKLKGHISSVL- -FAPTVSSKYR--KVYLQRQN--NRLRKISNILEVERVL-YKHG -FEFVNTG---TLSFQEQYELFSDTDVVIGVSGASFTNILFMQRNS-KAILL SPSAQCTNYYIFQPLADVSE--VELVHLLS--KPDDDS-- --NSL-HGDASVNVEE LELFLSEMSC--

DIYR >gi|46241628|gb|AAS83013.1|	  377 residues, 50 /line  hypothetical protein pRhico015 [Azospirillum brasilense] ---MGHPDGA--A--WGLRW---NS--- -ARMRP--TQIA LP---DDSVILTLTSPGFDAAYPRLVNG-DLI PDSVRQVMEWAWSTLRFP-- -ERPVRVARLADVWVAKEGLVFDR GGNLYRE--TITQHSETEIDQAH- ---DAVLASMRHWE---EMGWAADRE-- --GP--VLLCKKR-GVGNY--GHWMMEMLPKAHLVHDRLSD--- LGSR--FLVAQ-APEHLNNS-MAFSLS- ML---GIDLA---RTIVADD TPRRF--A--DLLLVDGLTEH--GG--- -YMSPLVLDTVDAM-- -ARDVASAGVE--QLFVTRRS--TGIRRIVDEDALAAQA-EARG -YRVVEPG---LLDLPQQIALFKGASRIIGVMGAAMTNIAFAPPGA-RVINL TPAGM--PDTFFWFIATLRG--LDYTEIRC--AQSGPV-- --RGI--MPWDTDLILSPDN RDSIFA--

---D >gi|53792588|dbj|BAD53603.1|	  465 residues, 50 /line  putative HGA1 [Oryza sativa (japonica cultivar-group)] ---MKAAVRS--K--KS--- -KGSFCHPPLLLLIVAIQF---LVIYS--PTLDQYM -VMLTTGKPGFPSMLIDGRRSFKQVD-- -EFIPEPHLRCDFRDN-RSDVCEM---EGAIRILGR T-SEVFLVAPSLASISGGGGGVNATGVDANATRWKIQPYTRK--

GESRVMPGITEVTV-RLVTADEAPPCDEWH-- --DVPAIVYSNGG-YCGNY--YHDFNDNIIPLFITSR--H --LAGEVQ--LLVT-QKQRW-WFGKYREIVEG L--T--KYE---PV---DLDAE---QRVRCYR RATVGLHSHKDLS--I--DPRR-AP--NN--- -YSMVDFKRFLMWRYALPREHAIR MEEEDKSKKPR--LLVINRRSRRRFVNLDEIVAAA-EGVG -FEVAAAE--LDAHIPAAASAVNSYDAMVAVHGSGLTNLVFLPMNA-VVIQV VPLGRME--GLAMDEYGVPPRDMN--MRYLQYNI--TAEEST-- --LSEVYPRA-HPVFLDPL---PIHK-QSWSLVK---DIYLGQQDVRLDVRR FRPVLLKAL---

HLLR >gi|56409864|emb|CAI30080.1|	  492 residues, 50 /line  glycosyltransferase [Zea mays] ---MKTRSSA--R--GE--- -PRRLGNAALLALMLCSVVALSLIRGRFAPI--VTTAGDAIKSE DD---AAAAALSVSKAAVNVDTGDSADEAAAEAAAEEKEKEEVQ PKPADSSGSGSGGSA---AKPVCYETSR-RSDTCEA---AGDVRVVGS T-QTVYVDSLDREWKTKPYCRK--

HDNFALAHVKEWSL-KPLPSGAAPQCTVNS-- --SATAFVLSTGG-FTGNP--FHDYTDVLIPAFITAH--P --LRGEVQ--FLVS-SYKSW-WMNRYIQIFQQ M--S--RHE---VV---DIDAD---DEVRCYR SVVVGATFHRELG--V--DASK-SP--PG--- -YSTADFRKMLRDAFGLERATATP---S GDRWDIRRRPR--LLIISRRP--SRGRAFMNERAMADMA-ASLG -FDVRIGEPDTSTDTSKFARLVNSCDVMVGVHGAGLTNMVFLPAGA-VVVQV VPYGRLE--WLARNTFAEPSAGME--VHYLEYVV--QLDETT-- --LSEQYPSD-HPVLRDPM---AIHK-QGWNALK---TTYLDKQNVRPHLGR LKNTFLQAL---

KML-PH--GRDD >gi|58265524|ref|XP_569918.1|	  461 residues, 50 /line  hypothetical protein [Cryptococcus neoformans var. neoformans JEC21] ---MRAALVL--F--- --LAVGLLPSALAASSLPS--QVLS--- -HGPTTLVSGLPGFTVLDNVWYRNRTFYVLE---DESEIPQTDR LLTLSRSNSGTQSVERVNWKEMVFYDG- --E---DGSPKEAQAKPDVEIKELHGIT

---LFFNDG-WDGKWSGYKWLYHMVAEALLGSLSVLS---SVPPLPTS IQSQGQDQGQDTRQGLVTYGGDGELPDR--LVIAWDYNWDARYGLPRAVAEALFGD DKLIEPEEWTQMTSQDTWI---YFERVLLV---DRNTA-H RHNLLARQWFKMA--V--DAYRLASSPSF--- ---FFPTRHALLSHY-GIRTYTRS--AP -GLRLSGKKPK--IVYVDRQR--TQRK--FDVEVHTQLLKQLKNIEKAKKAV -VVDAVLE---DLEKKEQFEMFSDADIILGIHGNGLAHELWMPEGG-IIIEI LPPPT--FQYDYAPVSAVLG--HMHIIWQYDK --IYPRYKWI-PENRKNETLIHD---GSPIPLDVDP FTKLVEALV---

DSM-S---FSYH >gi|87309616|ref|ZP_01091750.1|	  397 residues, 50 /line  hypothetical protein DSM3645_02353 [Blastopirellula marina DSM 3645] ---MRL-KSETI---KQ--- -LRCRLLNTWWRLFG--VPAPRGGCL-- DSPLDFCLEEPARQSFPRRT-MFG AVDQVGQDIEALIS-- --AGLLYETDR---DWNGESTIDYPPGGVTLLEQGSVISR QGILFTPKHGVLENLGGGSLA--- AVSGVGTSFT---HLPRPRRID-- --GN--VLVMTRGLAQRNY--YHWTFEMLSQLRLVEQSG- ---VSFDY--VAAP-KRHAF-ASESLQ- LL---GIERS---QILPMGH YTHIQ--A--KQLIIPSVACY--- -FPQPAGVAYLREKMQT-QA -WSHYERDDRL--KLYIARRR--FTSRYIVNEAELFAAL-KPLG -FQQVYLE---DLPLKKQIQLFQQAGVIVGPHGAGFSNLVYSRPGT-AVFEI TPTCR--PPLFFHYLAEINA--LQYAVYFG--QPVGQ--- ---RGMDANIRVDVPQ LRQQLTSFLAE-

-AAGDYS-RAAA >gi|86147246|ref|ZP_01065561.1|	  432 residues, 50 /line  Capsular polysaccharide biosynthesis protein-like [Vibrio sp. MED222] ---MLLRSLY--Y--LFPRF---IR--- -HQY---IDSIIFYRHVFF--RLISLFKSKEN KP-EENRFDVRLVGDLELLGGG-CEIIQHVSERYASVQGP

---LLYVDNQE---CKRSSLEGRLPDTKVVRLSGVQVIGS TDAVISGI-NMY HHELSLMENIHDLKRPDI-FLKYEELEGFDFQIS---FIREKLTLD-- --GL--VVSLLKE-HSTNY--YHWVTEVIPKLANMMEYIES--- --KDEKIT--ILVEEGTPQQ-SLSLIELLLSE LKNT--EYH---LC---HVKKG---QLVYCES LI-YCTPLWTSL--DNTRSLPNPKK--EF--- -FVSSDCLKKVKDKLSK-NT -LSNNYILKNK--KIYLQREN--TKLRKLSNVLDLERLL-YRKG -FDFVDPG---SLDFFEQYNLFSQAEVIVGASGAAFTNLLFMKPGS-TAISL YPSAQSTNYYVFQPLADVSN--VHLIHFLT--TPDDNS-- --NSV-HGDANVDVKE LEKLLEKLD---

---D >gi|69285556|ref|ZP_00617001.1|	  392 residues, 50 /line  similar to Capsular polysaccharide biosynthesis protein [Kineococcus radiotolerans SRS30216] ---MRSVNAG--W--- DYLVRRGADHHG RR---VRKALAHVRRAPVPLVGSLDLAAAGRAARVEVQPGQDVRMERP

--AALSPADWR---AFRHRDVSTLPPQFVLDVPDALVLGR NGWVAVED --GGARRVVSDLWQEVGL-ETGD---MVQPGLLATRPDERLP-- --GT--TVSLLLP-WMPNY--YHWTLQSVPRFDMVAGVLDP--- ---ASVDQ--WLVPPQSSPF-VREWLD- LL---GIPQD---RRVEVEP SGRV---LS--L--ERLVVASVPAR--NR--- -YVPPHVLDSVRARLD --LRRRDDLPR--RIFLDRPA--TDKRRLLNRDRVLTAV-RSGG -FEVVEAG---ALSVADQAALFASADVVAGVLGAGLTNLVYCYPGT-TVVEI LPRNL--MFPAYYKLCAAAG--LDHRLVTG--REPRLI-- --GP-L---RFPDTEADVLVDVAT LEQTLQDVL---

---T >gi|69285555|ref|ZP_00617000.1|	  398 residues, 50 /line  similar to Capsular polysaccharide biosynthesis protein [Kineococcus radiotolerans SRS30216] ---MVPRRLR--C--QSSAV---RS--- -NQR-VGWRYLLASAIGYRL SS---GRAWCRSLLARRVDMVSLEQLRE-NGATLRETLPSRKVRLTVP

--SDLRASDRS---ALRMRDVREVPAQAVVELSGATVLGR EGWVFVDG---R LVDGIWQEVGFPAR-RML-PRGR---LEKPAHLG-- --GT--TASLLMP-WLPNY--YHWTTQAVPRVQMVKDVAGD--- DVDH--WLIPADPPSY-VLEWLD- RL---DVPVE---RRVEVRG RRQV---FA--V--DRLVVSSVPGA--NR--- -WVPSWVVDHLRKQ-- --FPPPPEHGE--RVFVDRPE--TDRRRMLNREDVVAAL-RGRG -FRIVDLA---SLTVQEEAVLFGSAAVVVGVHGAGLTNLVFCRPGT-VVLEL APRGL--VFPTFAKLADAAQ--VTHHLLVG--TEPALP-- --R---PLRF-PDVLADVVVDIPA LTRLLDPVLT--

-RLG >gi|6735317|emb|CAB68144.1|	  470 residues, 50 /line  putative protein [Arabidopsis thaliana]

MVQYKRLIKKGEKHRLSVEEGGSGASA--VTVSGGAFSR- ESKGFGPYELFIAPLC SGTSN-GTICCDRTGS-RSDVCIM---KGDVRTHSA S-SSVFLFTSL---KNKTKITKKIKPYTRK--

WETSVMQTVQELNL-VYRDEENNSLVVSSVNDICDVFY-- --NVPAVFFSTGG-YTGNV--YHEFNDGIIPLFITSH--H --FNKKVV--FVIV-EYHSW-WIMKYGDIVSQ L--S--DYP---PV---DFNGD---KRTHCFK EAIVGLKIHDELT--V--ESSL-ML--GN--- -KTILDFRNVLDQAYWPRIHGLIQEEELKAAN -KTEDGFKKPI--LVILSRNGSREILNESLLVELA-EEIG -FIVHVLRPDKTTELAKIYRCLNSSDVMIGVHGAAMTHLLFLKPKT-VFIQI IPIG-TE--WAAETYYGKPAKKMR--LKYIGYKI--KPKESS-- --LYDEYGID-DPIIRDPK---SFTQ-KGWDYTK---KIYLERQNVKLDLKR FRKPLSRAY---

DFS-MKRIG-LVYISHKPDV--TN >gi|114321517|ref|YP_743200.1|	  373 residues, 50 /line  Capsular polysaccharide biosynthesis protein-like protein [Alkalilimnicola ehrlichei MLHE-1]

MSPWVRAVDR-LLGTDFNSHPACAWQP--SPVPLHAIEQA GD---GAVDQAV

NWRQTPPIAPVGVGRVRRPLILLPSPAPQLAHDPLRRRAVILTSGGRPVRYP KSAPALRHLLRGGWRYSA-RLGR---AARPAVRL-- --GTVAVLGNHDP-GCNNY--YHWWADTLADLWFLRESGVD--- --LGRVDS--FLMAYGGYPW-QQQSLA- LC---GIDQE---RVVAFA- ---DHPALT--A--EQALVPVRSRG--SW--- -VSPVWLARALRELT---GW -RPPAVTTPGR--RIYLSRRD--APRRQAANEAAVERLLVDESG -FESHQCS---GLSVPRQQALFADAEVIVAPHGAALTNLVWCRPGT-RVVEL VPEGH--RNPCFRDLAAQSG--LDYRAILC--PATGAG-- --GGL-TADIQVPLAR LREALAG-

>gi|149122431|ref|ZP_01848793.1|	  488 residues, 50 /line  Capsular polysaccharide biosynthesis protein-like protein [Methylobacterium sp. 4-46] ---MTL-RPRTG---SV--- -KAL---GGT-RPGARPAIPTKRHLSC--VAAT--RLMTA RG---ME---LDPMATSIAGSAWLYKQSLDDPGRIV KLDSSGKILGRDHSL---ECNWLYVDGR-LVFRDFS---GHDVAVFPQ PLFFDAPRRLTGWSA---SCADAPRWLLRLDDLVPLQSGSAYDL AAEVREVAHAVAFTCPGPAYGDGDAAPTGYTAGKY---NMLTLRDVDLLTTHGAIEKAGV VAEESLFHFPFHLEDRFI-RFPD---GTFARNAGDPQL-- --SIARARYACAG-INENY--YHWMMFFVGKICLHGETRA --SGEGAV--VLVP-EYRN---DV-QKRTAE- -LVAKAYG LNLVQLRRCDRVR--V--DELLLPHQHGS--YG--- IDPHPVVLRAFALIK---AA -QASAAPGAGR--RLYISRAD--SHYRRLENEREIETLL-AGRG -FDVVRLA---DRTLEQQISLLATAEVVVSPHGAGLTNLGYCEPGT-KVLEF HSPQYL--NWCMRNLSIAAG--LRYGFLMG--EATEGD-- RYRVAVAA VDAAVTAMLA--

---A >gi|52354423|gb|AAU44532.1|	  466 residues, 50 /line  hypothetical protein AT4G33590 [Arabidopsis thaliana]

MTTKASVWRR-LVTCLSSLKFYLNVLC--LVVTVFVLLQI CS---FQITQRSLSLPPALLTYLKHNHE-EVSENKTASLVEKLRESVT FLPLKDYRFSNKPLEGHTWFMSSLYDNQ-TKG EAQYQEFPSDSS KGRLLCLK-GVD EHDGSWNSYALAWPE--ALPTNAILQ-- --DGLTFVSYNQY-DYGNL--WHGLTAVVPFIAWSLRN-Q --CEKPQK--WVLYH--WGELRFGMGHW-LSEIVTATYGQ E--P--D-FL---RFVDD---DKPVCFE KAVVMRHNEGGMS-RER---R--- -MEAFDLIRCKARNYCNISSSV-- --ASKPRIGMTLLLRTGARSFRNESMVIDVFKKE--CKRVDGCE -ISVSYSN---NLSFCEQVELMKKTDVLVSPHGAQLTNLFLMDKNS-SVMEF FPKGWLKLAGVGQLVFQWGANWSG--MRHEGSWHDPVGEICX-- --FPDTDRRC-MSIYKNAM---IGYN--ETYFGE---WARRVLG -KFS

--IREMKELAE-C-NHSNSS--ILDVCS >gi|56409846|emb|CAI30071.1|	  468 residues, 50 /line  glycosyltransferase [Triticum aestivum] ---HEDTV---RD--- -PQQ-SGKKEPESR-LLGSG--GG EG---EKKGHRKVTLPTVSNYTIRDAEDGDNAKQQDSRPETENKLEMV AGKSDGSQQQDWDDAEWGSKPLCDFSNF-RANVCEM---RGNIRIHPN A-SSVMYMEPA---SSKRNELWKLKPYPRK--

GDELCLSKVTELTV-KSSK--VAPECTKYH-- --NVPVVVFALTG-YTGNL--FHDFTDALVPLFTTAS--E --FNGEVQ--FLIT-DMAIW-WTRKYHVVFKK L--S--NYP---LI---DFNKD---TDVHCAK HAIVGLHAYMEFT-IDPSKAP--HN--- -YTMVDFNRFMRRTYELPREAVSA -LGEIPKAKPR--LLIISRQRTRMFLNLPEIIAMA-EGLG -FEVVVEEANVSSDLSQFSKVVNSVDVMMGVHGAGLTNCVFLPHNA-TLIQI VPWGGIE--GVCRIDFGDPAEQMG--LRYKQYSI--AVHESS-- --LTDQYPLD-HEIFKNPL---AFHK--GFEFIK---ETFMDKQNVRLDCNR FKPVLLQTL---

DLL-N--Q >gi|58039897|ref|YP_191861.1|	  367 residues, 50 /line  hypothetical protein GOX1456 [Gluconobacter oxydans 621H]

-MPLFSRLRR-LFSP---PA GP---SGLA--EIARSTTILETCPVRPVPAPCASA-LSHPERNP F-RDWESMPVTVSQFA--LRDVVL D-QPLMTLLHA---GYPVTETAYVQD--

-PEAVRNLKL-RSAD---IVRCAPFK-- --GV--TASCVDH-WASNF--YHWVAHTVPTLHVLSQ--A --GRPVRL--GLPE-HMHPW-QFETLE- LF---GLNGD---AHIRLQQ GRQYAFQALDYI---AFVNGS--AD--- -FAVSDLSRAAYARLR--QA -AGATTPSAGR--RLYIERGS--SANRHVPNEAELAAGL-EKLG -FERVHPE---TLSLSEQIRLFSDAGMVMGMLGAGMANIAWCQPGT-LVYEL VPSHH--INPCFAAMATQGG--LKYWADVF--ETGAAR-- --ENHTDDAAIPLSVADILD RVRELVALLPD-

---A >gi|71663377|ref|XP_818682.1|	  362 residues, 50 /line  hypothetical protein Tc00.1047053509733.95 [Trypanosoma cruzi strain CL Brener]

-MGHTTKDAPHL-MTF L-MDYFAP C-STPCQRASQ---GESAAKRLRVQ---LTVL YGNVCTSY-PAP KLDEAFQKVILGWFHAVF-RGD-- ---SP-FIELM--GSWGIDFVPPAGASGS--G --ALLIKE--VSYK-MAMSY-GGFFCP---RD E--G--TVPTT---YTPASMVS---ERSTS---GLWIIT- -RWERFRWFR-TR--- -AQASLFRRCLLHYYK--VP -SRTGDH---S--LLLHRRLN-ERHFDELHWQKKLQAR--LEP-RGVS -VMLQTFI---SMEYHHQASFMHNSSIFIAAHGAGMVNIMSMSPGS-VVVEL FPHGF--RYAMYQELAELLG--LHYIAYES--PSVWPP-- --RCCIQREK-GSAAQHTPPLHGTPPRTSF--GMRSCKGCDINV LEEDMEAILFDA

--LGIVSADIC-L-HS-ASI >gi|83815193|ref|YP_444756.1|	  417 residues, 50 /line  hypothetical protein SRU_0614 [Salinibacter ruber DSM 13855] -M-EIEVI---SI--- -MESYGMFCLLWRS-IMSR---II FP---LGRTTRNLLSKTMCHLTLPMRWLPSDSKSFGPPRGYYHHARTY V-DQHDGRYQTVFPER--KRVHAE P-SSIYSSTHW---KFKNEKESTLREDYVATIPKGRIVGT PGDVVTAN-DRL LADASKQLATEAQCHHLL-RKPW---LPTLEKID-- --GN--IAVLASD-RGSEF--YHWFVDVLPRIYLVNK--S --KERIDY--YYVP-DDDSY-KKKTLQ- KI---GIDSG---KIINPS- -QDHHIEAAKVI--VPSLPRT--FG--- -NVPRWSTEFLRKRLI--PT -VDEANSKLPS--RVYIDRVN--VLRRKVANRERTINFL-KKYN -FKPVRLE---NYKWDKQVSIVRNASIIVAPHGAGLVNTIFCSDGC-NIIEI FSPNY--MNLCYWKLLQNLN--VRYHYIIG--SGKRPK-- --KGN-DPHYGWD---PIEVNIDA LENTLEAIL---

---R >gi|56756779|gb|AAW26561.1|	  369 residues, 50 /line  SJCHGC00943 protein [Schistosoma japonicum] ---MEVANQPESNELLR--- -FQHGFIRTYVET---

-NITEKLLHS--

YETNLIDFIKSMKLFQSVNSERTNYY-- --KEKVVFIVTRV-EYANL--YHTMTDWY-NAFLTMKLLS -LKPTNIH--ILIADGHPI---GNLDEV-WSKLFYNSLSR IGAYRLPYRTNLHRALPIDNKD---GLLHIAK LVLVPYGYASPLYVDRPLIK NMFIEEFRQFIFQSYNINNDEDTC QKRTSIRFLPK--IVIVSRRDYIAHPRNINGTIHRKITNELELLNEL-NQLG -FQNSKVVCFTDLTMQEQLKLIMSTDILIGMHGAALTYSLLLSNTS-CVIEL FPNYCCQTSQHFLKLTKLRH--IHYTTYYG--LAEND--- MNGDTSYIPVDI FKSLVFQTY---

RKW-KKQI--QKKHM--DCL