From d9bfdb5e19c87261e64c22fd3770d8d8ae3911a9 Mon Sep 17 00:00:00 2001 From: Ben Webb Date: Tue, 10 Sep 2024 15:21:40 -0700 Subject: [PATCH] Add UniProt accessions for all sequences --- rnapolii/data/1WCM_new.fasta.txt | 24 ++++++++++++------------ 1 file changed, 12 insertions(+), 12 deletions(-) diff --git a/rnapolii/data/1WCM_new.fasta.txt b/rnapolii/data/1WCM_new.fasta.txt index dbe4087..2bb8543 100644 --- a/rnapolii/data/1WCM_new.fasta.txt +++ b/rnapolii/data/1WCM_new.fasta.txt @@ -1,4 +1,4 @@ ->1WCM:A +>1WCM:A|P04050 MVGQQYSSAPLRTVKEVQFGLFSPEEVRAISVAKIRFPETMDETQTRAKIGGLNDPRLGSIDRNLKCQTCQEGMNECPGH FGHIDLAKPVFHVGFIAKIKKVCECVCMHCGKLLLDEHNELMRQALAIKDSKKRFAAIWTLCKTKMVCETDVPSEDDPTQ LVSRGGCGNTQPTIRKDGLKLVGSWKKDRATGDADEPELRVLSTEEILNIFKHISVKDFTSLGFNEVFSRPEWMILTCLP @@ -21,7 +21,7 @@ FDVMIDEESLVKYMPEQKITEIEDGQDGGVTPYSNESGLVNADLDVKDELMFSPLVDSGSNDAMAGGFTAYGGADYGEAT SPFGAYGEAPTSPGFGVSSPGFSPTSPTYSPTSPAYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSP TSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPSYSPTSPAYSPTSPSYSPTSPSYSPTSP SYSPTSPSYSPTSPNYSPTSPSYSPTSPGYSPGSPAYSPKQDEQKHNENENSR ->1WCM:B +>1WCM:B|P08518 MSDLANSEKYYDEDPYGFEDESAPITAEDSWAVISAFFREKGLVSQQLDSFNQFVDYTLQDIICEDSTLILEQLAQHTTE SDNISRKYEISFGKIYVTKPMVNESDGVTHALYPQEARLRNLTYSSGLFVDVKKRTYEAIDVPGRELKYELIAEESEDDS ESGKVFIGRLPIMLRSKNCYLSEATESDLYKLKECPFDMGGYFIINGSEKVLIAQERSAGNIVQVFKKAAPSPISHVAEI @@ -38,36 +38,36 @@ LKFVKVRVRTTKIPQIGDKFASRHGQKGTIGITYRREDMPFTAEGIVPDLIINPHAIPSRMTVAHLIECLLSKVAALSGN EGDASPFTDITVEGISKLLREHGYQSRGFEVMYNGHTGKKLMAQIFFGPTYYQRLRHMVDDKIHARARGPMQVLTRQPVE GRSRDGGLRFGEMERDCMIAHGAASFLKERLMEASDAFRVHICGICGLMTVIAKLNHNQFECKGCDNKIDIYQIHIPYAA KLLFQELMAMNITPRLYTDRSRDF ->1WCM:C +>1WCM:C|P16370 MSEEGPQVKIREASKDNVDFILSNVDLAMANSLRRVMIAEIPTLAIDSVEVETNTTVLADEFIAHRLGLIPLQSMDIEQL EYSRDCFCEDHCDKCSVVLTLQAFGESESTTNVYSKDLVIVSNLMGRNIGHPIIQDKEGNGVLICKLRKGQELKLTCVAK KGIAKEHAKWGPAAAIEFEYDPWNKLKHTDYWYEQDSAKEWPQSKNCEYEDPPNEGDPFDYKAQADTFYMNVESVGSIPV DQVVVRGIDTLQKKVASILLALTQMDQDKVNFASGDNNTASNMLGSNEDVMMTGAEQDPYSNASQMGNTGSGGYDNAW ->1WCM:D +>1WCM:D|P20433 STSTFQTRRRRLKKVEEEENAATLQLGQEFQLKQINHQGEEEELIALNLSEARLVIKEALVERRRAFKRSQKKHKKKHLK HENANDETTAVEDEDDDLDEDDVNADDDDFMHSETREKELESIDVLLEQTTGGNNKDLKNTMQYLTNFSRFRDQETVGAV IQLLKSTGLHPFEVAQLGSLACDTADEAKTLIPSLNNKISDDELERILKELSNLETLY ->1WCM:E +>1WCM:E|P20434 MDQENERNISRLWRAFRTVKEMVKDRGYFITQEEVELPLEDFKAKYCDSMGRPQRKMMSFQANPTEESISKFPDMGSLWV EFCDEPSVGVKTMKTFVIHIQEKNFQTGIFVYQNNITPSAMKLVPSIPPATIETFNEAALVVNITHHELVPKHIRLSSDE KRELLKRYRLKESQLPRIQRADPVALYLGLKRGEVVKIIRKSETSGRYASYRICM ->1WCM:F +>1WCM:F|P20435 MSDYEEAFNDGNENFEDFDVEHFSDEETYEEKPQFKDGETTDANGKTIVTGGNGPEDFQQHEQIRRKTLKEKAIPKDQRA TTPYMTKYERARILGTRALQISMNAPVFVDLEGETDPLRIAMKELAEKKIPLVIRRYLPDGSFEDWSVEELIVDL ->1WCM:G +>1WCM:G|P34087 MFFIKDLSLNITLHPSFFGPRMKQYLKTKLLEEVEGSCTGKFGYILCVLDYDNIDIQRGRILPTDGSAEFNVKYRAVVFK PFKGEVVDGTVVSCSQHGFEVQVGPMKVFVTKHLMPQDLTFNAGSNPPSYQSSEDVITIKSRIRVKIEGCISQVSSIHAI GSIKEDYLGAI ->1WCM:H +>1WCM:H|P20436 MSNTLFDDIFQVSEVDPGRYNKVCRIEAASTTQDQCKLTLDINVELFPVAAQDSLTVTIASSLNLEDTPANDSSATRSWR PPQAGDRSLADDYDYVMYGTAYKFEEVSKDLIAVYYSFGGLLMRLEGNYRNLNNLKQENAYLLIRR ->1WCM:I +>1WCM:I|P27999 MTTFRFCRDCNNMLYPREDKENNRLLFECRTCSYVEEAGSPLVYRHELITNIGETAGVVQDIGSDPTLPRSDRECPKCHS RENVFFQSQQRRKDTSMVLFFVCLSCSHIFTSDQKNKRTQFS ->1WCM:J +>1WCM:J|P22139 MIVPVRCFSCGKVVGDKWESYLNLLQEDELDEGTALSRLGLKRYCCRRMILTHVDLIEKFLRYNPLEKRD ->1WCM:K +>1WCM:K|P38902 MNAPDRFELFLLGEGESKLKIDPDTKAPNAVVITFEKEDHTLGNLIRAELLNDRKVLFAAYKVEHPFFARFKLRIQTTEG YDPKDALKNACNSIINKLGALKTNFETEWNLQTLAADDAF ->1WCM:L +>1WCM:L|P40422 MSREGFQIPTNLDAAAAGTSQARTATLKYICAECSSKLSLSRTDAVRCKDCGHRILLKARTKRLVQFEAR