-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathrbd_21mers.txt
272 lines (272 loc) · 5.84 KB
/
rbd_21mers.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
NENGTITDAVDCALDPLSETK
ENGTITDAVDCALDPLSETKC
NGTITDAVDCALDPLSETKCT
GTITDAVDCALDPLSETKCTL
TITDAVDCALDPLSETKCTLK
ITDAVDCALDPLSETKCTLKS
TDAVDCALDPLSETKCTLKSF
DAVDCALDPLSETKCTLKSFT
AVDCALDPLSETKCTLKSFTV
VDCALDPLSETKCTLKSFTVE
DCALDPLSETKCTLKSFTVEK
CALDPLSETKCTLKSFTVEKG
ALDPLSETKCTLKSFTVEKGI
LDPLSETKCTLKSFTVEKGIY
DPLSETKCTLKSFTVEKGIYQ
PLSETKCTLKSFTVEKGIYQT
LSETKCTLKSFTVEKGIYQTS
SETKCTLKSFTVEKGIYQTSN
ETKCTLKSFTVEKGIYQTSNF
TKCTLKSFTVEKGIYQTSNFR
KCTLKSFTVEKGIYQTSNFRV
CTLKSFTVEKGIYQTSNFRVQ
TLKSFTVEKGIYQTSNFRVQP
LKSFTVEKGIYQTSNFRVQPT
KSFTVEKGIYQTSNFRVQPTE
SFTVEKGIYQTSNFRVQPTES
FTVEKGIYQTSNFRVQPTESI
TVEKGIYQTSNFRVQPTESIV
VEKGIYQTSNFRVQPTESIVR
EKGIYQTSNFRVQPTESIVRF
KGIYQTSNFRVQPTESIVRFP
GIYQTSNFRVQPTESIVRFPN
IYQTSNFRVQPTESIVRFPNI
YQTSNFRVQPTESIVRFPNIT
QTSNFRVQPTESIVRFPNITN
TSNFRVQPTESIVRFPNITNL
SNFRVQPTESIVRFPNITNLC
NFRVQPTESIVRFPNITNLCP
FRVQPTESIVRFPNITNLCPF
RVQPTESIVRFPNITNLCPFG
VQPTESIVRFPNITNLCPFGE
QPTESIVRFPNITNLCPFGEV
PTESIVRFPNITNLCPFGEVF
TESIVRFPNITNLCPFGEVFN
ESIVRFPNITNLCPFGEVFNA
SIVRFPNITNLCPFGEVFNAT
IVRFPNITNLCPFGEVFNATR
VRFPNITNLCPFGEVFNATRF
RFPNITNLCPFGEVFNATRFA
FPNITNLCPFGEVFNATRFAS
PNITNLCPFGEVFNATRFASV
NITNLCPFGEVFNATRFASVY
ITNLCPFGEVFNATRFASVYA
TNLCPFGEVFNATRFASVYAW
NLCPFGEVFNATRFASVYAWN
LCPFGEVFNATRFASVYAWNR
CPFGEVFNATRFASVYAWNRK
PFGEVFNATRFASVYAWNRKR
FGEVFNATRFASVYAWNRKRI
GEVFNATRFASVYAWNRKRIS
EVFNATRFASVYAWNRKRISN
VFNATRFASVYAWNRKRISNC
FNATRFASVYAWNRKRISNCV
NATRFASVYAWNRKRISNCVA
ATRFASVYAWNRKRISNCVAD
TRFASVYAWNRKRISNCVADY
RFASVYAWNRKRISNCVADYS
FASVYAWNRKRISNCVADYSV
ASVYAWNRKRISNCVADYSVL
SVYAWNRKRISNCVADYSVLY
VYAWNRKRISNCVADYSVLYN
YAWNRKRISNCVADYSVLYNS
AWNRKRISNCVADYSVLYNSA
WNRKRISNCVADYSVLYNSAS
NRKRISNCVADYSVLYNSASF
RKRISNCVADYSVLYNSASFS
KRISNCVADYSVLYNSASFST
RISNCVADYSVLYNSASFSTF
ISNCVADYSVLYNSASFSTFK
SNCVADYSVLYNSASFSTFKC
NCVADYSVLYNSASFSTFKCY
CVADYSVLYNSASFSTFKCYG
VADYSVLYNSASFSTFKCYGV
ADYSVLYNSASFSTFKCYGVS
DYSVLYNSASFSTFKCYGVSP
YSVLYNSASFSTFKCYGVSPT
SVLYNSASFSTFKCYGVSPTK
VLYNSASFSTFKCYGVSPTKL
LYNSASFSTFKCYGVSPTKLN
YNSASFSTFKCYGVSPTKLND
NSASFSTFKCYGVSPTKLNDL
SASFSTFKCYGVSPTKLNDLC
ASFSTFKCYGVSPTKLNDLCF
SFSTFKCYGVSPTKLNDLCFT
FSTFKCYGVSPTKLNDLCFTN
STFKCYGVSPTKLNDLCFTNV
TFKCYGVSPTKLNDLCFTNVY
FKCYGVSPTKLNDLCFTNVYA
KCYGVSPTKLNDLCFTNVYAD
CYGVSPTKLNDLCFTNVYADS
YGVSPTKLNDLCFTNVYADSF
GVSPTKLNDLCFTNVYADSFV
VSPTKLNDLCFTNVYADSFVI
SPTKLNDLCFTNVYADSFVIR
PTKLNDLCFTNVYADSFVIRG
TKLNDLCFTNVYADSFVIRGD
KLNDLCFTNVYADSFVIRGDE
LNDLCFTNVYADSFVIRGDEV
NDLCFTNVYADSFVIRGDEVR
DLCFTNVYADSFVIRGDEVRQ
LCFTNVYADSFVIRGDEVRQI
CFTNVYADSFVIRGDEVRQIA
FTNVYADSFVIRGDEVRQIAP
TNVYADSFVIRGDEVRQIAPG
NVYADSFVIRGDEVRQIAPGQ
VYADSFVIRGDEVRQIAPGQT
YADSFVIRGDEVRQIAPGQTG
ADSFVIRGDEVRQIAPGQTGK
DSFVIRGDEVRQIAPGQTGKI
SFVIRGDEVRQIAPGQTGKIA
FVIRGDEVRQIAPGQTGKIAD
VIRGDEVRQIAPGQTGKIADY
IRGDEVRQIAPGQTGKIADYN
RGDEVRQIAPGQTGKIADYNY
GDEVRQIAPGQTGKIADYNYK
DEVRQIAPGQTGKIADYNYKL
EVRQIAPGQTGKIADYNYKLP
VRQIAPGQTGKIADYNYKLPD
RQIAPGQTGKIADYNYKLPDD
QIAPGQTGKIADYNYKLPDDF
IAPGQTGKIADYNYKLPDDFT
APGQTGKIADYNYKLPDDFTG
PGQTGKIADYNYKLPDDFTGC
GQTGKIADYNYKLPDDFTGCV
QTGKIADYNYKLPDDFTGCVI
TGKIADYNYKLPDDFTGCVIA
GKIADYNYKLPDDFTGCVIAW
KIADYNYKLPDDFTGCVIAWN
IADYNYKLPDDFTGCVIAWNS
ADYNYKLPDDFTGCVIAWNSN
DYNYKLPDDFTGCVIAWNSNN
YNYKLPDDFTGCVIAWNSNNL
NYKLPDDFTGCVIAWNSNNLD
YKLPDDFTGCVIAWNSNNLDS
KLPDDFTGCVIAWNSNNLDSK
LPDDFTGCVIAWNSNNLDSKV
PDDFTGCVIAWNSNNLDSKVG
DDFTGCVIAWNSNNLDSKVGG
DFTGCVIAWNSNNLDSKVGGN
FTGCVIAWNSNNLDSKVGGNY
TGCVIAWNSNNLDSKVGGNYN
GCVIAWNSNNLDSKVGGNYNY
CVIAWNSNNLDSKVGGNYNYL
VIAWNSNNLDSKVGGNYNYLY
IAWNSNNLDSKVGGNYNYLYR
AWNSNNLDSKVGGNYNYLYRL
WNSNNLDSKVGGNYNYLYRLF
NSNNLDSKVGGNYNYLYRLFR
SNNLDSKVGGNYNYLYRLFRK
NNLDSKVGGNYNYLYRLFRKS
NLDSKVGGNYNYLYRLFRKSN
LDSKVGGNYNYLYRLFRKSNL
DSKVGGNYNYLYRLFRKSNLK
SKVGGNYNYLYRLFRKSNLKP
KVGGNYNYLYRLFRKSNLKPF
VGGNYNYLYRLFRKSNLKPFE
GGNYNYLYRLFRKSNLKPFER
GNYNYLYRLFRKSNLKPFERD
NYNYLYRLFRKSNLKPFERDI
YNYLYRLFRKSNLKPFERDIS
NYLYRLFRKSNLKPFERDIST
YLYRLFRKSNLKPFERDISTE
LYRLFRKSNLKPFERDISTEI
YRLFRKSNLKPFERDISTEIY
RLFRKSNLKPFERDISTEIYQ
LFRKSNLKPFERDISTEIYQA
FRKSNLKPFERDISTEIYQAG
RKSNLKPFERDISTEIYQAGS
KSNLKPFERDISTEIYQAGST
SNLKPFERDISTEIYQAGSTP
NLKPFERDISTEIYQAGSTPC
LKPFERDISTEIYQAGSTPCN
KPFERDISTEIYQAGSTPCNG
PFERDISTEIYQAGSTPCNGV
FERDISTEIYQAGSTPCNGVE
ERDISTEIYQAGSTPCNGVEG
RDISTEIYQAGSTPCNGVEGF
DISTEIYQAGSTPCNGVEGFN
ISTEIYQAGSTPCNGVEGFNC
STEIYQAGSTPCNGVEGFNCY
TEIYQAGSTPCNGVEGFNCYF
EIYQAGSTPCNGVEGFNCYFP
IYQAGSTPCNGVEGFNCYFPL
YQAGSTPCNGVEGFNCYFPLQ
QAGSTPCNGVEGFNCYFPLQS
AGSTPCNGVEGFNCYFPLQSY
GSTPCNGVEGFNCYFPLQSYG
STPCNGVEGFNCYFPLQSYGF
TPCNGVEGFNCYFPLQSYGFQ
PCNGVEGFNCYFPLQSYGFQP
CNGVEGFNCYFPLQSYGFQPT
NGVEGFNCYFPLQSYGFQPTN
GVEGFNCYFPLQSYGFQPTNG
VEGFNCYFPLQSYGFQPTNGV
EGFNCYFPLQSYGFQPTNGVG
GFNCYFPLQSYGFQPTNGVGY
FNCYFPLQSYGFQPTNGVGYQ
NCYFPLQSYGFQPTNGVGYQP
CYFPLQSYGFQPTNGVGYQPY
YFPLQSYGFQPTNGVGYQPYR
FPLQSYGFQPTNGVGYQPYRV
PLQSYGFQPTNGVGYQPYRVV
LQSYGFQPTNGVGYQPYRVVV
QSYGFQPTNGVGYQPYRVVVL
SYGFQPTNGVGYQPYRVVVLS
YGFQPTNGVGYQPYRVVVLSF
GFQPTNGVGYQPYRVVVLSFE
FQPTNGVGYQPYRVVVLSFEL
QPTNGVGYQPYRVVVLSFELL
PTNGVGYQPYRVVVLSFELLH
TNGVGYQPYRVVVLSFELLHA
NGVGYQPYRVVVLSFELLHAP
GVGYQPYRVVVLSFELLHAPA
VGYQPYRVVVLSFELLHAPAT
GYQPYRVVVLSFELLHAPATV
YQPYRVVVLSFELLHAPATVC
QPYRVVVLSFELLHAPATVCG
PYRVVVLSFELLHAPATVCGP
YRVVVLSFELLHAPATVCGPK
RVVVLSFELLHAPATVCGPKK
VVVLSFELLHAPATVCGPKKS
VVLSFELLHAPATVCGPKKST
VLSFELLHAPATVCGPKKSTN
LSFELLHAPATVCGPKKSTNL
SFELLHAPATVCGPKKSTNLV
FELLHAPATVCGPKKSTNLVK
ELLHAPATVCGPKKSTNLVKN
LLHAPATVCGPKKSTNLVKNK
LHAPATVCGPKKSTNLVKNKC
HAPATVCGPKKSTNLVKNKCV
APATVCGPKKSTNLVKNKCVN
PATVCGPKKSTNLVKNKCVNF
ATVCGPKKSTNLVKNKCVNFN
TVCGPKKSTNLVKNKCVNFNF
VCGPKKSTNLVKNKCVNFNFN
CGPKKSTNLVKNKCVNFNFNG
GPKKSTNLVKNKCVNFNFNGL
PKKSTNLVKNKCVNFNFNGLT
KKSTNLVKNKCVNFNFNGLTG
KSTNLVKNKCVNFNFNGLTGT
STNLVKNKCVNFNFNGLTGTG
TNLVKNKCVNFNFNGLTGTGV
NLVKNKCVNFNFNGLTGTGVL
LVKNKCVNFNFNGLTGTGVLT
VKNKCVNFNFNGLTGTGVLTE
KNKCVNFNFNGLTGTGVLTES
NKCVNFNFNGLTGTGVLTESN
KCVNFNFNGLTGTGVLTESNK
CVNFNFNGLTGTGVLTESNKK
VNFNFNGLTGTGVLTESNKKF
NFNFNGLTGTGVLTESNKKFL
FNFNGLTGTGVLTESNKKFLP
NFNGLTGTGVLTESNKKFLPF
FNGLTGTGVLTESNKKFLPFQ
NGLTGTGVLTESNKKFLPFQQ
GLTGTGVLTESNKKFLPFQQF
LTGTGVLTESNKKFLPFQQFG
TGTGVLTESNKKFLPFQQFGR
GTGVLTESNKKFLPFQQFGRD
TGVLTESNKKFLPFQQFGRDI
GVLTESNKKFLPFQQFGRDIA
VLTESNKKFLPFQQFGRDIAD