hugoly commited on
Commit
700ce0d
·
verified ·
1 Parent(s): 9203ad9

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. data/example.json +240 -0
data/example.json ADDED
@@ -0,0 +1,240 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "name": "n_27",
4
+ "sequences": [
5
+ {
6
+ "proteinChain": {
7
+ "sequence": "ELQLVESGGGLVQPGGSLSLSCEVSGFSFDDVDNFIIAWFRQAPGKEREGVSFLRKYDMSTYYAESVKGRFTISSDNARDTVYLQMTNLKPEDTAVYYCALDREGFVFEQGMDFWGKGTQVTVSS",
8
+ "count": 1,
9
+ "msa": {
10
+ "precomputed_msa_dir": "/msa_database//40/409022d50b8e11c68dcd105ef71cb22b",
11
+ "non_pairing_msa_names": [
12
+ "mmdb_envdb_hits.a3m",
13
+ "mmdb_uniref30_hits.a3m"
14
+ ],
15
+ "pairing_db": "uniref100"
16
+ }
17
+ }
18
+ }
19
+ ]
20
+ },
21
+ {
22
+ "name": "a_19",
23
+ "sequences": [
24
+ {
25
+ "proteinChain": {
26
+ "sequence": "EVQLQQSGAELVKPGASVKLSCTASGFNIKDTYVHWVKQRPEQGLEWIGRIDPANGYTKYDPKFQGKATITADTSSNTAYLQLSSLTSEDTAVYYCVRPLYDYYAMDYWGQGTSVTVSS",
27
+ "count": 1,
28
+ "msa": {
29
+ "precomputed_msa_dir": "/msa_database//04/04f576349a6841c5148cb4f4bf2d61a0",
30
+ "non_pairing_msa_names": [
31
+ "mmdb_envdb_hits.a3m",
32
+ "mmdb_uniref30_hits.a3m"
33
+ ],
34
+ "pairing_db": "uniref100"
35
+ }
36
+ }
37
+ },
38
+ {
39
+ "proteinChain": {
40
+ "sequence": "DILMTQSPSSMSVSLGDTVSITCHASQGISSNIGWLQQKPGKSFMGLIYYGTNLVDGVPSRFSGSGSGADYSLTISSLDSEDFADYYCVQYAQLPYTFGGGTKLEIK",
41
+ "count": 1,
42
+ "msa": {
43
+ "precomputed_msa_dir": "/msa_database//98/98c4c262485cdd7e54c866d5364a40ca",
44
+ "non_pairing_msa_names": [
45
+ "mmdb_envdb_hits.a3m",
46
+ "mmdb_uniref30_hits.a3m"
47
+ ],
48
+ "pairing_db": "uniref100"
49
+ }
50
+ }
51
+ }
52
+ ]
53
+ },
54
+ {
55
+ "name": "rl_1",
56
+ "sequences": [
57
+ {
58
+ "rnaSequence": {
59
+ "sequence": "UUGGGUUCCCUCACCCCAAUCAUAAAAAGG",
60
+ "count": 1
61
+ }
62
+ },
63
+ {
64
+ "ligand": {
65
+ "ligand": "CCD_PRF",
66
+ "count": 1
67
+ }
68
+ }
69
+ ]
70
+ },
71
+ {
72
+ "name": "rna_1",
73
+ "sequences": [
74
+ {
75
+ "rnaSequence": {
76
+ "sequence": "GCCCGGAUAGCUCAGUCGGUAGAGCAGCGGCUAAAACAGCUCUGGGACCCCAGAGGCCCACGUGGCGGCUAGUACUCCGGUAUUGCGGUACCCUUGUACGCCUGUUUUAGCCGCGGGUCCAGGGUUCAAGUCCCUGUUCGGGCGCC",
77
+ "count": 1
78
+ }
79
+ }
80
+ ]
81
+ },
82
+ {
83
+ "name": "pp_5",
84
+ "sequences": [
85
+ {
86
+ "proteinChain": {
87
+ "sequence": "KDFLPLYFGWFLTKKSSETLRKAGQVFLEELGNHKAFKKELRHFIEKLELVSYFGKRPPGVLHCTTKFCDYGKAAGAEEYAQQEVVKRSYGKAFKLSISALFVTPKTAGAQVVLTDQELQLWPSSASEGLPPGSRAHVTLGCAADVQPVQTGLDLLDILQQVKGGSQGEAVGELPRGKLYSLGKGRWMLSLTKKMEVKAIFTGYYG",
88
+ "count": 1,
89
+ "msa": {
90
+ "precomputed_msa_dir": "/msa_database//44/44171e0f6f6b62d557e71259de7dd564",
91
+ "non_pairing_msa_names": [
92
+ "mmdb_envdb_hits.a3m",
93
+ "mmdb_uniref30_hits.a3m"
94
+ ],
95
+ "pairing_db": "uniref100"
96
+ }
97
+ }
98
+ },
99
+ {
100
+ "proteinChain": {
101
+ "sequence": "VQLEESGGGLVQPGGSLRLSCAASGFTFSSYVMSWVRQAPGKGLEWVSDINSGGSRTYYTDSVKGRFTISRDNAKNTLYLQMNSLKPEDTAVYYCARDSLLSTRYLHTSERGQGTQVTVSS",
102
+ "count": 1,
103
+ "msa": {
104
+ "precomputed_msa_dir": "/msa_database//95/95c0e2d90f643a4aa77b4887aca35a68",
105
+ "non_pairing_msa_names": [
106
+ "mmdb_envdb_hits.a3m",
107
+ "mmdb_uniref30_hits.a3m"
108
+ ],
109
+ "pairing_db": "uniref100"
110
+ }
111
+ }
112
+ }
113
+ ]
114
+ },
115
+ {
116
+ "name": "pl_2",
117
+ "sequences": [
118
+ {
119
+ "proteinChain": {
120
+ "sequence": "STGSATTTPIDSLDDAYITPVQIGTPAQTLNLDFDTGSSDLWVFSSETTASEVDGQTIYTPSKSTTAKLLSGATWSISYGDGSSSSGDVYTDTVSVGGLTVTGQAVESAKKVSSSFTEDSTIDGLLGLAFSTLNTVSPTQQKTFFDNAKASLDSPVFTADLGYHAPGTYNFGFIDTTAYTGSITYTAVSTKQGFWEWTSTGYAVGSGTFKSTSIDGIADTGTTLLYLPATVVSAYWAQVSGAKSSSSVGGYVFPCSATLPSFTFGVGSARIVIPGDYIDFGPISTGSSSCFGGIQSSAGIGINIFGDVALKAAFVVFNGATTPTLGFASK",
121
+ "count": 1,
122
+ "msa": {
123
+ "precomputed_msa_dir": "/msa_database//8e/8ef51c6dba3ea80243a8c7c216e9e815",
124
+ "non_pairing_msa_names": [
125
+ "mmdb_envdb_hits.a3m",
126
+ "mmdb_uniref30_hits.a3m"
127
+ ],
128
+ "pairing_db": "uniref100"
129
+ }
130
+ }
131
+ },
132
+ {
133
+ "ligand": {
134
+ "ligand": "CCD_ZRY",
135
+ "count": 1
136
+ }
137
+ }
138
+ ]
139
+ },
140
+ {
141
+ "name": "gpm_47",
142
+ "sequences": [
143
+ {
144
+ "proteinChain": {
145
+ "sequence": "KLRNVMYYGDWSIWGGQGNFYPKDIPADKLTHLNFAFMDFNSSGELIYCDKDAAIGHPLGNLGVTYGDVNGGILNAFQVLKSENPNLKIGVSLGGWSKSGDFSTIAATPSIRAKFVENVMKFIKYTNMDFVDIDWEYPGDYREPDKTDNINDEGTPNASAGDKENYILLLQDLKEALNKQGKELGKVYELSVALPAGVSKIEKGIDVDKLFNIVDFANIMTYDMAGAWSTTSGHQTALYTNPNAPEEYKGLSVDESVKYYISQGAEREKIVVGAAYYTRGWEQVSDKGTDPNNPGLFGEAAVVNKDADLSPTPGALNEAPMKNGEGGRAGGVWGYNALDKLKSKYTGLKEYWDDSAKAPYLYNSETGAFFTYDNIRSIQEKAKYVKENNLGGIIGWMASQDATTNSTKRDELTTATKESLFGKEDLPKYEIKYTENDITCTVTPVKQSWGSGGVLKMSITNNEKLDESGEVLSTVETSAKTVKNMKVYIKTDGIAITGSQYPAGPVTKEGDYYVIDFGKISDGKLMKAGITFTFDLNLDKAIEDTNNIISIEVSQRMYQTSPEFNRQTIWENT",
146
+ "count": 1,
147
+ "msa": {
148
+ "precomputed_msa_dir": "/msa_database//4a/4a6eb0005370ae9f869e53a44648cc4e",
149
+ "non_pairing_msa_names": [
150
+ "mmdb_envdb_hits.a3m",
151
+ "mmdb_uniref30_hits.a3m"
152
+ ],
153
+ "pairing_db": "uniref100"
154
+ }
155
+ }
156
+ }
157
+ ]
158
+ },
159
+ {
160
+ "name": "na_8",
161
+ "sequences": [
162
+ {
163
+ "proteinChain": {
164
+ "sequence": "QMQLVESGGGLVQAGGSLRLSCAVSGSIFSIITLAWYRQAPGKPRENVATITRGSRTSYADSVKGRFTISKDNAKSTVYLQMNKLKPEDTADYYCNAEGPAGYWGQGTPVTVS",
165
+ "count": 1,
166
+ "msa": {
167
+ "precomputed_msa_dir": "/msa_database//02/029e866cde0ee16963d85d0c7f94cf13",
168
+ "non_pairing_msa_names": [
169
+ "mmdb_envdb_hits.a3m",
170
+ "mmdb_uniref30_hits.a3m"
171
+ ],
172
+ "pairing_db": "uniref100"
173
+ }
174
+ }
175
+ },
176
+ {
177
+ "proteinChain": {
178
+ "sequence": "SGDVEFRNVTFTYPGRDVPALRNINLKIPAGKTVALVGRSGSGKSTIASLITRFYDIDEGEILMDGHDLREYTLASLRNQVALVSQNVHLFNDTVANNIAYARTEQYSREQIEEAARMAYAMDFINKMDNGLDTVIGENGVLLSGGQRQRIAIARALLRDSPILILDEATSALDTESERAIQAALDELQKNRTSLVIAHRLSTIEKADEIVVVEDGVIVERGTHNDLLEHRGVYAQLHKMQFGQA",
179
+ "count": 1,
180
+ "msa": {
181
+ "precomputed_msa_dir": "/msa_database//e0/e0fb27b225aa50cb2ce1d07db8d24ffd",
182
+ "non_pairing_msa_names": [
183
+ "mmdb_envdb_hits.a3m",
184
+ "mmdb_uniref30_hits.a3m"
185
+ ],
186
+ "pairing_db": "uniref100"
187
+ }
188
+ }
189
+ }
190
+ ]
191
+ },
192
+ {
193
+ "name": "aa_32",
194
+ "sequences": [
195
+ {
196
+ "proteinChain": {
197
+ "sequence": "EVQLVESGGGLVQPGGSLRLSCAASGFTFSTYSMNWVRQAPGKGLEWVSYISYRSRTIYYADSVKGRFTISRDNARNSLYLQMNSLRDEDTAVYYCARWGYGSGGFDYWGQGTLVTVSS",
198
+ "count": 1,
199
+ "msa": {
200
+ "precomputed_msa_dir": "/msa_database//3f/3f2f7e41c18f277c36a706d5c2cece8f",
201
+ "non_pairing_msa_names": [
202
+ "mmdb_envdb_hits.a3m",
203
+ "mmdb_uniref30_hits.a3m"
204
+ ],
205
+ "pairing_db": "uniref100"
206
+ }
207
+ }
208
+ },
209
+ {
210
+ "proteinChain": {
211
+ "sequence": "EIVLTQSPGTLSLSPGERATLSCRASQSVSSSYLAWYQQKPGQAPRLLIYGASSRATGIPDRFSGSGSGTDFTLTISRLEPEDFAVYYCQQYGSSFTFGPGTKVDIK",
212
+ "count": 1,
213
+ "msa": {
214
+ "precomputed_msa_dir": "/msa_database//fa/fae049eb9657f20032cd363cf8541608",
215
+ "non_pairing_msa_names": [
216
+ "mmdb_envdb_hits.a3m",
217
+ "mmdb_uniref30_hits.a3m"
218
+ ],
219
+ "pairing_db": "uniref100"
220
+ }
221
+ }
222
+ },
223
+ {
224
+ "proteinChain": {
225
+ "sequence": "GSTVPPMVNVTRSEASEGNITVTCRASSFYPRNIILTWRQDGVSLSHDTQQWGDVLPDGNGTYQTWVATRICRGEEQRFTCYMEHSGNHSTHPVPSGHHHHHH",
226
+ "count": 1,
227
+ "msa": {
228
+ "precomputed_msa_dir": "/msa_database//71/71a869512b985a27e9de997988d7ec98",
229
+ "non_pairing_msa_names": [
230
+ "mmdb_envdb_hits.a3m",
231
+ "mmdb_uniref30_hits.a3m"
232
+ ],
233
+ "pairing_db": "uniref100"
234
+ }
235
+ }
236
+ }
237
+ ]
238
+ }
239
+
240
+ ]