libokj commited on
Commit
6d003f4
·
verified ·
1 Parent(s): 0a1d236

Upload 17 files

Browse files
data/drug_libraries/Enamine_Discovery_Diversity_Set_10_10240cmpds_20240130.csv ADDED
The diff for this file is too large to render. See raw diff
 
data/drug_libraries/Enamine_Discovery_Diversity_Set_10_10240cmpds_20240130_origal.csv ADDED
The diff for this file is too large to render. See raw diff
 
data/drug_libraries/Enamine_Discovery_Diversity_Set_50_50240cmpds_20231031.csv ADDED
The diff for this file is too large to render. See raw diff
 
data/drug_libraries/Enamine_Phenotypic_Screening_Library_plated_5760cmds_2020_07_20.csv ADDED
The diff for this file is too large to render. See raw diff
 
data/drug_libraries/drugbank_compounds.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data/examples/MAPK14.fasta CHANGED
@@ -4,5 +4,4 @@ SIIHAKRTYRELRLLKHMKHENVIGLLDVFTPARSLEEFNDVYLVTHLMGADLNNIVKCQ
4
  KLTDDHVQFLIYQILRGLKYIHSADIIHRDLKPSNLAVNEDCELKILDFGLARHTDDEMT
5
  GYVATRWYRAPEIMLNWMHYNQTVDIWSVGCIMAELLTGRTLFPGTDHIDQLKLILRLVG
6
  TPGAELLKKISSESARNYIQSLTQMPKMNFANVFIGANPLAVDLLEKMLVLDSDKRITAA
7
- QALAHAYFAQYHDPDDEPVADPYDQSFESRDLLIDEWKSLTYDEVISFVPPPLDQEEMES
8
-
 
4
  KLTDDHVQFLIYQILRGLKYIHSADIIHRDLKPSNLAVNEDCELKILDFGLARHTDDEMT
5
  GYVATRWYRAPEIMLNWMHYNQTVDIWSVGCIMAELLTGRTLFPGTDHIDQLKLILRLVG
6
  TPGAELLKKISSESARNYIQSLTQMPKMNFANVFIGANPLAVDLLEKMLVLDSDKRITAA
7
+ QALAHAYFAQYHDPDDEPVADPYDQSFESRDLLIDEWKSLTYDEVISFVPPPLDQEEMES
 
data/examples/compound_library.sdf CHANGED
@@ -1,284 +1,509 @@
1
 
2
  RDKit 2D
3
 
4
- 22 23 0 0 0 0 0 0 0 0999 V2000
5
- 7.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
6
- 6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
7
- 5.2500 -1.2990 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
8
- 3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
9
- 3.0000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
10
- 3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
11
  1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
12
  0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
13
  -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
14
- -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
 
 
 
15
  -3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
16
  -3.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
17
- -5.2500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
18
- -6.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
19
- -7.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
20
- -8.2500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
21
- -9.7500 1.2990 0.0000 F 0 0 0 0 0 0 0 0 0 0 0 0
22
- -7.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
23
- -6.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
 
24
  -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
25
  0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
26
- 1.5000 2.5981 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
27
  1 2 1 0
28
- 2 3 1 0
29
  3 4 1 0
30
- 4 5 2 0
31
- 4 6 1 0
32
  6 7 1 0
33
  7 8 2 0
34
- 8 9 1 0
35
- 9 10 2 0
36
- 10 11 1 0
37
- 11 12 1 0
38
- 12 13 1 0
39
- 13 14 2 0
40
  14 15 1 0
41
- 15 16 2 0
42
- 16 17 1 0
43
  16 18 1 0
44
- 18 19 2 0
45
- 10 20 1 0
46
- 20 21 2 0
47
- 21 22 1 0
48
- 21 7 1 0
49
- 19 13 1 0
 
 
 
 
 
 
 
 
 
 
50
  M END
51
- > <ID> (1)
52
- CHEMBL41355
53
-
54
  $$$$
55
 
56
  RDKit 2D
57
 
58
- 23 23 0 0 0 0 0 0 0 0999 V2000
59
- 7.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
60
- 6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
61
- 5.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
62
- 3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
63
- 3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
64
- 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
 
 
 
 
 
 
 
65
  0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
66
- -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
67
- -1.5000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
68
- -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
69
- -3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
70
- -3.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
71
- -5.2500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
72
- -6.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
73
- -6.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
74
- -5.2500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
75
- -6.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
76
- -5.2500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
77
- -6.0000 7.7942 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
78
- -3.7500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
79
- -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
80
- -1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
81
  0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
82
- 1 2 1 0
 
 
 
 
 
 
 
 
83
  2 3 1 0
84
- 3 4 1 0
85
  4 5 1 0
86
- 5 6 1 0
87
- 6 7 2 0
88
- 7 8 1 0
89
  8 9 1 0
90
- 8 10 2 0
91
  10 11 1 0
92
  11 12 1 0
93
  12 13 2 0
94
  13 14 1 0
95
- 13 15 1 0
96
  15 16 1 0
97
- 16 17 1 0
98
- 17 18 2 0
99
- 18 19 1 0
100
- 18 20 1 0
101
- 10 21 1 0
102
  21 22 1 0
103
- 21 23 2 0
104
- 23 6 1 0
 
 
 
 
 
 
 
 
 
 
105
  M END
106
- > <ID> (2)
107
- CHEMBL497318
108
-
109
  $$$$
110
 
111
  RDKit 2D
112
 
113
- 26 29 0 0 0 0 0 0 0 0999 V2000
114
- -3.7527 6.6955 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
115
- -2.6380 5.6918 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
116
- -1.2114 6.1554 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
117
- -0.0967 5.1517 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
118
- -0.4086 3.6844 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
119
- 0.7062 2.6807 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
120
- 2.1328 3.1443 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
121
- 3.2475 2.1406 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
122
- 4.6741 2.6041 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
123
- 5.7888 1.6004 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
124
- 7.2154 2.0639 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
125
- 8.3301 1.0602 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
126
- 9.7567 1.5238 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
127
- 10.8714 0.5201 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
128
- 12.2980 0.9836 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
129
- 12.6098 2.4508 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
130
- 11.4951 3.4545 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
131
- 10.0685 2.9910 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
132
- 0.3943 1.2135 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
133
- 1.2760 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
134
- 0.3943 -1.2135 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
135
- -1.0323 -0.7500 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
136
- -1.0323 0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
137
- -2.1470 1.7537 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
138
- -1.8351 3.2209 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
139
- -2.9499 4.2246 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
140
  1 2 2 0
141
  2 3 1 0
142
- 3 4 2 0
143
- 4 5 1 0
144
- 5 6 2 0
145
- 6 7 1 0
146
  7 8 1 0
147
- 8 9 1 0
148
  9 10 1 0
149
  10 11 1 0
150
- 11 12 1 0
151
  12 13 1 0
152
  13 14 2 0
153
  14 15 1 0
154
  15 16 2 0
155
  16 17 1 0
156
  17 18 2 0
157
- 6 19 1 0
158
- 19 20 1 0
159
- 20 21 2 0
160
- 21 22 1 0
161
- 22 23 1 0
162
- 23 24 1 0
163
- 24 25 2 0
164
- 25 26 1 0
165
- 26 2 1 0
166
- 25 5 1 0
167
- 18 13 1 0
168
- 23 19 2 0
169
  M END
170
- > <ID> (3)
171
- CHEMBL444449
172
-
173
  $$$$
174
 
175
  RDKit 2D
176
 
177
- 24 26 0 0 0 0 0 0 0 0999 V2000
178
- 1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
179
- 0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
180
- 1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
181
- 3.0000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
182
- 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
183
  1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
184
- 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
 
 
 
 
 
185
  -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
186
  -1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
187
- -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
188
- -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
189
- -0.7500 -3.8971 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
190
- -1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
191
- -3.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
192
- -3.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
193
- -5.2500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
194
- -6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
195
- -5.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
196
- -6.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
197
- -7.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
198
- -8.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
199
- -7.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
200
- -3.0000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
201
- -1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
202
  1 2 1 0
203
  2 3 1 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
204
  3 4 1 0
205
- 3 5 1 0
206
- 5 6 2 0
207
  6 7 1 0
208
- 7 8 2 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
209
  8 9 1 0
210
- 8 10 1 0
211
- 10 11 2 0
212
- 2 12 1 0
213
  12 13 1 0
214
- 13 14 1 0
215
- 14 15 1 0
216
- 15 16 1 0
217
  16 17 1 0
218
  17 18 2 0
219
  18 19 1 0
220
- 19 20 2 0
221
- 20 21 1 0
222
- 21 22 2 0
223
- 15 23 1 0
224
- 23 24 1 0
225
- 11 5 1 0
226
- 24 12 1 0
227
- 22 17 1 0
228
  M END
229
- > <ID> (4)
230
- CHEMBL305187
 
231
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
232
  $$$$
233
 
234
  RDKit 2D
235
 
236
- 21 22 0 0 0 0 0 0 0 0999 V2000
237
- 6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
238
- 5.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
239
  3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
240
  3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
241
- 1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
 
242
  0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
243
  -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
244
  -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
245
  -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
246
  0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
247
- 1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
248
- 0.7500 3.8971 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
249
- 3.0000 2.5981 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
250
- 3.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
251
- 5.2500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
252
- 6.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
253
- 6.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
254
- 5.2500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
255
- 3.7500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
256
- 3.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
257
- 1.5000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
258
- 1 2 1 0
259
- 2 3 1 0
260
  3 4 1 0
261
  4 5 1 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
262
  5 6 1 0
263
  6 7 1 0
264
  7 8 1 0
265
  8 9 1 0
266
  9 10 1 0
267
  10 11 1 0
268
- 11 12 2 0
269
- 11 13 1 0
270
- 13 14 1 0
271
- 14 15 2 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
272
  15 16 1 0
273
- 15 17 1 0
274
- 17 18 2 0
275
- 18 19 1 0
276
- 19 20 2 0
277
  20 21 1 0
278
- 10 5 1 0
279
- 20 14 1 0
 
 
 
 
280
  M END
281
- > <ID> (5)
282
- CHEMBL1098
283
-
284
  $$$$
 
1
 
2
  RDKit 2D
3
 
4
+ 31 33 0 0 0 0 0 0 0 0999 V2000
5
+ 3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
6
  1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
7
  0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
8
  -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
9
+ -1.5000 -2.5981 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
10
+ -3.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
11
+ -3.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
12
+ -3.0000 -5.1962 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
13
+ -5.2500 -3.8971 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
14
+ -6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
15
+ -7.5000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
16
+ -5.2500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
17
+ -3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
18
  -3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
19
  -3.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
20
+ -3.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
21
+ -1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
22
+ -3.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
23
+ -5.2500 3.8971 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
24
+ -3.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
25
+ -1.5000 5.1962 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
26
+ -3.7500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
27
+ -3.0000 7.7942 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
28
+ -3.7500 9.0933 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
29
+ -2.4510 9.8433 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
30
+ -5.0490 8.3433 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
31
+ -4.5000 10.3923 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
32
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
33
  -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
34
  0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
35
+ 1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
36
  1 2 1 0
37
+ 2 3 2 0
38
  3 4 1 0
39
+ 4 5 1 0
40
+ 5 6 2 0
41
  6 7 1 0
42
  7 8 2 0
43
+ 7 9 1 0
44
+ 9 10 1 0
45
+ 10 11 2 0
46
+ 10 12 1 0
47
+ 12 13 2 0
48
+ 13 14 1 0
49
  14 15 1 0
50
+ 15 16 1 0
51
+ 16 17 1 1
52
  16 18 1 0
53
+ 18 19 1 6
54
+ 18 20 1 0
55
+ 20 21 1 1
56
+ 20 22 1 0
57
+ 22 23 1 0
58
+ 23 24 1 0
59
+ 24 25 2 0
60
+ 24 26 1 0
61
+ 24 27 1 0
62
+ 14 28 1 0
63
+ 28 29 1 0
64
+ 29 30 2 0
65
+ 30 31 1 0
66
+ 30 2 1 0
67
+ 28 4 2 0
68
+ 13 6 1 0
69
  M END
 
 
 
70
  $$$$
71
 
72
  RDKit 2D
73
 
74
+ 29 33 0 0 0 0 0 0 0 0999 V2000
75
+ 3.8670 -13.5458 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
76
+ 4.9817 -12.5421 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
77
+ 6.4083 -13.0057 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
78
+ 4.6699 -11.0749 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
79
+ 3.2433 -10.6114 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
80
+ 2.1286 -11.6151 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
81
+ 0.7020 -11.1516 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
82
+ 0.3901 -9.6843 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
83
+ -1.0365 -9.2208 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
84
+ -2.2500 -10.1025 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
85
+ -3.4635 -9.2208 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
86
+ -3.0000 -7.7942 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
87
+ -3.7500 -6.4952 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
88
+ -3.0000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
89
+ -1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
90
+ -0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
91
+ 0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
92
+ 1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
93
  0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
94
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
95
  0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
96
+ -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
97
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
98
+ -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
99
+ -1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
100
+ -0.7500 -6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
101
+ -1.5000 -7.7942 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
102
+ 1.5048 -8.6806 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
103
+ 2.9314 -9.1442 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
104
+ 1 2 2 0
105
  2 3 1 0
106
+ 2 4 1 0
107
  4 5 1 0
108
+ 5 6 2 0
109
+ 6 7 1 0
110
+ 7 8 2 0
111
  8 9 1 0
112
+ 9 10 2 0
113
  10 11 1 0
114
  11 12 1 0
115
  12 13 2 0
116
  13 14 1 0
117
+ 14 15 2 0
118
  15 16 1 0
119
+ 16 17 2 0
120
+ 17 18 1 0
121
+ 18 19 2 0
122
+ 19 20 1 0
123
+ 20 21 2 0
124
  21 22 1 0
125
+ 22 23 2 0
126
+ 23 24 1 0
127
+ 24 25 2 0
128
+ 15 26 1 0
129
+ 26 27 2 0
130
+ 8 28 1 0
131
+ 28 29 2 0
132
+ 29 5 1 0
133
+ 27 9 1 0
134
+ 27 12 1 0
135
+ 25 16 1 0
136
+ 24 19 1 0
137
  M END
 
 
 
138
  $$$$
139
 
140
  RDKit 2D
141
 
142
+ 24 27 0 0 0 0 0 0 0 0999 V2000
143
+ -7.2317 -6.0469 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
144
+ -6.9199 -4.5797 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
145
+ -8.0346 -3.5760 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
146
+ -5.4933 -4.1162 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
147
+ -5.1814 -2.6490 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
148
+ -3.7548 -2.1855 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
149
+ -2.6401 -3.1891 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
150
+ -1.2135 -2.7256 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
151
+ -0.0000 -3.6073 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
152
+ 1.2135 -2.7256 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
153
+ 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
154
+ 1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
155
+ 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
156
+ -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
157
+ -1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
158
+ -0.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
159
+ -1.5000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
160
+ -3.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
161
+ -3.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
162
+ -3.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
163
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
164
+ -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
165
+ -2.9520 -4.6564 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
166
+ -4.3786 -5.1199 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
 
 
167
  1 2 2 0
168
  2 3 1 0
169
+ 2 4 1 0
170
+ 4 5 2 0
171
+ 5 6 1 0
172
+ 6 7 2 0
173
  7 8 1 0
174
+ 8 9 2 0
175
  9 10 1 0
176
  10 11 1 0
177
+ 11 12 2 0
178
  12 13 1 0
179
  13 14 2 0
180
  14 15 1 0
181
  15 16 2 0
182
  16 17 1 0
183
  17 18 2 0
184
+ 18 19 1 0
185
+ 19 20 2 0
186
+ 14 21 1 0
187
+ 21 22 2 0
188
+ 7 23 1 0
189
+ 23 24 2 0
190
+ 24 4 1 0
191
+ 22 8 1 0
192
+ 22 11 1 0
193
+ 20 15 1 0
 
 
194
  M END
 
 
 
195
  $$$$
196
 
197
  RDKit 2D
198
 
199
+ 16 17 0 0 0 0 0 0 0 0999 V2000
200
+ 3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
201
  1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
202
+ 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
203
+ -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
204
+ -1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
205
+ -3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
206
+ -3.8817 -1.2135 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
207
+ -5.3083 -0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
208
+ -6.5218 -1.6317 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
209
+ -5.3083 0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
210
+ -6.5218 1.6317 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
211
+ -6.3650 3.1235 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
212
+ -3.8817 1.2135 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
213
  -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
214
  -1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
215
+ 0.7500 1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
216
  1 2 1 0
217
  2 3 1 0
218
+ 3 4 2 0
219
+ 4 5 1 0
220
+ 6 5 1 1
221
+ 6 7 1 0
222
+ 7 8 1 0
223
+ 8 9 1 6
224
+ 8 10 1 0
225
+ 10 11 1 1
226
+ 11 12 1 0
227
+ 10 13 1 0
228
+ 5 14 1 0
229
+ 14 15 2 0
230
+ 14 16 1 0
231
+ 16 2 2 0
232
+ 13 6 1 0
233
+ M END
234
+ $$$$
235
+
236
+ RDKit 2D
237
+
238
+ 29 30 0 0 0 0 0 0 0 0999 V2000
239
+ 3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
240
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
241
+ 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
242
+ -0.7500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
243
+ -1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
244
+ -0.8899 -3.9684 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
245
+ -2.0046 -4.9721 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
246
+ -1.8478 -6.4639 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
247
+ -3.3037 -4.2221 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
248
+ -4.6740 -4.8322 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
249
+ -5.8875 -3.9505 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
250
+ -7.2578 -4.5606 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
251
+ -6.6477 -5.9309 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
252
+ -7.8679 -3.1903 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
253
+ -8.6281 -5.1707 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
254
+ -8.7849 -6.6625 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
255
+ -10.2767 -6.5057 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
256
+ -7.2931 -6.8193 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
257
+ -8.9417 -8.1543 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
258
+ -7.7282 -9.0360 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
259
+ -8.6099 -10.2495 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
260
+ -6.8465 -7.8224 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
261
+ -6.5147 -9.9176 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
262
+ -2.9918 -2.7549 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
263
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
264
+ -3.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
265
+ -0.7500 1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
266
+ 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
267
+ 1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
268
+ 1 2 1 0
269
+ 2 3 2 0
270
  3 4 1 0
271
+ 5 4 1 1
272
+ 5 6 1 0
273
  6 7 1 0
274
+ 7 8 1 6
275
+ 7 9 1 0
276
+ 9 10 1 1
277
+ 10 11 1 0
278
+ 11 12 1 0
279
+ 12 13 2 0
280
+ 12 14 1 0
281
+ 12 15 1 0
282
+ 15 16 1 0
283
+ 16 17 2 0
284
+ 16 18 1 0
285
+ 16 19 1 0
286
+ 19 20 1 0
287
+ 20 21 2 0
288
+ 20 22 1 0
289
+ 20 23 1 0
290
+ 9 24 1 0
291
+ 4 25 1 0
292
+ 25 26 2 0
293
+ 25 27 1 0
294
+ 27 28 1 0
295
+ 28 29 2 0
296
+ 28 2 1 0
297
+ 24 5 1 0
298
+ M END
299
+ $$$$
300
+
301
+ RDKit 2D
302
+
303
+ 19 20 0 0 0 0 0 0 0 0999 V2000
304
+ 3.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
305
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
306
+ 0.7500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
307
+ -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
308
+ -1.5000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
309
+ -1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
310
+ -3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
311
+ -3.8817 -1.2135 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
312
+ -5.3083 -0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
313
+ -6.5218 -1.6317 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
314
+ -5.3083 0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
315
+ -6.5218 1.6317 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
316
+ -6.3650 3.1235 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
317
+ -3.8817 1.2135 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
318
+ -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
319
+ 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
320
+ 1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
321
+ 3.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
322
+ 3.7500 3.8971 0.0000 Br 0 0 0 0 0 0 0 0 0 0 0 0
323
+ 1 2 2 0
324
+ 2 3 1 0
325
+ 3 4 1 0
326
+ 4 5 2 0
327
+ 4 6 1 0
328
+ 7 6 1 1
329
+ 7 8 1 0
330
  8 9 1 0
331
+ 9 10 1 6
332
+ 9 11 1 0
333
+ 11 12 1 1
334
  12 13 1 0
335
+ 11 14 1 0
336
+ 6 15 1 0
337
+ 15 16 2 0
338
  16 17 1 0
339
  17 18 2 0
340
  18 19 1 0
341
+ 16 2 1 0
342
+ 14 7 1 0
 
 
 
 
 
 
343
  M END
344
+ $$$$
345
+
346
+ RDKit 2D
347
 
348
+ 17 18 0 0 0 0 0 0 0 0999 V2000
349
+ 3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
350
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
351
+ 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
352
+ -0.7500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
353
+ -1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
354
+ -0.8899 -3.9684 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
355
+ -2.0046 -4.9721 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
356
+ -1.8478 -6.4639 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
357
+ -3.3037 -4.2221 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
358
+ -4.6740 -4.8322 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
359
+ -5.8875 -3.9505 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
360
+ -2.9918 -2.7549 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
361
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
362
+ -3.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
363
+ -0.7500 1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
364
+ 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
365
+ 1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
366
+ 1 2 1 0
367
+ 2 3 2 0
368
+ 3 4 1 0
369
+ 5 4 1 1
370
+ 5 6 1 0
371
+ 6 7 1 0
372
+ 7 8 1 6
373
+ 7 9 1 0
374
+ 9 10 1 1
375
+ 10 11 1 0
376
+ 9 12 1 0
377
+ 4 13 1 0
378
+ 13 14 2 0
379
+ 13 15 1 0
380
+ 15 16 1 0
381
+ 16 17 2 0
382
+ 16 2 1 0
383
+ 12 5 1 0
384
+ M END
385
  $$$$
386
 
387
  RDKit 2D
388
 
389
+ 15 15 0 0 0 0 0 0 0 0999 V2000
390
+ 6.7500 -3.8971 0.0000 N 0 0 0 0 0 2 0 0 0 0 0 0
391
+ 6.0000 -2.5981 0.0000 N 0 0 0 0 0 4 0 0 0 0 0 0
392
+ 5.2500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
393
  3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
394
  3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
395
+ 3.7500 1.2990 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
396
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
397
  0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
398
  -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
399
  -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
400
+ -3.0000 0.0000 0.0000 N 0 0 0 0 0 4 0 0 0 0 0 0
401
+ -3.7500 -1.2990 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
402
+ -3.7500 1.2990 0.0000 O 0 0 0 0 0 1 0 0 0 0 0 0
403
  -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
404
  0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
405
+ 1 2 2 0
406
+ 2 3 2 0
 
 
 
 
 
 
 
 
 
 
 
407
  3 4 1 0
408
  4 5 1 0
409
+ 5 6 1 1
410
+ 5 7 1 0
411
+ 7 8 2 0
412
+ 8 9 1 0
413
+ 9 10 2 0
414
+ 10 11 1 0
415
+ 11 12 2 0
416
+ 11 13 1 0
417
+ 10 14 1 0
418
+ 14 15 2 0
419
+ 15 7 1 0
420
+ M CHG 4 1 -1 2 1 11 1 13 -1
421
+ M END
422
+ $$$$
423
+
424
+ RDKit 2D
425
+
426
+ 13 13 0 0 0 0 0 0 0 0999 V2000
427
+ 7.2990 -1.8481 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
428
+ 6.0000 -2.5981 0.0000 S 0 0 0 0 0 0 0 0 0 0 0 0
429
+ 4.7010 -3.3481 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
430
+ 6.7500 -3.8971 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
431
+ 5.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
432
+ 3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
433
+ 3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
434
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
435
+ 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
436
+ -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
437
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
438
+ -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
439
+ 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
440
+ 1 2 2 0
441
+ 2 3 2 0
442
+ 2 4 1 0
443
+ 2 5 1 0
444
  5 6 1 0
445
  6 7 1 0
446
  7 8 1 0
447
  8 9 1 0
448
  9 10 1 0
449
  10 11 1 0
450
+ 11 12 1 0
451
+ 12 13 1 0
452
+ 13 8 1 0
453
+ M END
454
+ $$$$
455
+
456
+ RDKit 2D
457
+
458
+ 23 26 0 0 0 0 0 0 0 0999 V2000
459
+ -5.2020 -8.5535 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
460
+ -4.8901 -7.0863 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
461
+ -6.0048 -6.0826 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
462
+ -3.4635 -6.6227 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
463
+ -2.2500 -7.5044 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
464
+ -1.0365 -6.6227 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
465
+ -1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
466
+ -0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
467
+ 0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
468
+ 1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
469
+ 0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
470
+ 1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
471
+ 0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
472
+ 1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
473
+ -0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
474
+ -1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
475
+ -0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
476
+ -2.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
477
+ -1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
478
+ -3.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
479
+ -3.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
480
+ -3.0000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
481
+ -4.4918 -5.3529 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
482
+ 1 2 1 0
483
+ 2 3 2 0
484
+ 4 2 1 6
485
+ 4 5 1 0
486
+ 5 6 1 0
487
+ 7 6 1 6
488
+ 7 8 1 0
489
+ 8 9 1 1
490
+ 9 10 1 0
491
+ 10 11 2 0
492
+ 11 12 1 0
493
+ 12 13 1 0
494
+ 13 14 1 6
495
+ 13 15 1 0
496
  15 16 1 0
497
+ 16 17 1 0
498
+ 17 18 1 6
499
+ 17 19 1 0
500
+ 19 20 1 6
501
  20 21 1 0
502
+ 21 22 1 0
503
+ 22 23 1 6
504
+ 22 4 1 0
505
+ 22 7 1 0
506
+ 19 8 1 0
507
+ 17 11 1 0
508
  M END
 
 
 
509
  $$$$
data/examples/interaction_pair_inference.csv CHANGED
@@ -1,6 +1,7 @@
1
  ID1,X1,ID2,X2
2
  CHEMBL41355,CCOC(=O)Nc1ccc(NCc2ccc(F)cc2)cc1N,O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
3
  CHEMBL497318,CCCCCc1cc(O)c(C/C=C(\C)CCC=C(C)C)c(O)c1,Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
 
4
  CHEMBL444449,O=c1ccc2c(OCCCCOc3ccccc3)c3ccoc3cc2o1,P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
5
  CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
6
  CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
 
1
  ID1,X1,ID2,X2
2
  CHEMBL41355,CCOC(=O)Nc1ccc(NCc2ccc(F)cc2)cc1N,O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
3
  CHEMBL497318,CCCCCc1cc(O)c(C/C=C(\C)CCC=C(C)C)c(O)c1,Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
4
+ CHEMBL497318,CCCCCc1cc(O)c(C/C=C(\C)CCC=C(C)C)c(O)c1,Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
5
  CHEMBL444449,O=c1ccc2c(OCCCCOc3ccccc3)c3ccoc3cc2o1,P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
6
  CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
7
  CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
data/examples/target_library.csv CHANGED
@@ -1,6 +1,7 @@
1
  ID2,X2
2
  O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
3
  Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
 
4
  P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
5
  O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
6
  Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
 
1
  ID2,X2
2
  O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
3
  Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
4
+ Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
5
  P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
6
  O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
7
  Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
data/examples/target_library.fasta CHANGED
@@ -1,102 +1,41 @@
1
- >O88943
2
- MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTG
3
- GAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEK
4
- SSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASI
5
- AVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGF
6
- LCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLI
7
- GVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTW
8
- QYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVS
9
- LKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRI
10
- KGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKE
11
- SLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDP
12
- SMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSR
13
- DHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLV
14
- RIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELER
15
- SFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEG
16
- PFGDVAWAGPRK
17
- >Q9Y5S1
18
- MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNY
19
- RKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCL
20
- MKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVK
21
- LLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQA
22
- TDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKL
23
- AAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAF
24
- HCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAA
25
- PHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALL
26
- TVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLL
27
- IYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLEL
28
- FKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIW
29
- KLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPT
30
- LCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
31
- >P17658
32
- MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLS
33
- LFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEE
34
- IRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVS
35
- VLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITP
36
- GEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIID
37
- LVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSK
38
- GLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTM
39
- TTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHV
40
- TCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
41
- >O15399
42
- MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGP
43
- AYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDD
44
- SRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLE
45
- EYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVS
46
- AQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPL
47
- PAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESL
48
- HRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYG
49
- RFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPE
50
- KRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSL
51
- TINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVT
52
- VFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVL
53
- VWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEK
54
- NIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGS
55
- GKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKL
56
- DIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAE
57
- AAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADG
58
- FHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPP
59
- AGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAG
60
- GTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYP
61
- YAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHD
62
- GLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGW
63
- DLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDL
64
- GTRRGSAHFSSLESEV
65
- >Q14957
66
- MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPL
67
- EIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPIL
68
- SISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLE
69
- GVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEA
70
- AQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGA
71
- HSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVV
72
- IALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPD
73
- PGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTN
74
- GKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNG
75
- TVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIG
76
- KSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTV
77
- SGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKM
78
- GKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQF
79
- LGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVY
80
- WKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAA
81
- RDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGW
82
- GPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASER
83
- PLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHA
84
- SLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGA
85
- PAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRD
86
- SGGLDEISRVARGTQGFPGPCTWRRISSLESEV
87
- >O54912
88
- MKRQNVRTLALIVCTFTYLLVGAAVFDALESEPEMIERQRLELRQLELRARYNLSEGGYE
89
- ELERVVLRLKPHKAGVQWRFAGSFYFAITVITTIGYGHAAPSTDGGKVFCMFYALLGIPL
90
- TLVMFQSLGERINTFVRYLLHRAKRGLGMRHAEVSMANMVLIGFVSCISTLCIGAAAFSY
91
- YERWTFFQAYYYCFITLTTIGFGDYVALQKDQALQTQPQYVAFSFVYILTGLTVIGAFLN
92
- LVVLRFMTMNAEDEKRDAEHRALLTHNGQAGGLGGLSCLSGSLGDGVRPRDPVTCAAAAG
93
- GMGVGVGVGGSGFRNVYAEMLHFQSMCSCLWYKSREKLQYSIPMIIPRDLSTSDTCVEHS
94
- HSSPGGGGRYSDTPSHPCLCSGTQRSAISSVSTGLHSLATFRGLMKRRSSV
95
- >Q9ES08
96
- MKRQNVRTLSLIACTFTYLLVGAAVFDALESDHEMREEEKLKAEEVRLRGKYNISSDDYQ
97
- QLELVILQSEPHRAGVQWKFAGSFYFAITVITTIGYGHAAPGTDAGKAFCMFYAVLGIPL
98
- TLVMFQSLGERMNTFVRYLLKRIKKCCGMRNTEVSMENMVTVGFFSCMGTLCLGAAAFSQ
99
- CEDWSFFHAYYYCFITLTTIGFGDFVALQSKGALQRKPFYVAFSFMYILVGLTVIGAFLN
100
- LVVLRFLTMNTDEDLLEGEVAQILAGNPRRVVVRVPQSRKRHHPMYFLRKYGRTLCYLCF
101
- PGANWGDDDDDDDDAVENVVVTTPVPPAVAAAAAAATPGPSTRNVRATVHSVSCRVEEIP
102
- PDVLRNTYFRSPFGAIPPGMHTCGENHRLHIRRKSI
 
1
+ >Seq1
2
+ LYLIFGAWAGMVGTALSLLIRAELGQPGTLLGDDQIYNVIVTAHAFVMIFFMVMPIMIGGFGNWLVPLMI
3
+ GAPDMAFPRMNNMSFWLLPPSFLLLLASSTVEAGAGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGVSS
4
+ ILGAINFITTAINMKPPTLSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGD
5
+ PVLYQHLFWFFGHPEVYILIL
6
+
7
+ >Seq2
8
+ VGTALXLLIRAELXQPGALLGDDQIYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMIGAPDMAFPRMN
9
+ NMSFWLLPPSFLLLMASSTVEAGAGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISSILGAINFITTA
10
+ INMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHLFWFF
11
+ GHPEVYILIL
12
+
13
+ >Seq3
14
+ LYLIFGAWAGMVGTALSLLIRAELGQPGALLGDDQVYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMI
15
+ GAPDMAFPRMNNMSFWLLPPSFLLLLASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISS
16
+ ILGAINFITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGD
17
+ PVLYQHLFWFFGHPEVYILIL
18
+
19
+ >Seq4
20
+ WAGMVGTALSLLIRAELGQPGALLGDDQIYNVVXTAHAFVMIFFMVMPIMIGGFGNWLVPLMIGAPDMAF
21
+ PRMNNMSFWLLPPSFLLLMASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISSILGAINF
22
+ ITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHL
23
+ FWFFGHPEVYILIL
24
+
25
+ >Seq5
26
+ LYLIFGAWAGMVGTALSLLIRAELGQPGALLGDDQVYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMI
27
+ GAPDMAFPRMNNMSFWLLPPSFLLLLASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISS
28
+ ILGAINFITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGD
29
+ PVLYQHLFWFFGHPEVYILIX
30
+
31
+ >Seq6
32
+ WAGMVGTALSLLIRAELGQPGALLGDDQIYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMIGAPDMAF
33
+ PRMNNMSFWLLPPSFLLLMASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISSILGAINF
34
+ ITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHL
35
+ FWFFGHPEVYILIL
36
+
37
+ >Seq7
38
+ VGTALSLLIRAELGQPGTLLGDDQIYNVIVTAHAFVMIFFMVMPVMIGGFGNWLVPLMIGAPDMAFPRMN
39
+ NMSFWLLPPSFLLLLASSTVEAGAGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGVSSILGAINFITTA
40
+ INMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHLFWFF
41
+ GHPEVYILIL
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/target_libraries/ChEMBL33_all_spe_single_prot_info.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data/target_libraries/ChEMBL33_human_proteins.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data/target_libraries/drugbank_targets.csv CHANGED
The diff for this file is too large to render. See raw diff
 
data/target_libraries/idmapping_not_in_chembl.csv ADDED
The diff for this file is too large to render. See raw diff