Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Upload 17 files
Browse files- data/drug_libraries/Enamine_Discovery_Diversity_Set_10_10240cmpds_20240130.csv +0 -0
- data/drug_libraries/Enamine_Discovery_Diversity_Set_10_10240cmpds_20240130_origal.csv +0 -0
- data/drug_libraries/Enamine_Discovery_Diversity_Set_50_50240cmpds_20231031.csv +0 -0
- data/drug_libraries/Enamine_Phenotypic_Screening_Library_plated_5760cmds_2020_07_20.csv +0 -0
- data/drug_libraries/drugbank_compounds.csv +0 -0
- data/examples/MAPK14.fasta +1 -2
- data/examples/compound_library.sdf +419 -194
- data/examples/interaction_pair_inference.csv +1 -0
- data/examples/target_library.csv +1 -0
- data/examples/target_library.fasta +41 -102
- data/target_libraries/ChEMBL33_all_spe_single_prot_info.csv +0 -0
- data/target_libraries/ChEMBL33_human_proteins.csv +0 -0
- data/target_libraries/drugbank_targets.csv +0 -0
- data/target_libraries/idmapping_not_in_chembl.csv +0 -0
data/drug_libraries/Enamine_Discovery_Diversity_Set_10_10240cmpds_20240130.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
data/drug_libraries/Enamine_Discovery_Diversity_Set_10_10240cmpds_20240130_origal.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
data/drug_libraries/Enamine_Discovery_Diversity_Set_50_50240cmpds_20231031.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
data/drug_libraries/Enamine_Phenotypic_Screening_Library_plated_5760cmds_2020_07_20.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
data/drug_libraries/drugbank_compounds.csv
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
data/examples/MAPK14.fasta
CHANGED
@@ -4,5 +4,4 @@ SIIHAKRTYRELRLLKHMKHENVIGLLDVFTPARSLEEFNDVYLVTHLMGADLNNIVKCQ
|
|
4 |
KLTDDHVQFLIYQILRGLKYIHSADIIHRDLKPSNLAVNEDCELKILDFGLARHTDDEMT
|
5 |
GYVATRWYRAPEIMLNWMHYNQTVDIWSVGCIMAELLTGRTLFPGTDHIDQLKLILRLVG
|
6 |
TPGAELLKKISSESARNYIQSLTQMPKMNFANVFIGANPLAVDLLEKMLVLDSDKRITAA
|
7 |
-
QALAHAYFAQYHDPDDEPVADPYDQSFESRDLLIDEWKSLTYDEVISFVPPPLDQEEMES
|
8 |
-
|
|
|
4 |
KLTDDHVQFLIYQILRGLKYIHSADIIHRDLKPSNLAVNEDCELKILDFGLARHTDDEMT
|
5 |
GYVATRWYRAPEIMLNWMHYNQTVDIWSVGCIMAELLTGRTLFPGTDHIDQLKLILRLVG
|
6 |
TPGAELLKKISSESARNYIQSLTQMPKMNFANVFIGANPLAVDLLEKMLVLDSDKRITAA
|
7 |
+
QALAHAYFAQYHDPDDEPVADPYDQSFESRDLLIDEWKSLTYDEVISFVPPPLDQEEMES
|
|
data/examples/compound_library.sdf
CHANGED
@@ -1,284 +1,509 @@
|
|
1 |
|
2 |
RDKit 2D
|
3 |
|
4 |
-
|
5 |
-
|
6 |
-
6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
7 |
-
5.2500 -1.2990 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
8 |
-
3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
9 |
-
3.0000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
10 |
-
3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
11 |
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
12 |
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
13 |
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
14 |
-
-1.5000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
15 |
-3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
16 |
-3.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
17 |
-
-
|
18 |
-
-
|
19 |
-
-
|
20 |
-
-
|
21 |
-
-
|
22 |
-
-
|
23 |
-
-
|
|
|
|
|
|
|
|
|
|
|
|
|
24 |
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
25 |
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
26 |
-
1.5000 2.5981 0.0000
|
27 |
1 2 1 0
|
28 |
-
2 3
|
29 |
3 4 1 0
|
30 |
-
4 5
|
31 |
-
|
32 |
6 7 1 0
|
33 |
7 8 2 0
|
34 |
-
|
35 |
-
9 10
|
36 |
-
10 11
|
37 |
-
|
38 |
-
12 13
|
39 |
-
13 14
|
40 |
14 15 1 0
|
41 |
-
15 16
|
42 |
-
16 17 1
|
43 |
16 18 1 0
|
44 |
-
18 19
|
45 |
-
|
46 |
-
20 21
|
47 |
-
|
48 |
-
|
49 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
50 |
M END
|
51 |
-
> <ID> (1)
|
52 |
-
CHEMBL41355
|
53 |
-
|
54 |
$$$$
|
55 |
|
56 |
RDKit 2D
|
57 |
|
58 |
-
|
59 |
-
|
60 |
-
|
61 |
-
|
62 |
-
|
63 |
-
3.
|
64 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
65 |
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
66 |
-
|
67 |
-
-1.5000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
68 |
-
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
69 |
-
-3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
70 |
-
-3.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
71 |
-
-5.2500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
72 |
-
-6.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
73 |
-
-6.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
74 |
-
-5.2500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
75 |
-
-6.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
76 |
-
-5.2500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
77 |
-
-6.0000 7.7942 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
78 |
-
-3.7500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
79 |
-
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
80 |
-
-1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
81 |
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
82 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
83 |
2 3 1 0
|
84 |
-
|
85 |
4 5 1 0
|
86 |
-
5 6
|
87 |
-
6 7
|
88 |
-
7 8
|
89 |
8 9 1 0
|
90 |
-
|
91 |
10 11 1 0
|
92 |
11 12 1 0
|
93 |
12 13 2 0
|
94 |
13 14 1 0
|
95 |
-
|
96 |
15 16 1 0
|
97 |
-
16 17
|
98 |
-
17 18
|
99 |
-
18 19
|
100 |
-
|
101 |
-
|
102 |
21 22 1 0
|
103 |
-
|
104 |
-
23
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
105 |
M END
|
106 |
-
> <ID> (2)
|
107 |
-
CHEMBL497318
|
108 |
-
|
109 |
$$$$
|
110 |
|
111 |
RDKit 2D
|
112 |
|
113 |
-
|
114 |
-
-
|
115 |
-
-
|
116 |
-
-
|
117 |
-
-
|
118 |
-
-
|
119 |
-
|
120 |
-
|
121 |
-
|
122 |
-
|
123 |
-
|
124 |
-
|
125 |
-
|
126 |
-
|
127 |
-
|
128 |
-
|
129 |
-
|
130 |
-
|
131 |
-
|
132 |
-
|
133 |
-
|
134 |
-
|
135 |
-
-
|
136 |
-
-
|
137 |
-
-
|
138 |
-
-1.8351 3.2209 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
139 |
-
-2.9499 4.2246 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
140 |
1 2 2 0
|
141 |
2 3 1 0
|
142 |
-
|
143 |
-
4 5
|
144 |
-
5 6
|
145 |
-
6 7
|
146 |
7 8 1 0
|
147 |
-
8 9
|
148 |
9 10 1 0
|
149 |
10 11 1 0
|
150 |
-
11 12
|
151 |
12 13 1 0
|
152 |
13 14 2 0
|
153 |
14 15 1 0
|
154 |
15 16 2 0
|
155 |
16 17 1 0
|
156 |
17 18 2 0
|
157 |
-
|
158 |
-
19 20
|
159 |
-
|
160 |
-
21 22
|
161 |
-
|
162 |
-
23 24
|
163 |
-
24
|
164 |
-
|
165 |
-
|
166 |
-
|
167 |
-
18 13 1 0
|
168 |
-
23 19 2 0
|
169 |
M END
|
170 |
-
> <ID> (3)
|
171 |
-
CHEMBL444449
|
172 |
-
|
173 |
$$$$
|
174 |
|
175 |
RDKit 2D
|
176 |
|
177 |
-
|
178 |
-
|
179 |
-
0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
180 |
-
1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
181 |
-
3.0000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
182 |
-
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
183 |
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
184 |
-
0.7500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
185 |
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
186 |
-1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
187 |
-
|
188 |
-
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
189 |
-
-0.7500 -3.8971 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
190 |
-
-1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
191 |
-
-3.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
192 |
-
-3.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
193 |
-
-5.2500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
194 |
-
-6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
195 |
-
-5.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
196 |
-
-6.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
197 |
-
-7.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
198 |
-
-8.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
199 |
-
-7.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
200 |
-
-3.0000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
201 |
-
-1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
202 |
1 2 1 0
|
203 |
2 3 1 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
204 |
3 4 1 0
|
205 |
-
|
206 |
-
5 6
|
207 |
6 7 1 0
|
208 |
-
7 8
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
209 |
8 9 1 0
|
210 |
-
|
211 |
-
|
212 |
-
|
213 |
12 13 1 0
|
214 |
-
|
215 |
-
|
216 |
-
15 16
|
217 |
16 17 1 0
|
218 |
17 18 2 0
|
219 |
18 19 1 0
|
220 |
-
|
221 |
-
|
222 |
-
21 22 2 0
|
223 |
-
15 23 1 0
|
224 |
-
23 24 1 0
|
225 |
-
11 5 1 0
|
226 |
-
24 12 1 0
|
227 |
-
22 17 1 0
|
228 |
M END
|
229 |
-
|
230 |
-
|
|
|
231 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
232 |
$$$$
|
233 |
|
234 |
RDKit 2D
|
235 |
|
236 |
-
|
237 |
-
6.
|
238 |
-
|
|
|
239 |
3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
240 |
3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
241 |
-
|
|
|
242 |
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
243 |
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
244 |
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
|
|
|
|
|
245 |
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
246 |
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
247 |
-
|
248 |
-
|
249 |
-
3.0000 2.5981 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
250 |
-
3.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
251 |
-
5.2500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
252 |
-
6.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
253 |
-
6.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
254 |
-
5.2500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
255 |
-
3.7500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
256 |
-
3.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
257 |
-
1.5000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
258 |
-
1 2 1 0
|
259 |
-
2 3 1 0
|
260 |
3 4 1 0
|
261 |
4 5 1 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
262 |
5 6 1 0
|
263 |
6 7 1 0
|
264 |
7 8 1 0
|
265 |
8 9 1 0
|
266 |
9 10 1 0
|
267 |
10 11 1 0
|
268 |
-
11 12
|
269 |
-
|
270 |
-
13
|
271 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
272 |
15 16 1 0
|
273 |
-
|
274 |
-
17 18
|
275 |
-
|
276 |
-
19 20
|
277 |
20 21 1 0
|
278 |
-
|
279 |
-
|
|
|
|
|
|
|
|
|
280 |
M END
|
281 |
-
> <ID> (5)
|
282 |
-
CHEMBL1098
|
283 |
-
|
284 |
$$$$
|
|
|
1 |
|
2 |
RDKit 2D
|
3 |
|
4 |
+
31 33 0 0 0 0 0 0 0 0999 V2000
|
5 |
+
3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
|
|
|
|
|
|
|
|
|
6 |
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
7 |
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
8 |
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
9 |
+
-1.5000 -2.5981 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
10 |
+
-3.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
11 |
+
-3.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
12 |
+
-3.0000 -5.1962 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
13 |
+
-5.2500 -3.8971 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
14 |
+
-6.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
15 |
+
-7.5000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
16 |
+
-5.2500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
17 |
+
-3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
18 |
-3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
19 |
-3.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
20 |
+
-3.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
21 |
+
-1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
22 |
+
-3.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
23 |
+
-5.2500 3.8971 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
24 |
+
-3.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
25 |
+
-1.5000 5.1962 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
26 |
+
-3.7500 6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
27 |
+
-3.0000 7.7942 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
28 |
+
-3.7500 9.0933 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
|
29 |
+
-2.4510 9.8433 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
30 |
+
-5.0490 8.3433 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
31 |
+
-4.5000 10.3923 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
32 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
33 |
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
34 |
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
35 |
+
1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
36 |
1 2 1 0
|
37 |
+
2 3 2 0
|
38 |
3 4 1 0
|
39 |
+
4 5 1 0
|
40 |
+
5 6 2 0
|
41 |
6 7 1 0
|
42 |
7 8 2 0
|
43 |
+
7 9 1 0
|
44 |
+
9 10 1 0
|
45 |
+
10 11 2 0
|
46 |
+
10 12 1 0
|
47 |
+
12 13 2 0
|
48 |
+
13 14 1 0
|
49 |
14 15 1 0
|
50 |
+
15 16 1 0
|
51 |
+
16 17 1 1
|
52 |
16 18 1 0
|
53 |
+
18 19 1 6
|
54 |
+
18 20 1 0
|
55 |
+
20 21 1 1
|
56 |
+
20 22 1 0
|
57 |
+
22 23 1 0
|
58 |
+
23 24 1 0
|
59 |
+
24 25 2 0
|
60 |
+
24 26 1 0
|
61 |
+
24 27 1 0
|
62 |
+
14 28 1 0
|
63 |
+
28 29 1 0
|
64 |
+
29 30 2 0
|
65 |
+
30 31 1 0
|
66 |
+
30 2 1 0
|
67 |
+
28 4 2 0
|
68 |
+
13 6 1 0
|
69 |
M END
|
|
|
|
|
|
|
70 |
$$$$
|
71 |
|
72 |
RDKit 2D
|
73 |
|
74 |
+
29 33 0 0 0 0 0 0 0 0999 V2000
|
75 |
+
3.8670 -13.5458 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
76 |
+
4.9817 -12.5421 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
77 |
+
6.4083 -13.0057 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
78 |
+
4.6699 -11.0749 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
79 |
+
3.2433 -10.6114 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
80 |
+
2.1286 -11.6151 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
81 |
+
0.7020 -11.1516 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
82 |
+
0.3901 -9.6843 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
83 |
+
-1.0365 -9.2208 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
84 |
+
-2.2500 -10.1025 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
85 |
+
-3.4635 -9.2208 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
86 |
+
-3.0000 -7.7942 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
87 |
+
-3.7500 -6.4952 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
88 |
+
-3.0000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
89 |
+
-1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
90 |
+
-0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
91 |
+
0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
92 |
+
1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
93 |
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
94 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
95 |
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
96 |
+
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
97 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
98 |
+
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
99 |
+
-1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
100 |
+
-0.7500 -6.4952 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
101 |
+
-1.5000 -7.7942 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
102 |
+
1.5048 -8.6806 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
103 |
+
2.9314 -9.1442 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
104 |
+
1 2 2 0
|
105 |
2 3 1 0
|
106 |
+
2 4 1 0
|
107 |
4 5 1 0
|
108 |
+
5 6 2 0
|
109 |
+
6 7 1 0
|
110 |
+
7 8 2 0
|
111 |
8 9 1 0
|
112 |
+
9 10 2 0
|
113 |
10 11 1 0
|
114 |
11 12 1 0
|
115 |
12 13 2 0
|
116 |
13 14 1 0
|
117 |
+
14 15 2 0
|
118 |
15 16 1 0
|
119 |
+
16 17 2 0
|
120 |
+
17 18 1 0
|
121 |
+
18 19 2 0
|
122 |
+
19 20 1 0
|
123 |
+
20 21 2 0
|
124 |
21 22 1 0
|
125 |
+
22 23 2 0
|
126 |
+
23 24 1 0
|
127 |
+
24 25 2 0
|
128 |
+
15 26 1 0
|
129 |
+
26 27 2 0
|
130 |
+
8 28 1 0
|
131 |
+
28 29 2 0
|
132 |
+
29 5 1 0
|
133 |
+
27 9 1 0
|
134 |
+
27 12 1 0
|
135 |
+
25 16 1 0
|
136 |
+
24 19 1 0
|
137 |
M END
|
|
|
|
|
|
|
138 |
$$$$
|
139 |
|
140 |
RDKit 2D
|
141 |
|
142 |
+
24 27 0 0 0 0 0 0 0 0999 V2000
|
143 |
+
-7.2317 -6.0469 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
144 |
+
-6.9199 -4.5797 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
145 |
+
-8.0346 -3.5760 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
146 |
+
-5.4933 -4.1162 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
147 |
+
-5.1814 -2.6490 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
148 |
+
-3.7548 -2.1855 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
149 |
+
-2.6401 -3.1891 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
150 |
+
-1.2135 -2.7256 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
151 |
+
-0.0000 -3.6073 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
152 |
+
1.2135 -2.7256 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
153 |
+
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
154 |
+
1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
155 |
+
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
156 |
+
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
157 |
+
-1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
158 |
+
-0.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
159 |
+
-1.5000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
160 |
+
-3.0000 5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
161 |
+
-3.7500 3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
162 |
+
-3.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
163 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
164 |
+
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
165 |
+
-2.9520 -4.6564 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
166 |
+
-4.3786 -5.1199 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
|
|
|
167 |
1 2 2 0
|
168 |
2 3 1 0
|
169 |
+
2 4 1 0
|
170 |
+
4 5 2 0
|
171 |
+
5 6 1 0
|
172 |
+
6 7 2 0
|
173 |
7 8 1 0
|
174 |
+
8 9 2 0
|
175 |
9 10 1 0
|
176 |
10 11 1 0
|
177 |
+
11 12 2 0
|
178 |
12 13 1 0
|
179 |
13 14 2 0
|
180 |
14 15 1 0
|
181 |
15 16 2 0
|
182 |
16 17 1 0
|
183 |
17 18 2 0
|
184 |
+
18 19 1 0
|
185 |
+
19 20 2 0
|
186 |
+
14 21 1 0
|
187 |
+
21 22 2 0
|
188 |
+
7 23 1 0
|
189 |
+
23 24 2 0
|
190 |
+
24 4 1 0
|
191 |
+
22 8 1 0
|
192 |
+
22 11 1 0
|
193 |
+
20 15 1 0
|
|
|
|
|
194 |
M END
|
|
|
|
|
|
|
195 |
$$$$
|
196 |
|
197 |
RDKit 2D
|
198 |
|
199 |
+
16 17 0 0 0 0 0 0 0 0999 V2000
|
200 |
+
3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
|
|
|
|
|
|
|
201 |
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
202 |
+
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
203 |
+
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
204 |
+
-1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
205 |
+
-3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
206 |
+
-3.8817 -1.2135 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
207 |
+
-5.3083 -0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
208 |
+
-6.5218 -1.6317 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
209 |
+
-5.3083 0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
210 |
+
-6.5218 1.6317 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
211 |
+
-6.3650 3.1235 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
212 |
+
-3.8817 1.2135 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
213 |
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
214 |
-1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
215 |
+
0.7500 1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
216 |
1 2 1 0
|
217 |
2 3 1 0
|
218 |
+
3 4 2 0
|
219 |
+
4 5 1 0
|
220 |
+
6 5 1 1
|
221 |
+
6 7 1 0
|
222 |
+
7 8 1 0
|
223 |
+
8 9 1 6
|
224 |
+
8 10 1 0
|
225 |
+
10 11 1 1
|
226 |
+
11 12 1 0
|
227 |
+
10 13 1 0
|
228 |
+
5 14 1 0
|
229 |
+
14 15 2 0
|
230 |
+
14 16 1 0
|
231 |
+
16 2 2 0
|
232 |
+
13 6 1 0
|
233 |
+
M END
|
234 |
+
$$$$
|
235 |
+
|
236 |
+
RDKit 2D
|
237 |
+
|
238 |
+
29 30 0 0 0 0 0 0 0 0999 V2000
|
239 |
+
3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
240 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
241 |
+
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
242 |
+
-0.7500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
243 |
+
-1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
244 |
+
-0.8899 -3.9684 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
245 |
+
-2.0046 -4.9721 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
246 |
+
-1.8478 -6.4639 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
247 |
+
-3.3037 -4.2221 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
248 |
+
-4.6740 -4.8322 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
249 |
+
-5.8875 -3.9505 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
250 |
+
-7.2578 -4.5606 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
|
251 |
+
-6.6477 -5.9309 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
252 |
+
-7.8679 -3.1903 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
253 |
+
-8.6281 -5.1707 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
254 |
+
-8.7849 -6.6625 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
|
255 |
+
-10.2767 -6.5057 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
256 |
+
-7.2931 -6.8193 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
257 |
+
-8.9417 -8.1543 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
258 |
+
-7.7282 -9.0360 0.0000 P 0 0 0 0 0 0 0 0 0 0 0 0
|
259 |
+
-8.6099 -10.2495 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
260 |
+
-6.8465 -7.8224 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
261 |
+
-6.5147 -9.9176 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
262 |
+
-2.9918 -2.7549 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
263 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
264 |
+
-3.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
265 |
+
-0.7500 1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
266 |
+
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
267 |
+
1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
268 |
+
1 2 1 0
|
269 |
+
2 3 2 0
|
270 |
3 4 1 0
|
271 |
+
5 4 1 1
|
272 |
+
5 6 1 0
|
273 |
6 7 1 0
|
274 |
+
7 8 1 6
|
275 |
+
7 9 1 0
|
276 |
+
9 10 1 1
|
277 |
+
10 11 1 0
|
278 |
+
11 12 1 0
|
279 |
+
12 13 2 0
|
280 |
+
12 14 1 0
|
281 |
+
12 15 1 0
|
282 |
+
15 16 1 0
|
283 |
+
16 17 2 0
|
284 |
+
16 18 1 0
|
285 |
+
16 19 1 0
|
286 |
+
19 20 1 0
|
287 |
+
20 21 2 0
|
288 |
+
20 22 1 0
|
289 |
+
20 23 1 0
|
290 |
+
9 24 1 0
|
291 |
+
4 25 1 0
|
292 |
+
25 26 2 0
|
293 |
+
25 27 1 0
|
294 |
+
27 28 1 0
|
295 |
+
28 29 2 0
|
296 |
+
28 2 1 0
|
297 |
+
24 5 1 0
|
298 |
+
M END
|
299 |
+
$$$$
|
300 |
+
|
301 |
+
RDKit 2D
|
302 |
+
|
303 |
+
19 20 0 0 0 0 0 0 0 0999 V2000
|
304 |
+
3.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
305 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
306 |
+
0.7500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
307 |
+
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
308 |
+
-1.5000 -2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
309 |
+
-1.5000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
310 |
+
-3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
311 |
+
-3.8817 -1.2135 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
312 |
+
-5.3083 -0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
313 |
+
-6.5218 -1.6317 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
314 |
+
-5.3083 0.7500 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
315 |
+
-6.5218 1.6317 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
316 |
+
-6.3650 3.1235 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
317 |
+
-3.8817 1.2135 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
318 |
+
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
319 |
+
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
320 |
+
1.5000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
321 |
+
3.0000 2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
322 |
+
3.7500 3.8971 0.0000 Br 0 0 0 0 0 0 0 0 0 0 0 0
|
323 |
+
1 2 2 0
|
324 |
+
2 3 1 0
|
325 |
+
3 4 1 0
|
326 |
+
4 5 2 0
|
327 |
+
4 6 1 0
|
328 |
+
7 6 1 1
|
329 |
+
7 8 1 0
|
330 |
8 9 1 0
|
331 |
+
9 10 1 6
|
332 |
+
9 11 1 0
|
333 |
+
11 12 1 1
|
334 |
12 13 1 0
|
335 |
+
11 14 1 0
|
336 |
+
6 15 1 0
|
337 |
+
15 16 2 0
|
338 |
16 17 1 0
|
339 |
17 18 2 0
|
340 |
18 19 1 0
|
341 |
+
16 2 1 0
|
342 |
+
14 7 1 0
|
|
|
|
|
|
|
|
|
|
|
|
|
343 |
M END
|
344 |
+
$$$$
|
345 |
+
|
346 |
+
RDKit 2D
|
347 |
|
348 |
+
17 18 0 0 0 0 0 0 0 0999 V2000
|
349 |
+
3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
350 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
351 |
+
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
352 |
+
-0.7500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
353 |
+
-1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
354 |
+
-0.8899 -3.9684 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
355 |
+
-2.0046 -4.9721 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
356 |
+
-1.8478 -6.4639 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
357 |
+
-3.3037 -4.2221 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
358 |
+
-4.6740 -4.8322 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
359 |
+
-5.8875 -3.9505 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
360 |
+
-2.9918 -2.7549 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
361 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
362 |
+
-3.0000 0.0000 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
363 |
+
-0.7500 1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
364 |
+
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
365 |
+
1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
366 |
+
1 2 1 0
|
367 |
+
2 3 2 0
|
368 |
+
3 4 1 0
|
369 |
+
5 4 1 1
|
370 |
+
5 6 1 0
|
371 |
+
6 7 1 0
|
372 |
+
7 8 1 6
|
373 |
+
7 9 1 0
|
374 |
+
9 10 1 1
|
375 |
+
10 11 1 0
|
376 |
+
9 12 1 0
|
377 |
+
4 13 1 0
|
378 |
+
13 14 2 0
|
379 |
+
13 15 1 0
|
380 |
+
15 16 1 0
|
381 |
+
16 17 2 0
|
382 |
+
16 2 1 0
|
383 |
+
12 5 1 0
|
384 |
+
M END
|
385 |
$$$$
|
386 |
|
387 |
RDKit 2D
|
388 |
|
389 |
+
15 15 0 0 0 0 0 0 0 0999 V2000
|
390 |
+
6.7500 -3.8971 0.0000 N 0 0 0 0 0 2 0 0 0 0 0 0
|
391 |
+
6.0000 -2.5981 0.0000 N 0 0 0 0 0 4 0 0 0 0 0 0
|
392 |
+
5.2500 -1.2990 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
393 |
3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
394 |
3.0000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
395 |
+
3.7500 1.2990 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
396 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
397 |
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
398 |
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
399 |
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
400 |
+
-3.0000 0.0000 0.0000 N 0 0 0 0 0 4 0 0 0 0 0 0
|
401 |
+
-3.7500 -1.2990 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
402 |
+
-3.7500 1.2990 0.0000 O 0 0 0 0 0 1 0 0 0 0 0 0
|
403 |
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
404 |
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
405 |
+
1 2 2 0
|
406 |
+
2 3 2 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
407 |
3 4 1 0
|
408 |
4 5 1 0
|
409 |
+
5 6 1 1
|
410 |
+
5 7 1 0
|
411 |
+
7 8 2 0
|
412 |
+
8 9 1 0
|
413 |
+
9 10 2 0
|
414 |
+
10 11 1 0
|
415 |
+
11 12 2 0
|
416 |
+
11 13 1 0
|
417 |
+
10 14 1 0
|
418 |
+
14 15 2 0
|
419 |
+
15 7 1 0
|
420 |
+
M CHG 4 1 -1 2 1 11 1 13 -1
|
421 |
+
M END
|
422 |
+
$$$$
|
423 |
+
|
424 |
+
RDKit 2D
|
425 |
+
|
426 |
+
13 13 0 0 0 0 0 0 0 0999 V2000
|
427 |
+
7.2990 -1.8481 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
428 |
+
6.0000 -2.5981 0.0000 S 0 0 0 0 0 0 0 0 0 0 0 0
|
429 |
+
4.7010 -3.3481 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
430 |
+
6.7500 -3.8971 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
431 |
+
5.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
432 |
+
3.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
433 |
+
3.0000 0.0000 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
434 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
435 |
+
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
436 |
+
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
437 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
438 |
+
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
439 |
+
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
440 |
+
1 2 2 0
|
441 |
+
2 3 2 0
|
442 |
+
2 4 1 0
|
443 |
+
2 5 1 0
|
444 |
5 6 1 0
|
445 |
6 7 1 0
|
446 |
7 8 1 0
|
447 |
8 9 1 0
|
448 |
9 10 1 0
|
449 |
10 11 1 0
|
450 |
+
11 12 1 0
|
451 |
+
12 13 1 0
|
452 |
+
13 8 1 0
|
453 |
+
M END
|
454 |
+
$$$$
|
455 |
+
|
456 |
+
RDKit 2D
|
457 |
+
|
458 |
+
23 26 0 0 0 0 0 0 0 0999 V2000
|
459 |
+
-5.2020 -8.5535 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
460 |
+
-4.8901 -7.0863 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
461 |
+
-6.0048 -6.0826 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
462 |
+
-3.4635 -6.6227 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
463 |
+
-2.2500 -7.5044 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
464 |
+
-1.0365 -6.6227 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
465 |
+
-1.5000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
466 |
+
-0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
467 |
+
0.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
468 |
+
1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
469 |
+
0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
470 |
+
1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
471 |
+
0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
472 |
+
1.5000 2.5981 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
473 |
+
-0.7500 1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
474 |
+
-1.5000 0.0000 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
475 |
+
-0.7500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
476 |
+
-2.2500 -1.2990 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
477 |
+
-1.5000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
478 |
+
-3.0000 -2.5981 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
479 |
+
-3.7500 -3.8971 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
480 |
+
-3.0000 -5.1962 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
481 |
+
-4.4918 -5.3529 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
482 |
+
1 2 1 0
|
483 |
+
2 3 2 0
|
484 |
+
4 2 1 6
|
485 |
+
4 5 1 0
|
486 |
+
5 6 1 0
|
487 |
+
7 6 1 6
|
488 |
+
7 8 1 0
|
489 |
+
8 9 1 1
|
490 |
+
9 10 1 0
|
491 |
+
10 11 2 0
|
492 |
+
11 12 1 0
|
493 |
+
12 13 1 0
|
494 |
+
13 14 1 6
|
495 |
+
13 15 1 0
|
496 |
15 16 1 0
|
497 |
+
16 17 1 0
|
498 |
+
17 18 1 6
|
499 |
+
17 19 1 0
|
500 |
+
19 20 1 6
|
501 |
20 21 1 0
|
502 |
+
21 22 1 0
|
503 |
+
22 23 1 6
|
504 |
+
22 4 1 0
|
505 |
+
22 7 1 0
|
506 |
+
19 8 1 0
|
507 |
+
17 11 1 0
|
508 |
M END
|
|
|
|
|
|
|
509 |
$$$$
|
data/examples/interaction_pair_inference.csv
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
ID1,X1,ID2,X2
|
2 |
CHEMBL41355,CCOC(=O)Nc1ccc(NCc2ccc(F)cc2)cc1N,O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
|
3 |
CHEMBL497318,CCCCCc1cc(O)c(C/C=C(\C)CCC=C(C)C)c(O)c1,Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
|
|
|
4 |
CHEMBL444449,O=c1ccc2c(OCCCCOc3ccccc3)c3ccoc3cc2o1,P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
|
5 |
CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
|
6 |
CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
|
|
|
1 |
ID1,X1,ID2,X2
|
2 |
CHEMBL41355,CCOC(=O)Nc1ccc(NCc2ccc(F)cc2)cc1N,O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
|
3 |
CHEMBL497318,CCCCCc1cc(O)c(C/C=C(\C)CCC=C(C)C)c(O)c1,Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
|
4 |
+
CHEMBL497318,CCCCCc1cc(O)c(C/C=C(\C)CCC=C(C)C)c(O)c1,Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
|
5 |
CHEMBL444449,O=c1ccc2c(OCCCCOc3ccccc3)c3ccoc3cc2o1,P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
|
6 |
CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
|
7 |
CHEMBL305187,CC(C(O)c1ccc(O)cc1)N1CCC(Cc2ccccc2)CC1,Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
|
data/examples/target_library.csv
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
ID2,X2
|
2 |
O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
|
3 |
Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
|
|
|
4 |
P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
|
5 |
O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
|
6 |
Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
|
|
|
1 |
ID2,X2
|
2 |
O88943,MVQKSRNGGVYPGTSGEKKLKVGFVGLDPGAPDSTRDGALLIAGSEAPKRGSVLSKPRTGGAGAGKPPKRNAFYRKLQNFLYNVLERPRGWAFIYHAYVFLLVFSCLVLSVFSTIKEYEKSSEGALYILEIVTIVVFGVEYFVRIWAAGCCCRYRGWRGRLKFARKPFCVIDIMVLIASIAVLAAGSQGNVFATSALRSLRFLQILRMIRMDRRGGTWKLLGSVVYAHSKELVTAWYIGFLCLILASFLVYLAEKGENDHFDTYADALWWGLITLTTIGYGDKYPQTWNGRLLAATFTLIGVSFFALPAGILGSGFALKVQEQHRQKHFEKRRNPAAGLIQSAWRFYATNLSRTDLHSTWQYYERTVTVPMISSQTQTYGASRLIPPLNQLEMLRNLKSKSGLTFRKEPQPEPSPSQKVSLKDRVFSSPRGVAAKGKGSPQAQTVRRSPSADQSLDDSPSKVPKSWSFGDRSRARQAFRIKGAASRQNSEEASLPGEDIVEDNKSCNCEFVTEDLTPGLKVSIRAVCVMRFLVSKRKFKESLRPYDVMDVIEQYSAGHLDMLSRIKSLQSRVDQIVGRGPTITDKDRTKGPAETELPEDPSMMGRLGKVEKQVLSMEKKLDFLVSIYTQRMGIPPAETEAYFGAKEPEPAPPYHSPEDSRDHADKHGCIIKIVRSTSSTGQRKYAAPPVMPPAECPPSTSWQQSHQRHGTSPVGDHGSLVRIPPPPAHERSLSAYSGGNRASTEFLRLEGTPACRPSEAALRDSDTSISIPSVDHEELERSFSGFSISQSKENLNALASCYAAVAPCAKVRPYIAEGESDTDSDLCTPCGPPPRSATGEGPFGDVAWAGPRK
|
3 |
Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
|
4 |
+
Q9Y5S1,MTSPSSSPVFRLETLDGGQEDGSEADRGKLDFGSGLPPMESQFQGEDRKFAPQIRVNLNYRKGTGASQPDPNRFDRDRLFNAVSRGVPEDLAGLPEYLSKTSKYLTDSEYTEGSTGKTCLMKAVLNLKDGVNACILPLLQIDRDSGNPQPLVNAQCTDDYYRGHSALHIAIEKRSLQCVKLLVENGANVHARACGRFFQKGQGTCFYFGELPLSLAACTKQWDVVSYLLENPHQPASLQATDSQGNTVLHALVMISDNSAENIALVTSMYDGLLQAGARLCPTVQLEDIRNLQDLTPLKLAAKEGKIEIFRHILQREFSGLSHLSRKFTEWCYGPVRVSLYDLASVDSCEENSVLEIIAFHCKSPHRHRMVVLEPLNKLLQAKWDLLIPKFFLNFLCNLIYMFIFTAVAYHQPTLKKQAAPHLKAEVGNSMLLTGHILILLGGIYLLVGQLWYFWRRHVFIWISFIDSYFEILFLFQALLTVVSQVLCFLAIEWYLPLLVSALVLGWLNLLYYTRGFQHTGIYSVMIQKVILRDLLRFLLIYLVFLFGFAVALVSLSQEAWRPEAPTGPNATESVQPMEGQEDEGNGAQYRGILEASLELFKFTIGMGELAFQEQLHFRGMVLLLLLAYVLLTYILLLNMLIALMSETVNSVATDSWSIWKLQKAISVLEMENGYWWCRKKQRAGVMLTVGTKPDGSPDERWCFRVEEVNWASWEQTLPTLCEDPSGAGVPRTLENPVLASPPKEDEDGASEENYVPVQLLQSN
|
5 |
P17658,MRSEKSLTLAAPGEVRGPEGEQQDAGDFPEAGGGGGCCSSERLVINISGLRFETQLRTLSLFPDTLLGDPGRRVRFFDPLRNEYFFDRNRPSFDAILYYYQSGGRLRRPVNVPLDIFLEEIRFYQLGDEALAAFREDEGCLPEGGEDEKPLPSQPFQRQVWLLFEYPESSGPARGIAIVSVLVILISIVIFCLETLPQFRVDGRGGNNGGVSRVSPVSRGSQEEEEDEDDSYTFHHGITPGEMGTGGSSSLSTLGGSFFTDPFFLVETLCIVWFTFELLVRFSACPSKPAFFRNIMNIIDLVAIFPYFITLGTELVQQQEQQPASGGGGQNGQQAMSLAILRVIRLVRVFRIFKLSRHSKGLQILGKTLQASMRELGLLIFFLFIGVILFSSAVYFAEADDDDSLFPSIPDAFWWAVVTMTTVGYGDMYPMTVGGKIVGSLCAIAGVLTIALPVPVIVSNFNYFYHRETEQEEQGQYTHVTCGQPAPDLRATDNGLGKPDFPEANRERRPSYLPTPHRAYAEKRMLTEV
|
6 |
O15399,MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGPAYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDDSRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLEEYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVSAQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPLPAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESLHRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYGRFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPEKRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVTVFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEKNIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGSGKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKLDIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAEAAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADGFHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPPAGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAGGTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYPYAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHDGLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGWDLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDLGTRRGSAHFSSLESEV
|
7 |
Q14957,MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPLEIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPILSISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLEGVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEAAQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGAHSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVVIALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPDPGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTNGKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIGKSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTVSGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKMGKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQFLGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVYWKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAARDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGWGPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASERPLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHASLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGAPAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRDSGGLDEISRVARGTQGFPGPCTWRRISSLESEV
|
data/examples/target_library.fasta
CHANGED
@@ -1,102 +1,41 @@
|
|
1 |
-
>
|
2 |
-
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
25 |
-
|
26 |
-
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
|
31 |
-
>
|
32 |
-
|
33 |
-
|
34 |
-
|
35 |
-
|
36 |
-
|
37 |
-
|
38 |
-
|
39 |
-
|
40 |
-
|
41 |
-
|
42 |
-
MRGAGGPRGPRGPAKMLLLLALACASPFPEEAPGPGGAGGPGGGLGGARPLNVALVFSGP
|
43 |
-
AYAAEAARLGPAVAAAVRSPGLDVRPVALVLNGSDPRSLVLQLCDLLSGLRVHGVVFEDD
|
44 |
-
SRAPAVAPILDFLSAQTSLPIVAVHGGAALVLTPKEKGSTFLQLGSSTEQQLQVIFEVLE
|
45 |
-
EYDWTSFVAVTTRAPGHRAFLSYIEVLTDGSLVGWEHRGALTLDPGAGEAVLSAQLRSVS
|
46 |
-
AQIRLLFCAREEAEPVFRAAEEAGLTGSGYVWFMVGPQLAGGGGSGAPGEPPLLPGGAPL
|
47 |
-
PAGLFAVRSAGWRDDLARRVAAGVAVVARGAQALLRDYGFLPELGHDCRAQNRTHRGESL
|
48 |
-
HRYFMNITWDNRDYSFNEDGFLVNPSLVVISLTRDRTWEVVGSWEQQTLRLKYPLWSRYG
|
49 |
-
RFLQPVDDTQHLTVATLEERPFVIVEPADPISGTCIRDSVPCRSQLNRTHSPPPDAPRPE
|
50 |
-
KRCCKGFCIDILKRLAHTIGFSYDLYLVTNGKHGKKIDGVWNGMIGEVFYQRADMAIGSL
|
51 |
-
TINEERSEIVDFSVPFVETGISVMVARSNGTVSPSAFLEPYSPAVWVMMFVMCLTVVAVT
|
52 |
-
VFIFEYLSPVGYNRSLATGKRPGGSTFTIGKSIWLLWALVFNNSVPVENPRGTTSKIMVL
|
53 |
-
VWAFFAVIFLASYTANLAAFMIQEEYVDTVSGLSDRKFQRPQEQYPPLKFGTVPNGSTEK
|
54 |
-
NIRSNYPDMHSYMVRYNQPRVEEALTQLKAGKLDAFIYDAAVLNYMARKDEGCKLVTIGS
|
55 |
-
GKVFATTGYGIALHKGSRWKRPIDLALLQFLGDDEIEMLERLWLSGICHNDKIEVMSSKL
|
56 |
-
DIDNMAGVFYMLLVAMGLSLLVFAWEHLVYWRLRHCLGPTHRMDFLLAFSRGMYSCCSAE
|
57 |
-
AAPPPAKPPPPPQPLPSPAYPAPRPAPGPAPFVPRERASVDRWRRTKGAGPPGGAGLADG
|
58 |
-
FHRYYGPIEPQGLGLGLGEARAAPRGAAGRPLSPPAAQPPQKPPPSYFAIVRDKEPAEPP
|
59 |
-
AGAFPGFPSPPAPPAAAATAVGPPLCRLAFEDESPPAPARWPRSDPESQPLLGPGAGGAG
|
60 |
-
GTGGAGGGAPAAPPPCRAAPPPCPYLDLEPSPSDSEDSESLGGASLGGLEPWWFADFPYP
|
61 |
-
YAERLGPPPGRYWSVDKLGGWRAGSWDYLPPRSGPAAWHCRHCASLELLPPPRHLSCSHD
|
62 |
-
GLDGGWWAPPPPPWAAGPLPRRRARCGCPRSHPHRPRASHRTPAAAAPHHHRHRRAAGGW
|
63 |
-
DLPPPAPTSRSLEDLSSCPRAAPARRLTGPSRHARRCPHAAHWGPPLPTASHRRHRGGDL
|
64 |
-
GTRRGSAHFSSLESEV
|
65 |
-
>Q14957
|
66 |
-
MGGALGPALLLTSLFGAWAGLGPGQGEQGMTVAVVFSSSGPPQAQFRARLTPQSFLDLPL
|
67 |
-
EIQPLTVGVNTTNPSSLLTQICGLLGAAHVHGIVFEDNVDTEAVAQILDFISSQTHVPIL
|
68 |
-
SISGGSAVVLTPKEPGSAFLQLGVSLEQQLQVLFKVLEEYDWSAFAVITSLHPGHALFLE
|
69 |
-
GVRAVADASHVSWRLLDVVTLELGPGGPRARTQRLLRQLDAPVFVAYCSREEAEVLFAEA
|
70 |
-
AQAGLVGPGHVWLVPNLALGSTDAPPATFPVGLISVVTESWRLSLRQKVRDGVAILALGA
|
71 |
-
HSYWRQHGTLPAPAGDCRVHPGPVSPAREAFYRHLLNVTWEGRDFSFSPGGYLVQPTMVV
|
72 |
-
IALNRHRLWEMVGRWEHGVLYMKYPVWPRYSASLQPVVDSRHLTVATLEERPFVIVESPD
|
73 |
-
PGTGGCVPNTVPCRRQSNHTFSSGDVAPYTKLCCKGFCIDILKKLARVVKFSYDLYLVTN
|
74 |
-
GKHGKRVRGVWNGMIGEVYYKRADMAIGSLTINEERSEIVDFSVPFVETGISVMVARSNG
|
75 |
-
TVSPSAFLEPYSPAVWVMMFVMCLTVVAITVFMFEYFSPVSYNQNLTRGKKSGGPAFTIG
|
76 |
-
KSVWLLWALVFNNSVPIENPRGTTSKIMVLVWAFFAVIFLASYTANLAAFMIQEQYIDTV
|
77 |
-
SGLSDKKFQRPQDQYPPFRFGTVPNGSTERNIRSNYRDMHTHMVKFNQRSVEDALTSLKM
|
78 |
-
GKLDAFIYDAAVLNYMAGKDEGCKLVTIGSGKVFATTGYGIAMQKDSHWKRAIDLALLQF
|
79 |
-
LGDGETQKLETVWLSGICQNEKNEVMSSKLDIDNMAGVFYMLLVAMGLALLVFAWEHLVY
|
80 |
-
WKLRHSVPNSSQLDFLLAFSRGIYSCFSGVQSLASPPRQASPDLTASSAQASVLKMLQAA
|
81 |
-
RDMVTTAGVSSSLDRATRTIENWGGGRRAPPPSPCPTPRSGPSPCLPTPDPPPEPSPTGW
|
82 |
-
GPPDGGRAALVRRAPQPPGRPPTPGPPLSDVSRVSRRPAWEARWPVRTGHCGRHLSASER
|
83 |
-
PLSPARCHYSSFPRADRSGRPFLPLFPELEDLPLLGPEQLARREALLHAAWARGSRPRHA
|
84 |
-
SLPSSVAEAFARPSSLPAGCTGPACARPDGHSACRRLAQAQSMCLPIYREACQEGEQAGA
|
85 |
-
PAWQHRQHVCLHAHAHLPFCWGAVCPHLPPCASHGSWLSGAWGPLGHRGRTLGLGTGYRD
|
86 |
-
SGGLDEISRVARGTQGFPGPCTWRRISSLESEV
|
87 |
-
>O54912
|
88 |
-
MKRQNVRTLALIVCTFTYLLVGAAVFDALESEPEMIERQRLELRQLELRARYNLSEGGYE
|
89 |
-
ELERVVLRLKPHKAGVQWRFAGSFYFAITVITTIGYGHAAPSTDGGKVFCMFYALLGIPL
|
90 |
-
TLVMFQSLGERINTFVRYLLHRAKRGLGMRHAEVSMANMVLIGFVSCISTLCIGAAAFSY
|
91 |
-
YERWTFFQAYYYCFITLTTIGFGDYVALQKDQALQTQPQYVAFSFVYILTGLTVIGAFLN
|
92 |
-
LVVLRFMTMNAEDEKRDAEHRALLTHNGQAGGLGGLSCLSGSLGDGVRPRDPVTCAAAAG
|
93 |
-
GMGVGVGVGGSGFRNVYAEMLHFQSMCSCLWYKSREKLQYSIPMIIPRDLSTSDTCVEHS
|
94 |
-
HSSPGGGGRYSDTPSHPCLCSGTQRSAISSVSTGLHSLATFRGLMKRRSSV
|
95 |
-
>Q9ES08
|
96 |
-
MKRQNVRTLSLIACTFTYLLVGAAVFDALESDHEMREEEKLKAEEVRLRGKYNISSDDYQ
|
97 |
-
QLELVILQSEPHRAGVQWKFAGSFYFAITVITTIGYGHAAPGTDAGKAFCMFYAVLGIPL
|
98 |
-
TLVMFQSLGERMNTFVRYLLKRIKKCCGMRNTEVSMENMVTVGFFSCMGTLCLGAAAFSQ
|
99 |
-
CEDWSFFHAYYYCFITLTTIGFGDFVALQSKGALQRKPFYVAFSFMYILVGLTVIGAFLN
|
100 |
-
LVVLRFLTMNTDEDLLEGEVAQILAGNPRRVVVRVPQSRKRHHPMYFLRKYGRTLCYLCF
|
101 |
-
PGANWGDDDDDDDDAVENVVVTTPVPPAVAAAAAAATPGPSTRNVRATVHSVSCRVEEIP
|
102 |
-
PDVLRNTYFRSPFGAIPPGMHTCGENHRLHIRRKSI
|
|
|
1 |
+
>Seq1
|
2 |
+
LYLIFGAWAGMVGTALSLLIRAELGQPGTLLGDDQIYNVIVTAHAFVMIFFMVMPIMIGGFGNWLVPLMI
|
3 |
+
GAPDMAFPRMNNMSFWLLPPSFLLLLASSTVEAGAGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGVSS
|
4 |
+
ILGAINFITTAINMKPPTLSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGD
|
5 |
+
PVLYQHLFWFFGHPEVYILIL
|
6 |
+
|
7 |
+
>Seq2
|
8 |
+
VGTALXLLIRAELXQPGALLGDDQIYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMIGAPDMAFPRMN
|
9 |
+
NMSFWLLPPSFLLLMASSTVEAGAGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISSILGAINFITTA
|
10 |
+
INMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHLFWFF
|
11 |
+
GHPEVYILIL
|
12 |
+
|
13 |
+
>Seq3
|
14 |
+
LYLIFGAWAGMVGTALSLLIRAELGQPGALLGDDQVYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMI
|
15 |
+
GAPDMAFPRMNNMSFWLLPPSFLLLLASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISS
|
16 |
+
ILGAINFITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGD
|
17 |
+
PVLYQHLFWFFGHPEVYILIL
|
18 |
+
|
19 |
+
>Seq4
|
20 |
+
WAGMVGTALSLLIRAELGQPGALLGDDQIYNVVXTAHAFVMIFFMVMPIMIGGFGNWLVPLMIGAPDMAF
|
21 |
+
PRMNNMSFWLLPPSFLLLMASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISSILGAINF
|
22 |
+
ITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHL
|
23 |
+
FWFFGHPEVYILIL
|
24 |
+
|
25 |
+
>Seq5
|
26 |
+
LYLIFGAWAGMVGTALSLLIRAELGQPGALLGDDQVYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMI
|
27 |
+
GAPDMAFPRMNNMSFWLLPPSFLLLLASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISS
|
28 |
+
ILGAINFITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGD
|
29 |
+
PVLYQHLFWFFGHPEVYILIX
|
30 |
+
|
31 |
+
>Seq6
|
32 |
+
WAGMVGTALSLLIRAELGQPGALLGDDQIYNVVVTAHAFVMIFFMVMPIMIGGFGNWLVPLMIGAPDMAF
|
33 |
+
PRMNNMSFWLLPPSFLLLMASSTVEAGVGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGISSILGAINF
|
34 |
+
ITTAINMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHL
|
35 |
+
FWFFGHPEVYILIL
|
36 |
+
|
37 |
+
>Seq7
|
38 |
+
VGTALSLLIRAELGQPGTLLGDDQIYNVIVTAHAFVMIFFMVMPVMIGGFGNWLVPLMIGAPDMAFPRMN
|
39 |
+
NMSFWLLPPSFLLLLASSTVEAGAGTGWTVYPPLAGNLAHAGASVDLAIFSLHLAGVSSILGAINFITTA
|
40 |
+
INMKPPALSQYQTPLFVWSVLITAVLLLLSLPVLAAGITMLLTDRNLNTTFFDPAGGGDPVLYQHLFWFF
|
41 |
+
GHPEVYILIL
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data/target_libraries/ChEMBL33_all_spe_single_prot_info.csv
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
data/target_libraries/ChEMBL33_human_proteins.csv
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
data/target_libraries/drugbank_targets.csv
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
data/target_libraries/idmapping_not_in_chembl.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|