0
|
1 <tool id="sdf2fps" name="SDF to Fingerprint" version="0.1.1">
|
|
2 <description>extract fingerprints from sdf files metadata</description>
|
|
3 <parallelism method="multi" split_inputs="infile" split_mode="to_size" split_size="10000" shared_inputs="" merge_outputs="outfile"></parallelism>
|
|
4 <requirements>
|
|
5 <requirement type="package" version="1.1p1">chemfp</requirement>
|
|
6 </requirements>
|
|
7 <command>
|
|
8 sdf2fps --pubchem "${infile}" > "${outfile}"
|
|
9 </command>
|
|
10 <inputs>
|
|
11 <param name="infile" type='data' format="sdf" label="SDF file with fingerprints as metadata"/>
|
|
12 </inputs>
|
|
13 <outputs>
|
|
14 <data name="outfile" format="fps"/>
|
|
15 </outputs>
|
|
16 <tests>
|
|
17 </tests>
|
|
18 <help>
|
|
19
|
|
20
|
|
21 **What it does**
|
|
22
|
|
23 Read a SDF file and extract the fingerprints, to stores them in a fps-file.
|
|
24 TODO: currently it only works for PubChem
|
|
25
|
|
26 -----
|
|
27
|
|
28 **Example**
|
|
29 * input::
|
|
30
|
|
31 SDF File
|
|
32
|
|
33 28434379
|
|
34 -OEChem-02031205132D
|
|
35
|
|
36 37 39 0 0 0 0 0 0 0999 V2000
|
|
37 8.1648 -1.8842 0.0000 O 0 0 0 0 0 0 0 0 0 0 0 0
|
|
38 6.0812 -0.2134 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
39 6.0812 -1.8229 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
40 2.5369 -2.0182 0.0000 N 0 0 0 0 0 0 0 0 0 0 0 0
|
|
41 6.3919 0.7371 0.0000 C 0 0 0 0 0 0 0 0 0 0 0 0
|
|
42 7.3704 0.9433 0.0000 C 0 0 0 0
|
|
43 ......
|
|
44 1 15 1 0 0 0 0
|
|
45 1 35 1 0 0 0 0
|
|
46 2 5 1 0 0 0 0
|
|
47 2 11 1 0 0 0 0
|
|
48 2 12 1 0 0 0 0
|
|
49 3 12 2 0 0 0 0
|
|
50 3 13 1 0 0 0 0
|
|
51 4 18 1 0 0 0 0
|
|
52 ......
|
|
53
|
|
54 >PUBCHEM_COMPOUND_CID<
|
|
55 28434379
|
|
56
|
|
57 > <PUBCHEM_COMPOUND_CANONICALIZED>
|
|
58 1
|
|
59
|
|
60 > <PUBCHEM_CACTVS_COMPLEXITY>
|
|
61 280
|
|
62
|
|
63 > <PUBCHEM_CACTVS_HBOND_ACCEPTOR>
|
|
64 2
|
|
65
|
|
66 > <PUBCHEM_CACTVS_HBOND_DONOR>
|
|
67 2
|
|
68
|
|
69 > <PUBCHEM_CACTVS_ROTATABLE_BOND>
|
|
70 2
|
|
71
|
|
72 > <PUBCHEM_CACTVS_SUBSKEYS>
|
|
73 AAADceBzIAAAAAAAAAAAAAAAAAAAAWAAAAAwYAAAAAAAAFgB8AAAHgAQCAAACCjhlwYx0LdMEgCgASZiZASCgC0hEqAJ2CA4dJiKeKLA2dGUJAhokALYyCcQAAAAAACAAAQAACAAAQAACAAAQAAAAAAAAA==
|
|
74
|
|
75 >
|
|
76
|
|
77 * output::
|
|
78
|
|
79 #FPS1
|
|
80 #num_bits=881
|
|
81 #type=CACTVS-E_SCREEN/1.0 extended=2
|
|
82 #software=CACTVS/unknown
|
|
83 #source=/home/mohammed/galaxy-central/database/files/000/dataset_409.dat
|
|
84 #date=2012-02-03T10:44:12
|
|
85 07ce04000000000000000000000000000080060000000c0600
|
|
86 00000000001a800f0000780008100000101487e9608c0bed32
|
|
87 48000580644626204101b4844805901b041c2e19511e45039b
|
|
88 8b2924101609401b13e4080000000000010020000004008000
|
|
89 0010000002000000000000 28434379
|
|
90
|
|
91
|
|
92 </help>
|
|
93 </tool>
|