comparison readme @ 0:efd9c309b8f7

Uploaded
author bgruening
date Tue, 26 Mar 2013 14:50:53 -0400
parents
children edff5c162649
comparison
equal deleted inserted replaced
-1:000000000000 0:efd9c309b8f7
1 OSRA: Optical Structure Recognition Application
2
3 OSRA is a utility designed to convert graphical representations of chemical
4 structures, as they appear in journal articles, patent documents, textbooks,
5 trade magazines etc., into SMILES (Simplified Molecular Input Line Entry
6 Specification - see http://en.wikipedia.org/wiki/SMILES) or
7 SD files - a computer recognizable molecular structure format.
8 OSRA can read a document in any of the over 90 graphical formats parseable by
9 ImageMagick - including GIF, JPEG, PNG, TIFF, PDF, PS etc., and generate
10 the SMILES or SDF representation of the molecular structure images encountered
11 within that document.
12
13 Note that any software designed for optical recognition is unlikely to be
14 perfect, and the output produced might, and probably will, contain errors,
15 so curation by a human knowledgeable in chemical structures is highly recommended.
16
17 http://cactus.nci.nih.gov/osra/
18
19
20 The wrapper comes with an automatic installation of all dependencies through the
21 galaxy toolshed. If you do not want to use that feature you can compile OSRA with
22 the following instructions.
23
24
25 ########################################
26 # #
27 # OSRA Setup #
28 # currently a small patch is requiered #
29 # #
30 ########################################
31
32 Save the following file to 'osra-1.4.0-configure.patch' and store it next
33 to that script below.
34
35 -------------------------------------------------------
36 --- configure 2013-03-18 18:14:00.888605219 +0100
37 +++ configure_ori 2013-03-18 18:13:48.396605759 +0100
38 @@ -4178,7 +4178,8 @@
39
40 # Check whether --with-tclap-include was given.
41 if test "${with_tclap_include+set}" = set; then :
42 - withval=$with_tclap_include;
43 + withval=$with_tclap_include;
44 + CPPFLAGS="-I${withval} ${CPPFLAGS}"
45 else
46 with_tclap_include="auto"
47 fi
48 -------------------------------------------------------
49
50 #!/usr/bin/bash
51 #osra installation
52
53 cdir=`pwd`
54
55 wget http://sourceforge.net/projects/graphicsmagick/files/graphicsmagick/1.3.18/GraphicsMagick-1.3.18.tar.gz
56 tar xfvz GraphicsMagick-1.3.18.tar.gz
57 cd GraphicsMagick-1.3.18
58 ./configure --prefix=`pwd`/build --enable-shared=yes
59 make
60 make install
61 cd ..
62
63 export PATH=$PATH:/home/bag/projects/osra/GraphicsMagick-1.3.18/build/bin/
64
65 wget http://potrace.sourceforge.net/download/potrace-1.11.tar.gz
66 tar xfvz potrace-1.11.tar.gz
67 cd potrace-1.11
68 ./configure --with-libpotrace --prefix=`pwd`/build
69 make
70 make install
71 cd ..
72
73 wget http://downloads.sourceforge.net/project/osra/gocr-patched/gocr-0.50pre-patched.tgz
74 tar xfvz gocr-0.50pre-patched.tgz
75 cd gocr-0.50pre-patched
76 ./configure --prefix=`pwd`/build
77 make libs
78 make all install
79 cd ..
80
81 wget http://downloads.sourceforge.net/project/tclap/tclap-1.2.1.tar.gz
82 tar xfvz tclap-1.2.1.tar.gz
83 cd tclap-1.2.1
84 ./configure --prefix=`pwd`/build
85 make
86 make install
87 cd ..
88
89 wget http://mirror.checkdomain.de/gnu/ocrad/ocrad-0.21.tar.gz
90 tar xfvz ocrad-0.21.tar.gz
91 cd ocrad-0.21
92 ./configure --prefix=`pwd`/build
93 make
94 make install
95 cd ..
96
97 wget http://downloads.sourceforge.net/project/openbabel/openbabel/2.3.2/openbabel-2.3.2.tar.gz
98 tar xfvz openbabel-2.3.2.tar.gz
99 cd openbabel-2.3.2
100 mkdir build
101 cd build
102 cmake .. -DCMAKE_INSTALL_PREFIX=`pwd`/install/
103 make
104 make install
105 cd ../..
106
107 #wget http://tesseract-ocr.googlecode.com/files/tesseract-ocr-3.02.02.tar.gz
108 #tar xfvz tesseract-ocr-3.02.02.tar.gz
109 #cd tesseract-ocr
110 #./configure --prefix=`pwd`/build
111 #make
112 #make install
113 #cd ..
114
115
116 wget https://launchpad.net/cuneiform-linux/1.1/1.1/+download/cuneiform-linux-1.1.0.tar.bz2
117 tar xfvj cuneiform-linux-1.1.0.tar.bz2
118 cd cuneiform-linux-1.1.0
119 mkdir build
120 cd build
121 cmake .. -DCMAKE_INSTALL_PREFIX=`pwd`/install/
122 make
123 make install
124 cd ../..
125
126
127 wget http://downloads.sourceforge.net/project/osra/osra/1.4.0/osra-1.4.0.tgz
128 tar xfvz osra-1.4.0.tgz
129 patch osra-1.4.0/configure < osra-1.4.0-configure.patch
130 cd osra-1.4.0
131
132 ./configure --with-tclap-include=$cdir/tclap-1.2.1/build/include/ \
133 --with-potrace-include=$cdir/potrace-1.11/build/include/ \
134 --with-potrace-lib=$cdir/potrace-1.11/build/lib/ \
135 --with-gocr-include=$cdir/gocr-0.50pre-patched/build/include/gocr/ \
136 --with-gocr-lib=$cdir/gocr-0.50pre-patched/build/lib/ \
137 --with-ocrad-include=$cdir/ocrad-0.21/build/include/ \
138 --with-ocrad-lib=$cdir/ocrad-0.21/build/lib/ \
139 --with-cuneiform-include=$cdir/cuneiform-linux-1.1.0/build/install/include/ \
140 --with-cuneiform \
141 --with-cuneiform-lib=$cdir/cuneiform-linux-1.1.0/build/install/lib/ \
142 --with-openbabel-include=$cdir/openbabel-2.3.2/build/install/include/openbabel-2.0/ \
143 --with-openbabel-lib=$cdir/openbabel-2.3.2/build/install/lib/ \
144 --with-graphicsmagick-lib=$cdir/GraphicsMagick-1.3.18/build/lib/ \
145 --with-graphicsmagick-include=$cdir/GraphicsMagick-1.3.18/build/include/GraphicsMagick/ \
146 --prefix=`pwd`/bin/
147 #--enable-static-linking --disable-graphicsmagick-config
148 make
149 make install
150
151 export LD_LIBRARY_PATH=$cdir/GraphicsMagick-1.3.18/build/lib/:$cdir/GraphicsMagick-1.3.18/build/lib:$cdir/potrace-1.11/build/lib/
152 ./bin/bin/osra
153
154
155 #--with-tesseract-include=$cdir/tclap-1.2.1/build/include/
156 #--with-tesseract
157 #--with-tesseract-lib
158
159
160
161
162
163
164
165