$ cd ./O2-tools-2.00
$ ./configure --prefix=/usr/local/ ; make ; sudo make install
$ cd ../nhocr-0.16
$ ./configure --prefix=/usr/local/ --with-O2tools=/usr/local ; make ; sudo make install
$ setenv NHOCR_DICDIR /usr/local/share
$ convert input.jpg input.pgm
$ nhocr -line -o output.txt test/hello.pgm
$ cd ../iulib-0.3
$ ./configure ; make ; sudo make install
$ cd ..
$ svn checkout http://tesseract-ocr.googlecode.com/svn/trunk/ tesseract-ocr
$ cd tesseract-ocr
$ ./configure ; make ; sudo make install
$ cd ../ocropus-0.3
$ ./configure --without-fst --without-leptonica; make ; sudo make install
$ cd ../nhocr-0.16/
$ vi ocropus/rec-nhocr-0.3.lua
/opt/nhocr -> /usr/local
$ sudo cp ocropus/rec-nhocr-0.3.lua /usr/local/share/ocropus/scripts/rec-nhocr.lua
$ setenv OCROSCRIPTS /usr/local/share/ocropus/scripts
// $ ocroscript recognize data/pages/alice_1.png
$ ocroscript rec-nhocr ~/Desktop/Screenshot.png
$ gs -dSAFER -dBATCH -dNOPAUSE -sDEVICE=jpeg -r300 -sOutputFile=kuwabara_01.%02d.pdf.jpg kuwabara_01.pdf
// ここまでは完璧.
// 後は、レイアウト。でも、MySQLに登録して、マッチングをかけるだけなら、もうできるはず。
$ cd ../weocr-toolkit-0.13
$ ./configure --prefix=/usr/local/ --with-O2tools=/usr/local ; make ; sudo make install
$ vi bin/execocr_tesseract.tmpl html/* cgi-bin/*
/opt/weocr -> /usr/local
/cgi-bin -> /weocr
$ sudo cp bin/execocr_tesseract.tmpl /usr/local/bin/execocr_tesseract
$ cd bin/; sudo cp filenorm run_xalan wo_cleandir /usr/local/bin ; cd -
$ mkdir /var/www/html/weocr/; cp html/* cgi-bin/* /var/www/html/weocr
$ sudo vi /etc/httpd/conf/httpd.conf
AddHandler cgi-script .cgi
Options FollowSymLinks ExecCGI
AllowOverride None
$ cd /var/www/html/weocr/; make ; cd -
(Location of error unknown)XSLT Error (javax.xml.transform.TransformerConfigurationException): getAssociatedStylesheets failed
make: *** [srvspec.html] Error 255
あれ?
// $ java -cp /usr/share/java/xalan-j2.jar org.apache.xalan.xslt.Process -HTML -IN srvspec.xml -OUT srvspec.html
// javaが悪い。OSをupdateしたらなおるかも。
// ということでpending
nhocrを使って、ocrと全文検索を組み合わせてみた
]]>$ sudo yum install freeglut-devel freeglut
$ ./Configure
1 y n n
http://mxhaard.free.fr/download.html
$ make && sudo make install
'owner'でこけるので、一部コメントアウト
]]># sudo yum install libtool-ltdl-devel [riken]
http://www.gphoto.org/proj/libgphoto2/
# tar zxvf libgphoto2-2.4.5.tar.gz && configure --prefix=/usr && make && sudo make instlal
# sudo yum install python-ctypes
http://www.freedesktop.org/wiki/Software/dbus#head-ed92e8f84ae0374ae3a2e3f714c2eb0037a84868
# ./configure --prefix=/usr && make && sudo make install
http://dbus.freedesktop.org/releases/dbus-glib/
# ./configure --prefix=/usr && make && sudo make install
http://dbus.freedesktop.org/releases/dbus-python/
# ./configure && make && sudo make install
/*
https://answers.launchpad.net/hplip/+question/35150
# install SIP.tar.gz
# install PyQT3
# sh hplip-3.9.2.run
// not finished
// we have to upgrade Linux OS.
list
http://lists.debian.or.jp/debian-users/200706/msg00048.html
cannot apply BOLD font
http://inkscape.paix.jp/faq/troubleshoot.html#troubleshoot-14
you can use the following fonts.
http://ossipedia.ipa.go.jp/ipafont/
http://www.masuseki.com/index.php?u=be/konatu.htm
Use the fonts which is looked like BOLD.
]]>$ sudo cp *.ttf /usr/share/fonts/japanese/TrueType
]]># yum install qt4 qt4-x11
# rpm -Uhv skype-2.0.0.72-fc5.i586.rpm
]]>$ lame --decode a.mp3 a.wav
]]>