From: Daniel Axtens Date: Wed, 17 Aug 2011 04:18:23 +0000 (+0800) Subject: Don't try full ocr, it's useless. X-Git-Url: https://git.ucc.asn.au/?p=dja%2Fscandal.git;a=commitdiff_plain;h=d3130f66fba75ba0fefa6bf6a85c11f6c0c3a96b Don't try full ocr, it's useless. --- diff --git a/scan2pages.sh b/scan2pages.sh index e878bfe..5fbdab5 100755 --- a/scan2pages.sh +++ b/scan2pages.sh @@ -233,13 +233,13 @@ for scanpgnum in `$my_seq 1 $pages`; do done -#try full ocr -rm -rf $outdir/logpgs -ocropus book2pages $outdir/logpgs $outdir/logpg-*.png -ocropus pages2lines $outdir/logpgs -ocropus lines2fsts $outdir/logpgs -ocropus fsts2bestpaths $outdir/logpgs -ocropus buildhtml $outdir/logpgs > $outdir/out.html +#don't try full ocr, it's a waste of time. +#rm -rf $outdir/logpgs +#ocropus book2pages $outdir/logpgs $outdir/logpg-*.png +#ocropus pages2lines $outdir/logpgs +#ocropus lines2fsts $outdir/logpgs +#ocropus fsts2bestpaths $outdir/logpgs +#ocropus buildhtml $outdir/logpgs > $outdir/out.html mkdir -p $outdir/pages mv $outdir/final-*.${extension} $outdir/pages