X-Git-Url: https://git.ucc.asn.au/?p=dja%2Fscandal.git;a=blobdiff_plain;f=scan2pages.sh;h=5fbdab5ffdeba68b5684bdad7a60c59fb525574d;hp=3013efeeede6d21d3259c8a76d9e62ffbe17b94f;hb=d3130f66fba75ba0fefa6bf6a85c11f6c0c3a96b;hpb=9d7a737f447a6708ebea3cb0e1513b03b2edc82d diff --git a/scan2pages.sh b/scan2pages.sh index 3013efe..5fbdab5 100755 --- a/scan2pages.sh +++ b/scan2pages.sh @@ -223,8 +223,8 @@ for scanpgnum in `$my_seq 1 $pages`; do convert $convertflags $outdir/logpg-${scanpgnum}-${physpgnum}-?.pnm $outdir/logpg-${scanpgnum}-${physpgnum}-%01d.png || exit 1 #final convert and clean w/ bebook optimisation - if [[ $bebook ]]; then - convert $convertflags $outdir/logpg-${scanpgnum}-${physpgnum}-?.pnm -trim -fuzz 80% -resize 1200x1600 $outdir/final-${scanpgnum}-${physpgnum}-%01d.${extension} || exit 1 + if [[ $bebook ]]; then #1200x1600 + convert $convertflags $outdir/logpg-${scanpgnum}-${physpgnum}-?.pnm -trim $outdir/final-${scanpgnum}-${physpgnum}-%01d.${extension} || exit 1 else convert $convertflags $outdir/logpg-${scanpgnum}-${physpgnum}-?.pnm $outdir/final-${scanpgnum}-${physpgnum}-%01d.${extension} || exit 1 fi @@ -233,13 +233,13 @@ for scanpgnum in `$my_seq 1 $pages`; do done -#try full ocr -rm -rf $outdir/logpgs -ocropus book2pages $outdir/logpgs $outdir/logpg-*.png -ocropus pages2lines $outdir/logpgs -ocropus lines2fsts $outdir/logpgs -ocropus fsts2bestpaths $outdir/logpgs -ocropus buildhtml $outdir/logpgs > $outdir/out.html +#don't try full ocr, it's a waste of time. +#rm -rf $outdir/logpgs +#ocropus book2pages $outdir/logpgs $outdir/logpg-*.png +#ocropus pages2lines $outdir/logpgs +#ocropus lines2fsts $outdir/logpgs +#ocropus fsts2bestpaths $outdir/logpgs +#ocropus buildhtml $outdir/logpgs > $outdir/out.html mkdir -p $outdir/pages mv $outdir/final-*.${extension} $outdir/pages