From 1527ef1b775132aa8f3b89b4728e6f59c1c983b5 Mon Sep 17 00:00:00 2001 From: Toke Eskildsen <te@ekot.dk> Date: Wed, 4 Dec 2013 13:22:37 +0100 Subject: [PATCH] Closes #19 (Add OCR quality statistics): The reported accuracy is shown on the image page --- image_template.html | 3 ++- quack.sh | 3 ++- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/image_template.html b/image_template.html index 61258e2..1f747aa 100644 --- a/image_template.html +++ b/image_template.html @@ -26,7 +26,8 @@ ${ALTERNATIVES} <p class="greystats"> ${GREY_FIRST}: ${GREY_PERCENT_FIRST}%<br/> ${GREY_LAST}: ${GREY_PERCENT_LAST}%<br/> -Unique greyscale values: ${GREY_UNIQUE} +Unique greyscale values: ${GREY_UNIQUE}<br/> +ALTO-accuracy: ${ACCURACY}% <p><input type="checkbox" id="toggle_grid" onClick="toggleGrid();">Grid</input></p> <p><input type="checkbox" id="toggle_textblock" checked="checked" onClick="toggleTextBlock();">TextBlocks</input></p> <p><input type="checkbox" id="toggle_blown" onClick="toggleBlown();">Black/white</input></p> diff --git a/quack.sh b/quack.sh index 198963d..77913c4 100755 --- a/quack.sh +++ b/quack.sh @@ -467,7 +467,7 @@ function blackWhite() { # Generates overlayscase # src dest altofile width height -# Output: ELEMENTS_HTML OVERLAYS OCR_CONTENT IDNEXT_CONTENT FULL_RELATIVE_HEIGHT +# Output: ELEMENTS_HTML OVERLAYS OCR_CONTENT IDNEXT_CONTENT FULL_RELATIVE_HEIGHT ACCURACY function processALTO() { local SRC="$1" local DEST="$2" @@ -499,6 +499,7 @@ function processALTO() { local PTAG=`echo "$ALTO_COMPACT" | grep -o "<Page[^>]\\+>"` local PHEIGHT=`echo $PTAG | sed 's/.*HEIGHT=\"\([^"]\+\)".*/\\1/g'` local PWIDTH=`echo $PTAG | sed 's/.*WIDTH=\"\([^"]\+\)".*/\\1/g'` + ACCURACY=`echo $PTAG | sed 's/.*ACCURACY=\"\([^"]\+\)".*/\\1/g'` FULL_RELATIVE_HEIGHT=`echo "scale=6;$PHEIGHT/$PWIDTH" | bc | sed 's/^\./0./'` # TODO: Ponder how relative positioning works and why this hack is necessary -- GitLab