From 9e7bd54b1f252e95ae1d3b3f87f794a3a53a5cc4 Mon Sep 17 00:00:00 2001 From: Shihaam Abdul Rahman Date: Sat, 3 Aug 2024 01:50:43 +0500 Subject: [PATCH] added status, better date and time and some processing --- ocr.sh | 15 +++++++++------ 1 file changed, 9 insertions(+), 6 deletions(-) diff --git a/ocr.sh b/ocr.sh index 344b837..647f4b2 100755 --- a/ocr.sh +++ b/ocr.sh @@ -1,18 +1,20 @@ #!/bin/bash - INPUT_IMAGE=$1 -raw_text=$(tesseract $INPUT_IMAGE stdout) +raw_text=$(tesseract $INPUT_IMAGE stdout --psm 6) referece=$(echo "$raw_text" | grep -o 'BLAZ[0-9]*') to_number=$(echo "$raw_text" | grep -oE '\b9[0-9]{16}\b|\b7[0-9]{12}\b') -date=$(echo "$raw_text" | grep -oE '\b[0-3][0-9]/[0-1][0-9]/[0-9]{4}\b') -time=$(echo "$raw_text" | grep -oE '\b[0-2][0-9]:[0-5][0-9]\b') +#date=$(echo "$raw_text" | grep -oE '\b[0-3][0-9]/[0-1][0-9]/[0-9]{4}\b') +#time=$(echo "$raw_text" | grep -oE '\b[0-2][0-9]:[0-5][0-9]\b') +date=$(echo "$raw_text" | grep -oE '[0-3][0-9]/[0-1][0-9]/[0-9]{4}') +time=$(echo "$raw_text" | grep -oE '[0-2][0-9]:[0-5][0-9]') currency=$(echo "$raw_text" | grep -oP '(?<=Amount\s)[A-Z]{3}') amount=$(echo "$raw_text" | grep -oP '(?<=Amount\s[A-Z]{3}\s)[0-9]{1,3}(?:,[0-9]{3})*(?:\.[0-9]{2})') +status=$(echo "$raw_text" | grep -oP '(?<=Status\s)[A-Z]+') -json_output=$(cat <