Spaces:
Sleeping
Sleeping
maslionok
commited on
Commit
Β·
8d5fa5e
1
Parent(s):
abc6868
fix
Browse files
app.py
CHANGED
|
@@ -41,7 +41,7 @@ def process_ocr_qa(text, lang_choice):
|
|
| 41 |
if 'score' in result:
|
| 42 |
score = result['score']
|
| 43 |
score_emoji = "π’" if score >= 0.8 else "π‘" if score >= 0.5 else "π΄"
|
| 44 |
-
output_lines.append(f"{score_emoji} **Quality Score:** {score:.
|
| 45 |
|
| 46 |
# Diagnostics section
|
| 47 |
if 'diagnostics' in result and result['diagnostics']:
|
|
@@ -54,13 +54,16 @@ def process_ocr_qa(text, lang_choice):
|
|
| 54 |
|
| 55 |
# Known tokens
|
| 56 |
if 'known_tokens' in diagnostics and diagnostics['known_tokens']:
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
|
|
|
|
|
|
| 60 |
|
| 61 |
# Unknown tokens (potential OCR errors)
|
| 62 |
if 'unknown_tokens' in diagnostics and diagnostics['unknown_tokens']:
|
| 63 |
-
|
|
|
|
| 64 |
elif 'unknown_tokens' in diagnostics:
|
| 65 |
output_lines.append(" β¨ No potential OCR errors detected!")
|
| 66 |
|
|
|
|
| 41 |
if 'score' in result:
|
| 42 |
score = result['score']
|
| 43 |
score_emoji = "π’" if score >= 0.8 else "π‘" if score >= 0.5 else "π΄"
|
| 44 |
+
output_lines.append(f"{score_emoji} **Quality Score:** {score:.1f}")
|
| 45 |
|
| 46 |
# Diagnostics section
|
| 47 |
if 'diagnostics' in result and result['diagnostics']:
|
|
|
|
| 54 |
|
| 55 |
# Known tokens
|
| 56 |
if 'known_tokens' in diagnostics and diagnostics['known_tokens']:
|
| 57 |
+
known_tokens = diagnostics['known_tokens']
|
| 58 |
+
displayed_tokens = ', '.join(known_tokens[:10])
|
| 59 |
+
output_lines.append(f" β
Known tokens ({len(known_tokens)}): {displayed_tokens}")
|
| 60 |
+
if len(known_tokens) > 10:
|
| 61 |
+
output_lines.append(f" ... and {len(known_tokens) - 10} more")
|
| 62 |
|
| 63 |
# Unknown tokens (potential OCR errors)
|
| 64 |
if 'unknown_tokens' in diagnostics and diagnostics['unknown_tokens']:
|
| 65 |
+
unknown_tokens = diagnostics['unknown_tokens']
|
| 66 |
+
output_lines.append(f" β Potential OCR errors ({len(unknown_tokens)}): {', '.join(unknown_tokens)}")
|
| 67 |
elif 'unknown_tokens' in diagnostics:
|
| 68 |
output_lines.append(" β¨ No potential OCR errors detected!")
|
| 69 |
|