maslionok commited on
Commit
8d5fa5e
Β·
1 Parent(s): abc6868
Files changed (1) hide show
  1. app.py +8 -5
app.py CHANGED
@@ -41,7 +41,7 @@ def process_ocr_qa(text, lang_choice):
41
  if 'score' in result:
42
  score = result['score']
43
  score_emoji = "🟒" if score >= 0.8 else "🟑" if score >= 0.5 else "πŸ”΄"
44
- output_lines.append(f"{score_emoji} **Quality Score:** {score:.2f}")
45
 
46
  # Diagnostics section
47
  if 'diagnostics' in result and result['diagnostics']:
@@ -54,13 +54,16 @@ def process_ocr_qa(text, lang_choice):
54
 
55
  # Known tokens
56
  if 'known_tokens' in diagnostics and diagnostics['known_tokens']:
57
- output_lines.append(f" βœ… Known tokens ({len(diagnostics['known_tokens'])}): {', '.join(diagnostics['known_tokens'][:10])}")
58
- if len(diagnostics['known_tokens']) > 10:
59
- output_lines.append(f" ... and {len(diagnostics['known_tokens']) - 10} more")
 
 
60
 
61
  # Unknown tokens (potential OCR errors)
62
  if 'unknown_tokens' in diagnostics and diagnostics['unknown_tokens']:
63
- output_lines.append(f" ❌ Potential OCR errors ({len(diagnostics['unknown_tokens'])}): {', '.join(diagnostics['unknown_tokens'])}")
 
64
  elif 'unknown_tokens' in diagnostics:
65
  output_lines.append(" ✨ No potential OCR errors detected!")
66
 
 
41
  if 'score' in result:
42
  score = result['score']
43
  score_emoji = "🟒" if score >= 0.8 else "🟑" if score >= 0.5 else "πŸ”΄"
44
+ output_lines.append(f"{score_emoji} **Quality Score:** {score:.1f}")
45
 
46
  # Diagnostics section
47
  if 'diagnostics' in result and result['diagnostics']:
 
54
 
55
  # Known tokens
56
  if 'known_tokens' in diagnostics and diagnostics['known_tokens']:
57
+ known_tokens = diagnostics['known_tokens']
58
+ displayed_tokens = ', '.join(known_tokens[:10])
59
+ output_lines.append(f" βœ… Known tokens ({len(known_tokens)}): {displayed_tokens}")
60
+ if len(known_tokens) > 10:
61
+ output_lines.append(f" ... and {len(known_tokens) - 10} more")
62
 
63
  # Unknown tokens (potential OCR errors)
64
  if 'unknown_tokens' in diagnostics and diagnostics['unknown_tokens']:
65
+ unknown_tokens = diagnostics['unknown_tokens']
66
+ output_lines.append(f" ❌ Potential OCR errors ({len(unknown_tokens)}): {', '.join(unknown_tokens)}")
67
  elif 'unknown_tokens' in diagnostics:
68
  output_lines.append(" ✨ No potential OCR errors detected!")
69