Spaces:

milwright
/

historical-ocr

Running

App Files Files Community

historical-ocr / streamlit_app.py

milwright

submit pull for merge (#1)

f475c01 verified 8 days ago

raw

history blame contribute delete

88.6 kB

	import os
	import streamlit as st
	import json
	import sys
	from pathlib import Path
	import tempfile
	from datetime import datetime
	import io
	import base64
	from io import BytesIO
	from enum import Enum
	import inspect

	# Add parent directory to path so we can import the OCR modules
	parent_dir = Path(__file__).parent.absolute()
	sys.path.append(str(parent_dir))

	# Import the StructuredOCR class and process_file utility
	from structured_ocr import StructuredOCR

	# Add API endpoint support for the React app
	from streamlit.web.server.server import Server
	from streamlit.runtime.scriptrunner import get_script_run_ctx

	# Custom JSON encoder to handle Enum types and other non-serializable objects
	class EnhancedJSONEncoder(json.JSONEncoder):
	def default(self, obj):
	if isinstance(obj, Enum):
	return obj.value
	elif hasattr(obj, '__dict__'):
	# For objects that have a __dict__ but aren't directly serializable
	return {key: value for key, value in obj.__dict__.items()
	if not key.startswith('_')}
	elif hasattr(obj, 'model_dump'):
	# For Pydantic models
	return obj.model_dump()
	elif hasattr(obj, 'to_dict'):
	# For objects with to_dict method
	return obj.to_dict()
	# Let the base class handle other types or raise TypeError
	return super().default(obj)

	# Helper function to convert any result to JSON-serializable
	def make_serializable(obj):
	"""Convert any object to a JSON-serializable form"""
	if isinstance(obj, dict):
	return {k: make_serializable(v) for k, v in obj.items()}
	elif isinstance(obj, list):
	return [make_serializable(item) for item in obj]
	elif isinstance(obj, Enum):
	return obj.value
	elif hasattr(obj, 'pages'):
	# Special case for OCRResponse objects which have pages attribute
	if hasattr(obj, '__dict__'):
	result = {k: make_serializable(v) for k, v in obj.__dict__.items()
	if not k.startswith('_')}
	# Explicitly handle pages attribute
	if hasattr(obj, 'pages'):
	result['pages'] = [make_serializable(page) for page in obj.pages]
	return result
	elif hasattr(obj, '__dict__'):
	# For objects with __dict__ attribute
	return {k: make_serializable(v) for k, v in obj.__dict__.items()
	if not k.startswith('_')}
	elif hasattr(obj, 'model_dump'):
	# For Pydantic models
	return make_serializable(obj.model_dump())
	elif hasattr(obj, 'to_dict'):
	# For objects with to_dict method
	return make_serializable(obj.to_dict())
	# Basic types will be returned as is
	return obj

	# API response handler
	def process_api_request():
	"""Handle API requests from the React frontend"""
	# Get the current Streamlit session
	ctx = get_script_run_ctx()
	if ctx is None:
	return

	session_id = ctx.session_id
	session_info = Server.get_current()._get_session_info(session_id)

	if session_info is None:
	return

	request = session_info.uploaded_file_mgr._uploaded_files.get('file')

	if not request:
	return

	# Extract file and parameters
	uploaded_file = request[0]
	use_vision = session_info.query_string.get('use_vision', ['true'])[0].lower() == 'true'

	try:
	# Process file
	result = process_file(uploaded_file, use_vision=use_vision)

	# Convert result to JSON-serializable format
	serializable_result = make_serializable(result)

	# Return JSON response
	return serializable_result
	except Exception as e:
	# Return error response
	return {"error": str(e)}

	try:
	from process_file import process_file as process_file_util
	# Use the utility function instead of the local function
	process_file = process_file_util
	except ImportError:
	# Define the process_file function if it's not available
	def process_file(uploaded_file, use_vision=True):
	"""Process the uploaded file and return the OCR results"""
	# Save the uploaded file to a temporary file
	with tempfile.NamedTemporaryFile(delete=False, suffix=Path(uploaded_file.name).suffix) as tmp:
	tmp.write(uploaded_file.getvalue())
	temp_path = tmp.name

	try:
	# Initialize OCR processor
	processor = StructuredOCR()

	# Determine file type from extension
	file_ext = Path(uploaded_file.name).suffix.lower()
	file_type = "pdf" if file_ext == ".pdf" else "image"

	# Process the file
	result = processor.process_file(temp_path, file_type=file_type, use_vision=use_vision)

	# Add to processing history
	history_item = {
	"id": datetime.now().timestamp(),
	"fileName": uploaded_file.name,
	"timestamp": datetime.now().isoformat(),
	"result": result,
	"useVision": use_vision
	}

	if 'processing_history' not in st.session_state:
	st.session_state.processing_history = []

	st.session_state.processing_history.append(history_item)

	return result
	except Exception as e:
	st.error(f"Error processing document: {str(e)}")
	return None
	finally:
	# Clean up the temporary file
	if os.path.exists(temp_path):
	os.unlink(temp_path)

	# Set page configuration
	st.set_page_config(
	page_title="Historical OCR Workshop",
	page_icon="📜",
	layout="wide",
	initial_sidebar_state="collapsed" # Start with sidebar collapsed for cleaner landing
	)

	# Custom CSS to match React dark theme and improve Streamlit integration
	st.markdown("""
	<style>
	/* Global theme alignment with React */
	.stApp {
	background-color: #111827; /* bg-gray-900 in Tailwind */
	color: white;
	position: relative;
	}

	/* Add subtle grid background to the entire app */
	.stApp::before {
	content: "";
	position: fixed;
	top: 0;
	left: 0;
	right: 0;
	bottom: 0;
	background-image:
	linear-gradient(rgba(55, 65, 81, 0.1) 1px, transparent 1px),
	linear-gradient(90deg, rgba(55, 65, 81, 0.1) 1px, transparent 1px);
	background-size: 25px 25px;
	opacity: 0.3;
	z-index: 0;
	pointer-events: none;
	}

	/* Make sure all text is visible */
	p, h1, h2, h3, h4, h5, h6, div, span, li, label, a {
	color: white !important;
	position: relative;
	}

	/* Add spacier typography */
	p, li {
	line-height: 1.7;
	margin-bottom: 0.8rem;
	}

	h3 {
	margin-top: 1.5rem;
	margin-bottom: 1.2rem;
	font-weight: 600;
	letter-spacing: 0.015em;
	}

	/* Fix empty-looking containers */
	div:empty {
	min-height: 0 !important;
	padding: 0 !important;
	margin: 0 !important;
	}

	/* Custom header */
	.main-header {
	background-color: #000000;
	padding: 1rem;
	border-bottom: 1px solid #374151; /* border-gray-700 */
	margin-bottom: 1.5rem;
	}

	/* Content containers */
	.content-container {
	background-color: #1f2937; /* bg-gray-800 in Tailwind */
	color: white;
	padding: 1.8rem;
	border-radius: 0.75rem;
	margin-bottom: 2rem;
	box-shadow: 0 6px 12px rgba(0,0,0,0.2);
	border: 1px solid rgba(75, 85, 99, 0.3);
	position: relative;
	overflow: hidden;
	}

	.content-container::before {
	content: "";
	position: absolute;
	top: 0;
	left: 0;
	right: 0;
	bottom: 0;
	background-image: linear-gradient(rgba(55, 65, 81, 0.2) 1px, transparent 1px),
	linear-gradient(90deg, rgba(55, 65, 81, 0.2) 1px, transparent 1px);
	background-size: 20px 20px;
	opacity: 0.05;
	z-index: 0;
	}

	.content-container > * {
	position: relative;
	z-index: 1;
	color: white !important;
	}

	.content-container h4 {
	color: #60A5FA !important;
	margin-bottom: 1rem;
	font-size: 1.2rem;
	letter-spacing: 0.02em;
	}

	.content-container ul, .content-container ol {
	padding-left: 1.5rem;
	margin-top: 0.8rem;
	margin-bottom: 0.8rem;
	}

	.content-container li {
	margin-bottom: 0.5rem;
	line-height: 1.5;
	}

	/* Interactive elements */
	.tool-container {
	background-color: #1f2937; /* bg-gray-800 */
	color: white;
	padding: 1.5rem;
	border-radius: 0.5rem;
	border: 1px solid #374151; /* border-gray-700 */
	margin-bottom: 1.5rem;
	}

	.tool-container * {
	color: white !important;
	}

	/* Special containers */
	.key-concept {
	background-color: #374151; /* bg-gray-700 */
	padding: 0.75rem;
	border-radius: 0.5rem;
	margin: 1rem 0;
	border-left: 3px solid #3B82F6; /* border-blue-500 */
	color: white;
	}

	.key-concept * {
	color: white !important;
	}

	.research-question {
	background-color: #1E3A8A; /* bg-blue-900 */
	padding: 0.75rem;
	border-radius: 0.5rem;
	margin: 1rem 0;
	border-left: 3px solid #60A5FA; /* border-blue-400 */
	color: white;
	}

	.research-question * {
	color: white !important;
	}

	.quote-container {
	font-style: italic;
	color: #D1D5DB; /* text-gray-300 */
	padding: 0.5rem 1rem;
	border-left: 3px solid #4B5563; /* border-gray-600 */
	margin: 1rem 0;
	}

	/* Hero section */
	.hero-container {
	background: linear-gradient(135deg, #1E3A8A 0%, #2563EB 100%); /* blue-900 to blue-600 */
	color: white;
	padding: 3rem 2rem;
	border-radius: 0.75rem;
	margin-bottom: 3rem;
	box-shadow: 0 8px 16px rgba(0,0,0,0.4);
	text-align: center;
	position: relative;
	overflow: hidden;
	}

	.hero-container::before {
	content: "";
	position: absolute;
	top: 0;
	left: 0;
	right: 0;
	bottom: 0;
	background-image:
	linear-gradient(rgba(30, 58, 138, 0.8) 1px, transparent 1px),
	linear-gradient(90deg, rgba(30, 58, 138, 0.8) 1px, transparent 1px);
	background-size: 20px 20px;
	opacity: 0.2;
	z-index: 0;
	}

	.hero-title {
	font-size: 2.5rem;
	font-weight: 700;
	margin-bottom: 1rem;
	position: relative;
	z-index: 1;
	}

	.hero-subtitle {
	font-size: 1.25rem;
	opacity: 0.9;
	max-width: 700px;
	margin: 0 auto;
	position: relative;
	z-index: 1;
	}

	/* File upload styling */
	.upload-container {
	border: 2px dashed #4B5563; /* border-gray-600 */
	padding: 1.5rem;
	text-align: center;
	border-radius: 0.5rem;
	margin-bottom: 1rem;
	background-color: #374151; /* bg-gray-700 */
	color: white;
	}

	/* History cards */
	.history-card {
	padding: 0.75rem;
	background-color: #374151; /* bg-gray-700 */
	color: white;
	border-radius: 0.25rem;
	border: 1px solid #4B5563; /* border-gray-600 */
	margin-bottom: 0.5rem;
	}

	/* Override Streamlit defaults */
	.stTextInput > div > div > input {
	background-color: #374151; /* bg-gray-700 */
	color: white !important;
	}

	.stSelectbox > div > div > div {
	background-color: #374151; /* bg-gray-700 */
	color: white !important;
	}

	.stCheckbox > div > label {
	color: white !important;
	}

	/* Fix empty containers */
	.tool-container:empty {
	display: none;
	}

	/* Ensure all text is visible */
	div, span, p, h1, h2, h3, h4, h5, h6, label, li {
	color: white !important;
	}

	/* Tab panel content */
	.stTabs [data-baseweb="tab-panel"] * {
	color: white !important;
	}

	/* Button styling */
	.stButton > button {
	background-color: #2563EB; /* bg-blue-600 */
	color: white;
	}

	.stButton > button:hover {
	background-color: #1D4ED8; /* bg-blue-700 */
	}

	/* Make sure all text is readable */
	p, h1, h2, h3, h4, h5, h6, span, label {
	color: white;
	}

	.stMarkdown a {
	color: #93C5FD; /* text-blue-300 */
	}

	/* Tabs */
	.stTabs [data-baseweb="tab"] {
	color: white;
	}

	.stTabs [data-baseweb="tab-highlight"] {
	background-color: #2563EB; /* bg-blue-600 */
	}

	/* Expander */
	.streamlit-expanderHeader {
	color: white;
	background-color: #1f2937; /* bg-gray-800 */
	}

	/* Sidebar */
	[data-testid="stSidebar"] {
	background-color: #111827; /* bg-gray-900 */
	}

	[data-testid="stSidebar"] .stMarkdown {
	color: white;
	}
	</style>
	""", unsafe_allow_html=True)

	# Initialize session state for workshop progress
	if 'current_module' not in st.session_state:
	st.session_state.current_module = 1
	if 'processing_history' not in st.session_state:
	st.session_state.processing_history = []
	if 'workshop_started' not in st.session_state:
	st.session_state.workshop_started = False

	def navigate_to_module(module_number):
	"""Navigate to a specific module"""
	st.session_state.current_module = module_number

	# Welcome/Start screen if workshop hasn't been started
	if not st.session_state.workshop_started:
	# Hero section with eye-catching design
	st.markdown("""
	<div class="hero-container">
	<h1 class="hero-title">Historical OCR Workshop</h1>
	<p class="hero-subtitle">Unlock the potential of historical documents with modern OCR technology</p>
	</div>
	""", unsafe_allow_html=True)

	# Introduction with cleaner layout
	col1, col2 = st.columns([3, 2])

	with col1:
	st.markdown("""
	<div class="content-container">
	<h3>Workshop Overview</h3>

	This interactive workshop explores the application of OCR technology to historical documents,
	combining theoretical understanding with practical experiences. Designed for historians,
	archivists, and digital humanities scholars, it offers both conceptual frameworks and hands-on skills.
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="key-concept">
	<h4>What is OCR?</h4>
	Optical Character Recognition (OCR) technology enables computers to extract text from images and documents.
	Modern OCR uses AI vision models to understand both the text and its visual context, making it powerful for
	historical research and digital humanities.
	</div>
	""", unsafe_allow_html=True)

	with col2:
	# Add an engaging research question to connect with historians
	st.markdown("""
	<div class="research-question">
	<h4>For Historians:</h4>
	How might OCR technology transform our access to and interpretation of historical documents?
	What new research questions become possible when large archives become machine-readable?
	</div>
	""", unsafe_allow_html=True)

	# Display sample historical document images in a better format
	input_dir = Path(__file__).parent / "input"
	sample_images = [
	{"path": input_dir / "letter-1.jpg", "caption": "Historical Letter"},
	{"path": input_dir / "recipe.jpg", "caption": "Historical Recipe"}
	]

	# Try to find any of the sample images
	for sample in sample_images:
	if sample["path"].exists():
	try:
	from PIL import Image
	with Image.open(sample["path"]) as img:
	# Add a better styled border and shadow
	st.markdown(f"""
	<div style="
	border: 1px solid rgba(75, 85, 99, 0.6);
	padding: 12px;
	border-radius: 8px;
	margin-bottom: 1rem;
	box-shadow: 0 6px 15px rgba(0,0,0,0.3);
	background-color: #1f2937;
	position: relative;
	">
	""", unsafe_allow_html=True)
	st.image(img, caption=sample["caption"], width=280)
	st.markdown("""
	<p style="
	font-size: 0.85rem;
	opacity: 0.8;
	margin-top: 8px;
	font-style: italic;
	text-align: center;
	">Sample document for OCR analysis</p>
	</div>
	""", unsafe_allow_html=True)
	break # Only show one image
	except Exception:
	pass

	# What you'll learn section combined with Workshop Modules in parallel columns
	col1, col2 = st.columns(2)

	with col1:
	st.markdown('<h3 class="workshop-heading" style="margin-bottom:1.5rem; padding-bottom:0.5rem; border-bottom:1px solid rgba(75, 85, 99, 0.5);">What You\'ll Learn</h3>', unsafe_allow_html=True)

	st.markdown("""
	<div class="content-container">
	<h4><i class="fas fa-book-open"></i> Conceptual Understanding</h4>

	- Text-image relationships in historical documents
	- Evolution of OCR technology
	- AI vision models for document analysis
	- Historical typography challenges
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="content-container">
	<h4><i class="fas fa-microscope"></i> Methodological Approaches</h4>

	- Critical frameworks for OCR in historical research
	- Hybrid computational-traditional methods
	- Error analysis and interpretation
	- Contextual reading strategies
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="content-container">
	<h4><i class="fas fa-tools"></i> Practical Skills</h4>

	- Processing historical documents with OCR
	- Analyzing and structuring extracted information
	- Integrating OCR into research workflows
	- Building searchable archives
	</div>
	""", unsafe_allow_html=True)

	with col2:
	# Workshop modules with visually appealing cards
	st.markdown('<h3 class="workshop-heading" style="margin-bottom:1.5rem; padding-bottom:0.5rem; border-bottom:1px solid rgba(75, 85, 99, 0.5);">Workshop Modules</h3>', unsafe_allow_html=True)

	# Add some styling for the module cards
	st.markdown("""
	<style>
	.module-card {
	background-color: #1f2937; /* bg-gray-800 */
	border-radius: 10px;
	box-shadow: 0 4px 8px rgba(0,0,0,0.2);
	padding: 1.5rem;
	margin-bottom: 1.5rem;
	transition: all 0.3s ease;
	border-left: 4px solid #3B82F6; /* border-blue-500 */
	color: white;
	position: relative;
	overflow: hidden;
	}

	.module-card::before {
	content: "";
	position: absolute;
	top: 0;
	left: 0;
	right: 0;
	bottom: 0;
	background-image: linear-gradient(rgba(55, 65, 81, 0.2) 1px, transparent 1px),
	linear-gradient(90deg, rgba(55, 65, 81, 0.2) 1px, transparent 1px);
	background-size: 16px 16px;
	opacity: 0.05;
	z-index: 0;
	}

	.module-card > * {
	position: relative;
	z-index: 1;
	}

	.module-card:hover {
	transform: translateY(-5px);
	box-shadow: 0 10px 20px rgba(0,0,0,0.25);
	border-left-color: #60A5FA;
	}

	.module-number {
	background-color: #3B82F6; /* bg-blue-500 */
	color: white;
	font-weight: bold;
	padding: 0.4rem 0.8rem;
	border-radius: 20px;
	font-size: 0.9rem;
	display: inline-block;
	margin-bottom: 12px;
	box-shadow: 0 2px 4px rgba(0,0,0,0.2);
	}

	.module-title {
	font-weight: 600;
	margin-bottom: 1rem;
	font-size: 1.25rem;
	color: white;
	letter-spacing: 0.015em;
	}

	.module-card p {
	line-height: 1.6;
	opacity: 0.9;
	font-size: 0.95rem;
	}
	</style>
	""", unsafe_allow_html=True)

	# Modules inside the col2 from earlier
	with col2:
	st.markdown("""
	<div class="module-card">
	<div class="module-number">Module 1</div>
	<div class="module-title">Introduction and Problematization</div>
	<p>Explore the challenges of historical document digitization and the potential of OCR technologies
	to transform historical research. Examine key problems and opportunities in historical OCR.</p>
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="module-card">
	<div class="module-number">Module 2</div>
	<div class="module-title">Text-Image Relations in Historical Archives</div>
	<p>Analyze the complex relationships between text and images in historical documents,
	from typography and layout to marginalia and decorative elements.</p>
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="module-card">
	<div class="module-number">Module 3</div>
	<div class="module-title">OCR Technology and Historical Documents</div>
	<p>Understand the evolution of OCR technology from pattern matching to modern AI vision-language models,
	and how they address the unique challenges of historical documents.</p>
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="module-card">
	<div class="module-number">Module 4</div>
	<div class="module-title">Methodological Approaches</div>
	<p>Develop hybrid methodologies that combine computational processing with traditional
	historical research practices, balancing distant and close reading.</p>
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="module-card">
	<div class="module-number">Module 5</div>
	<div class="module-title">Interactive OCR Experiment</div>
	<p>Gain hands-on experience processing historical documents with OCR technology,
	analyzing results, and comparing different approaches.</p>
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="module-card">
	<div class="module-number">Module 6</div>
	<div class="module-title">Conclusion and Future Directions</div>
	<p>Synthesize workshop insights and explore future directions for OCR in historical research,
	from large-scale corpus analysis to computational paleography.</p>
	</div>
	""", unsafe_allow_html=True)

	# Engaging quote to inspire participation with citation - in a better styled container
	st.markdown("""
	<div style="
	background: linear-gradient(to right, rgba(30, 58, 138, 0.3), rgba(37, 99, 235, 0.1));
	border-left: 4px solid #3B82F6;
	padding: 1.5rem 2rem;
	border-radius: 8px;
	margin: 2.5rem 0;
	position: relative;
	font-style: italic;
	box-shadow: 0 4px 12px rgba(0,0,0,0.2);
	">
	<div style="
	position: absolute;
	left: 20px;
	top: -18px;
	font-size: 2rem;
	color: #60A5FA;
	opacity: 0.7;
	">"</div>

	<p style="
	font-size: 1.15rem;
	line-height: 1.7;
	max-width: 800px;
	margin: 0 auto;
	text-align: center;
	color: #E5E7EB !important;
	">The digital turn in historical research is not just about converting analog to digital;
	it's about transforming how we access, analyze, and interpret the past.</p>

	<div style="
	text-align: right;
	margin-top: 1rem;
	color: #9CA3AF !important;
	opacity: 0.9;
	font-size: 0.9rem;
	">— Dr. Jane Winters, Professor of Digital Humanities</div>
	</div>
	""", unsafe_allow_html=True)

	# Feature highlight before call to action with better styling
	st.markdown("""
	<div style="
	background: linear-gradient(135deg, #1E3A8A 0%, #1E40AF 100%);
	border-radius: 12px;
	padding: 2rem;
	margin: 3rem 0;
	border-top: 5px solid #3B82F6;
	color: white;
	box-shadow: 0 8px 20px rgba(0,0,0,0.3);
	position: relative;
	overflow: hidden;
	">
	<div style="
	position: absolute;
	top: 0;
	right: 0;
	bottom: 0;
	left: 0;
	background-image:
	linear-gradient(rgba(30, 58, 138, 0.2) 1px, transparent 1px),
	linear-gradient(90deg, rgba(30, 58, 138, 0.2) 1px, transparent 1px);
	background-size: 20px 20px;
	opacity: 0.1;
	"></div>

	<h3 style="
	margin-top: 0;
	color: white !important;
	font-size: 1.5rem;
	margin-bottom: 1.5rem;
	position: relative;
	z-index: 1;
	">Workshop Highlights</h3>

	<div style="
	display: grid;
	grid-template-columns: 1fr 1fr;
	gap: 1.5rem;
	position: relative;
	z-index: 1;
	">
	<div style="
	background-color: rgba(30, 64, 175, 0.5);
	padding: 1rem;
	border-radius: 8px;
	border-left: 3px solid #60A5FA;
	">
	<h4 style="
	margin-top: 0;
	color: #93C5FD !important;
	font-size: 1.1rem;
	">Interactive Learning</h4>
	<p style="
	margin-bottom: 0;
	opacity: 0.9;
	font-size: 0.95rem;
	">Hands-on document processing with real-time feedback and analysis</p>
	</div>

	<div style="
	background-color: rgba(30, 64, 175, 0.5);
	padding: 1rem;
	border-radius: 8px;
	border-left: 3px solid #60A5FA;
	">
	<h4 style="
	margin-top: 0;
	color: #93C5FD !important;
	font-size: 1.1rem;
	">Real Historical Documents</h4>
	<p style="
	margin-bottom: 0;
	opacity: 0.9;
	font-size: 0.95rem;
	">Work with authentic materials spanning different eras and formats</p>
	</div>

	<div style="
	background-color: rgba(30, 64, 175, 0.5);
	padding: 1rem;
	border-radius: 8px;
	border-left: 3px solid #60A5FA;
	">
	<h4 style="
	margin-top: 0;
	color: #93C5FD !important;
	font-size: 1.1rem;
	">Vision AI Models</h4>
	<p style="
	margin-bottom: 0;
	opacity: 0.9;
	font-size: 0.95rem;
	">Experience state-of-the-art OCR technology powered by advanced AI</p>
	</div>

	<div style="
	background-color: rgba(30, 64, 175, 0.5);
	padding: 1rem;
	border-radius: 8px;
	border-left: 3px solid #60A5FA;
	">
	<h4 style="
	margin-top: 0;
	color: #93C5FD !important;
	font-size: 1.1rem;
	">Research Applications</h4>
	<p style="
	margin-bottom: 0;
	opacity: 0.9;
	font-size: 0.95rem;
	">Learn to integrate OCR into historical research workflows</p>
	</div>
	</div>
	</div>
	""", unsafe_allow_html=True)

	# Enhanced start button with dynamic styling and clear call to action
	st.markdown("""
	<div style="
	text-align: center;
	margin: 3.5rem 0;
	padding: 2rem;
	background: linear-gradient(180deg, rgba(31, 41, 55, 0.6) 0%, rgba(17, 24, 39, 0.8) 100%);
	border-radius: 12px;
	border: 1px solid rgba(75, 85, 99, 0.3);
	box-shadow: 0 10px 25px rgba(0,0,0,0.2);
	">
	<h3 style="
	margin-bottom: 1.5rem;
	font-size: 1.5rem;
	color: white !important;
	">Ready to Start Your Journey?</h3>

	<button id="start-button" style="
	background: linear-gradient(90deg, #2563EB 0%, #1D4ED8 100%);
	color: white;
	border: none;
	padding: 0.8rem 2rem;
	font-size: 1.1rem;
	font-weight: 500;
	border-radius: 8px;
	cursor: pointer;
	transition: all 0.3s ease;
	box-shadow: 0 4px 12px rgba(37, 99, 235, 0.3);
	margin-bottom: 1rem;
	width: 280px;
	" onclick="document.getElementById('streamlit-button').click()">Begin Workshop Journey</button>

	<p style="
	text-align: center;
	margin-top: 1rem;
	font-size: 0.95rem;
	color: #9CA3AF !important;
	">No installation required • Start immediately • Interactive experience</p>
	</div>

	<script>
	// Animation for the button
	document.getElementById('start-button').addEventListener('mouseover', function() {
	this.style.transform = 'translateY(-3px)';
	this.style.boxShadow = '0 6px 15px rgba(37, 99, 235, 0.4)';
	});

	document.getElementById('start-button').addEventListener('mouseout', function() {
	this.style.transform = 'translateY(0)';
	this.style.boxShadow = '0 4px 12px rgba(37, 99, 235, 0.3)';
	});
	</script>
	""", unsafe_allow_html=True)

	# Hidden button to trigger the workshop start
	col1, col2, col3 = st.columns([1, 1, 1])
	with col2:
	if st.button("Begin Workshop", key="streamlit-button", use_container_width=True, type="primary"):
	st.session_state.workshop_started = True
	st.rerun()

	# Display workshop navigation sidebar only if workshop has started
	elif st.session_state.workshop_started:
	# Define input directory for images
	input_dir = Path(__file__).parent / "input"

	# Enhanced sidebar navigation
	with st.sidebar:
	st.markdown("<h1 style='margin-bottom:15px;'>Workshop Navigation</h1>", unsafe_allow_html=True)

	# Improved visual header with logo/image
	st.markdown("<div style='display:flex; align-items:center; margin-bottom:20px;'>", unsafe_allow_html=True)

	# Add a visual element with better sizing/styling
	workflow_path = input_dir / "workflow.jpg"
	if workflow_path.exists():
	try:
	from PIL import Image
	with Image.open(workflow_path) as img:
	st.image(img, width=160, output_format="PNG")
	except Exception:
	pass

	st.markdown("</div>", unsafe_allow_html=True)

	# Show enhanced progress indicator
	current_module = st.session_state.current_module
	st.markdown(f"<div style='margin-bottom:15px;'><b>Your Progress:</b> Module {current_module} of 6</div>", unsafe_allow_html=True)
	st.progress(current_module / 6)

	# More visually appealing module navigation
	modules = [
	"Introduction",
	"Text-Image Relations",
	"OCR Technology",
	"Methodological Approaches",
	"Interactive OCR Experiment",
	"Conclusion"
	]

	# Custom styling for navigation buttons
	st.markdown("""
	<style>
	.nav-button {
	padding: 8px 12px;
	margin-bottom: 8px;
	border-radius: 6px;
	background-color: #f5f5f5;
	display: block;
	text-decoration: none;
	color: #333;
	font-weight: 500;
	border-left: 3px solid transparent;
	transition: all 0.2s;
	}
	.nav-button:hover {
	background-color: #e6e6e6;
	}
	.nav-button.active {
	background-color: #e8f0fe;
	border-left: 3px solid #0d3c84;
	font-weight: 600;
	}
	.nav-section {
	margin: 20px 0 10px 0;
	font-weight: 600;
	color: #555;
	}
	</style>
	""", unsafe_allow_html=True)

	# Group into clearer sections
	st.markdown("<div class='nav-section'>Theory & Concepts</div>", unsafe_allow_html=True)

	for i in range(1, 4): # Modules 1-3
	active_class = "active" if i == current_module else ""
	st.markdown(f"""
	<div class="nav-button {active_class}" onclick="document.getElementById('nav_{i}').click()">
	<span style="display:inline-block; width:22px; text-align:center; margin-right:8px;
	background-color:{'#0d3c84' if i == current_module else '#ddd'}; color:{'white' if i == current_module else '#555'};
	border-radius:11px; font-size:0.8rem; font-weight:bold;">{i}</span>
	{modules[i-1]}
	</div>
	""", unsafe_allow_html=True)

	# Hidden button to handle the click
	if st.button(f"{i}", key=f"nav_{i}"):
	navigate_to_module(i)
	st.rerun()

	st.markdown("<div class='nav-section'>Application & Practice</div>", unsafe_allow_html=True)

	for i in range(4, 7): # Modules 4-6
	active_class = "active" if i == current_module else ""
	st.markdown(f"""
	<div class="nav-button {active_class}" onclick="document.getElementById('nav_{i}').click()">
	<span style="display:inline-block; width:22px; text-align:center; margin-right:8px;
	background-color:{'#0d3c84' if i == current_module else '#ddd'}; color:{'white' if i == current_module else '#555'};
	border-radius:11px; font-size:0.8rem; font-weight:bold;">{i}</span>
	{modules[i-1]}
	</div>
	""", unsafe_allow_html=True)

	# Hidden button to handle the click
	if st.button(f"{i}", key=f"nav_{i}"):
	navigate_to_module(i)
	st.rerun()

	st.markdown("---")

	# Enhanced quick jump button
	st.markdown("""
	<style>
	.jump-button {
	background-color: #f0f7ff;
	padding: 10px;
	border-radius: 6px;
	border-left: 3px solid #0d3c84;
	margin-bottom: 15px;
	cursor: pointer;
	}
	.jump-button:hover {
	background-color: #e3f0ff;
	}
	</style>
	""", unsafe_allow_html=True)

	st.markdown("""
	<div class="jump-button" onclick="document.getElementById('jump_exp').click()">
	<span style="font-weight:500;">📊 Jump to OCR Experiment</span>
	</div>
	""", unsafe_allow_html=True)

	# Hidden button for jump
	if st.button("Jump to Experiment", key="jump_exp"):
	navigate_to_module(5)
	st.rerun()

	# Workshop information in a cleaner collapsible section
	with st.expander("About the Workshop"):
	st.markdown("""
	This interactive workshop explores OCR technology for historical documents.

	How to use this workshop:
	1. Navigate through modules sequentially
	2. Expand content sections to read more
	3. Try the interactive OCR experiment
	4. Reflect on research questions

	For help or more information, use the reference materials in Module 6.
	""")

	# Enhanced progress tracking
	if st.session_state.processing_history:
	with st.expander("Your Activity"):
	st.markdown(f"<b>Documents processed:</b> {len(st.session_state.processing_history)}", unsafe_allow_html=True)

	# Show the most recent document processed with better formatting
	latest = st.session_state.processing_history[-1]
	st.markdown(f"""
	<div style="background:#f9f9f9; padding:8px; border-radius:4px; margin-top:10px;">
	<b>Latest document:</b> {latest['fileName']}<br>
	<span style="font-size:0.9rem; color:#666;">Processed with {' vision model' if latest['useVision'] else ' basic OCR'}</span>
	</div>
	""", unsafe_allow_html=True)

	# Main content based on current module
	if st.session_state.current_module == 1:
	# MODULE 1: Introduction
	st.title("Module 1: Introduction and Problematization")

	col1, col2 = st.columns([2, 1])

	with col1:
	st.markdown("""
	## Historical OCR Workshop

	### The Problem

	Historical documents present unique challenges for OCR technology:

	- Varying typography and handwriting styles
	- Document degradation and damage
	- Complex layouts and formatting
	- Multiple languages and archaic terminology
	- Illustrations and decorative elements
	""")

	with col2:
	st.markdown("""
	### Workshop Goals

	By the end of this workshop, you will:

	1. Understand text-image relationships in historical archives
	2. Learn about advanced OCR technology
	3. Explore methodological approaches
	4. Gain hands-on experience with OCR tools
	5. Develop research integration strategies
	""")

	# Next button
	st.button("Next: Text-Image Relations", key="next_to_2", on_click=navigate_to_module, args=(2,))

	elif st.session_state.current_module == 2:
	# MODULE 2: Text-Image Relations
	st.title("Module 2: Text-Image Relations in Historical Archives")

	col1, col2 = st.columns([1, 1])

	with col1:
	st.markdown("""
	### Textual Elements

	- Typography: Varying fonts, sizes, and styles
	- Layout: Columns, margins, and spacing
	- Marginalia: Notes, comments, and additions
	- Decorative Text: Illuminated letters and calligraphy
	""")

	st.markdown("""
	### Visual Elements

	- Illustrations: Diagrams, maps, and artistic representations
	- Watermarks: Hidden identifiers that locate documents
	- Damage: Tears, stains, and fading affecting legibility
	- Material Features: Paper quality and physical dimensions
	""")

	with col2:
	st.markdown("""
	### Interdependence

	The relationship between text and image in historical documents exists on a complex spectrum:

	- Text functions as image (decorative headings)
	- Images function as text (symbolic representations)
	- Layout creates meaning through visual organization
	- Material conditions affect both textual and visual elements
	""")

	st.image("https://upload.wikimedia.org/wikipedia/commons/thumb/0/0c/Book_of_Kells_folio_292r.jpg/800px-Book_of_Kells_folio_292r.jpg",
	caption="Book of Kells - Example of text-image integration")

	st.markdown("""
	### OCR Challenges

	These complex text-image relationships create particular challenges for OCR:

	1. Distinguishing Text from Decoration: Where does ornamental text end and functional text begin?
	2. Handling Illustrations: Should they be processed as images or described as text?
	3. Interpreting Layout: How to capture the significance of spacing and organization?
	4. Preserving Context: Maintaining the relationship between textual and visual elements
	""")

	# Navigation buttons
	col1, col2 = st.columns(2)
	with col1:
	st.button("Previous: Introduction", key="prev_to_1", on_click=navigate_to_module, args=(1,))

	with col2:
	st.button("Next: OCR Technology", key="next_to_3", on_click=navigate_to_module, args=(3,))

	elif st.session_state.current_module == 3:
	# MODULE 3: OCR Technology
	st.title("Module 3: OCR Technology and Historical Documents")

	col1, col2 = st.columns([1, 1])

	with col1:
	st.markdown("""
	### Traditional OCR Approaches

	1. Pattern Matching: Early OCR compared characters to templates
	2. Feature Extraction: Identifying key features of characters
	3. Statistical Models: Using probabilities to improve recognition
	""")

	st.markdown("""
	### Modern AI-Enhanced OCR

	1. Neural Networks: Deep learning models trained on vast datasets
	2. Computer Vision: Advanced image processing techniques
	3. Language Models: Contextual understanding to resolve ambiguities
	4. Multimodal Models: Integration of text, layout, and visual understanding
	""")

	with col2:
	st.markdown("""
	### Challenges with Historical Documents

	Historical materials present unique difficulties:

	- Typography Variation: Non-standardized fonts and styles
	- Historical Language: Archaic vocabulary and grammar
	- Layout Complexity: Non-linear arrangements
	- Document Degradation: Fading, tears, stains, and damage
	- Material Artifacts: Paper texture, binding shadows, etc.
	""")

	st.image("https://cdn.dribbble.com/users/412119/screenshots/16353886/media/82e593c60a5e4d460db917236eab6ece.jpg",
	caption="OCR processing layers")

	# Display processing history if available
	if st.session_state.processing_history:
	with st.expander("Your OCR Processing History"):
	st.markdown("You've already processed the following documents:")

	for item in st.session_state.processing_history:
	st.markdown(f"{item['fileName']} - {datetime.fromisoformat(item['timestamp']).strftime('%Y-%m-%d %H:%M')}")
	col1, col2 = st.columns(2)
	with col1:
	st.write(f"Topics: {', '.join(item['result'].get('topics', ['Unknown']))}")
	with col2:
	st.write(f"Vision model used: {'Yes' if item['useVision'] else 'No'}")

	# Quick link to experiment
	st.button("Jump to OCR Experiment", key="jump_to_5", on_click=navigate_to_module, args=(5,))

	# Navigation buttons
	col1, col2 = st.columns(2)
	with col1:
	st.button("Previous: Text-Image Relations", key="prev_to_2", on_click=navigate_to_module, args=(2,))

	with col2:
	st.button("Next: Methodological Approaches", key="next_to_4", on_click=navigate_to_module, args=(4,))

	elif st.session_state.current_module == 4:
	# MODULE 4: Methodological Approaches
	st.title("Module 4: Methodological Approaches")

	col1, col2 = st.columns([1, 1])

	with col1:
	st.markdown("""
	### Hybrid Methodologies

	1. Computational + Human Reading
	- OCR for initial processing and discovery
	- Human review for context and interpretation
	- Iterative refinement of computational outputs

	2. Close + Distant Reading
	- Distant reading through large-scale OCR processing
	- Close reading of selected passages
	- Zooming between scales of analysis
	""")

	# Reference to diagram.jpg
	input_dir = Path(__file__).parent / "input"
	diagram_path = input_dir / "diagram.jpg"
	if diagram_path.exists():
	try:
	# Load image file directly from disk
	from PIL import Image
	with Image.open(diagram_path) as img:
	st.image(img, caption="Historical VLM architecture", use_column_width=True)
	except Exception:
	pass

	with col2:
	st.markdown("""
	### Mistral-OCR-Latest: State-of-the-Art

	The Mistral-OCR model represents a significant advancement:

	- Multimodal Understanding: Processes both visual and textual information
	- Contextual Awareness: Considers historical context
	- Layout Recognition: Preserves complex document structures
	- Historical Font Adaptation: Trained on diverse historical typography
	""")

	# Reference to workflow.jpg
	workflow_path = input_dir / "workflow.jpg"
	if workflow_path.exists():
	try:
	# Load image file directly from disk
	from PIL import Image
	with Image.open(workflow_path) as img:
	st.image(img, caption="Mistral OCR workflow", use_column_width=True)
	except Exception:
	pass

	st.markdown("""
	### Practical Workflow

	A typical historical OCR workflow with Mistral-OCR includes:

	1. Selection: Choosing appropriate documents
	2. Preprocessing: Enhancing images before OCR
	3. OCR Processing: Running documents through vision-enhanced OCR
	4. Post-processing: Cleaning up outputs and structured extraction
	5. Verification: Cross-checking results against originals
	6. Integration: Incorporating OCR outputs into research materials
	""")

	# Navigation buttons
	col1, col2 = st.columns(2)
	with col1:
	st.button("Previous: OCR Technology", key="prev_to_3", on_click=navigate_to_module, args=(3,))

	with col2:
	st.button("Next: Interactive OCR Experiment", key="next_to_5", on_click=navigate_to_module, args=(5,))

	elif st.session_state.current_module == 5:
	# MODULE 5: Interactive OCR Experiment
	st.title("Module 5: Interactive OCR Experiment")

	# More modular design with sequenced steps
	st.markdown("""
	<div class="workshop-container">
	This interactive module allows you to process historical documents with OCR and analyze the results.
	Follow the sequenced steps below to experiment with historical document analysis.
	</div>
	""", unsafe_allow_html=True)

	# Tabbed interface for different activities
	experiment_tab, compare_tab, analyze_tab = st.tabs(["Process Documents", "Compare Results", "Analysis Guide"])

	with experiment_tab:
	# Import additional libraries for enhanced functionality
	try:
	from pdf2image import convert_from_bytes
	pdf_support = True
	except ImportError:
	pdf_support = False
	st.warning("PDF preview functionality is limited. The pdf2image module is required for PDF previews.")

	# OCR tool in a compact layout
	col1, col2 = st.columns([1, 1])

	with col1:
	st.markdown('<div class="tool-container" style="color:white !important; background-color:#1f2937; padding:1.5rem; border-radius:0.5rem; border:1px solid #374151;">', unsafe_allow_html=True)
	st.markdown("<h3 style='color:white !important;'>Step 1: Select Document & Options</h3>", unsafe_allow_html=True)

	# Processing options
	use_vision = st.checkbox("Use Vision Model", value=True,
	help="Use the vision model for improved analysis")

	# Additional prompt for the model
	st.markdown("### Custom Research Prompt (Optional)")
	st.markdown("""Provide additional instructions to guide the OCR analysis.
	Focus on specific aspects of historical research you're interested in.""")
	custom_prompt = st.text_area("Research Prompt",
	placeholder="E.g., Focus on identifying dates and historical figures; Analyze the writing style for period-specific terminology; Highlight any cultural or social indicators of the time period...",
	help="Optional instructions to guide the analysis of the historical document")

	# Example preset documents selection
	input_dir = Path(__file__).parent / "input"
	if input_dir.exists():
	sample_files = list(input_dir.glob(".jpg")) + list(input_dir.glob(".png")) + list(input_dir.glob("*.pdf"))
	if sample_files:
	st.markdown("#### Sample Documents")
	sample_options = ["Upload my own document"] + [f.name for f in sample_files]
	sample_choice = st.selectbox("Choose a document:", sample_options)

	if sample_choice != "Upload my own document":
	selected_file = next((f for f in sample_files if f.name == sample_choice), None)
	if selected_file:
	# Store the selected sample file in session state
	with open(selected_file, "rb") as f:
	file_bytes = f.read()
	st.session_state.sample_file = {
	"name": selected_file.name,
	"bytes": file_bytes
	}

	# Preview the selected sample
	if selected_file.suffix.lower() == ".pdf" and pdf_support:
	try:
	with st.spinner("Generating PDF preview..."):
	images = convert_from_bytes(file_bytes, first_page=1, last_page=1, dpi=150)
	if images:
	# Convert PIL image to bytes for Streamlit
	first_page = images[0]
	img_bytes = io.BytesIO()
	first_page.save(img_bytes, format='JPEG')
	img_bytes.seek(0)
	st.image(img_bytes, caption=f"Preview: {selected_file.name}", use_container_width=True)
	except Exception:
	st.info(f"PDF selected: {selected_file.name}")
	else:
	# For images display directly
	try:
	from PIL import Image
	img = Image.open(BytesIO(file_bytes))
	st.image(img, caption=f"Preview: {selected_file.name}", use_container_width=True)
	except Exception:
	st.info(f"Selected: {selected_file.name}")
	else:
	# Clear the sample file if "Upload my own" is selected
	if 'sample_file' in st.session_state:
	del st.session_state.sample_file

	# File uploader with styling matched to React theme
	st.markdown('<div class="upload-container">', unsafe_allow_html=True)
	uploaded_file = st.file_uploader("Choose a file", type=["pdf", "png", "jpg", "jpeg"], label_visibility="collapsed")

	if uploaded_file is None:
	st.markdown("### Upload a document to get started")
	st.markdown("Supported formats: PDF, JPG, PNG")
	else:
	# Display the uploaded file
	file_ext = Path(uploaded_file.name).suffix.lower()

	if file_ext == ".pdf" and pdf_support:
	try:
	# Convert first page of PDF to image for preview
	pdf_bytes = uploaded_file.getvalue()
	with st.spinner("Generating PDF preview..."):
	images = convert_from_bytes(pdf_bytes, first_page=1, last_page=1, dpi=150)

	if images:
	# Convert PIL image to bytes for Streamlit
	first_page = images[0]
	img_bytes = io.BytesIO()
	first_page.save(img_bytes, format='JPEG')
	img_bytes.seek(0)

	# Display the PDF preview
	st.image(img_bytes, caption=f"PDF Preview: {uploaded_file.name}", use_container_width=True)
	else:
	st.info(f"PDF uploaded: {uploaded_file.name}")
	except Exception:
	# Simply show the file name without an error message
	st.info(f"PDF uploaded: {uploaded_file.name}")
	elif file_ext != ".pdf":
	st.image(uploaded_file, use_container_width=True)
	else:
	st.info(f"PDF uploaded: {uploaded_file.name}")

	st.markdown('</div>', unsafe_allow_html=True)
	else:
	# No sample files found, just show the uploader
	st.markdown('<div class="upload-container">', unsafe_allow_html=True)
	uploaded_file = st.file_uploader("Choose a file", type=["pdf", "png", "jpg", "jpeg"], label_visibility="collapsed")

	if uploaded_file is None:
	st.markdown("### Upload a document to get started")
	st.markdown("Supported formats: PDF, JPG, PNG")
	else:
	# Display the uploaded file preview
	file_ext = Path(uploaded_file.name).suffix.lower()
	if file_ext == ".pdf" and pdf_support:
	try:
	# PDF preview logic
	pdf_bytes = uploaded_file.getvalue()
	with st.spinner("Generating PDF preview..."):
	images = convert_from_bytes(pdf_bytes, first_page=1, last_page=1, dpi=150)
	if images:
	first_page = images[0]
	img_bytes = io.BytesIO()
	first_page.save(img_bytes, format='JPEG')
	img_bytes.seek(0)
	st.image(img_bytes, caption=f"PDF Preview: {uploaded_file.name}", use_container_width=True)
	else:
	st.info(f"PDF uploaded: {uploaded_file.name}")
	except Exception:
	st.info(f"PDF uploaded: {uploaded_file.name}")
	elif file_ext != ".pdf":
	st.image(uploaded_file, use_container_width=True)
	else:
	st.info(f"PDF uploaded: {uploaded_file.name}")
	st.markdown('</div>', unsafe_allow_html=True)
	else:
	# Input directory doesn't exist, just show the uploader
	st.markdown('<div class="upload-container">', unsafe_allow_html=True)
	uploaded_file = st.file_uploader("Choose a file", type=["pdf", "png", "jpg", "jpeg"], label_visibility="collapsed")

	if uploaded_file is None:
	st.markdown("### Upload a document to get started")
	st.markdown("Supported formats: PDF, JPG, PNG")
	st.markdown('</div>', unsafe_allow_html=True)

	# Step 2: Process document
	st.subheader("Step 2: Process the Document")

	# Get the file to process (either uploaded or sample)
	file_to_process = None
	if 'sample_file' in st.session_state and sample_choice != "Upload my own document":
	# Create a FileUploader-like object from the sample file
	class SampleFileObject:
	def __init__(self, name, data):
	self.name = name
	self._data = data

	def getvalue(self):
	return self._data

	file_to_process = SampleFileObject(
	st.session_state.sample_file["name"],
	st.session_state.sample_file["bytes"]
	)
	elif 'uploaded_file' in locals() and uploaded_file is not None:
	file_to_process = uploaded_file

	# Process button (disabled if no file selected)
	process_button = st.button(
	"Process Document",
	disabled=file_to_process is None,
	use_container_width=True
	)

	if process_button and file_to_process is not None:
	with st.spinner("Processing document..."):
	try:
	# Process the file
	result = process_file(file_to_process, use_vision, custom_prompt=custom_prompt if custom_prompt else None)

	if result:
	st.success("Document processed successfully!")

	# Store result in session state for display in the right column
	st.session_state.current_result = result
	st.rerun() # Refresh to show result
	else:
	st.error("Failed to process document.")
	except Exception as e:
	st.error(f"Error processing document: {str(e)}")

	st.markdown('</div>', unsafe_allow_html=True)

	# Experiment instructions in a compact format
	st.markdown('<div class="key-concept" style="background-color:#374151; padding:0.75rem; border-radius:0.5rem; margin:1rem 0; border-left:3px solid #3B82F6; color:white;">', unsafe_allow_html=True)
	st.markdown("<h3 style='color:white !important;'>Experiment Instructions</h3>", unsafe_allow_html=True)
	st.markdown("""
	1. Step 1: Select a document and choose your options
	2. Step 2: Process the document with the selected options
	3. Step 3: Analyze the results in the panel on the right
	4. Step 4: Try again with different settings (e.g., toggle vision model)
	5. Step 5: Compare results between different runs
	""")
	st.markdown('</div>', unsafe_allow_html=True)

	with col2:
	st.markdown('<div class="tool-container" style="color:white !important; background-color:#1f2937; padding:1.5rem; border-radius:0.5rem; border:1px solid #374151;">', unsafe_allow_html=True)
	st.markdown("<h3 style='color:white !important;'>Step 3: View Results</h3>", unsafe_allow_html=True)

	if 'current_result' in st.session_state and st.session_state.current_result:
	result = st.session_state.current_result

	# File info in a compact format
	st.markdown(f"File: {result.get('file_name', 'Unknown')}")

	# Horizontal display of metadata
	col1, col2 = st.columns(2)
	with col1:
	if 'languages' in result and result['languages']:
	languages = [lang for lang in result['languages'] if lang]
	if languages:
	st.markdown(f"Languages: {', '.join(languages)}")

	with col2:
	if 'topics' in result and result['topics']:
	st.markdown(f"Topics: {', '.join(result['topics'])}")

	# Create tabs for different views with inline styling to ensure visibility
	tab1, tab2 = st.tabs(["Structured View", "Raw JSON"])
	st.markdown("""
	<style>
	.stTabs [data-baseweb="tab-panel"] * {color: white !important;}
	</style>
	""", unsafe_allow_html=True)

	with tab1:
	# Display in a more user-friendly format based on the content structure
	if 'ocr_contents' in result:
	if isinstance(result['ocr_contents'], dict):
	for section, content in result['ocr_contents'].items():
	if content: # Only display non-empty sections
	st.markdown(f"<h4 style='color:white !important;'>{section.replace('_', ' ').title()}</h4>", unsafe_allow_html=True)

	if isinstance(content, str):
	st.markdown(f"<p style='color:white !important;'>{content}</p>", unsafe_allow_html=True)
	elif isinstance(content, list):
	for item in content:
	if isinstance(item, str):
	st.markdown(f"<p style='color:white !important;'>- {item}</p>", unsafe_allow_html=True)
	elif isinstance(item, dict):
	st.markdown("<div style='color:white !important;'>", unsafe_allow_html=True)
	st.json(item)
	st.markdown("</div>", unsafe_allow_html=True)
	elif isinstance(content, dict):
	for k, v in content.items():
	st.markdown(f"<p style='color:white !important;'><strong>{k}:</strong> {v}</p>", unsafe_allow_html=True)

	with tab2:
	# Show the raw JSON for developers
	# Convert to serializable format first
	serializable_result = make_serializable(result)
	st.json(serializable_result)

	# Download options
	st.markdown("### Export Results")

	col1, col2 = st.columns(2)

	with col1:
	# Export as JSON (using the serializable converter)
	serializable_result = make_serializable(result)
	json_bytes = json.dumps(serializable_result, indent=2).encode()
	st.download_button(
	label="Download JSON",
	data=json_bytes,
	file_name="ocr_results.json",
	mime="application/json",
	use_container_width=True
	)

	with col2:
	# Export as text
	if 'ocr_contents' in result and isinstance(result['ocr_contents'], dict) and 'content' in result['ocr_contents']:
	text_content = result['ocr_contents']['content']
	st.download_button(
	label="Download Text",
	data=text_content.encode(),
	file_name="ocr_text.txt",
	mime="text/plain",
	use_container_width=True
	)
	else:
	st.markdown("""
	<div style="background-color:#1f2937; padding:1rem; border-radius:0.5rem;">
	<h3 style="color:white !important;">Results will appear here</h3>

	<p style="color:white !important;">Upload and process a document to see the OCR results in this panel.</p>

	<p style="color:white !important;">The OCR tool will:</p>
	<ol style="color:white !important;">
	<li style="color:white !important;">Extract text from your document</li>
	<li style="color:white !important;">Identify languages and topics</li>
	<li style="color:white !important;">Provide structured content analysis</li>
	<li style="color:white !important;">Generate downloadable results</li>
	</ol>
	</div>
	""", unsafe_allow_html=True)
	st.markdown('</div>', unsafe_allow_html=True)

	# Processing history
	if st.session_state.processing_history:
	st.markdown('<div class="tool-container" style="color:white !important; background-color:#1f2937; padding:1.5rem; border-radius:0.5rem; border:1px solid #374151;">', unsafe_allow_html=True)
	st.markdown("<h3 style='color:white !important;'>Step 4: Review Processing History</h3>", unsafe_allow_html=True)

	# Most recent result summary
	latest = st.session_state.processing_history[-1]
	st.markdown(f"Latest Document: {latest['fileName']}")
	st.markdown(f"Processed at: {datetime.fromisoformat(latest['timestamp']).strftime('%Y-%m-%d %H:%M')}")
	st.markdown(f"Vision model used: {'Yes' if latest['useVision'] else 'No'}")

	# Full history in expander
	with st.expander("View Complete Processing History"):
	for i, item in enumerate(reversed(st.session_state.processing_history)):
	st.markdown(f"""
	<div class="history-card" style="padding:0.75rem; background-color:#374151; color:white; border-radius:0.25rem; border:1px solid #4B5563; margin-bottom:0.5rem;">
	<strong style="color:white !important;">{item['fileName']}</strong><br>
	<span style="color:white !important;">{datetime.fromisoformat(item['timestamp']).strftime('%Y-%m-%d %H:%M')} -
	Vision model: {'Yes' if item['useVision'] else 'No'}</span>
	</div>
	""", unsafe_allow_html=True)

	# Add option to view a previous result
	if st.button(f"View This Result", key=f"view_history_{i}"):
	st.session_state.current_result = item['result']
	st.rerun()
	st.markdown('</div>', unsafe_allow_html=True)

	# Compare tab for side-by-side comparison
	with compare_tab:
	st.subheader("Compare OCR Results")

	if len(st.session_state.processing_history) >= 2:
	st.markdown("""
	Select two processing results to compare side by side. This allows you to see
	how different options (like using the vision model) affect OCR quality.
	""")

	# Create selection dropdowns for the documents
	col1, col2 = st.columns(2)
	with col1:
	# First document selector
	doc_options_1 = [f"{i+1}: {item['fileName']} ({'Vision' if item['useVision'] else 'No Vision'})"
	for i, item in enumerate(st.session_state.processing_history)]
	doc_choice_1 = st.selectbox("First Document:", doc_options_1, key="compare_doc_1")
	doc_index_1 = int(doc_choice_1.split(":")[0]) - 1

	with col2:
	# Second document selector
	doc_options_2 = [f"{i+1}: {item['fileName']} ({'Vision' if item['useVision'] else 'No Vision'})"
	for i, item in enumerate(st.session_state.processing_history)]
	default_index = min(1, len(st.session_state.processing_history) - 1) # Default to second item
	doc_choice_2 = st.selectbox("Second Document:", doc_options_2, key="compare_doc_2", index=default_index)
	doc_index_2 = int(doc_choice_2.split(":")[0]) - 1

	# Retrieve the selected documents
	doc1 = st.session_state.processing_history[doc_index_1]
	doc2 = st.session_state.processing_history[doc_index_2]

	# Show comparison
	col1, col2 = st.columns(2)

	with col1:
	st.markdown(f"### Document 1: {doc1['fileName']}")
	st.markdown(f"Processed at: {datetime.fromisoformat(doc1['timestamp']).strftime('%Y-%m-%d %H:%M')}")
	st.markdown(f"Vision model used: {'Yes' if doc1['useVision'] else 'No'}")

	# Display content summary
	if 'ocr_contents' in doc1['result'] and isinstance(doc1['result']['ocr_contents'], dict):
	if 'content' in doc1['result']['ocr_contents']:
	content = doc1['result']['ocr_contents']['content']
	# Display first 500 characters with word wrap
	st.markdown(f"""
	<div style="max-height: 300px; overflow-y: auto; word-wrap: break-word;
	border: 1px solid #ddd; padding: 1rem; background-color: #f9f9f9;">
	{content[:500]}{'...' if len(content) > 500 else ''}
	</div>
	""", unsafe_allow_html=True)

	with col2:
	st.markdown(f"### Document 2: {doc2['fileName']}")
	st.markdown(f"Processed at: {datetime.fromisoformat(doc2['timestamp']).strftime('%Y-%m-%d %H:%M')}")
	st.markdown(f"Vision model used: {'Yes' if doc2['useVision'] else 'No'}")

	# Display content summary
	if 'ocr_contents' in doc2['result'] and isinstance(doc2['result']['ocr_contents'], dict):
	if 'content' in doc2['result']['ocr_contents']:
	content = doc2['result']['ocr_contents']['content']
	# Display first 500 characters with word wrap
	st.markdown(f"""
	<div style="max-height: 300px; overflow-y: auto; word-wrap: break-word;
	border: 1px solid #ddd; padding: 1rem; background-color: #f9f9f9;">
	{content[:500]}{'...' if len(content) > 500 else ''}
	</div>
	""", unsafe_allow_html=True)

	# Comparison analysis
	if doc1['fileName'] == doc2['fileName'] and doc1['useVision'] != doc2['useVision']:
	st.markdown("""
	<div class="key-concept">
	<h3>Vision vs. Non-Vision Model Comparison</h3>
	<p>You're comparing the same document processed with different models.
	This is an excellent way to evaluate the impact of vision capabilities on OCR accuracy.</p>

	<p>Look for these differences:</p>
	<ul>
	<li>Completeness of extracted text</li>
	<li>Accuracy of layout understanding</li>
	<li>Recognition of complex elements (tables, figures)</li>
	<li>Topic and language detection accuracy</li>
	</ul>
	</div>
	""", unsafe_allow_html=True)
	else:
	st.markdown("""
	<div class="research-question">
	<h3>Need More Documents to Compare</h3>
	<p>Process at least two documents to enable side-by-side comparison. Try processing
	the same document with and without the vision model to see the differences in OCR quality.</p>
	</div>
	""", unsafe_allow_html=True)

	# Analysis tab for guidance on working with OCR results
	with analyze_tab:
	st.subheader("Analysis Guide")

	st.markdown("""
	<div class="workshop-container">
	<h3>How to Analyze OCR Results</h3>
	<p>This guide helps you assess the quality and usefulness of OCR output for historical research.</p>
	</div>
	""", unsafe_allow_html=True)

	st.markdown("""
	### Evaluating OCR Quality

	When analyzing OCR results from historical documents, consider these key factors:

	1. Text Accuracy
	- Check for common OCR errors (e.g., mistaking "e" for "c", "l" for "1")
	- Assess recognition of period-specific typography and writing styles
	- Evaluate handling of degraded or damaged text areas

	2. Structure Preservation
	- Does the OCR maintain paragraph and section breaks?
	- Are columns and tabular data correctly preserved?
	- How well are page transitions handled?

	3. Special Elements
	- Recognition of footnotes, marginalia, and annotations
	- Handling of illustrations, diagrams, and decorative elements
	- Treatment of watermarks, signatures, and stamps

	4. Metadata Extraction
	- Accuracy of detected languages, topics, and document type
	- Identification of dates, names, and key entities
	- Recognition of document purpose and context
	""")

	col1, col2 = st.columns(2)

	with col1:
	st.markdown("""
	### Common OCR Challenges in Historical Documents

	- Typography Variations: Historical fonts and writing styles that differ from modern text
	- Material Degradation: Fading, stains, tears, and other damage affecting legibility
	- Handwritten Elements: Marginalia, signatures, and handwritten annotations
	- Complex Layouts: Multi-column formats, non-linear reading order, and decorative elements
	- Language and Terminology: Archaic terms, specialized vocabulary, and multilingual content
	""")

	with col2:
	st.markdown("""
	### Making the Most of OCR Results

	- Contextual Reading: Use historical context to interpret unclear passages
	- Error Patterns: Identify and mentally correct for systematic OCR errors
	- Hybrid Analysis: Combine OCR-based search with close reading of original images
	- Comparative Processing: Try different OCR settings and models on the same document
	- Iterative Refinement: Use insights from each document to improve future processing
	""")

	st.markdown("""
	### Research Integration

	Once you've obtained and analyzed OCR results from historical documents, consider these approaches for integrating them into your research:

	1. Digital Corpus Building: Create searchable collections of processed texts
	2. Computational Analysis: Apply text mining, topic modeling, or network analysis
	3. Cross-Document Linking: Identify connections across multiple sources
	4. Annotation and Enrichment: Add context, translations, or explanatory notes
	5. Collaborative Research: Share processed texts with other researchers

	Remember that OCR is a tool to assist your research, not replace careful reading and analysis. The most effective approaches combine computational methods with traditional historical research practices.
	""")

	# Example of what to look for
	if st.session_state.processing_history:
	with st.expander("Example Analysis from Your Documents"):
	# Pick the latest document
	latest = st.session_state.processing_history[-1]

	st.markdown(f"""
	#### Sample Analysis for: {latest['fileName']}

	Document Context:
	- Languages: {', '.join(latest['result'].get('languages', ['Unknown']))}
	- Topics: {', '.join(latest['result'].get('topics', ['Unknown']))}
	- Vision model used: {'Yes' if latest['useVision'] else 'No'}

	What to Look For:
	1. Check how well the model identified key topics and languages
	2. Evaluate the completeness of extracted text
	3. Note any systematic errors in text recognition
	4. Assess how well document structure was preserved
	""")

	# Navigation buttons
	col1, col2 = st.columns(2)
	with col1:
	st.button("Previous: Methodological Approaches", key="prev_to_4", on_click=navigate_to_module, args=(4,))

	with col2:
	st.button("Next: Conclusion", key="next_to_6", on_click=navigate_to_module, args=(6,))

	else: # Module 6
	# MODULE 6: Conclusion
	st.title("Module 6: Conclusion and Future Directions")

	col1, col2 = st.columns([3, 2])

	with col1:
	st.markdown("""
	### Workshop Summary

	Throughout this workshop, we've explored:

	1. Text-Image Interdependence: The complex relationship between textual and visual elements
	2. OCR Technology: The evolution of OCR and its application to historical materials
	3. Methodological Approaches: Hybrid strategies for working with historical texts
	4. Practical Application: Hands-on experience with OCR processing tools
	""")

	st.markdown("""
	### Key Takeaways

	1. OCR is Not Perfect: Even advanced AI models face challenges with historical documents
	2. Context Matters: Vision-enhanced models provide better results by understanding document context
	3. Hybrid Approaches: Combining computational methods with traditional research yields best results
	4. Critical Evaluation: Always evaluate OCR outputs with awareness of limitations
	5. Structured Extraction: Modern OCR goes beyond text recognition to understand document structure
	""")

	with col2:
	# Display statistics if there's processing history
	if st.session_state.processing_history:
	st.subheader("Your Workshop Statistics")

	# Calculate statistics
	total_docs = len(st.session_state.processing_history)
	vision_docs = len([item for item in st.session_state.processing_history if item['useVision']])
	non_vision_docs = total_docs - vision_docs

	# Create metrics for statistics
	col1, col2 = st.columns(2)

	with col1:
	st.metric("Documents Processed", total_docs)
	st.metric("With Vision Model", vision_docs)

	with col2:
	st.metric("Without Vision Model", non_vision_docs)

	# Topics word cloud
	if total_docs > 0:
	st.subheader("Topics Encountered")
	all_topics = []
	for item in st.session_state.processing_history:
	if 'topics' in item['result']:
	all_topics.extend(item['result']['topics'])

	if all_topics:
	# Count topic frequencies
	topic_counts = {}
	for topic in all_topics:
	if topic in topic_counts:
	topic_counts[topic] += 1
	else:
	topic_counts[topic] = 1

	# Display as a horizontal bar chart
	st.bar_chart(topic_counts)

	st.subheader("Future Directions")

	col1, col2 = st.columns(2)

	with col1:
	st.markdown("""
	### Technological Developments

	- Multimodal AI models: Increasingly sophisticated understanding
	- Historical font training: Models trained on historical typography
	- Document intelligence: Enhanced understanding of structures
	- Collaborative correction: Platforms for collective improvement
	""")

	with col2:
	st.markdown("""
	### Research Applications

	- Large-scale corpus analysis: Processing entire archives
	- Multilingual historical research: Working across languages
	- Image-text integration: New methodologies for visual analysis
	- Computational paleography: AI-assisted handwriting analysis
	""")

	st.markdown("""
	### Additional Resources

	- [Mistral AI Documentation](https://docs.mistral.ai/): Learn more about the OCR models used in this workshop
	- [Transkribus](https://readcoop.eu/transkribus/): Platform for historical document transcription
	- [OCR-D](https://ocr-d.de/en/): Coordinated OCR research project for historical documents
	- [Historical OCR Research Papers](https://scholar.google.com/scholar?q=historical+OCR): Academic research on historical OCR
	""")

	# Reset button to start over
	if st.button("Start Workshop Again", key="reset_workshop", use_container_width=True):
	st.session_state.current_module = 1
	st.rerun()

	# Handle API requests if the URL contains /api/process
	if 'api/process' in st.query_params.get('', ''):
	# Process the API request
	result = process_api_request()
	if result:
	# Return the result as JSON
	# Make sure result is serializable
	serializable_result = make_serializable(result)
	st.json(serializable_result)
	else:
	st.json({"error": "Invalid request"})