Files

162 lines
4.8 KiB
Python

"""
Lazy loader for compressed interlinear Bible data.
Decompresses and loads the data on first access.
Optimized for fly.io production deployment.
"""
import gzip
import json
import logging
from pathlib import Path
from typing import Optional, Dict, List
logger = logging.getLogger(__name__)
_interlinear_data = None
_load_failed = False
# Map site book names to interlinear data book names
BOOK_NAME_MAP = {
"Song of Solomon": "Solomon's Song",
}
def _normalize_book_name(book: str) -> str:
"""Normalize book name for interlinear data lookup."""
return BOOK_NAME_MAP.get(book, book)
def _load_interlinear_data():
"""Load and decompress interlinear data from gzipped JSON file"""
global _interlinear_data, _load_failed
if _interlinear_data is not None:
return _interlinear_data
# If loading previously failed, return empty dict to avoid repeated errors
if _load_failed:
logger.warning("Interlinear data loading previously failed, returning empty data")
return {}
data_file = Path(__file__).parent / "data" / "interlinear.json.gz"
try:
logger.info(f"Loading interlinear data from {data_file}...")
if not data_file.exists():
raise FileNotFoundError(f"Interlinear data file not found: {data_file}")
with gzip.open(data_file, 'rt', encoding='utf-8') as f:
_interlinear_data = json.load(f)
logger.info(f"Successfully loaded {len(_interlinear_data)} verses")
return _interlinear_data
except Exception as e:
_load_failed = True
logger.error(f"Failed to load interlinear data: {e}", exc_info=True)
_interlinear_data = {}
return _interlinear_data
def get_interlinear_data(book: str, chapter: int, verse: int) -> Optional[List[Dict]]:
"""Get interlinear data for a specific verse"""
data = _load_interlinear_data()
normalized_book = _normalize_book_name(book)
key = f"{normalized_book}:{chapter}:{verse}"
return data.get(key)
def has_interlinear_data(book: str, chapter: int, verse: int) -> bool:
"""Check if interlinear data exists for a verse"""
data = _load_interlinear_data()
normalized_book = _normalize_book_name(book)
key = f"{normalized_book}:{chapter}:{verse}"
return key in data
def get_all_interlinear_verses() -> List[Dict]:
"""Get list of all verses with interlinear data"""
data = _load_interlinear_data()
verses = []
for key in sorted(data.keys()):
book, chapter, verse = key.split(":")
verses.append({
"book": book,
"chapter": int(chapter),
"verse": int(verse),
"ref": f"{book} {chapter}:{verse}"
})
return verses
def preload_data():
"""
Preload interlinear data at startup to warm the cache.
Call this during application initialization to avoid first-request delays.
"""
logger.info("Preloading interlinear data to warm cache...")
data = _load_interlinear_data()
if data:
logger.info(f"Cache warmed successfully with {len(data)} verses")
else:
logger.warning("Cache warming completed but no data loaded")
def find_verses_by_strongs(strongs_number: str, limit: int = 50) -> List[Dict]:
"""
Find all verses containing a specific Strong's number.
Args:
strongs_number: A Strong's number like "H7999" or "G3056"
limit: Maximum number of results to return
Returns:
List of dicts with verse reference and the word occurrence
"""
data = _load_interlinear_data()
if not data:
return []
strongs_number = strongs_number.upper().strip()
results = []
for key, words in data.items():
if len(results) >= limit:
break
for word in words:
if word.get("strongs") == strongs_number:
book, chapter, verse = key.split(":")
results.append({
"book": book,
"chapter": int(chapter),
"verse": int(verse),
"reference": f"{book} {chapter}:{verse}",
"url": f"/book/{book}/chapter/{chapter}/verse/{verse}",
"original": word.get("original", ""),
"english": word.get("english", ""),
})
break # Only count each verse once
if len(results) >= limit:
break
return results
def count_strongs_occurrences(strongs_number: str) -> int:
"""Count total occurrences of a Strong's number in the interlinear data."""
data = _load_interlinear_data()
if not data:
return 0
strongs_number = strongs_number.upper().strip()
count = 0
for key, words in data.items():
for word in words:
if word.get("strongs") == strongs_number:
count += 1
return count