Add per-line meter detection

CMU stress markers -> stress string per line, scored against the
classical feet (iamb, trochee, anapest, dactyl, amphibrach) with
flexible monosyllables. Syllable count + best-fit meter shown in the
toolbar readout for the caret line.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
This commit is contained in:
2026-06-07 01:12:34 -04:00
parent 84bae60dff
commit 7a1e0e2953
3 changed files with 90 additions and 3 deletions
+59 -1
View File
@@ -247,6 +247,56 @@ def slant_key(word: str) -> str | None:
return "gv:" + (m.group(0) if m else tail)
# --------------------------------------------------------------------------
# meter
# --------------------------------------------------------------------------
FEET = {
"iambic": "01", "trochaic": "10", "anapestic": "001",
"dactylic": "100", "amphibrachic": "010",
}
METER_NAMES = {1: "monometer", 2: "dimeter", 3: "trimeter", 4: "tetrameter",
5: "pentameter", 6: "hexameter", 7: "heptameter", 8: "octameter"}
def line_meter(line: str) -> dict | None:
"""Syllable count and best-fit metrical foot for a line.
Stress comes from the CMU markers (1/2 stressed, 0 unstressed).
Monosyllables flex in real speech, so function words read as
unstressed and content monosyllables as wildcards.
"""
stress = ""
for w in WORD_RE.findall(line):
ph = phones_for(w)
if not ph:
stress += "x" # unknown word: one flexible syllable, at least
continue
syls = [p[-1] for p in ph.split() if p[-1].isdigit()]
if len(syls) == 1:
stress += "0" if w.lower() in STOPWORDS else "x"
else:
stress += "".join("1" if s in "12" else "0" for s in syls)
n = len(stress)
if n == 0:
return None
best_label, best_score = None, 0.0
if n >= 4: # too short to call a meter
for name, foot in FEET.items():
pat = (foot * (n // len(foot) + 1))[:n] # final foot may truncate
score = sum(a == "x" or a == b for a, b in zip(stress, pat)) / n
if score > best_score:
feet_count = round(n / len(foot))
meter = METER_NAMES.get(feet_count, f"{feet_count}-foot")
best_label, best_score = f"{name} {meter}", score
return {
"syl": n,
"stress": stress,
"label": best_label if best_score >= 0.75 else None,
"score": round(best_score, 2),
}
# --------------------------------------------------------------------------
# analysis
# --------------------------------------------------------------------------
@@ -483,8 +533,16 @@ def analyze(draft: Draft):
"slant": t["slant"] or groups_out[t["gid"]]["slant"]}
for t in [*tokens, *phrases] if t["gid"] is not None
]
meter = []
for i, line in enumerate(lines):
if sids[i] is None:
continue
m = line_meter(line)
if m:
meter.append({"l": i, **m})
return {"lines": lines, "tokens": toks_out,
"groups": groups_out, "stanzas": stanzas}
"groups": groups_out, "stanzas": stanzas, "meter": meter}
# --------------------------------------------------------------------------
+6 -2
View File
@@ -414,9 +414,13 @@ function buildReadout(){
schemeReadout.innerHTML = '<span class="offline">backend offline — run: uv run uvicorn app:app</span>';
return;
}
const parts = [];
const ln = caretLine();
const m = analysis && analysis.meter ? analysis.meter.find(x=>x.l===ln) : null;
if(m) parts.push(`${m.syl} syl` + (m.label ? ` · ${m.label}` : ''));
const st = caretStanza();
if(!st || !st.scheme){ schemeReadout.innerHTML = ''; return; }
schemeReadout.innerHTML = `stanza scheme &nbsp;<b>${st.scheme.toUpperCase().split('').join(' ')}</b>`;
if(st && st.scheme) parts.push(`scheme <b>${st.scheme.toUpperCase().split('').join(' ')}</b>`);
schemeReadout.innerHTML = parts.join(' &nbsp;&nbsp; ');
}
function buildLegend(){
+25
View File
@@ -190,3 +190,28 @@ def test_stanzas_and_legend():
def test_blank_lines_split_stanzas():
res = analyze(Draft(text="the cat\na hat\n\nso blue\nso true"))
assert [s["scheme"] for s in res["stanzas"]] == ["aa", "aa"]
# ------------------------------------------------------------------ meter
def meter_of(line: str) -> dict:
res = analyze(Draft(text=line))
return res["meter"][0]
def test_iambic_pentameter():
m = meter_of("Shall I compare thee to a summer's day")
assert m["syl"] == 10
assert m["label"] == "iambic pentameter"
def test_trochaic_tetrameter():
m = meter_of("Tyger Tyger burning bright")
assert m["syl"] == 7 # catalectic — final unstressed syllable dropped
assert m["label"] == "trochaic tetrameter"
def test_syllables_always_reported():
m = meter_of("the city hums in amber under fading light")
assert m["syl"] == 12
assert m["stress"]