html shell.ts

97.61% Statements 82/84
86.2% Branches 50/58
100% Functions 10/10
98.76% Lines 80/81
Press n or j to go to the next uncovered block, b, p or k for the previous block.

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587  
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16x
 
 
16x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16x
 
 
 
 
 
 
 
 
 
 
562x
562x
563x
563x
1x
 
562x
 
 
562x
 
 
 
 
 
 
 
16x
 
 
 
 
 
 
 
 
562x
562x
562x
 
 
 
 
 
 
 
 
 
 
 
 
281x
281x
 
 
 
 
 
 
 
 
 
 
3x
3x
2x
 
3x
3x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
281x
281x
281x
281x
281x
 
 
 
 
 
281x
 
 
281x
281x
281x
281x
 
 
 
 
 
281x
 
 
 
 
 
 
 
281x
 
281x
 
281x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
281x
281x
281x
281x
281x
281x
281x
281x
281x
281x
281x
281x
 
 
 
281x
281x
281x
281x
281x
 
 
281x
281x
 
281x
281x
 
281x
 
 
 
 
 
 
 
 
 
281x
 
 
281x
281x
281x
281x
 
 
 
 
 
 
 
 
 
 
281x
 
 
 
 
 
 
 
 
 
 
281x
 
 
 
 
 
281x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
281x
3x
 
 
281x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
157x
 
 
 
 
3x
 
 
 
 
 
 
 
281x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
281x
281x
 
968x
 
281x
 
 
281x
281x
281x
 
281x
 
 
 
 
 
 
 
281x
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
  // SPDX-FileCopyrightText: 2024-2026 Hack23 AB
// SPDX-License-Identifier: Apache-2.0
 
/**
 * @module Aggregator/Html/Shell
 * @description Render the full article HTML document with the shared
 * site chrome — site header, language switcher, skip link, theme toggle,
 * breadcrumb, JSON-LD `NewsArticle` + `BreadcrumbList`, and footer. The
 * shell pulls localized labels from `constants/languages.js` and
 * composes the chrome from `templates/section-builders.ts`, so
 * localisation, a11y, and CSP stay consistent with the rest of the
 * site.
 */
 
import { BASE_URL, BUILD_SHORT, MERMAID_VERSION } from '../../constants/config.js';
import { buildHeadFreshnessTags } from '../../constants/build-info-meta.js';
import {
  ALL_LANGUAGES,
  PAGE_TITLES,
  SKIP_LINK_TEXTS,
  ARTICLE_NAV_LABELS,
  BACK_TO_NEWS_LABELS,
  VIEW_SOURCE_MARKDOWN_LABELS,
  FOOTER_SITEMAP_LABELS,
  FOOTER_POLITICAL_INTELLIGENCE_LABELS,
  PROGRESSIVE_DISCLOSURE_LABELS,
  getLocalizedString,
  getTextDirection,
} from '../../constants/languages.js';
import { buildOgLocaleTags } from '../../constants/og-locales.js';
import { ORG_SAME_AS, buildTwitterAttributionTags } from '../../constants/social-handles.js';
import type { LanguageCode } from '../../types/index.js';
import { escapeHTML } from '../../utils/file-utils.js';
import {
  buildResponsiveIconLinks,
  buildResponsiveSocialImageMeta,
  buildSiteFooter,
  buildSiteHeader,
  buildPageBanner,
} from '../../templates/section-builders.js';
import { getPoliticalIntelligenceFilename } from '../../generators/political-intelligence.js';
import { getSitemapFilename } from '../../generators/sitemap/index.js';
import { buildRssAlternateLink } from '../../templates/sections/rss-discovery.js';
import {
  truncateHeadline,
  getTitleSeparator,
  buildPageTitle,
  getLocalizedArticleType,
  getLocalizedArticleTypePlain,
} from './headline.js';
import { clampForBudget } from '../metadata/seo-budgets.js';
import {
  getArticleFilename,
  buildArticleHreflangLinks,
  buildLanguageSwitcher,
} from './hreflang.js';
import { buildArticleToc, type ArticleTocEntry } from './toc.js';
import { blobUrl } from '../infra/github-urls.js';
import { applyReaderFriendlyTransform } from '../reader-friendly-transform.js';
import {
  buildLayerReadingTimes,
  buildProgressiveDisclosureBody,
  type LayerReadingTimes,
} from '../progressive-disclosure.js';
 
export type { ArticleTocEntry } from './toc.js';
 
/** Publisher organization name used in JSON-LD, meta tags. */
export const PUBLISHER_NAME = 'Hack23 AB';
 
/** Site name used across meta tags and structured data. */
export const SITE_NAME = 'EU Parliament Monitor';
 
/** Inputs for {@link wrapArticleHtml}. */
export interface WrapArticleOptions {
  /** Target language (used for `<html lang>`, meta, nav labels). */
  readonly lang: LanguageCode;
  /**
   * Logical article slug (no lang suffix, no extension). Example:
   * `2026-01-15-breaking`. Used to build the `<link rel="alternate">` set.
   */
  readonly articleSlug: string;
  /** Pre-rendered HTML body fragment (from `renderMarkdown`). */
  readonly body: string;
  /**
   * Enable reader-friendly post-processing for rendered HTML body text.
   * Defaults to `true` for public HTML output.
   */
  readonly readerFriendly?: boolean;
  /** Article title — shown in `<title>`, breadcrumb, OG/Twitter meta. */
  readonly title: string;
  /** Article description — shown in `<meta name="description">` and OG. */
  readonly description: string;
  /**
   * Optional: longer (up to ~300 chars) editorial summary lifted from
   * the language-specific executive brief BLUF. When provided, used
   * for `og:description` and `twitter:description`; falls back to
   * `description` when absent. Lets social-card previews show the
   * full BLUF paragraph while the short `<meta description>` stays
   * within Google's ~160-char snippet budget.
   */
  readonly extendedDescription?: string;
  /** SEO keywords — shown in `<meta name="keywords">`. */
  readonly keywords?: readonly string[];
  /** Canonical ISO date of the run (YYYY-MM-DD). */
  readonly date: string;
  /** Article type slug (e.g. `breaking`, `motions`). */
  readonly articleType: string;
  /**
   * Optional: repo-relative path to the aggregated source Markdown file so
   * readers can open the exact input the HTML was rendered from. Rendered
   * as a sidebar link and in the `<link rel="alternate">` set.
   */
  readonly sourceMarkdownRelPath?: string;
  /**
   * Optional: ordered list of top-level H2 sections emitted into the
   * article body. Used to render the article-level table-of-contents
   * sidebar. When omitted (or empty) the sidebar is not rendered.
   */
  readonly toc?: readonly ArticleTocEntry[];
  /**
   * Optional: total number of articles available site-wide. When provided
   * the shared site footer surfaces a `<p class="footer-stats">{n} articles
   * available</p>` line that matches the `index.html` chrome; otherwise
   * the line is omitted.
   */
  readonly articleCount?: number;
  /**
   * Optional: URLs of source artifacts included in the aggregated article.
   * Emitted as `isBasedOn` in the JSON-LD `NewsArticle` schema for provenance.
   */
  readonly isBasedOn?: readonly string[];
  /**
   * Optional: real-world organizations (political groups, media outlets,
   * institutions) named in the article's intelligence and media-framing
   * artifacts. Emitted as JSON-LD `mentions` Organization entries to give
   * search engines and AI overviews high-precision entity grounding.
   * Currently only extractable from the English intelligence corpus; the
   * same list is reused across every language variant because the entities
   * are language-independent proper nouns.
   */
  readonly mentions?: readonly string[];
  /** Optional precomputed reading-time estimates per disclosure layer. */
  readonly readingTimes?: LayerReadingTimes;
}
 
/**
 * Per-surface SEO clamps for one article render. Each field is the
 * exact string emitted into the corresponding HTML/JSON-LD surface,
 * pre-clamped to the budget in
 * `src/aggregator/metadata/seo-budgets.ts`.
 *
 * Extracted from {@link wrapArticleHtml} to keep that function's
 * cognitive complexity within limits while still funnelling every
 * SEO surface through a single source of truth.
 */
interface SeoClampedSurfaces {
  readonly pageTitle: string;
  readonly ogTitleClamped: string;
  readonly twitterTitleClamped: string;
  readonly metaDescriptionClamped: string;
  readonly ogDescriptionClamped: string;
  readonly twitterDescriptionClamped: string;
  readonly imageAltClamped: string;
  readonly jsonLdHeadline: string;
  readonly alternativeHeadline?: string;
}
 
/**
 * Trailing separator characters (whitespace + editorial punctuation) that
 * may dangle after a `Published …` tail has been removed.
 */
const TRAILING_SEPARATOR_CHARS = new Set(['\u2014', '\u2013', '|', ':', ';', ',', '-']);
 
/**
 * Linear-time trailing trim of whitespace and editorial separator
 * punctuation. Avoids the polynomial backtracking that an unanchored
 * `/[\s…]+$/` character-class quantifier exhibits on adversarial input.
 *
 * @param value - Text whose trailing separators should be removed
 * @returns `value` without trailing whitespace/separator characters
 */
function trimTrailingSeparators(value: string): string {
  let end = value.length;
  while (end > 0) {
    const ch = value.charAt(end - 1);
    if (TRAILING_SEPARATOR_CHARS.has(ch) || /\s/u.test(ch)) {
      end -= 1;
    } else {
      break;
    }
  }
  return value.slice(0, end);
}
 
/**
 * Anchored `Published YYYY-MM-DD` tail matcher. The leading `Published`
 * literal keeps the match deterministic (no ambiguous leading-whitespace
 * quantifier), so it is linear on uncontrolled input.
 */
const PUBLISHED_DATE_TAIL_RE = /Published\s+\d{4}-\d{2}-\d{2}\.?\s*$/iu;
 
/**
 * Remove leaked `Published YYYY-MM-DD` tails from social descriptions.
 *
 * @param value - Raw description candidate
 * @returns Description with trailing publication-date boilerplate removed
 */
function stripPublishedDateTail(value: string): string {
  Iif (!value) return '';
  const withoutTail = value.replace(PUBLISHED_DATE_TAIL_RE, '');
  return trimTrailingSeparators(withoutTail).trim();
}
 
/**
 * Resolve a publish-date-safe description: prefer the stripped value, and
 * only fall back to the original when no `Published …` tail was present.
 * When the original was *only* a publish-date tail, stripping yields an
 * empty string and we must not re-introduce the leaked tail.
 *
 * @param value - Raw description candidate
 * @returns Stripped description, or empty when the original was tail-only
 */
function safeDescriptionWithoutPublishedTail(value: string): string {
  const stripped = stripPublishedDateTail(value);
  Eif (stripped) return stripped;
  return PUBLISHED_DATE_TAIL_RE.test(value) ? '' : value;
}
 
/**
 * Strip numbered list prefixes from JSON-LD mention labels.
 *
 * @param name - Raw mention label
 * @returns Mention label without leading numeric hierarchy markers
 */
function sanitizeMentionName(name: string): string {
  let cleaned = name.trim();
  while (/^\d+\./u.test(cleaned)) {
    cleaned = cleaned.replace(/^\d+\./u, '').trimStart();
  }
  cleaned = cleaned.replace(/^\d+\s+/u, '').replace(/^\.\s*/u, '');
  return cleaned.trim();
}
 
/**
 * Compute the per-surface SEO-budget-clamped variants of the article
 * title and description for a single render. See
 * `analysis/methodologies/seo-headers-policy.md` § 1.1 for the
 * documented sources of every cap.
 *
 * @param options - The {@link WrapArticleOptions} carrying title /
 *                  description / extendedDescription
 * @param lang - Validated publishing locale (already coerced to a
 *               supported `LanguageCode`)
 * @param siteTitle - Resolved localized site title used as the brand
 *                    suffix
 * @returns One {@link SeoClampedSurfaces} record per article render
 */
function computeSeoClamps(
  options: WrapArticleOptions,
  lang: LanguageCode,
  siteTitle: string
): SeoClampedSurfaces {
  const safeMetaDescription = safeDescriptionWithoutPublishedTail(options.description);
  const pageTitle = buildPageTitle(options.title, lang, siteTitle);
  const ogTitleClamped = clampForBudget(options.title, lang, 'ogTitle');
  const twitterTitleClamped = clampForBudget(options.title, lang, 'twitterTitle');
  const metaDescriptionClamped = clampForBudget(safeMetaDescription, lang, 'metaDescription');
  // og:description and twitter:description prefer the longer BLUF
  // paragraph (extendedDescription) so social-card previews show the
  // full lede; fall back to the short meta description when the
  // extended one is empty.
  const socialSourceRaw =
    options.extendedDescription && options.extendedDescription.length > 0
      ? options.extendedDescription
      : safeMetaDescription;
  const socialSource = stripPublishedDateTail(socialSourceRaw) || safeMetaDescription;
  const ogDescriptionClamped = clampForBudget(socialSource, lang, 'ogDescription');
  const twitterDescriptionClamped = clampForBudget(socialSource, lang, 'twitterDescription');
  const imageAltClamped = clampForBudget(
    `${options.title}${getTitleSeparator(lang)}${siteTitle}`,
    lang,
    'imageAlt'
  );
 
  const jsonLdHeadline = truncateHeadline(options.title);
  // Emit an `alternativeHeadline` whenever the headline truncator
  // dropped more than a handful of characters from the full title.
  // Schema.org's `NewsArticle.alternativeHeadline` field is exactly
  // for the long-form variant of `headline` and lets Google's
  // Knowledge Graph keep both versions for retrieval. The 5-char
  // threshold avoids emitting trivially redundant pairs when the
  // truncator only trimmed trailing whitespace or punctuation.
  const fullTitleTrimmed = options.title.trim();
  const altCandidate =
    fullTitleTrimmed.length - jsonLdHeadline.length > 5 ? fullTitleTrimmed : undefined;
 
  return {
    pageTitle,
    ogTitleClamped,
    twitterTitleClamped,
    metaDescriptionClamped,
    ogDescriptionClamped,
    twitterDescriptionClamped,
    imageAltClamped,
    jsonLdHeadline,
    ...(altCandidate ? { alternativeHeadline: altCandidate } : {}),
  };
}
 
/**
 * Render the full article HTML document with the shared chrome.
 *
 * @param options - {@link WrapArticleOptions} describing the article and its
 *                  rendered body content
 * @returns Complete `<!DOCTYPE html>` document ready to be written to disk
 */
export function wrapArticleHtml(options: WrapArticleOptions): string {
  const safeLang = ALL_LANGUAGES.includes(options.lang) ? options.lang : ('en' as LanguageCode);
  const dir = getTextDirection(safeLang);
  const siteTitle = getLocalizedString(PAGE_TITLES, safeLang).split(' - ')[0] ?? SITE_NAME;
  const skipLinkText = getLocalizedString(SKIP_LINK_TEXTS, safeLang);
  const canonicalUrl = `${BASE_URL}/news/${getArticleFilename(options.articleSlug, safeLang)}`;
  const indexHref = safeLang === 'en' ? '../index.html' : `../index-${safeLang}.html`;
  const hreflangLinks = buildArticleHreflangLinks(options.articleSlug);
  const langSwitcher = buildLanguageSwitcher(options.articleSlug, safeLang);
  const sourceMdLabel = getLocalizedString(VIEW_SOURCE_MARKDOWN_LABELS, safeLang);
  const articleNavLabel = getLocalizedString(ARTICLE_NAV_LABELS, safeLang);
  const backToNewsLabel = getLocalizedString(BACK_TO_NEWS_LABELS, safeLang);
  const politicalIntelligenceLabel = getLocalizedString(
    FOOTER_POLITICAL_INTELLIGENCE_LABELS,
    safeLang
  );
  const sitemapLabel = getLocalizedString(FOOTER_SITEMAP_LABELS, safeLang);
  const politicalIntelligenceHref = `../${getPoliticalIntelligenceFilename(safeLang)}`;
  const sitemapHref = `../${getSitemapFilename(safeLang)}`;
  const sourceMdHref = options.sourceMarkdownRelPath ? blobUrl(options.sourceMarkdownRelPath) : '';
  const sourceMdLink = options.sourceMarkdownRelPath
    ? `<p class="article-source-md"><a href="${escapeHTML(sourceMdHref)}" rel="alternate" type="text/markdown"><svg class="icon icon-inline" width="16" height="16" viewBox="0 0 24 24" role="img" aria-hidden="true" focusable="false"><path d="M9 5H7a2 2 0 0 0-2 2v10a2 2 0 0 0 2 2h10a2 2 0 0 0 2-2v-2M12 3h6a2 2 0 0 1 2 2v6M10 14 20 4" fill="none" stroke="currentColor" stroke-width="1.8" stroke-linecap="round" stroke-linejoin="round"/></svg> ${escapeHTML(sourceMdLabel)}</a></p>`
    : '';
  const tocHtml = buildArticleToc(options.toc ?? [], safeLang);
  const articleMainClass = tocHtml.length > 0 ? 'article-main--with-toc' : 'article-main--no-toc';
 
  const articleSectionLabel = getLocalizedArticleTypePlain(options.articleType, safeLang);
  const disclosureBody = buildProgressiveDisclosureBody(options.body, safeLang);
  const transformedBodyHtml =
    options.readerFriendly === false
      ? disclosureBody.bodyHtml
      : applyReaderFriendlyTransform(disclosureBody.bodyHtml);
 
  // Count words from the rendered body for the JSON-LD `wordCount`
  // field (Google's NewsArticle structured-data validator emits a
  // warning when this is missing). Done by stripping HTML tags from
  // the rendered body then splitting on whitespace — fast and
  // CodeQL-safe.
  const wordCount =
    disclosureBody.wordCounts.quick +
    disclosureBody.wordCounts.analysis +
    disclosureBody.wordCounts.intelligence;
  const readingTimes = options.readingTimes ?? buildLayerReadingTimes(disclosureBody.wordCounts);
  const disclosureLabels = getLocalizedString(PROGRESSIVE_DISCLOSURE_LABELS, safeLang);
  const min = disclosureLabels.minutesAbbr;
  const readingTimeLine = `⏱️ ${disclosureLabels.quickRead}: ${readingTimes.quickRead}${min} · ${disclosureLabels.fullAnalysis}: ${readingTimes.fullAnalysis}${min} · ${disclosureLabels.completeIntelligence}: ${readingTimes.completeIntelligence}${min}`;
 
  // Pre-compute the per-surface SEO-budget-clamped variants of title
  // and description. Each surface gets its own clamp tuned to the
  // documented platform envelope (Google/Bing SERP, Facebook/LinkedIn
  // OG, Twitter card) and the script family (Latin / CJK / RTL —
  // CJK glyphs render at ~2× Latin pixel width, so the same byte
  // count occupies twice the SERP width). See
  // `src/aggregator/metadata/seo-budgets.ts` for the budget table and
  // `analysis/methodologies/seo-headers-policy.md` § 1.1 for the
  // documented sources of every cap.
  const seoClamps = computeSeoClamps(options, safeLang, siteTitle);
  const {
    pageTitle,
    ogTitleClamped,
    twitterTitleClamped,
    metaDescriptionClamped,
    ogDescriptionClamped,
    twitterDescriptionClamped,
    imageAltClamped,
    jsonLdHeadline,
    alternativeHeadline,
  } = seoClamps;
 
  // Build the JSON-LD image graph. Google requires NewsArticle.image
  // to be an array (or single ImageObject) with explicit width/height
  // covering at least one of the 1:1, 4:3, 16:9 aspect ratios for
  // Top Stories carousel eligibility.
  const jsonLdImages = [
    {
      '@type': 'ImageObject',
      url: `${BASE_URL}/images/og-image-1200.jpg`,
      width: 1200,
      height: 630,
    },
    {
      '@type': 'ImageObject',
      url: `${BASE_URL}/images/og-image-1200.webp`,
      width: 1200,
      height: 630,
    },
    {
      '@type': 'ImageObject',
      url: `${BASE_URL}/images/og-image-1200.avif`,
      width: 1200,
      height: 630,
    },
  ];
  const sanitizedMentions = (options.mentions ?? [])
    .map((name) => sanitizeMentionName(name))
    .filter(Boolean);
 
  const jsonLd = {
    '@context': 'https://schema.org',
    '@type': 'NewsArticle',
    headline: jsonLdHeadline,
    ...(alternativeHeadline ? { alternativeHeadline } : {}),
    description: metaDescriptionClamped,
    datePublished: options.date,
    dateModified: options.date,
    inLanguage: safeLang,
    url: canonicalUrl,
    mainEntityOfPage: { '@type': 'WebPage', '@id': canonicalUrl },
    image: jsonLdImages,
    author: {
      '@type': 'NewsMediaOrganization',
      name: PUBLISHER_NAME,
      url: 'https://hack23.com',
      sameAs: [...ORG_SAME_AS],
    },
    publisher: {
      '@type': 'NewsMediaOrganization',
      name: PUBLISHER_NAME,
      url: 'https://hack23.com',
      logo: { '@type': 'ImageObject', url: `${BASE_URL}/images/apple-touch-icon.png` },
      sameAs: [...ORG_SAME_AS],
    },
    articleSection: articleSectionLabel,
    wordCount,
    keywords: (options.keywords ?? []).join(', '),
    speakable: {
      '@type': 'SpeakableSpecification',
      cssSelector: ['.article-dek', '.article-body > p:first-of-type'],
    },
    isPartOf: {
      '@type': 'WebSite',
      name: SITE_NAME,
      url: BASE_URL,
    },
    ...(options.isBasedOn && options.isBasedOn.length > 0
      ? {
          isBasedOn: options.isBasedOn.map((url) => ({ '@type': 'CreativeWork', url })),
        }
      : {}),
    ...(sanitizedMentions.length > 0
      ? {
          mentions: sanitizedMentions.map((name) => ({
            '@type': 'Organization',
            name,
          })),
        }
      : {}),
  };
 
  const breadcrumbLd = {
    '@context': 'https://schema.org',
    '@type': 'BreadcrumbList',
    itemListElement: [
      {
        '@type': 'ListItem',
        position: 1,
        name: SITE_NAME,
        item: BASE_URL,
      },
      {
        '@type': 'ListItem',
        position: 2,
        name: articleSectionLabel,
        item: `${BASE_URL}/news/`,
      },
      {
        '@type': 'ListItem',
        position: 3,
        name: options.title,
        item: canonicalUrl,
      },
    ],
  };
 
  const structuredData = [jsonLd, breadcrumbLd];
  const jsonLdString = JSON.stringify(structuredData).replace(/</g, '\\u003c');
 
  const keywords = (options.keywords ?? []).map((keyword) => keyword.trim()).filter(Boolean);
  const keywordsMeta =
    keywords.length > 0
      ? `  <meta name="keywords" content="${escapeHTML(keywords.join(', '))}">\n`
      : '';
  const ogLocaleTags = buildOgLocaleTags(safeLang);
  const twitterAttribution = buildTwitterAttributionTags();
  const twitterAttributionBlock = twitterAttribution ? `\n${twitterAttribution}` : '';
 
  const header = buildSiteHeader({
    lang: safeLang,
    pathPrefix: '../',
    homeHref: indexHref,
    siteTitle,
    languageSwitcherHtml: langSwitcher,
  });
 
  return `<!DOCTYPE html>
<html lang="${safeLang}" dir="${dir}">
<head>
  <meta charset="UTF-8">
  <meta name="viewport" content="width=device-width, initial-scale=1.0">
  <meta http-equiv="X-Content-Type-Options" content="nosniff">
  <meta http-equiv="Content-Language" content="${safeLang}">
  <meta name="referrer" content="no-referrer">
  <title>${escapeHTML(pageTitle)}</title>
  <meta name="description" content="${escapeHTML(metaDescriptionClamped)}">
${keywordsMeta}  <meta name="robots" content="index, follow, max-snippet:-1, max-image-preview:large">
  <meta name="author" content="${PUBLISHER_NAME}">
  <meta name="publisher" content="${PUBLISHER_NAME}">
  <meta name="date" content="${options.date}">
  <meta property="article:published_time" content="${options.date}">
  <meta property="article:modified_time" content="${options.date}">
  <meta property="article:section" content="${escapeHTML(articleSectionLabel)}">
  <meta property="article:author" content="${PUBLISHER_NAME}">
  <meta property="article:publisher" content="https://hack23.com">
  <link rel="canonical" href="${canonicalUrl}">
${hreflangLinks}
  ${buildRssAlternateLink(safeLang, `${BASE_URL}/`)}
  <link rel="preconnect" href="https://hack23.com" crossorigin>
  <meta property="og:type" content="article">
  <meta property="og:title" content="${escapeHTML(ogTitleClamped)}">
  <meta property="og:description" content="${escapeHTML(ogDescriptionClamped)}">
  <meta property="og:url" content="${canonicalUrl}">
  <meta property="og:site_name" content="EU Parliament Monitor">
${ogLocaleTags}
${buildResponsiveSocialImageMeta(imageAltClamped)}
  <meta name="twitter:card" content="summary_large_image">
  <meta name="twitter:title" content="${escapeHTML(twitterTitleClamped)}">
  <meta name="twitter:description" content="${escapeHTML(twitterDescriptionClamped)}">${twitterAttributionBlock}
${buildResponsiveIconLinks('../')}
  <link rel="manifest" href="../site.webmanifest">
  <meta name="color-scheme" content="light dark">
  <meta name="theme-color" content="#003399" media="(prefers-color-scheme: light)">
  <meta name="theme-color" content="#0a1a38" media="(prefers-color-scheme: dark)">
  <link rel="stylesheet" href="../styles.css?v=${BUILD_SHORT}">
${buildHeadFreshnessTags('../')}
  <script type="application/ld+json">${jsonLdString}</script>
  <script type="module" src="../js/mermaid-init.js?v=${MERMAID_VERSION}" defer></script>
  <script src="../js/article-runtime.js" defer></script>
</head>
<body>
  <a href="#main" class="skip-link">${escapeHTML(skipLinkText)}</a>
  <div class="reading-progress" aria-hidden="true"></div>
 
  ${header}
 
  ${buildPageBanner('../')}
 
  <main id="main" class="site-main article-main ${articleMainClass}">
    <nav class="article-top-nav" aria-label="${escapeHTML(articleNavLabel)}">
      <a class="article-top-nav__link article-top-nav__link--primary" href="${indexHref}">${escapeHTML(backToNewsLabel)}</a>
      <a class="article-top-nav__link" href="${politicalIntelligenceHref}">🧠 ${escapeHTML(politicalIntelligenceLabel)}</a>
      <a class="article-top-nav__link" href="${sitemapHref}">🗺️ ${escapeHTML(sitemapLabel)}</a>
    </nav>
${tocHtml}    <article class="article-body" lang="${safeLang}">
      <header class="article-hero">
        <p class="article-kicker">${escapeHTML(getLocalizedArticleType(options.articleType, safeLang))}</p>
        <h1>${escapeHTML(options.title)}</h1>
        <p class="article-dek">${escapeHTML(options.description)}</p>
        <p class="article-reading-times" aria-label="${escapeHTML(disclosureLabels.readingTimeAria)}">${escapeHTML(readingTimeLine)}</p>
        <p class="article-meta"><time datetime="${options.date}">${options.date}</time> · EU Parliament Monitor</p>
      </header>
      ${sourceMdLink}
      ${transformedBodyHtml}
    </article>
  </main>
 
  ${buildSiteFooter({ lang: safeLang, pathPrefix: '../', ...(typeof options.articleCount === 'number' ? { articleCount: options.articleCount } : {}) })}
</body>
</html>`;
}