136 lines
3.7 KiB
Python
136 lines
3.7 KiB
Python
import lxml.etree as ET
|
|
from fastapi import APIRouter, FastAPI, Response
|
|
from fastapi.middleware.cors import CORSMiddleware
|
|
|
|
from formex_viewer.formex4 import FormexArticleConverter
|
|
from formex_viewer.main import (
|
|
CellarClient,
|
|
CellarIdentifier,
|
|
ContentType,
|
|
Language,
|
|
SystemName,
|
|
)
|
|
|
|
origins = [
|
|
"http://localhost:5173",
|
|
]
|
|
app = FastAPI()
|
|
app.add_middleware(
|
|
CORSMiddleware,
|
|
allow_origins=origins,
|
|
allow_credentials=True,
|
|
allow_methods=["*"],
|
|
allow_headers=["*"],
|
|
)
|
|
|
|
type CacheKey = tuple[str, Language]
|
|
|
|
CACHE: dict[CacheKey, str] = {}
|
|
|
|
|
|
def _get_fmx4_data(celex_id: str, language: Language) -> ET.Element:
|
|
"""
|
|
Fetch the FMX4 data from the server.
|
|
"""
|
|
|
|
if (celex_id, language) in CACHE:
|
|
return CACHE[(celex_id, language)]
|
|
|
|
client = CellarClient(language)
|
|
cellar_id = CellarIdentifier(
|
|
system_name=SystemName.CELEX,
|
|
system_id=celex_id,
|
|
)
|
|
fmx4_data = client.publication_text(cellar_id, ContentType.ZIP_FMX4)
|
|
|
|
xml = ET.fromstring(fmx4_data.encode("utf-8"))
|
|
CACHE[(celex_id, language)] = xml
|
|
|
|
return xml
|
|
|
|
|
|
api_router = APIRouter()
|
|
|
|
|
|
@api_router.get("/{celex_id}/articles")
|
|
def article_ids(celex_id: str, language: Language = Language.ENG):
|
|
"""
|
|
Fetch the article IDs from the server.
|
|
"""
|
|
xml = _get_fmx4_data(celex_id, language)
|
|
|
|
article_xpath = "//ARTICLE/@IDENTIFIER"
|
|
article_ids = xml.xpath(article_xpath)
|
|
article_ids = [int(article_id.lstrip("0")) for article_id in article_ids]
|
|
article_ids.sort()
|
|
return article_ids
|
|
|
|
|
|
@api_router.get("/{celex_id}/toc/{language}")
|
|
def toc(celex_id: str, language: Language = Language.ENG):
|
|
def _handle_division(division: ET.Element, level: int):
|
|
title = ti_el[0] if (ti_el := division.xpath("TITLE/TI//text()")) else ""
|
|
subtitle = sti_el[0] if (sti_el := division.xpath("TITLE/STI//text()")) else ""
|
|
|
|
subdivisions = []
|
|
for subdivision in division.xpath("DIVISION") or []:
|
|
subdivisions.append(_handle_division(subdivision, level + 1))
|
|
|
|
articles = []
|
|
for article in division.xpath("ARTICLE") or []:
|
|
art_id = article.get("IDENTIFIER")
|
|
if not art_id:
|
|
continue
|
|
art_title = ti_el[0] if (ti_el := article.xpath("TI.ART//text()")) else ""
|
|
art_subtitle = (
|
|
sti_el[0] if (sti_el := article.xpath("STI.ART//text()")) else ""
|
|
)
|
|
articles.append(
|
|
{
|
|
"id": int(art_id.lstrip("0")),
|
|
"type": "article",
|
|
"title": art_title,
|
|
"subtitle": art_subtitle,
|
|
}
|
|
)
|
|
|
|
return {
|
|
"type": "division",
|
|
"title": title,
|
|
"subtitle": subtitle,
|
|
"level": level,
|
|
"content": subdivisions + articles,
|
|
}
|
|
|
|
"""
|
|
Fetch the table of contents from the server.
|
|
"""
|
|
xml = _get_fmx4_data(celex_id, language)
|
|
toc = []
|
|
|
|
for division in xml.xpath("//ENACTING.TERMS/DIVISION"):
|
|
toc.append(_handle_division(division, 0))
|
|
|
|
return toc
|
|
|
|
|
|
@api_router.get("/{celex_id}/articles/{article_id}/{language}")
|
|
def article(celex_id: str, article_id: int, language: Language = Language.ENG):
|
|
"""
|
|
Fetch an article from the server.
|
|
"""
|
|
xml = _get_fmx4_data(celex_id, language)
|
|
|
|
article_xpath = "//ARTICLE"
|
|
articles = xml.xpath(article_xpath)
|
|
for article in articles:
|
|
num = article.get("IDENTIFIER").lstrip("0")
|
|
if num == str(article_id):
|
|
return Response(
|
|
FormexArticleConverter().convert_article(article),
|
|
media_type="text/html",
|
|
)
|
|
|
|
|
|
app.include_router(api_router, prefix="/api")
|