progress and add typing extensions

2023-06-22 17:45:15 +02:00 · 2023-06-22 17:45:15 +02:00 · a24224c6ee
commit a24224c6ee
parent 23d8702dbe
4 changed files with 73 additions and 47 deletions
--- a/poetry.lock
+++ b/poetry.lock
@ -103,6 +103,17 @@ files = [
    {file = "text_unidecode-1.3-py2.py3-none-any.whl", hash = "sha256:1311f10e8b895935241623731c2ba64f4c455287888b18189350b67134a822e8"},
 ]
 [[package]]
 name = "typing-extensions"
 version = "4.6.3"
 description = "Backported and Experimental Type Hints for Python 3.7+"
 optional = false
 python-versions = ">=3.7"
 files = [
    {file = "typing_extensions-4.6.3-py3-none-any.whl", hash = "sha256:88a4153d8505aabbb4e13aacb7c486c2b4a33ca3b3f807914a9b4c844c471c26"},
    {file = "typing_extensions-4.6.3.tar.gz", hash = "sha256:d91d5919357fe7f681a9f2b5b4cb2a5f1ef0a1e9f59c4d8ff0d3491e05c0ffd5"},
 ]
 [[package]]
 name = "unidecode"
 version = "1.3.6"
@ -117,4 +128,4 @@ files = [
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "b2f6a06875c1c40404e891bf9765fab11ecf7fbf04a486962c27f71b3084857a"
+content-hash = "aa57e8d6b431eddf09f5e5fe90196a965781c9b020aeb0d8ac3b7c5bd34a51a4"
--- a/pyproject.toml
+++ b/pyproject.toml
@ -27,6 +27,7 @@ pyyaml = "^6.0"
 python-slugify = {extras = ["unidecode"], version = "^8.0.1"}
 pymysql = "^1.0.3"
 peewee = "^3.16.2"
 typing-extensions = "^4.6.3"
 [tool.poetry.scripts]
 spip2md = "spip2md.lib:cli"
--- a/spip2md/convert.py
+++ b/spip2md/convert.py
@ -19,6 +19,7 @@ and methods to convert them to Markdown + YAML, static site structure
 """
 import logging
 from os.path import basename, splitext
 from typing_extensions import Self
 from slugify import slugify
@ -35,22 +36,6 @@ from spip2md.spip_models import (
 )
 # Unique Spip object ID
 class ObjId:
    _id: int
    _type: type
    def __init__(self, obj_id: int, type_string: str) -> None:
        self._id = obj_id
        self._type_str = type_string
    def __hash__(self):
        return hash((self._id, self._type_str))
    def __eq__(self, other: "ObjId"):
        return (self._id, self._type_str) == (other._id, other._type_str)
 class ConvertableDocument:
    _log_c: logging.Logger  # Logger for conversion operations
    _cfg: Configuration  # Global configuration
@ -58,6 +43,7 @@ class ConvertableDocument:
    # Converted fields
    _src: str  # URL
    _slug: str = ""  # URL
    _id: int
    class Meta:
        table_name: str = "spip_document"  # Define the name of the Spip DB table
@ -80,18 +66,17 @@ class ConvertableRedactional:
    _cfg: Configuration  # Global configuration
    _spip_obj: SpipArticles | SpipRubriques  # The Spip Article this is representing
    _depth: int  # Depth
-    _children: dict[
+    _children: dict[tuple[str, int], ConvertableDocument] = {}  # Children
        ObjId, "ConvertableDocument | ConvertableRedactional"
    ] = {}  # documents
    _index: dict[ObjId, ObjId] = {}  # Index of the next-hop subsection to ObjId obj
    _id: int
    _lang: str
    _authors: tuple[SpipAuteurs, ...]
    _tags: tuple[SpipMots, ...]
    # Initialize documents related to self
-    def documents(self, limit: int = 10**3) -> dict[ObjId, ConvertableDocument]:
+    def documents(
-        print(
+        self, limit: int = 10**3
    ) -> dict[tuple[str, int], ConvertableDocument]:
        self._log_c.debug(
            "Initialize documents.\n"
            + f"Section: {self._spip_obj.titre}, Depth : {self._depth}"
        )
@ -108,11 +93,11 @@ class ConvertableRedactional:
            )
        ]
        # Store them mutably
-        return {ObjId(d._id, "document"): d for d in documents}
+        return {("document", d._id): d for d in documents}
    # Initialize self authors
    def authors(self) -> tuple[SpipAuteurs, ...]:
-        print("Initialize authors")
+        self._log_c.debug("Initialize authors")
        return (
            SpipAuteurs.select()
            .join(
@ -124,7 +109,7 @@ class ConvertableRedactional:
    # Initialize self tags
    def tags(self) -> tuple[SpipMots]:
-        print("Initialize tags")
+        self._log_c.debug("Initialize tags")
        return (
            SpipMots.select()
            .join(
@ -137,7 +122,6 @@ class ConvertableRedactional:
 class ConvertableArticle(ConvertableRedactional):
    _fileprefix: str = "index"
    _children: dict[ObjId, ConvertableDocument] = {}  # documents
    # Converted fields
    _surtitle: str  # Content
    _title: str  # Content
@ -161,21 +145,29 @@ class ConvertableArticle(ConvertableRedactional):
        self._draft = spip_obj.statut != "publie"
        self._children |= self.documents()  # Retreive documents & add them to the index
    # Return children and itself in order to be indexed by the parent
    def index(
        self,
    ) -> dict[tuple[str, int], tuple[str, int]]:
        return {child_key: ("article", self._id) for child_key in self._children}
 # Define Section as an Article that can contain other Articles or Sections
 class ConvertableSection(ConvertableRedactional):
    _fileprefix: str = "_index"  # Prefix of written Markdown files
    # sub-sections, documents, articles
    _children: dict[
-        ObjId, "ConvertableSection | ConvertableArticle | ConvertableDocument"
+        tuple[str, int], "ConvertableSection | ConvertableArticle | ConvertableDocument"
    ] = {}
    # Routing table to objects
    _index: dict[tuple[str, int], tuple[str, int]] = {}
    class Meta:
        table_name: str = "spip_rubriques"  # Define the name of the Spip DB table
    # Get articles of this section
    def articles(self, limit: int = 10**6):
-        print(
+        self._log_c.debug(
            "Initialize articles.\n"
            + f"Section: {self._spip_obj.titre}, Depth : {self._depth}"
        )
@ -188,18 +180,17 @@ class ConvertableSection(ConvertableRedactional):
                .limit(limit)
            )
        ]
-        # Add these articles children to self index
+        # Add these articles and their children to self index
-        for art in articles:
+        for article in articles:
-            for doc in art._children:
+            self._index |= article.index()
                self._index[ObjId(doc._id, "document")] = ObjId(art._id, "article")
        # Store them mutably
-        return {ObjId(a._id, "article"): a for a in articles}
+        return {("article", art._id): art for art in articles}
    # Get subsections of this section
    def sections(self, limit: int = 10**6):
-        print(
+        self._log_c.debug(
-            "Initialize subsections.\n"
+            "Initialize subsections of\n"
-            + f"Section: {self._spip_obj.titre}, Depth : {self._depth}"
+            + f"section {self._spip_obj.titre} of depth {self._depth}"
        )
        sections = [
            ConvertableSection(sec, self._cfg, self._depth)
@ -211,10 +202,12 @@ class ConvertableSection(ConvertableRedactional):
            )
        ]
        # Add these sections’s indexes to self index, replacing next hop with section
-        for sec in sections:
+        for section in sections:
-            self._index |= {obj: ObjId(sec._id, "section") for obj in sec._index.keys()}
+            self._index |= {
                obj_key: ("section", section._id) for obj_key in section._index
            }
        # Store them mutably
-        return {ObjId(s._id, "section"): s for s in sections}
+        return {("section", sec._id): sec for sec in sections}
    def __init__(self, spip_obj: SpipRubriques, cfg: Configuration, parent_depth: int):
        self._log_c = logging.getLogger(cfg.name + ".convert.section")
@ -232,14 +225,14 @@ class ConvertableSection(ConvertableRedactional):
 class ConvertableSite:
    _log_c: logging.Logger  # Logger for conversion operations
    _cfg: Configuration  # Global configuration
-    _children: dict[ObjId, ConvertableSection] = {}  # Root sections
+    _children: dict[tuple[str, int], ConvertableSection] = {}  # Root sections
-    _index: dict[ObjId, ObjId] = {}  # Routing table to nested objects
+    _index: dict[tuple[str, int], tuple[str, int]] = {}  # Routing table to objects
    _id: int = 0  # Parent ID of root sections
    _depth: int = 0  # Depth
-    def sections(self) -> dict[ObjId, ConvertableSection]:
+    def sections(self) -> dict[tuple[str, int], ConvertableSection]:
-        print("Initialize ROOT sections")
+        self._log_c.debug("Initialize ROOT sections")
        # Get all sections of parentID root_id
        sections = [
            ConvertableSection(sec, self._cfg, self._depth)
@ -249,10 +242,15 @@ class ConvertableSite:
                .order_by(SpipRubriques.date.desc())
            )
        ]
        # Add these sections’s indexes to self index, replacing next hop with section
-        for sec in sections:
+        # do this while outputting it as the children
-            self._index |= {obj: ObjId(sec._id, "section") for obj in sec._index.keys()}
+        def sec_to_index(section: ConvertableSection):
-        return {ObjId(s._id, "section"): s for s in sections}
+            for obj_key in section._index:
                self._index[obj_key] = ("section", section._id)
            return ("section", section._id)
        return {sec_to_index(subsection): subsection for subsection in sections}
    def __init__(self, cfg: Configuration) -> None:
        self._log_c = logging.getLogger(cfg.name + ".convert.site")
--- a/spip2md/test.py
+++ b/spip2md/test.py
@ -0,0 +1,16 @@
 # File for test purposes, mainly in interactive python
 from spip2md.config import Configuration
 from spip2md.convert import (
    ConvertableSite,
 )
 from spip2md.spip_models import DB
 cfg = Configuration()  # Get the configuration
 DB.init(  # type: ignore
    cfg.db, host=cfg.db_host, user=cfg.db_user, password=cfg.db_pass
 )
 SITE = ConvertableSite(cfg)
 ID = ("document", 1293)