From faf9e3734ae700886e9b9ac71025e559ae77af13 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 25 Oct 2022 16:47:20 +0200
Subject: [PATCH 01/47] [skip ci] [WIP] Alternative Card implementation

This is a suggestion to address the issues discussed on #72

Description

The proposed model card implementation would allow to dynamically add
sections or overwrite them.

This is not a complete implementation but already covers most of the
features we already have and then some.

On top of these features, it would be possible to add more features like
creating a default Card with placeholders, just like the exisint
template, or the possibility to delete existing sections or to retrieve
the result of a certain section.

Implementation

The underlying data structure consists of a dict and a Section
dataclass.

All data is stored in a _data attribute with the type dict[str,
Section]. The dataclass hold the section contents, i.e. the section
title, the section content, and subsections, which again have the same
type. It's thus recursive data structure. Section title and dict key are
identical, which is mostly for convenience.

With this refactor, there are no separate data containers anymore for
eval results, template sections, extra sections, etc. They are all
treated the same.

IMHO, this greatly simplifies the code overall. The only complex
function that's left is the one needed to traverse the tree holding the
data, and even that is just 14 LOC.

Demo

To see how the new class can be used, take a look at the main function.
The resulting Card can be seen here:

https://huggingface.co/skops-ci/hf_hub_example-fcc0d6fe-d072-4f94-8fdb-6bf3bb917bca
---
 skops/card/_card_alternative.py | 361 ++++++++++++++++++++++++++++++++
 1 file changed, 361 insertions(+)
 create mode 100644 skops/card/_card_alternative.py
diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
new file mode 100644
index 00000000..656ae18c
--- /dev/null
+++ b/skops/card/_card_alternative.py
@@ -0,0 +1,361 @@
+from __future__ import annotations
+
+import re
+from dataclasses import dataclass, field
+from pathlib import Path
+from reprlib import Repr
+from typing import Any, Iterator, Protocol
+
+from huggingface_hub import CardData
+from sklearn.utils import estimator_html_repr
+from tabulate import tabulate  # type: ignore
+
+from skops.card._model_card import PlotSection, TableSection
+
+aRepr = Repr()
+aRepr.maxother = 79
+aRepr.maxstring = 79
+
+
+def split_subsection_names(key: str) -> list[str]:
+    return key.split("/")
+
+
+def _clean_table(table: str) -> str:
+    # replace line breaks "\n" with html tag <br />, however, leave end-of-line
+    # line breaks (eol_lb) intact
+    eol_lb = "|\n"
+    placeholder = "$%!?"  # arbitrary sting that never appears naturally
+    table = (
+        table.replace(eol_lb, placeholder)
+        .replace("\n", "<br />")
+        .replace(placeholder, eol_lb)
+    )
+    return table
+
+
+@dataclass
+class Section:
+    title: str
+    content: Formattable | str | None = None
+    subsections: dict[str, Section] = field(default_factory=dict)
+
+
+class Formattable(Protocol):
+    def format(self) -> str:
+        ...
+
+
+class Card:
+    @classmethod
+    def make_default(
+        cls, model, model_diagram: bool = True, metadata: CardData | None = None
+    ):
+        """Add a bunch of default sections, yet to be implemented"""
+        raise NotImplementedError
+
+    def __init__(
+        self, model, model_diagram: bool = True, metadata: CardData | None = None
+    ):
+        self.model = model
+        self.model_diagram = model_diagram
+        self.metadata = metadata or CardData()
+
+        self._data: dict[str, Section] = {}
+        self._metrics: dict[str, float | int] = {}
+        self._reset()
+
+    def _reset(self) -> None:
+        self._add_model(self.model)
+
+        model_file = self.metadata.to_dict().get("model_file")
+        if model_file:
+            self._add_get_started_code(model_file)
+
+        self._add_model_section()
+        self._add_hyperparams()
+
+    def add(self, **kwargs: str) -> "Card":
+        for key, val in kwargs.items():
+            self._add_single(key, val)
+        return self
+
+    def _add_single(self, key: str, val: Formattable | str) -> None:
+        section = self._data
+        *subsection_names, leaf_node_name = split_subsection_names(key)
+        for subsection_name in subsection_names:
+            section_maybe = section.get(subsection_name)
+
+            # there are already subsections
+            if section_maybe is not None:
+                section = section_maybe.subsections
+                continue
+
+            # no subsection, create
+            entry = Section(title=subsection_name)
+            section[subsection_name] = entry
+            section = entry.subsections
+
+        if leaf_node_name in section:
+            # entry exists, only overwrite content
+            section[leaf_node_name].content = val
+        else:
+            # entry does not exist, create a new one
+            section[leaf_node_name] = Section(title=leaf_node_name, content=val)
+
+    def _add_model(self, model) -> None:
+        model = getattr(self, "model", None)
+        if model is None:
+            return
+
+        model_str = self._strip_blank(repr(model))
+        model_repr = aRepr.repr(f"model={model_str},").strip('"').strip("'")
+        self._add_single("Model description", model_repr)
+
+    def _add_model_section(self) -> None:
+        if not self.model_diagram:
+            return
+
+        model_plot_div = re.sub(r"\n\s+", "", str(estimator_html_repr(self.model)))
+        if model_plot_div.count("sk-top-container") == 1:
+            model_plot_div = model_plot_div.replace(
+                "sk-top-container", 'sk-top-container" style="overflow: auto;'
+            )
+        self._add_single("Model Plot", model_plot_div)
+
+    def _add_hyperparams(self) -> None:
+        hyperparameter_dict = self.model.get_params(deep=True)
+        table = _clean_table(
+            tabulate(
+                list(hyperparameter_dict.items()),
+                headers=["Hyperparameter", "Value"],
+                tablefmt="github",
+            )
+        )
+        self._add_single("Model description/Training Procedure/Hyperparameters", table)
+
+    def add_plot(self, folded=False, **kwargs: str) -> "Card":
+        for plot_name, plot_path in kwargs.items():
+            section = PlotSection(alt_text=plot_name, path=plot_path, folded=folded)
+            self._add_single(plot_name, section)
+        return self
+
+    def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> Card:
+        for key, val in kwargs.items():
+            section = TableSection(table=val, folded=folded)
+            self._add_single(key, section)
+        return self
+
+    def add_metrics(self, **kwargs: int | float) -> "Card":
+        self._metrics.update(kwargs)
+        self._add_metrics(self._metrics)
+        return self
+
+    def _add_metrics(self, metrics: dict[str, float | int]) -> None:
+        table = tabulate(
+            list(metrics.items()),
+            headers=["Metric", "Value"],
+            tablefmt="github",
+        )
+        self._add_single("Model description/Evaluation Results", table)
+
+    def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
+        for key, val in metadata.to_dict().items() if metadata else {}:
+            if key == "widget":
+                yield "metadata.widget={...},"
+                continue
+
+            yield aRepr.repr(f"metadata.{key}={val},").strip('"').strip("'")
+
+    @staticmethod
+    def _strip_blank(text) -> str:
+        # remove new lines and multiple spaces
+        text = text.replace("\n", " ")
+        text = re.sub(r"\s+", r" ", text)
+        return text
+
+    def _generate_content(self, data, depth: int = 1) -> Iterator[str]:
+        for val in data.values():
+            title = f"{depth * '#'} {val.title}"
+            yield title
+
+            if isinstance(val.content, str):
+                yield val.content
+            elif val.content is not None:  # is Formattable
+                yield val.content.format()
+
+            if val.subsections:
+                yield from self._generate_content(val.subsections, depth=depth + 1)
+
+    def __str__(self) -> str:
+        return self.__repr__()
+
+    def __repr__(self) -> str:
+        metadata_repr = "\n".join(
+            "  " + line for line in self._generate_metadata(self.metadata)
+        )
+        content_repr = "\n\n".join(
+            "  " + line for line in self._generate_content(self._data)
+        )
+
+        complete_repr = "Card(\n"
+        if metadata_repr:
+            complete_repr += metadata_repr + "\n"
+        if content_repr:
+            complete_repr += content_repr + "\n"
+        complete_repr += ")"
+        return complete_repr
+
+    def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
+        lines = [
+            "import json",
+            "import pandas as pd",
+        ]
+        if file_name.endswith(".skops"):
+            lines += [
+                "from skops.io import load",
+                f'model = load("{file_name}")',
+            ]
+        else:  # pickle
+            lines += [
+                "import pickle",
+                f"with open('{file_name}') as f:",
+                indent + "model = pickle.load(f)",
+            ]
+
+        lines += [
+            'with open("config.json") as f:',
+            indent + "config = json.load(f)",
+            'clf.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
+        ]
+        self._add_single("How to Get Started with the Model", "\n".join(lines))
+
+    def _generate_card(self) -> Iterator[str]:
+        if self.metadata:
+            yield f"---\n{self.metadata.to_yaml()}\n---"
+
+        for line in self._generate_content(self._data):
+            yield "\n" + line
+
+    def save(self, path: str | Path) -> None:
+        """Save the model card.
+
+        This method renders the model card in markdown format and then saves it
+        as the specified file.
+
+        Parameters
+        ----------
+        path: str, or Path
+            Filepath to save your card.
+
+        Notes
+        -----
+        The keys in model card metadata can be seen `here
+        <https://huggingface.co/docs/hub/models-cards#model-card-metadata>`__.
+        """
+        with open(path, "w") as f:
+            f.write("\n".join(self._generate_card()))
+
+    def render(self) -> str:
+        """Render the final model card as a string.
+
+        Returns
+        -------
+        card : str
+            The rendered model card with all placeholders filled and all extra
+            sections inserted.
+        """
+        return "\n".join(self._generate_card())
+
+
+def main():
+    import os
+    import pickle
+    import tempfile
+    from uuid import uuid4
+
+    import matplotlib.pyplot as plt
+    import sklearn
+    from huggingface_hub import HfApi
+    from sklearn.datasets import load_iris
+    from sklearn.linear_model import LogisticRegression
+    from sklearn.pipeline import Pipeline
+    from sklearn.preprocessing import StandardScaler
+
+    from skops import hub_utils
+    from skops.card import metadata_from_config
+
+    X, y = load_iris(return_X_y=True, as_frame=True)
+
+    model = Pipeline(
+        [("scaler", StandardScaler()), ("clf", LogisticRegression(random_state=123))]
+    ).fit(X, y)
+
+    pkl_file = tempfile.mkstemp(suffix=".pkl", prefix="skops-test")[1]
+    with open(pkl_file, "wb") as f:
+        pickle.dump(model, f)
+
+    with tempfile.TemporaryDirectory(prefix="skops-test") as destination_path:
+        hub_utils.init(
+            model=pkl_file,
+            requirements=[f"scikit-learn=={sklearn.__version__}"],
+            dst=destination_path,
+            task="tabular-classification",
+            data=X,
+        )
+        card = Card(model, metadata=metadata_from_config(destination_path))
+
+        # add a placeholder for figures
+        card.add(Plots="")
+
+        # add arbitrary sections, overwrite them, etc.
+        card.add(hi="howdy")
+        card.add(**{"parent section/child section": "child content"})
+        card.add(**{"foo": "bar", "spam": "eggs"})
+        # change content of "hi" section
+        card.add(**{"hi/german": "guten tag", "hi/french": "salut"})
+        card.add(**{"very/deeply/nested/section": "but why?"})
+
+        # add metrics
+        card.add_metrics(**{"acc": 0.1})
+
+        # insert the plot in the "Plot" section we inserted above
+        plt.plot([4, 5, 6, 7])
+        plt.savefig(Path(destination_path) / "fig1.png")
+        card.add_plot(**{"Plots/A beautiful plot": "fig1.png"})
+
+        # add table
+        table = {"split": [1, 2, 3], "score": [4, 5, 6]}
+        card.add_table(
+            folded=True,
+            **{"Model description/Training Procedure/Yet another table": table},
+        )
+
+        # more metrics
+        card.add_metrics(**{"f1": 0.2, "roc": 123})
+
+        # add content for "Model description" section, which has subsections but
+        # otherwise no content
+        card.add(**{"Model description": "This is a fantastic model"})
+
+        card.save(Path(destination_path) / "README.md")
+        print(destination_path)
+
+        # pushing to Hub
+        token = os.environ["HF_HUB_TOKEN"]
+        repo_name = f"hf_hub_example-{uuid4()}"
+        user_name = HfApi().whoami(token=token)["name"]
+        repo_id = f"{user_name}/{repo_name}"
+        print(f"Creating and pushing to repo: {repo_id}")
+        hub_utils.push(
+            repo_id=repo_id,
+            source=destination_path,
+            token=token,
+            commit_message="testing model cards",
+            create_remote=True,
+            private=False,
+        )
+
+
+if __name__ == "__main__":
+    main()

From cc229a209bfaf272242a656c9ebe9537db75afd1 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 31 Oct 2022 17:57:48 +0100
Subject: [PATCH 02/47] [WIP] Further align new model card design

Added a test that shows that the new card produces the same output as
the old card (except for a few non-deterministic parts). This includes
most of the idiosyncrasies of the old card we might want to change in
the future (e.g. inconsistent capitalization, use of empty lines). Some
of the more problematic behaviors of the old card class were, however,
fixed (e.g. creating an empty metrics table when there are no metrics).

The other tests have been reworked to use the new card features to make
them more precise. Often, that means that instead of having a very weak
test like "assert 'foo' in card.render()", it is now possible to select
the exact section and check that it equals the expected output.

This work is still unfinished, specifically it still lacks tests for the
card repr and for the newly added features.
---
 skops/card/_card_alternative.py           | 174 ++++-
 skops/card/_model_card.py                 |  20 +-
 skops/card/default_template.md            |   2 +-
 skops/card/tests/test_card.py             |   2 +-
 skops/card/tests/test_card_alternative.py | 761 ++++++++++++++++++++++
 5 files changed, 913 insertions(+), 46 deletions(-)
 create mode 100644 skops/card/tests/test_card_alternative.py

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index 656ae18c..8326c10f 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -1,6 +1,7 @@
 from __future__ import annotations
 
 import re
+import textwrap
 from dataclasses import dataclass, field
 from pathlib import Path
 from reprlib import Repr
@@ -17,6 +18,43 @@
 aRepr.maxstring = 79
 
 
+DEFAULT_TEMPLATE = {
+    "Model description": "[More Information Needed]",
+    "Model description/Intended uses & limitations": "[More Information Needed]",
+    "Model description/Training Procedure/Hyperparameters": """The model is trained with below hyperparameters.
+
+<details>
+<summary> Click to expand </summary>
+
+{{ hyperparameter_table }}
+
+</details>""",
+    "Model description/Training Procedure/Model Plot": "The model plot is below.",
+    "Model description/Evaluation Results": """You can find the details about evaluation process and the evaluation results.
+
+
+
+[More Information Needed]""",
+    "How to Get Started with the Model": """Use the code below to get started with the model.
+
+```python
+[More Information Needed]
+```""",
+    "Model Card Authors": """This model card is written by following authors:
+
+[More Information Needed]""",
+    "Model Card Contact": """You can contact the model card authors through following channels:
+[More Information Needed]""",
+    "Citation": """Below you can find information related to citation.
+
+**BibTeX:**
+```
+[More Information Needed]
+```
+""",
+}
+
+
 def split_subsection_names(key: str) -> list[str]:
     return key.split("/")
 
@@ -47,27 +85,24 @@ def format(self) -> str:
 
 
 class Card:
-    @classmethod
-    def make_default(
-        cls, model, model_diagram: bool = True, metadata: CardData | None = None
-    ):
-        """Add a bunch of default sections, yet to be implemented"""
-        raise NotImplementedError
-
     def __init__(
-        self, model, model_diagram: bool = True, metadata: CardData | None = None
+        self,
+        model,
+        model_diagram: bool = True,
+        metadata: CardData | None = None,
+        prefill: bool = True,
     ):
         self.model = model
         self.model_diagram = model_diagram
         self.metadata = metadata or CardData()
 
         self._data: dict[str, Section] = {}
-        self._metrics: dict[str, float | int] = {}
+        if prefill:
+            self._fill_default_sections()
+        self._metrics: dict[str, str | float | int] = {}
         self._reset()
 
     def _reset(self) -> None:
-        self._add_model(self.model)
-
         model_file = self.metadata.to_dict().get("model_file")
         if model_file:
             self._add_get_started_code(model_file)
@@ -75,14 +110,22 @@ def _reset(self) -> None:
         self._add_model_section()
         self._add_hyperparams()
 
+    def _fill_default_sections(self) -> None:
+        self.add(**DEFAULT_TEMPLATE)
+
     def add(self, **kwargs: str) -> "Card":
         for key, val in kwargs.items():
             self._add_single(key, val)
         return self
 
-    def _add_single(self, key: str, val: Formattable | str) -> None:
+    def _select(
+        self, subsection_names: list[str], create: bool = True
+    ) -> dict[str, Section]:
+        """TODO"""
         section = self._data
-        *subsection_names, leaf_node_name = split_subsection_names(key)
+        if not subsection_names:
+            return section
+
         for subsection_name in subsection_names:
             section_maybe = section.get(subsection_name)
 
@@ -91,10 +134,31 @@ def _add_single(self, key: str, val: Formattable | str) -> None:
                 section = section_maybe.subsections
                 continue
 
-            # no subsection, create
-            entry = Section(title=subsection_name)
-            section[subsection_name] = entry
-            section = entry.subsections
+            if create:
+                # no subsection, create
+                entry = Section(title=subsection_name)
+                section[subsection_name] = entry
+                section = entry.subsections
+            else:
+                raise KeyError(f"Section titles {subsection_name} does not exist")
+
+        return section
+
+    def select(self, key: str | list[str]) -> Section:
+        assert key  # TODO
+
+        if isinstance(key, str):
+            subsection_names = split_subsection_names(key)
+        else:
+            subsection_names = key
+
+        parent_section = self._select(subsection_names[:-1], create=False)
+        return parent_section[subsection_names[-1]]
+
+    def _add_single(self, key: str, val: Formattable | str) -> None:
+        section = self._data
+        *subsection_names, leaf_node_name = split_subsection_names(key)
+        section = self._select(subsection_names)
 
         if leaf_node_name in section:
             # entry exists, only overwrite content
@@ -121,7 +185,11 @@ def _add_model_section(self) -> None:
             model_plot_div = model_plot_div.replace(
                 "sk-top-container", 'sk-top-container" style="overflow: auto;'
             )
-        self._add_single("Model Plot", model_plot_div)
+        template = "The model plot is below.\n\n{}"
+        self._add_single(
+            "Model description/Training Procedure/Model Plot",
+            template.format(model_plot_div),
+        )
 
     def _add_hyperparams(self) -> None:
         hyperparameter_dict = self.model.get_params(deep=True)
@@ -132,12 +200,26 @@ def _add_hyperparams(self) -> None:
                 tablefmt="github",
             )
         )
-        self._add_single("Model description/Training Procedure/Hyperparameters", table)
+        template = textwrap.dedent(
+            """        The model is trained with below hyperparameters.
+
+        <details>
+        <summary> Click to expand </summary>
+
+        {}
+
+        </details>"""
+        )
+        self._add_single(
+            "Model description/Training Procedure/Hyperparameters",
+            template.format(table),
+        )
 
     def add_plot(self, folded=False, **kwargs: str) -> "Card":
-        for plot_name, plot_path in kwargs.items():
+        for section_name, plot_path in kwargs.items():
+            plot_name = split_subsection_names(section_name)[-1]
             section = PlotSection(alt_text=plot_name, path=plot_path, folded=folded)
-            self._add_single(plot_name, section)
+            self._add_single(section_name, section)
         return self
 
     def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> Card:
@@ -146,18 +228,25 @@ def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> C
             self._add_single(key, section)
         return self
 
-    def add_metrics(self, **kwargs: int | float) -> "Card":
+    def add_metrics(self, **kwargs: str | int | float) -> "Card":
         self._metrics.update(kwargs)
         self._add_metrics(self._metrics)
         return self
 
-    def _add_metrics(self, metrics: dict[str, float | int]) -> None:
+    def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
         table = tabulate(
             list(metrics.items()),
             headers=["Metric", "Value"],
             tablefmt="github",
         )
-        self._add_single("Model description/Evaluation Results", table)
+        template = textwrap.dedent(
+            """        You can find the details about evaluation process and the evaluation results.
+
+
+
+        {}"""
+        )
+        self._add_single("Model description/Evaluation Results", template.format(table))
 
     def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
         for key, val in metadata.to_dict().items() if metadata else {}:
@@ -174,7 +263,9 @@ def _strip_blank(text) -> str:
         text = re.sub(r"\s+", r" ", text)
         return text
 
-    def _generate_content(self, data, depth: int = 1) -> Iterator[str]:
+    def _generate_content(
+        self, data: dict[str, Section], depth: int = 1
+    ) -> Iterator[str]:
         for val in data.values():
             title = f"{depth * '#'} {val.title}"
             yield title
@@ -207,28 +298,41 @@ def __repr__(self) -> str:
         return complete_repr
 
     def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
-        lines = [
+        is_skops_format = file_name.endswith(".skops")  # else, assume pickle
+
+        lines = ["```python"]
+        if is_skops_format:
+            lines += ["from skops.io import load"]
+        else:
+            lines += ["import joblib"]
+
+        lines += [
             "import json",
             "import pandas as pd",
         ]
-        if file_name.endswith(".skops"):
+        if is_skops_format:
             lines += [
                 "from skops.io import load",
                 f'model = load("{file_name}")',
             ]
         else:  # pickle
-            lines += [
-                "import pickle",
-                f"with open('{file_name}') as f:",
-                indent + "model = pickle.load(f)",
-            ]
+            lines += [f"model = joblib.load({file_name})"]
 
         lines += [
             'with open("config.json") as f:',
             indent + "config = json.load(f)",
-            'clf.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
+            'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
+            "```",
         ]
-        self._add_single("How to Get Started with the Model", "\n".join(lines))
+        template = textwrap.dedent(
+            """        Use the code below to get started with the model.
+
+        {}
+        """
+        )
+        self._add_single(
+            "How to Get Started with the Model", template.format("\n".join(lines))
+        )
 
     def _generate_card(self) -> Iterator[str]:
         if self.metadata:
@@ -261,7 +365,7 @@ def render(self) -> str:
 
         Returns
         -------
-        card : str
+        result : str
             The rendered model card with all placeholders filled and all extra
             sections inserted.
         """
diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index c978e670..22f782e3 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -395,20 +395,20 @@ def _generate_card(self) -> ModelCard:
                     template_sections["get_started_code"] = (
                         "from skops.io import load\nimport json\n"
                         "import pandas as pd\n"
-                        f'clf = load("{model_file}")\n'
+                        f'model = load("{model_file}")\n'
                         'with open("config.json") as f:\n   '
                         " config ="
                         " json.load(f)\n"
-                        'clf.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))'
+                        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))'
                     )
                 else:
                     template_sections["get_started_code"] = (
-                        "import joblib\nimport json\nimport pandas as pd\nclf ="
+                        "import joblib\nimport json\nimport pandas as pd\nmodel ="
                         f' joblib.load({model_file})\nwith open("config.json") as'
                         " f:\n   "
                         " config ="
                         " json.load(f)\n"
-                        'clf.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))'
+                        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))'
                     )
         if self.model_diagram is True:
             model_plot_div = re.sub(r"\n\s+", "", str(estimator_html_repr(self.model)))
@@ -419,11 +419,13 @@ def _generate_card(self) -> ModelCard:
             model_plot: str | None = model_plot_div
         else:
             model_plot = None
-        template_sections["eval_results"] = tabulate(
-            list(self._eval_results.items()),
-            headers=["Metric", "Value"],
-            tablefmt="github",
-        )
+
+        if self._eval_results:  # only add metrics if there are any
+            template_sections["eval_results"] = tabulate(
+                list(self._eval_results.items()),
+                headers=["Metric", "Value"],
+                tablefmt="github",
+            )
 
         # if template path is not given, use default
         if template_sections.get("template_path") is None:
diff --git a/skops/card/default_template.md b/skops/card/default_template.md
index edbc8d49..91141dfe 100644
--- a/skops/card/default_template.md
+++ b/skops/card/default_template.md
@@ -29,7 +29,7 @@ The model plot is below.
 
 {{ model_plot }}
 
-## Evaluation Results
+## Evaluation Results
 
 You can find the details about evaluation process and the evaluation results.
 
diff --git a/skops/card/tests/test_card.py b/skops/card/tests/test_card.py
index e2ed4596..4cb6d4ec 100644
--- a/skops/card/tests/test_card.py
+++ b/skops/card/tests/test_card.py
@@ -222,7 +222,7 @@ def test_code_autogeneration_skops(
     filename = metadata["model_file"]
     with open(Path(destination_path) / "README.md") as f:
         read_buffer = f.read()
-        assert f'clf = load("{filename}")' in read_buffer
+        assert f'model = load("{filename}")' in read_buffer
 
         # test if the model doesn't overflow the huggingface models page
         assert read_buffer.count("sk-top-container") == 1
diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
new file mode 100644
index 00000000..b723b3e2
--- /dev/null
+++ b/skops/card/tests/test_card_alternative.py
@@ -0,0 +1,761 @@
+import copy
+import os
+import pickle
+import tempfile
+from itertools import zip_longest
+from pathlib import Path
+
+import matplotlib.pyplot as plt
+import numpy as np
+import pytest
+import sklearn
+from huggingface_hub import CardData, metadata_load
+from sklearn.datasets import load_iris
+from sklearn.linear_model import LinearRegression, LogisticRegression
+from sklearn.tree import DecisionTreeClassifier
+
+import skops
+from skops import hub_utils
+from skops.card import metadata_from_config
+from skops.card._card_alternative import Card
+from skops.card._model_card import PlotSection, TableSection
+from skops.io import dump
+
+
+def fit_model():
+    X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
+    y = np.dot(X, np.array([1, 2])) + 3
+    reg = LinearRegression().fit(X, y)
+    return reg
+
+
+@pytest.fixture
+def model_card(model_diagram=True):
+    model = fit_model()
+    card = Card(model, model_diagram)
+    yield card
+
+
+@pytest.fixture
+def iris_data():
+    X, y = load_iris(return_X_y=True, as_frame=True)
+    yield X, y
+
+
+@pytest.fixture
+def iris_estimator(iris_data):
+    X, y = iris_data
+    est = LogisticRegression(solver="liblinear").fit(X, y)
+    yield est
+
+
+@pytest.fixture
+def iris_pkl_file(iris_estimator):
+    pkl_file = tempfile.mkstemp(suffix=".pkl", prefix="skops-test")[1]
+    with open(pkl_file, "wb") as f:
+        pickle.dump(iris_estimator, f)
+    yield pkl_file
+
+
+@pytest.fixture
+def iris_skops_file(iris_estimator):
+    skops_folder = tempfile.mkdtemp()
+    model_name = "model.skops"
+    skops_path = Path(skops_folder) / model_name
+    dump(iris_estimator, skops_path)
+    yield skops_path
+
+
+def _create_model_card_from_saved_model(
+    destination_path,
+    iris_estimator,
+    iris_data,
+    save_file,
+):
+    X, y = iris_data
+    hub_utils.init(
+        model=save_file,
+        requirements=[f"scikit-learn=={sklearn.__version__}"],
+        dst=destination_path,
+        task="tabular-classification",
+        data=X,
+    )
+    card = Card(iris_estimator, metadata=metadata_from_config(destination_path))
+    card.save(Path(destination_path) / "README.md")
+    return card
+
+
+@pytest.fixture
+def skops_model_card_metadata_from_config(
+    destination_path, iris_estimator, iris_skops_file, iris_data
+):
+    yield _create_model_card_from_saved_model(
+        destination_path, iris_estimator, iris_data, iris_skops_file
+    )
+
+
+@pytest.fixture
+def pkl_model_card_metadata_from_config(
+    destination_path, iris_estimator, iris_pkl_file, iris_data
+):
+    yield _create_model_card_from_saved_model(
+        destination_path, iris_estimator, iris_data, iris_pkl_file
+    )
+
+
+@pytest.fixture
+def destination_path():
+    with tempfile.TemporaryDirectory(prefix="skops-test") as dir_path:
+        yield Path(dir_path)
+
+
+def test_save_model_card(destination_path, model_card):
+    model_card.save(Path(destination_path) / "README.md")
+    assert (Path(destination_path) / "README.md").exists()
+
+
+def test_select_existing_section():
+    # TODO
+    pass
+
+
+def test_select_non_existing_section_raises():
+    # TODO
+    pass
+
+
+def test_hyperparameter_table(destination_path, model_card):
+    section_name = "Model description/Training Procedure/Hyperparameters"
+    text_hyperparams = model_card.select(section_name).content
+    expected = "\n".join(
+        [
+            "The model is trained with below hyperparameters.",
+            "",
+            "<details>",
+            "<summary> Click to expand </summary>",
+            "",
+            "| Hyperparameter   | Value      |",
+            "|------------------|------------|",
+            "| copy_X           | True       |",
+            "| fit_intercept    | True       |",
+            "| n_jobs           |            |",
+            "| normalize        | deprecated |",
+            "| positive         | False      |",
+            "",
+            "</details>",
+        ]
+    )
+    assert text_hyperparams == expected
+
+
+def _strip_multiple_chars(text, char):
+    # _strip_multiple_chars("hi    there") == "hi there"
+    # _strip_multiple_chars("|---|--|", "-") == "|-|-|"
+    while char + char in text:
+        text = text.replace(char + char, char)
+    return text
+
+
+def test_hyperparameter_table_with_line_break(destination_path):
+    # Hyperparameters can contain values with line breaks, "\n", in them. In
+    # that case, the markdown table is broken. Check that the hyperparameter
+    # table we create properly replaces the "\n" with "<br />".
+    class EstimatorWithLbInParams:
+        def get_params(self, deep=False):
+            return {"fit_intercept": True, "n_jobs": "line\nwith\nbreak"}
+
+    model_card = Card(EstimatorWithLbInParams())
+    section_name = "Model description/Training Procedure/Hyperparameters"
+    text_hyperparams = model_card.select(section_name).content
+
+    # remove multiple whitespaces, as they're not important
+    text_cleaned = _strip_multiple_chars(text_hyperparams, " ")
+    assert "| n_jobs | line<br />with<br />break |" in text_cleaned
+
+
+def test_plot_model(destination_path, model_card):
+    text_plot = model_card.select(
+        "Model description/Training Procedure/Model Plot"
+    ).content
+    # don't compare whole text, as it's quite long and non-deterministic
+    assert text_plot.startswith("The model plot is below.\n\n<style>#sk-container-id")
+    assert "<style>" in text_plot
+    assert text_plot.endswith(
+        "<pre>LinearRegression()</pre></div></div></div></div></div>"
+    )
+
+
+def test_plot_model_false(destination_path, model_card):
+    model = fit_model()
+    model_card = Card(model, model_diagram=False)
+    text_plot = model_card.select(
+        "Model description/Training Procedure/Model Plot"
+    ).content
+    assert text_plot == "The model plot is below."
+
+
+def test_add_new_section(destination_path, model_card):
+    model_card = model_card.add(**{"A new section": "sklearn FTW"})
+    section = model_card.select("A new section")
+    assert section.content == "sklearn FTW"
+
+
+def test_add_content_to_existing_section(destination_path, model_card):
+    section = model_card.select("Model description")
+    num_subsection_before = len(section.subsections)
+
+    # add content to "Model description" section
+    model_card = model_card.add(**{"Model description": "sklearn FTW"})
+    section = model_card.select("Model description")
+    num_subsection_after = len(section.subsections)
+
+    assert num_subsection_before == num_subsection_after
+    assert section.content == "sklearn FTW"
+
+
+@pytest.mark.skip  # FIXME: remove
+def test_template_sections_not_mutated_by_save(destination_path, model_card):
+    template_sections_before = copy.deepcopy(model_card._template_sections)
+    model_card.save(Path(destination_path) / "README.md")
+    template_sections_after = copy.deepcopy(model_card._template_sections)
+    assert template_sections_before == template_sections_after
+
+
+def test_add_plot(destination_path, model_card):
+    plt.plot([4, 5, 6, 7])
+    plt.savefig(Path(destination_path) / "fig1.png")
+    model_card = model_card.add_plot(fig1="fig1.png")
+    plot_content = model_card.select("fig1").content.format()
+    assert plot_content == "![fig1](fig1.png)"
+
+
+@pytest.mark.skip  # FIXME: remove
+def test_temporary_plot(destination_path, model_card):
+    # test if the additions are made to a temporary template file
+    # and not to default template or template provided
+    root = skops.__path__
+    # read original template
+    with open(Path(root[0]) / "card" / "default_template.md") as f:
+        default_template = f.read()
+    plt.plot([4, 5, 6, 7])
+    plt.savefig(Path(destination_path) / "fig1.png")
+    model_card.add_plot(fig1="fig1.png")
+    model_card.save(Path(destination_path) / "README.md")
+    # check if default template is not modified
+    with open(Path(root[0]) / "card" / "default_template.md") as f:
+        default_template_post = f.read()
+    assert default_template == default_template_post
+
+
+def test_adding_metadata(destination_path, model_card):
+    # test if the metadata is added to the card
+    model_card.metadata.tags = "dummy"
+    metadata = list(model_card._generate_metadata(model_card.metadata))
+    assert len(metadata) == 1
+    assert metadata[0] == "metadata.tags=dummy,"
+
+
+@pytest.mark.xfail(reason="Waiting for update of model attribute")
+def test_override_model(model_card):
+    # test that the model can be overridden and dependent sections are updated
+    hyperparams_before = model_card.select(
+        "Model description/Training Procedure/Hyperparameters"
+    ).content
+    model_card.model = DecisionTreeClassifier()
+    hyperparams_after = model_card.select(
+        "Model description/Training Procedure/Hyperparameters"
+    ).content
+
+    assert hyperparams_before != hyperparams_after
+    assert "fit_intercept" not in hyperparams_before
+    assert "min_samples_leaf" in hyperparams_after
+
+
+def test_add_metrics(destination_path, model_card):
+    model_card.add_metrics(**{"acc": "0.1"})  # str
+    model_card.add_metrics(f1=0.1)  # float
+    model_card.add_metrics(awesomeness=123)  # int
+
+    eval_metric_content = model_card.select(
+        "Model description/Evaluation Results"
+    ).content
+    expected = "\n".join(
+        [
+            "| Metric      |   Value |",
+            "|-------------|---------|",
+            "| acc         |     0.1 |",
+            "| f1          |     0.1 |",
+            "| awesomeness |   123   |",
+        ]
+    )
+    assert eval_metric_content.endswith(expected)
+
+
+def test_code_autogeneration(destination_path, pkl_model_card_metadata_from_config):
+    # test if getting started code is automatically generated
+    metadata = metadata_load(local_path=Path(destination_path) / "README.md")
+    filename = metadata["model_file"]
+    with open(Path(destination_path) / "README.md") as f:
+        assert f"joblib.load({filename})" in f.read()
+
+
+def test_code_autogeneration_skops(
+    destination_path, skops_model_card_metadata_from_config
+):
+    # test if getting started code is automatically generated for skops format
+    metadata = metadata_load(local_path=Path(destination_path) / "README.md")
+    filename = metadata["model_file"]
+    with open(Path(destination_path) / "README.md") as f:
+        read_buffer = f.read()
+        assert f'model = load("{filename}")' in read_buffer
+
+        # test if the model doesn't overflow the huggingface models page
+        assert read_buffer.count("sk-top-container") == 1
+        assert 'style="overflow: auto;' in read_buffer
+
+
+def test_metadata_from_config_tabular_data(
+    pkl_model_card_metadata_from_config, destination_path
+):
+    # test if widget data is correctly set in the README
+    metadata = metadata_load(local_path=Path(destination_path) / "README.md")
+    assert "widget" in metadata
+
+    expected_data = {
+        "structuredData": {
+            "petal length (cm)": [1.4, 1.4, 1.3],
+            "petal width (cm)": [0.2, 0.2, 0.2],
+            "sepal length (cm)": [5.1, 4.9, 4.7],
+            "sepal width (cm)": [3.5, 3.0, 3.2],
+        }
+    }
+    assert metadata["widget"] == expected_data
+
+    for tag in ["sklearn", "skops", "tabular-classification"]:
+        assert tag in metadata["tags"]
+
+
+@pytest.mark.skip  # FIXME
+class TestCardRepr:
+    """Test __str__ and __repr__ methods of Card, which are identical for now"""
+
+    @pytest.fixture
+    def card(self):
+        model = LinearRegression(fit_intercept=False)
+        card = Card(model=model)
+        card.add(
+            model_description="A description",
+            model_card_authors="Jane Doe",
+        )
+        card.add_plot(
+            roc_curve="ROC_curve.png",
+            confusion_matrix="confusion_matrix.jpg",
+        )
+        card.add_table(search_results={"split": [1, 2, 3], "score": [4, 5, 6]})
+        return card
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_card_repr(self, card: Card, meth):
+        result = meth(card)
+        expected = (
+            "Card(\n"
+            "  model=LinearRegression(fit_intercept=False),\n"
+            "  model_description='A description',\n"
+            "  model_card_authors='Jane Doe',\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_very_long_lines_are_shortened(self, card: Card, meth):
+        card.add(my_section="very long line " * 100)
+        result = meth(card)
+        expected = (
+            "Card(\n  model=LinearRegression(fit_intercept=False),\n"
+            "  model_description='A description',\n  model_card_authors='Jane Doe',\n"
+            "  my_section='very long line very lon...line very long line very long line"
+            " ',\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_without_model_attribute(self, card: Card, meth):
+        del card.model
+        result = meth(card)
+        expected = (
+            "Card(\n"
+            "  model_description='A description',\n"
+            "  model_card_authors='Jane Doe',\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_no_template_sections(self, card: Card, meth):
+        card._template_sections = {}  # type: ignore
+        result = meth(card)
+        expected = (
+            "Card(\n"
+            "  model=LinearRegression(fit_intercept=False),\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_no_extra_sections(self, card: Card, meth):
+        card._extra_sections = []  # type: ignore
+        result = meth(card)
+        expected = (
+            "Card(\n"
+            "  model=LinearRegression(fit_intercept=False),\n"
+            "  model_description='A description',\n"
+            "  model_card_authors='Jane Doe',\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_template_section_val_not_str(self, card: Card, meth):
+        card._template_sections["model_description"] = [1, 2, 3]  # type: ignore
+        result = meth(card)
+        expected = (
+            "Card(\n"
+            "  model=LinearRegression(fit_intercept=False),\n"
+            "  model_description=[1, 2, 3],\n"
+            "  model_card_authors='Jane Doe',\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_extra_sections_val_not_str(self, card: Card, meth):
+        card._extra_sections.append(("some section", {1: 2}))  # type: ignore
+        result = meth(card)
+        expected = (
+            "Card(\n"
+            "  model=LinearRegression(fit_intercept=False),\n"
+            "  model_description='A description',\n"
+            "  model_card_authors='Jane Doe',\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            "  some section={1: 2},\n"
+            ")"
+        )
+        assert result == expected
+
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_with_metadata(self, card: Card, meth):
+        metadata = CardData(
+            language="fr",
+            license="bsd",
+            library_name="sklearn",
+            tags=["sklearn", "tabular-classification"],
+            foo={"bar": 123},
+            widget={"something": "very-long"},
+        )
+        card.metadata = metadata
+        expected = (
+            "Card(\n"
+            "  model=LinearRegression(fit_intercept=False),\n"
+            "  metadata.language=fr,\n"
+            "  metadata.license=bsd,\n"
+            "  metadata.library_name=sklearn,\n"
+            "  metadata.tags=['sklearn', 'tabular-classification'],\n"
+            "  metadata.foo={'bar': 123},\n"
+            "  metadata.widget={...},\n"
+            "  model_description='A description',\n"
+            "  model_card_authors='Jane Doe',\n"
+            "  roc_curve='ROC_curve.png',\n"
+            "  confusion_matrix='confusion_matrix.jpg',\n"
+            "  search_results=Table(3x2),\n"
+            ")"
+        )
+        result = meth(card)
+        assert result == expected
+
+
+class TestPlotSection:
+    def test_format_path_is_str(self):
+        section = PlotSection(alt_text="some title", path="path/plot.png")
+        expected = "![some title](path/plot.png)"
+        assert section.format() == expected
+
+    def test_format_path_is_pathlib(self):
+        section = PlotSection(alt_text="some title", path=Path("path") / "plot.png")
+        expected = f"![some title](path{os.path.sep}plot.png)"
+        assert section.format() == expected
+
+    @pytest.mark.parametrize("meth", [str, repr])
+    def test_str_and_repr(self, meth):
+        section = PlotSection(alt_text="some title", path="path/plot.png")
+        expected = "'path/plot.png'"
+        assert meth(section) == expected
+
+    def test_str(self):
+        section = PlotSection(alt_text="some title", path="path/plot.png")
+        expected = "'path/plot.png'"
+        assert str(section) == expected
+
+    @pytest.mark.parametrize("folded", [True, False])
+    def test_folded(self, folded):
+        section = PlotSection(
+            alt_text="some title", path="path/plot.png", folded=folded
+        )
+        output = section.format()
+        if folded:
+            assert "<details>" in output
+        else:
+            assert "<details>" not in output
+
+
+class TestTableSection:
+    @pytest.fixture
+    def table_dict(self):
+        return {"split": [1, 2, 3], "score": [4, 5, 6]}
+
+    def test_table_is_dict(self, table_dict):
+        section = TableSection(table=table_dict)
+        expected = """|   split |   score |
+|---------|---------|
+|       1 |       4 |
+|       2 |       5 |
+|       3 |       6 |"""
+        assert section.format() == expected
+
+    def test_table_is_dataframe(self, table_dict):
+        pd = pytest.importorskip("pandas")
+        df = pd.DataFrame(table_dict)
+        section = TableSection(table=df)
+        expected = """|   split |   score |
+|---------|---------|
+|       1 |       4 |
+|       2 |       5 |
+|       3 |       6 |"""
+        assert section.format() == expected
+
+    @pytest.mark.parametrize("meth", [str, repr])
+    def test_str_and_repr_table_is_dict(self, table_dict, meth):
+        section = TableSection(table=table_dict)
+        expected = "Table(3x2)"
+        assert meth(section) == expected
+
+    @pytest.mark.parametrize("meth", [str, repr])
+    def test_str_and_repr_table_is_dataframe(self, table_dict, meth):
+        pd = pytest.importorskip("pandas")
+        df = pd.DataFrame(table_dict)
+        section = TableSection(table=df)
+        expected = "Table(3x2)"
+        assert meth(section) == expected
+
+    @pytest.mark.parametrize("table", [{}, {"col": []}, "pandas"])
+    def test_raise_error_empty_table(self, table):
+        # Test no columns, no rows, empty df
+        if table == "pandas":
+            pd = pytest.importorskip("pandas")
+            table = pd.DataFrame([])
+
+        msg = "Empty table added"
+        with pytest.raises(ValueError, match=msg):
+            TableSection(table=table)
+
+    def test_pandas_not_installed(self, table_dict, pandas_not_installed):
+        # use pandas_not_installed fixture from conftest.py to pretend that
+        # pandas is not installed
+        section = TableSection(table=table_dict)
+        assert section._is_pandas_df is False
+
+    @pytest.mark.parametrize("folded", [True, False])
+    def test_folded(self, table_dict, folded):
+        section = TableSection(table=table_dict, folded=folded)
+        output = section.format()
+        if folded:
+            assert "<details>" in output
+        else:
+            assert "<details>" not in output
+
+    def test_line_break_in_entry(self, table_dict):
+        # Line breaks are not allowed inside markdown tables, so check that
+        # they're removed. We test 3 conditions here:
+
+        # 1. custom object with line breaks in repr
+        # 2. string with line break in the middle
+        # 3. string with line break at start, middle, and end
+
+        # Note that for the latter, tabulate will automatically strip the line
+        # breaks from the start and end.
+        class LineBreakInRepr:
+            """Custom object whose repr has a line break"""
+
+            def __repr__(self) -> str:
+                return "obj\nwith lb"
+
+        table_dict["with break"] = [
+            LineBreakInRepr(),
+            "hi\nthere",
+            """
+entry with
+line breaks
+""",
+        ]
+        section = TableSection(table=table_dict)
+        expected = """| split | score | with break |
+|-|-|-|
+| 1 | 4 | obj<br />with lb |
+| 2 | 5 | hi<br />there |
+| 3 | 6 | entry with<br />line breaks |"""
+
+        result = section.format()
+        # remove multiple whitespaces and dashes, as they're not important
+        result = _strip_multiple_chars(result, " ")
+        result = _strip_multiple_chars(result, "-")
+        assert result == expected
+
+
+def make_card(card_type, file_path: Path, fill_content: bool = True):
+    import pickle
+
+    import matplotlib.pyplot as plt
+    import sklearn
+    from sklearn.datasets import load_iris
+    from sklearn.linear_model import LogisticRegression
+    from sklearn.pipeline import Pipeline
+    from sklearn.preprocessing import StandardScaler
+
+    from skops import hub_utils
+    from skops.card import Card as CardOld
+    from skops.card import metadata_from_config
+
+    if card_type == "old":
+        card_cls = CardOld  # type: ignore
+    else:
+        card_cls = Card  # type: ignore
+
+    destination_path = file_path.parent
+    X, y = load_iris(return_X_y=True, as_frame=True)
+
+    model = Pipeline(
+        [("scaler", StandardScaler()), ("clf", LogisticRegression(random_state=123))]
+    ).fit(X, y)
+
+    pkl_file = tempfile.mkstemp(suffix=".pkl", prefix="skops-test")[1]
+    with open(pkl_file, "wb") as f:
+        pickle.dump(model, f)
+
+    hub_utils.init(
+        model=pkl_file,
+        requirements=[f"scikit-learn=={sklearn.__version__}"],
+        dst=destination_path,
+        task="tabular-classification",
+        data=X,
+    )
+    card = card_cls(model, metadata=metadata_from_config(destination_path))
+
+    if fill_content:
+        # add metrics
+        card.add_metrics(**{"acc": "0.1"})
+
+        plt.plot([4, 5, 6, 7])
+        plt.savefig(Path(destination_path) / "fig1.png")
+        if card_type == "old":
+            card.add_plot(**{"A beautiful plot": "fig1.png"})
+        else:
+            # old card always adds additional content in an extra section
+            card.add_plot(**{"Additional Content/A beautiful plot": "fig1.png"})
+
+        # add table
+        table = {"split": [1, 2, 3], "score": [4, 5, 6]}
+        if card_type == "old":
+            card.add_table(
+                folded=True,
+                **{"Yet another table": table},
+            )
+        else:
+            # old card always adds additional content in an extra section
+            card.add_table(
+                folded=True, **{"Additional Content/Yet another table": table}
+            )
+
+        # add authors and contacts
+        if card_type == "old":
+            # old card requires to use the placeholder variable name
+            card.add(
+                **{
+                    "model_card_authors": "Alice and Bob",
+                    "model_card_contact": "alice@example.com",
+                    "citation_bibtex": "Holy Cow, Nature, 2022-10",
+                }
+            )
+        else:
+            # new card uses the section titles instead and overrides the
+            # existing content
+            card.add(
+                **{
+                    "Model Card Authors": (
+                        "This model card is written by following authors:\n\n"
+                        "Alice and Bob"
+                    ),
+                    "Model Card Contact": (
+                        "You can contact the model card authors through following"
+                        " channels:\nalice@example.com"
+                    ),
+                    "Citation": (
+                        "Below you can find information related to citation.\n\n"
+                        "**BibTeX:**\n"
+                        "```\nHoly Cow, Nature, 2022-10\n```\n"
+                    ),
+                }
+            )
+
+        # more metrics
+        card.add_metrics(**{"f1": "0.2", "roc": "123"})
+
+    card.save(file_path)
+
+
+@pytest.mark.parametrize("fill_content", [False, True])
+def test_old_and_new_card_identical(fill_content):
+    import tempfile
+
+    with tempfile.TemporaryDirectory(prefix="skops-test") as destination_path:
+        file_path = Path(destination_path) / "README-old.md"
+        make_card("old", file_path, fill_content=fill_content)
+        card_old = file_path.read_text()
+
+    with tempfile.TemporaryDirectory(prefix="skops-test") as destination_path:
+        file_path = Path(destination_path) / "README-new.md"
+        make_card("new", file_path, fill_content=fill_content)
+        card_new = file_path.read_text()
+
+    lines_old, lines_new = card_old.split("\n"), card_new.split("\n")
+    for i, (line0, line1) in enumerate(zip_longest(lines_old, lines_new, fillvalue="")):
+        # actual file name may differ, so only compare start of line
+        if line0.startswith("model_file: skops-"):
+            assert line1.startswith("model_file: skops-")
+            continue
+        if line0.startswith("model = joblib.load(skops-test"):
+            assert line1.startswith("model = joblib.load(skops-test")
+            continue
+
+        # model diagram is not deterministic, e.g. ids
+        if line0.startswith("<style>#sk-container-id"):
+            assert line1.startswith("<style>#sk-container-id")
+            continue
+
+        assert line0 == line1

From 166e33dc5914a252099e459a9a1776b0af9c1098 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 1 Nov 2022 15:28:08 +0100
Subject: [PATCH 03/47] Make tests pass

Some refactoring to clean up things, rework repr, make repr tests pass.
---
 skops/card/_card_alternative.py           | 155 ++++++++++++--------
 skops/card/_model_card.py                 |  11 +-
 skops/card/tests/test_card_alternative.py | 168 ++++++++--------------
 3 files changed, 158 insertions(+), 176 deletions(-)

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index 8326c10f..20698a02 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -17,41 +17,28 @@
 aRepr.maxother = 79
 aRepr.maxstring = 79
 
+CONTENT_PLACEHOLDER = "[More Information Needed]"
+"""When there is a section but no content, show this"""
 
 DEFAULT_TEMPLATE = {
-    "Model description": "[More Information Needed]",
-    "Model description/Intended uses & limitations": "[More Information Needed]",
-    "Model description/Training Procedure/Hyperparameters": """The model is trained with below hyperparameters.
-
-<details>
-<summary> Click to expand </summary>
-
-{{ hyperparameter_table }}
-
-</details>""",
-    "Model description/Training Procedure/Model Plot": "The model plot is below.",
-    "Model description/Evaluation Results": """You can find the details about evaluation process and the evaluation results.
-
-
-
-[More Information Needed]""",
-    "How to Get Started with the Model": """Use the code below to get started with the model.
-
-```python
-[More Information Needed]
-```""",
-    "Model Card Authors": """This model card is written by following authors:
-
-[More Information Needed]""",
-    "Model Card Contact": """You can contact the model card authors through following channels:
-[More Information Needed]""",
-    "Citation": """Below you can find information related to citation.
-
-**BibTeX:**
-```
-[More Information Needed]
-```
-""",
+    "Model description": CONTENT_PLACEHOLDER,
+    "Model description/Intended uses & limitations": CONTENT_PLACEHOLDER,
+    "Model description/Training Procedure": "",
+    "Model description/Training Procedure/Hyperparameters": CONTENT_PLACEHOLDER,
+    "Model description/Training Procedure/Model Plot": CONTENT_PLACEHOLDER,
+    "Model description/Evaluation Results": CONTENT_PLACEHOLDER,
+    "How to Get Started with the Model": CONTENT_PLACEHOLDER,
+    "Model Card Authors": (
+        f"This model card is written by following authors:\n\n{CONTENT_PLACEHOLDER}"
+    ),
+    "Model Card Contact": (
+        "You can contact the model card authors through following channels:\n"
+        f"{CONTENT_PLACEHOLDER}"
+    ),
+    "Citation": (
+        "Below you can find information related to citation.\n\n**BibTeX:**\n```\n"
+        f"{CONTENT_PLACEHOLDER}\n```"
+    ),
 }
 
 
@@ -75,7 +62,7 @@ def _clean_table(table: str) -> str:
 @dataclass
 class Section:
     title: str
-    content: Formattable | str | None = None
+    content: Formattable | str
     subsections: dict[str, Section] = field(default_factory=dict)
 
 
@@ -100,6 +87,9 @@ def __init__(
         if prefill:
             self._fill_default_sections()
         self._metrics: dict[str, str | float | int] = {}
+        # TODO: This is for compatibility with old model card but having an
+        # empty table by default is kinda pointless
+        self.add_metrics()
         self._reset()
 
     def _reset(self) -> None:
@@ -113,7 +103,7 @@ def _reset(self) -> None:
     def _fill_default_sections(self) -> None:
         self.add(**DEFAULT_TEMPLATE)
 
-    def add(self, **kwargs: str) -> "Card":
+    def add(self, **kwargs: str | Formattable) -> "Card":
         for key, val in kwargs.items():
             self._add_single(key, val)
         return self
@@ -136,7 +126,7 @@ def _select(
 
             if create:
                 # no subsection, create
-                entry = Section(title=subsection_name)
+                entry = Section(title=subsection_name, content="")
                 section[subsection_name] = entry
                 section = entry.subsections
             else:
@@ -177,7 +167,11 @@ def _add_model(self, model) -> None:
         self._add_single("Model description", model_repr)
 
     def _add_model_section(self) -> None:
+        section_title = "Model description/Training Procedure/Model Plot"
+        default_content = "The model plot is below."
+
         if not self.model_diagram:
+            self._add_single(section_title, default_content)
             return
 
         model_plot_div = re.sub(r"\n\s+", "", str(estimator_html_repr(self.model)))
@@ -185,11 +179,8 @@ def _add_model_section(self) -> None:
             model_plot_div = model_plot_div.replace(
                 "sk-top-container", 'sk-top-container" style="overflow: auto;'
             )
-        template = "The model plot is below.\n\n{}"
-        self._add_single(
-            "Model description/Training Procedure/Model Plot",
-            template.format(model_plot_div),
-        )
+        content = f"{default_content}\n\n{model_plot_div}"
+        self._add_single(section_title, content)
 
     def _add_hyperparams(self) -> None:
         hyperparameter_dict = self.model.get_params(deep=True)
@@ -256,13 +247,6 @@ def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
 
             yield aRepr.repr(f"metadata.{key}={val},").strip('"').strip("'")
 
-    @staticmethod
-    def _strip_blank(text) -> str:
-        # remove new lines and multiple spaces
-        text = text.replace("\n", " ")
-        text = re.sub(r"\s+", r" ", text)
-        return text
-
     def _generate_content(
         self, data: dict[str, Section], depth: int = 1
     ) -> Iterator[str]:
@@ -278,22 +262,74 @@ def _generate_content(
             if val.subsections:
                 yield from self._generate_content(val.subsections, depth=depth + 1)
 
+    def _iterate_content(
+        self, data: dict[str, Section], parent_section: str = ""
+    ) -> Iterator[tuple[str, Formattable | str]]:
+        for val in data.values():
+            if parent_section:
+                title = "/".join((parent_section, val.title))
+            else:
+                title = val.title
+
+            yield title, val.content
+
+            if val.subsections:
+                yield from self._iterate_content(val.subsections, parent_section=title)
+
+    @staticmethod
+    def _strip_blank(text: str) -> str:
+        # remove new lines and multiple spaces
+        text = text.replace("\n", " ")
+        text = re.sub(r"\s+", r" ", text)
+        return text
+
+    def _format_repr(self, text: str) -> str:
+        # Remove new lines, multiple spaces, quotation marks, and cap line length
+        text = self._strip_blank(text)
+        return aRepr.repr(text).strip('"').strip("'")
+
     def __str__(self) -> str:
         return self.__repr__()
 
     def __repr__(self) -> str:
-        metadata_repr = "\n".join(
-            "  " + line for line in self._generate_metadata(self.metadata)
-        )
-        content_repr = "\n\n".join(
-            "  " + line for line in self._generate_content(self._data)
-        )
+        # repr for the model
+        model = getattr(self, "model", None)
+        if model:
+            model_repr = self._format_repr(f"model={repr(model)}")
+        else:
+            model_repr = None
+
+        # repr for metadata
+        metadata_reprs = []
+        for key, val in self.metadata.to_dict().items() if self.metadata else {}:
+            if key == "widget":
+                metadata_reprs.append("metadata.widget={...},")
+                continue
+
+            metadata_reprs.append(self._format_repr(f"metadata.{key}={val},"))
+        metadata_repr = "\n".join(metadata_reprs)
+
+        # repr for contents
+        content_reprs = []
+        for title, content in self._iterate_content(self._data):
+            if not content:
+                continue
+            if isinstance(content, str) and content.rstrip().endswith(
+                CONTENT_PLACEHOLDER
+            ):
+                # if content is just some default text, no need to show it
+                continue
+            content_reprs.append(self._format_repr(f"{title}={content},"))
+        content_repr = "\n".join(content_reprs)
 
+        # combine all parts
         complete_repr = "Card(\n"
-        if metadata_repr:
-            complete_repr += metadata_repr + "\n"
-        if content_repr:
-            complete_repr += content_repr + "\n"
+        if model_repr:
+            complete_repr += textwrap.indent(model_repr, "  ") + "\n"
+        if metadata_reprs:
+            complete_repr += textwrap.indent(metadata_repr, "  ") + "\n"
+        if content_reprs:
+            complete_repr += textwrap.indent(content_repr, "  ") + "\n"
         complete_repr += ")"
         return complete_repr
 
@@ -339,7 +375,8 @@ def _generate_card(self) -> Iterator[str]:
             yield f"---\n{self.metadata.to_yaml()}\n---"
 
         for line in self._generate_content(self._data):
-            yield "\n" + line
+            if line:
+                yield "\n" + line
 
     def save(self, path: str | Path) -> None:
         """Save the model card.
diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index 22f782e3..3fdf8ab1 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -420,12 +420,11 @@ def _generate_card(self) -> ModelCard:
         else:
             model_plot = None
 
-        if self._eval_results:  # only add metrics if there are any
-            template_sections["eval_results"] = tabulate(
-                list(self._eval_results.items()),
-                headers=["Metric", "Value"],
-                tablefmt="github",
-            )
+        template_sections["eval_results"] = tabulate(
+            list(self._eval_results.items()),
+            headers=["Metric", "Value"],
+            tablefmt="github",
+        )
 
         # if template path is not given, use default
         if template_sections.get("template_path") is None:
diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
index b723b3e2..b22d88fc 100644
--- a/skops/card/tests/test_card_alternative.py
+++ b/skops/card/tests/test_card_alternative.py
@@ -2,6 +2,7 @@
 import os
 import pickle
 import tempfile
+import textwrap
 from itertools import zip_longest
 from pathlib import Path
 
@@ -335,7 +336,6 @@ def test_metadata_from_config_tabular_data(
         assert tag in metadata["tags"]
 
 
-@pytest.mark.skip  # FIXME
 class TestCardRepr:
     """Test __str__ and __repr__ methods of Card, which are identical for now"""
 
@@ -343,125 +343,75 @@ class TestCardRepr:
     def card(self):
         model = LinearRegression(fit_intercept=False)
         card = Card(model=model)
+        card.add(Figures="")
         card.add(
-            model_description="A description",
-            model_card_authors="Jane Doe",
+            **{
+                "Model Description": "A description",
+                "Model Card Authors": "Jane Doe",
+            }
         )
         card.add_plot(
-            roc_curve="ROC_curve.png",
-            confusion_matrix="confusion_matrix.jpg",
+            **{
+                "Figures/ROC": "ROC.png",
+                "Figures/Confusion matrix": "confusion_matrix.jpg",
+            }
         )
-        card.add_table(search_results={"split": [1, 2, 3], "score": [4, 5, 6]})
+        card.add_table(**{"Search Results": {"split": [1, 2, 3], "score": [4, 5, 6]}})
         return card
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_card_repr(self, card: Card, meth):
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
+    @pytest.fixture
+    def expected_lines(self):
+        card_repr = """
+        Card(
+          model=LinearRegression(fit_intercept=False)
+          Model description/Training Procedure/...ed | | positive | False | </details>,
+          Model description/Training Procedure/...</pre></div></div></div></div></div>,
+          Model description/Evaluation Results=...ric | Value | |----------|---------|,
+          Model Card Authors=Jane Doe,
+          Citation=Below you can find informati...** ``` [More Information Needed] ```,
+          Figures/ROC='ROC.png',
+          Figures/Confusion matrix='confusion_matrix.jpg',
+          Model Description=A description,
+          Search Results=Table(3x2),
         )
-        assert result == expected
+        """
+        expected = textwrap.dedent(card_repr).strip()
+        return expected.split("\n")
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_very_long_lines_are_shortened(self, card: Card, meth):
-        card.add(my_section="very long line " * 100)
+    def test_card_repr(self, card: Card, meth, expected_lines):
         result = meth(card)
-        expected = (
-            "Card(\n  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n  model_card_authors='Jane Doe',\n"
-            "  my_section='very long line very lon...line very long line very long line"
-            " ',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
+        expected = "\n".join(expected_lines)
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_without_model_attribute(self, card: Card, meth):
-        del card.model
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
-        assert result == expected
+    def test_very_long_lines_are_shortened(self, card: Card, meth, expected_lines):
+        card.add(my_section="very long line " * 100)
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_no_template_sections(self, card: Card, meth):
-        card._template_sections = {}  # type: ignore
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
+        # expected results contain 1 line at the very end
+        extra_line = (
+            "  my_section=very long line very long l... "
+            "line very long line very long line ,"
         )
-        assert result == expected
+        expected_lines.insert(-1, extra_line)
+        expected = "\n".join(expected_lines)
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_no_extra_sections(self, card: Card, meth):
-        card._extra_sections = []  # type: ignore
         result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            ")"
-        )
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_template_section_val_not_str(self, card: Card, meth):
-        card._template_sections["model_description"] = [1, 2, 3]  # type: ignore
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description=[1, 2, 3],\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
-        assert result == expected
+    def test_without_model_attribute(self, card: Card, meth, expected_lines):
+        del card.model
+
+        # remove line 1 from expected results, which corresponds to the model
+        del expected_lines[1]
+        expected = "\n".join(expected_lines)
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_extra_sections_val_not_str(self, card: Card, meth):
-        card._extra_sections.append(("some section", {1: 2}))  # type: ignore
         result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            "  some section={1: 2},\n"
-            ")"
-        )
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_with_metadata(self, card: Card, meth):
+    def test_with_metadata(self, card: Card, meth, expected_lines):
         metadata = CardData(
             language="fr",
             license="bsd",
@@ -471,22 +421,18 @@ def test_with_metadata(self, card: Card, meth):
             widget={"something": "very-long"},
         )
         card.metadata = metadata
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  metadata.language=fr,\n"
-            "  metadata.license=bsd,\n"
-            "  metadata.library_name=sklearn,\n"
-            "  metadata.tags=['sklearn', 'tabular-classification'],\n"
-            "  metadata.foo={'bar': 123},\n"
-            "  metadata.widget={...},\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
+
+        # metadata comes after model line, i.e. position 2
+        extra_lines = [
+            "  metadata.language=fr,",
+            "  metadata.license=bsd,",
+            "  metadata.library_name=sklearn,",
+            "  metadata.tags=['sklearn', 'tabular-classification'],",
+            "  metadata.foo={'bar': 123},",
+            "  metadata.widget={...},",
+        ]
+        expected = "\n".join(expected_lines[:2] + extra_lines + expected_lines[2:])
+
         result = meth(card)
         assert result == expected
 

From a90e3a5311730389e83b1972a9db1b22448a26fc Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 1 Nov 2022 18:13:07 +0100
Subject: [PATCH 04/47] Add tests for new functionalities and docstrings

---
 skops/card/_card_alternative.py           | 407 +++++++++++++++++++---
 skops/card/tests/test_card_alternative.py | 286 ++++++++++++---
 2 files changed, 601 insertions(+), 92 deletions(-)

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index 20698a02..d12e30f4 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -1,11 +1,12 @@
 from __future__ import annotations
 
 import re
+import sys
 import textwrap
 from dataclasses import dataclass, field
 from pathlib import Path
 from reprlib import Repr
-from typing import Any, Iterator, Protocol
+from typing import Any, Iterator
 
 from huggingface_hub import CardData
 from sklearn.utils import estimator_html_repr
@@ -13,6 +14,12 @@
 
 from skops.card._model_card import PlotSection, TableSection
 
+if sys.version_info >= (3, 8):
+    from typing import Protocol
+else:
+    from typing_extensions import Protocol
+
+
 aRepr = Repr()
 aRepr.maxother = 79
 aRepr.maxstring = 79
@@ -43,7 +50,40 @@
 
 
 def split_subsection_names(key: str) -> list[str]:
-    return key.split("/")
+    placeholder = "$%!?"  # arbitrary sting that never appears naturally
+    key = key.replace("\\/", placeholder)
+    splits = key.split("/")
+    return [part.replace(placeholder, "/") for part in splits]
+
+
+def _getting_started_code(
+    file_name: str, is_skops_format: bool = False, indent="    "
+) -> list[str]:
+    # get lines of code required to load the model
+    lines: list[str] = []
+    if is_skops_format:
+        lines += ["from skops.io import load"]
+    else:
+        lines += ["import joblib"]
+
+    lines += [
+        "import json",
+        "import pandas as pd",
+    ]
+    if is_skops_format:
+        lines += [
+            "from skops.io import load",
+            f'model = load("{file_name}")',
+        ]
+    else:  # pickle
+        lines += [f"model = joblib.load({file_name})"]
+
+    lines += [
+        'with open("config.json") as f:',
+        indent + "config = json.load(f)",
+        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
+    ]
+    return lines
 
 
 def _clean_table(table: str) -> str:
@@ -72,6 +112,129 @@ def format(self) -> str:
 
 
 class Card:
+    """Model card class that will be used to generate model card.
+
+    This class can be used to write information and plots to model card and save
+    it. This class by default generates an interactive plot of the model and a
+    table of hyperparameters. Some default sections are added by default.
+
+    Parameters
+    ----------
+    model: estimator object
+        Model that will be documented.
+
+    model_diagram: bool, default=True
+        Set to True if model diagram should be plotted in the card.
+
+    metadata: CardData, optional
+        ``CardData`` object. The contents of this object are saved as metadata
+        at the beginning of the output file, and used by Hugging Face Hub.
+
+        You can use :func:`~skops.card.metadata_from_config` to create an
+        instance pre-populated with necessary information based on the contents
+        of the ``config.json`` file, which itself is created by
+        :func:`skops.hub_utils.init`.
+
+    prefill: bool (default=True)
+        Whether to add default sections or not.
+
+    Attributes
+    ----------
+    model: estimator object
+        The scikit-learn compatible model that will be documented.
+
+    metadata: CardData
+        Metadata to be stored at the beginning of the saved model card, as
+        metadata to be understood by the Hugging Face Hub.
+
+    Examples
+    --------
+    >>> from sklearn.metrics import (
+    ...     ConfusionMatrixDisplay,
+    ...     confusion_matrix,
+    ...     accuracy_score,
+    ...     f1_score
+    ... )
+    >>> import tempfile
+    >>> from pathlib import Path
+    >>> from sklearn.datasets import load_iris
+    >>> from sklearn.linear_model import LogisticRegression
+    >>> from skops.card._card_alternative import Card  # TODO
+    >>> X, y = load_iris(return_X_y=True)
+    >>> model = LogisticRegression(solver="liblinear", random_state=0).fit(X, y)
+    >>> model_card = Card(model)
+    >>> model_card.metadata.license = "mit"
+    >>> y_pred = model.predict(X)
+    >>> model_card.add_metrics(**{
+    ...     "accuracy": accuracy_score(y, y_pred),
+    ...     "f1 score": f1_score(y, y_pred, average="micro"),
+    ... })
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+    )
+    >>> cm = confusion_matrix(y, y_pred,labels=model.classes_)
+    >>> disp = ConfusionMatrixDisplay(
+    ...     confusion_matrix=cm,
+    ...     display_labels=model.classes_
+    ... )
+    >>> disp.plot()
+    <sklearn.metrics._plot.confusion_matrix.ConfusionMatrixDisplay object at ...>
+    >>> disp.figure_.savefig("confusion_matrix.png")
+    ...
+    >>> model_card.add_plot(confusion_matrix="confusion_matrix.png")
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      confusion_matrix='confusion_matrix.png',
+    )
+    >>> # add new content to the existing section "Model description"
+    >>> model_card.add(**{"Model description": "This is the best model"})
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description=This is the best model,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      confusion_matrix='confusion_matrix.png',
+    )
+    >>> # add content to a new section
+    >>> model_card.add(**{"A new section": "Please rate my model"})
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description=This is the best model,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      confusion_matrix='confusion_matrix.png',
+      A new section=Please rate my model,
+    )
+    >>> # add new subsection to an existing section by using "/"
+    >>> model_card.add(**{"Model description/Model name": "This model is called Bob"})
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description=This is the best model,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      Model description/Model name=This model is called Bob,
+      confusion_matrix='confusion_matrix.png',
+      A new section=Please rate my model,
+    )
+    >>> # save the card to a README.md file
+    >>> with tempfile.TemporaryDirectory() as tmpdir:
+    ...     model_card.save((Path(tmpdir) / "README.md"))
+    """
+
     def __init__(
         self,
         model,
@@ -84,13 +247,13 @@ def __init__(
         self.metadata = metadata or CardData()
 
         self._data: dict[str, Section] = {}
+        self._metrics: dict[str, str | float | int] = {}
         if prefill:
             self._fill_default_sections()
-        self._metrics: dict[str, str | float | int] = {}
-        # TODO: This is for compatibility with old model card but having an
-        # empty table by default is kinda pointless
-        self.add_metrics()
-        self._reset()
+            # TODO: This is for compatibility with old model card but having an
+            # empty table by default is kinda pointless
+            self.add_metrics()
+            self._reset()
 
     def _reset(self) -> None:
         model_file = self.metadata.to_dict().get("model_file")
@@ -104,6 +267,37 @@ def _fill_default_sections(self) -> None:
         self.add(**DEFAULT_TEMPLATE)
 
     def add(self, **kwargs: str | Formattable) -> "Card":
+        """Add new section(s) to the model card.
+
+        Add one or multiple sections to the model card. The section names are
+        taken from the keys and the contents are taken from the values.
+
+        To add to an existing section, use a ``"/"`` in the section name, e.g.:
+
+        ``card.add(**{"Existing section/New section": "content"})``.
+
+        If the parent section does not exist, it will be added automatically.
+
+        To add a section with ``"/"`` in its title (i.e. not inteded as a
+        subsection), escape the slash like so, ``"\\/"``, e.g.:
+
+        ``card.add(**{"A section with\\/a slash in the title": "content"})``.
+
+        If a section of the given name already exists, its content will be
+        overwritten.
+
+        Parameters
+        ----------
+        **kwargs : dict
+            The keys of the dictionary serve as the section title and the values
+            as the section content. It's possible to add to existing sections.
+
+        Returns
+        -------
+        self : object
+            Card object.
+
+        """
         for key, val in kwargs.items():
             self._add_single(key, val)
         return self
@@ -111,7 +305,6 @@ def add(self, **kwargs: str | Formattable) -> "Card":
     def _select(
         self, subsection_names: list[str], create: bool = True
     ) -> dict[str, Section]:
-        """TODO"""
         section = self._data
         if not subsection_names:
             return section
@@ -130,23 +323,100 @@ def _select(
                 section[subsection_name] = entry
                 section = entry.subsections
             else:
-                raise KeyError(f"Section titles {subsection_name} does not exist")
+                raise KeyError(f"Section {subsection_name} does not exist")
 
         return section
 
     def select(self, key: str | list[str]) -> Section:
-        assert key  # TODO
+        """Select a section from the model card.
+
+        To select a subsection of an existing section, use a ``"/"`` in the
+        section name, e.g.:
+
+        ``card.select("Existing section/New section")``.
+
+        Alternatively, a list of strings can be passed:
+
+        ``card.select(["Existing section", "New section"])``.
+
+        Parameters
+        ----------
+        key : str or list of str
+            The name of the (sub)section to select. When selecting a subsection,
+            either use a ``"/"`` in the name to separate the parent and child
+            sections, or pass a list of strings.
+
+        Returns
+        -------
+        self : Section
+            A dataclass containing all information relevant to the selected
+            section. Those are the title, the content, and subsections (in a
+            dict).
+
+        Raises
+        ------
+        KeyError
+            If the given section name was not found, a ``KeyError`` is raised.
+
+        """
+        if not key:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
+
+        if isinstance(key, str):
+            *subsection_names, leaf_node_name = split_subsection_names(key)
+        else:
+            *subsection_names, leaf_node_name = key
+
+        if not leaf_node_name:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
+
+        parent_section = self._select(subsection_names, create=False)
+        return parent_section[leaf_node_name]
+
+    def delete(self, key: str | list[str]) -> None:
+        """Delete a section from the model card.
+
+        To delete a subsection of an existing section, use a ``"/"`` in the
+        section name, e.g.:
+
+        ``card.delete("Existing section/New section")``.
+
+        Alternatively, a list of strings can be passed:
+
+        ``card.delete(["Existing section", "New section"])``.
+
+        Parameters
+        ----------
+        key : str or list of str
+            The name of the (sub)section to select. When selecting a subsection,
+            either use a ``"/"`` in the name to separate the parent and child
+            sections, or pass a list of strings.
+
+        Raises
+        ------
+        KeyError
+            If the given section name was not found, a ``KeyError`` is raised.
+
+        """
+        if not key:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
 
         if isinstance(key, str):
-            subsection_names = split_subsection_names(key)
+            *subsection_names, leaf_node_name = split_subsection_names(key)
         else:
-            subsection_names = key
+            *subsection_names, leaf_node_name = key
+
+        if not key:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
 
-        parent_section = self._select(subsection_names[:-1], create=False)
-        return parent_section[subsection_names[-1]]
+        parent_section = self._select(subsection_names, create=False)
+        del parent_section[leaf_node_name]
 
     def _add_single(self, key: str, val: Formattable | str) -> None:
-        section = self._data
         *subsection_names, leaf_node_name = split_subsection_names(key)
         section = self._select(subsection_names)
 
@@ -207,6 +477,27 @@ def _add_hyperparams(self) -> None:
         )
 
     def add_plot(self, folded=False, **kwargs: str) -> "Card":
+        """Add plots to the model card.
+
+        Parameters
+        ----------
+        folded: bool (default=False)
+            If set to ``True``, the plot will be enclosed in a ``details`` tag.
+            That means the content is folded by default and users have to click
+            to show the content. This option is useful if the added plot is
+            large.
+
+        **kwargs : dict
+            The arguments should be of the form `name=plot_path`, where `name`
+            is the name of the plot and `plot_path` is the path to the plot,
+            relative to the root of the project. The plots should have already
+            been saved under the project's folder.
+
+        Returns
+        -------
+        self : object
+            Card object.
+        """
         for section_name, plot_path in kwargs.items():
             plot_name = split_subsection_names(section_name)[-1]
             section = PlotSection(alt_text=plot_name, path=plot_path, folded=folded)
@@ -214,12 +505,68 @@ def add_plot(self, folded=False, **kwargs: str) -> "Card":
         return self
 
     def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> Card:
+        """Add a table to the model card.
+
+        Add a table to the model card. This can be especially useful when you
+        using cross validation with sklearn. E.g. you can directly pass the
+        result from calling :func:`sklearn.model_selection.cross_validate` or
+        the ``cv_results_`` attribute from any of the hyperparameter searches,
+        such as :class:`sklearn.model_selection.GridSearchCV`.
+
+        Morevoer, you can pass any pandas :class:`pandas.DataFrame` to this
+        method and it will be rendered in the model card. You may consider
+        selecting only a part of the table if it's too big:
+
+        .. code:: python
+
+            search = GridSearchCV(...)
+            search.fit(X, y)
+            df = pd.DataFrame(search.cv_results_)
+            # show only top 10 highest scores
+            df = df.sort_values(["mean_test_score"], ascending=False).head(10)
+            model_card = skops.card.Card(...)
+            model_card.add_table(**{"Hyperparameter search results top 10": df})
+
+        Parameters
+        ----------
+        folded: bool (default=False)
+            If set to ``True``, the table will be enclosed in a ``details`` tag.
+            That means the content is folded by default and users have to click
+            to show the content. This option is useful if the added table is
+            large.
+
+        **kwargs : dict
+            The keys should be strings, which will be used as the section
+            headers, and the values should be tables. Tables can be either dicts
+            with the key being strings that represent the column name, and the
+            values being lists that represent the entries for each row.
+            Alternatively, the table can be a :class:`pandas.DataFrame`. The
+            table must not be empty.
+
+        Returns
+        -------
+        self : object
+            Card object.
+
+        """
         for key, val in kwargs.items():
             section = TableSection(table=val, folded=folded)
             self._add_single(key, section)
         return self
 
     def add_metrics(self, **kwargs: str | int | float) -> "Card":
+        """Add metric values to the model card.
+
+        Parameters
+        ----------
+        **kwargs : dict
+            A dictionary of the form ``{metric name: metric value}``.
+
+        Returns
+        -------
+        self : object
+            Card object.
+        """
         self._metrics.update(kwargs)
         self._add_metrics(self._metrics)
         return self
@@ -314,7 +661,7 @@ def __repr__(self) -> str:
         for title, content in self._iterate_content(self._data):
             if not content:
                 continue
-            if isinstance(content, str) and content.rstrip().endswith(
+            if isinstance(content, str) and content.rstrip("`").rstrip().endswith(
                 CONTENT_PLACEHOLDER
             ):
                 # if content is just some default text, no need to show it
@@ -335,31 +682,11 @@ def __repr__(self) -> str:
 
     def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
         is_skops_format = file_name.endswith(".skops")  # else, assume pickle
+        lines = _getting_started_code(
+            file_name, is_skops_format=is_skops_format, indent=indent
+        )
+        lines = ["```python"] + lines + ["```"]
 
-        lines = ["```python"]
-        if is_skops_format:
-            lines += ["from skops.io import load"]
-        else:
-            lines += ["import joblib"]
-
-        lines += [
-            "import json",
-            "import pandas as pd",
-        ]
-        if is_skops_format:
-            lines += [
-                "from skops.io import load",
-                f'model = load("{file_name}")',
-            ]
-        else:  # pickle
-            lines += [f"model = joblib.load({file_name})"]
-
-        lines += [
-            'with open("config.json") as f:',
-            indent + "config = json.load(f)",
-            'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
-            "```",
-        ]
         template = textwrap.dedent(
             """        Use the code below to get started with the model.
 
diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
index b22d88fc..d019b7d5 100644
--- a/skops/card/tests/test_card_alternative.py
+++ b/skops/card/tests/test_card_alternative.py
@@ -1,4 +1,3 @@
-import copy
 import os
 import pickle
 import tempfile
@@ -15,7 +14,6 @@
 from sklearn.linear_model import LinearRegression, LogisticRegression
 from sklearn.tree import DecisionTreeClassifier
 
-import skops
 from skops import hub_utils
 from skops.card import metadata_from_config
 from skops.card._card_alternative import Card
@@ -115,17 +113,7 @@ def test_save_model_card(destination_path, model_card):
     assert (Path(destination_path) / "README.md").exists()
 
 
-def test_select_existing_section():
-    # TODO
-    pass
-
-
-def test_select_non_existing_section_raises():
-    # TODO
-    pass
-
-
-def test_hyperparameter_table(destination_path, model_card):
+def test_hyperparameter_table(model_card):
     section_name = "Model description/Training Procedure/Hyperparameters"
     text_hyperparams = model_card.select(section_name).content
     expected = "\n".join(
@@ -157,7 +145,7 @@ def _strip_multiple_chars(text, char):
     return text
 
 
-def test_hyperparameter_table_with_line_break(destination_path):
+def test_hyperparameter_table_with_line_break():
     # Hyperparameters can contain values with line breaks, "\n", in them. In
     # that case, the markdown table is broken. Check that the hyperparameter
     # table we create properly replaces the "\n" with "<br />".
@@ -174,7 +162,7 @@ def get_params(self, deep=False):
     assert "| n_jobs | line<br />with<br />break |" in text_cleaned
 
 
-def test_plot_model(destination_path, model_card):
+def test_plot_model(model_card):
     text_plot = model_card.select(
         "Model description/Training Procedure/Model Plot"
     ).content
@@ -186,7 +174,7 @@ def test_plot_model(destination_path, model_card):
     )
 
 
-def test_plot_model_false(destination_path, model_card):
+def test_plot_model_false(model_card):
     model = fit_model()
     model_card = Card(model, model_diagram=False)
     text_plot = model_card.select(
@@ -195,31 +183,219 @@ def test_plot_model_false(destination_path, model_card):
     assert text_plot == "The model plot is below."
 
 
-def test_add_new_section(destination_path, model_card):
-    model_card = model_card.add(**{"A new section": "sklearn FTW"})
-    section = model_card.select("A new section")
-    assert section.content == "sklearn FTW"
+class TestSelect:
+    """Selecting sections from the model card"""
 
+    def test_select_existing_section(self, model_card):
+        section = model_card.select("Model description")
+        assert section.title == "Model description"
 
-def test_add_content_to_existing_section(destination_path, model_card):
-    section = model_card.select("Model description")
-    num_subsection_before = len(section.subsections)
+    def test_select_existing_subsection(self, model_card):
+        section = model_card.select("Model description/Training Procedure")
+        assert section.title == "Training Procedure"
 
-    # add content to "Model description" section
-    model_card = model_card.add(**{"Model description": "sklearn FTW"})
-    section = model_card.select("Model description")
-    num_subsection_after = len(section.subsections)
+        section = model_card.select(["Model description", "Training Procedure"])
+        assert section.title == "Training Procedure"
 
-    assert num_subsection_before == num_subsection_after
-    assert section.content == "sklearn FTW"
+    def test_select_non_existing_section_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select("non-existing section")
 
+    def test_select_non_existing_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select("Model description/non-existing subsection")
 
-@pytest.mark.skip  # FIXME: remove
-def test_template_sections_not_mutated_by_save(destination_path, model_card):
-    template_sections_before = copy.deepcopy(model_card._template_sections)
-    model_card.save(Path(destination_path) / "README.md")
-    template_sections_after = copy.deepcopy(model_card._template_sections)
-    assert template_sections_before == template_sections_after
+        with pytest.raises(KeyError):
+            model_card.select(["Model description", "non-existing subsection"])
+
+    def test_select_non_existing_subsubsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select(
+                "Model description/Training Procedure/non-existing sub-subsection"
+            )
+
+        with pytest.raises(KeyError):
+            model_card.select(
+                [
+                    "Model description",
+                    "Training Procedure",
+                    "non-existing sub-subsection",
+                ]
+            )
+
+    def test_select_non_existing_section_and_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select(["non-existing section", "non-existing subsection"])
+
+    def test_select_empty_key_raises(self, model_card):
+        msg = r"Section name cannot be empty but got ''"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select("")
+
+        msg = r"Section name cannot be empty but got '\[\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select([])
+
+    def test_select_empty_key_subsection_raises(self, model_card):
+        msg = r"Section name cannot be empty but got 'Model description/'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select("Model description/")
+
+        msg = r"Section name cannot be empty but got '\['Model description', ''\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select(["Model description", ""])
+
+    def test_default_sections_empty_card(self, model_card):
+        # Without prefill, the card should not contain the default sections
+        from skops.card._card_alternative import DEFAULT_TEMPLATE
+
+        # model_card (which is prefilled) contains all default sections
+        for key in DEFAULT_TEMPLATE:
+            model_card.select(key)
+
+        # empty card does not contain those sections
+        model = fit_model()
+        card_empty = Card(model, model_diagram=False, prefill=False)
+        for key in DEFAULT_TEMPLATE:
+            with pytest.raises(KeyError):
+                card_empty.select(key)
+
+
+class TestAdd:
+    """Adding sections and subsections"""
+
+    def test_add_new_section(self, model_card):
+        model_card = model_card.add(**{"A new section": "sklearn FTW"})
+        section = model_card.select("A new section")
+        assert section.title == "A new section"
+        assert section.content == "sklearn FTW"
+
+    def test_add_new_subsection(self, model_card):
+        model_card = model_card.add(
+            **{"Model description/A new section": "sklearn FTW"}
+        )
+        section = model_card.select("Model description/A new section")
+        assert section.title == "A new section"
+        assert section.content == "sklearn FTW"
+
+        # make sure that the new subsection is the last subsection
+        subsections = model_card._data["Model description"].subsections
+        assert len(subsections) > 1  # exclude trivial case of only one subsection
+
+        last_subsection = list(subsections.values())[-1]
+        assert last_subsection is section
+
+    def test_add_new_section_and_subsection(self, model_card):
+        model_card = model_card.add(**{"A new section/A new subsection": "sklearn FTW"})
+
+        section = model_card.select("A new section")
+        assert section.title == "A new section"
+        assert section.content == ""
+
+        subsection = model_card.select("A new section/A new subsection")
+        assert subsection.title == "A new subsection"
+        assert subsection.content == "sklearn FTW"
+
+    def test_add_new_section_with_slash_in_name(self, model_card):
+        model_card = model_card.add(**{"A new\\/section": "sklearn FTW"})
+        section = model_card.select("A new\\/section")
+        assert section.title == "A new/section"
+        assert section.content == "sklearn FTW"
+
+    def test_add_new_subsection_with_slash_in_name(self, model_card):
+        model_card = model_card.add(
+            **{"Model description/A new\\/section": "sklearn FTW"}
+        )
+        section = model_card.select("Model description/A new\\/section")
+        assert section.title == "A new/section"
+        assert section.content == "sklearn FTW"
+
+    def test_add_content_to_existing_section(self, model_card):
+        # Add content (not new sections) to an existing section. Make sure that
+        # existing subsections are not affected by this
+        section = model_card.select("Model description")
+        num_subsection_before = len(section.subsections)
+        assert num_subsection_before > 0  # exclude trivial case of empty sections
+
+        # add content to "Model description" section
+        model_card = model_card.add(**{"Model description": "sklearn FTW"})
+        section = model_card.select("Model description")
+        num_subsection_after = len(section.subsections)
+
+        assert num_subsection_before == num_subsection_after
+        assert section.content == "sklearn FTW"
+
+
+class TestDelete:
+    """Deleting sections and subsections"""
+
+    def test_delete_section(self, model_card):
+        model_card.select("Model description")
+        model_card.delete("Model description")
+        with pytest.raises(KeyError):
+            model_card.select("Model description")
+
+    def test_delete_subsection(self, model_card):
+        model_card.select("Model description/Training Procedure")
+        model_card.delete("Model description/Training Procedure")
+        with pytest.raises(KeyError):
+            model_card.select("Model description/Training Procedure")
+        # parent section still exists
+        model_card.delete("Model description")
+
+    def test_delete_subsubsection(self, model_card):
+        model_card.select("Model description/Training Procedure/Hyperparameters")
+        model_card.delete("Model description/Training Procedure/Hyperparameters")
+        with pytest.raises(KeyError):
+            model_card.select("Model description/Training Procedure/Hyperparameters")
+        # parent section still exists
+        model_card.delete("Model description/Training Procedure")
+
+    def test_delete_section_with_slash_in_name(self, model_card):
+        model_card.add(**{"A new\\/section": "some content"})
+        model_card.select("A new\\/section")
+        model_card.delete("A new\\/section")
+        with pytest.raises(KeyError):
+            model_card.select("A new\\/section")
+
+    def test_delete_non_existing_section_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete("non-existing section")
+
+    def test_delete_non_existing_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete("Model description/non-existing subsection")
+
+        with pytest.raises(KeyError):
+            model_card.delete(["Model description", "non-existing subsection"])
+
+    def test_delete_non_existing_subsubsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete(
+                "Model description/Training Procedure/non-existing sub-subsection"
+            )
+
+        with pytest.raises(KeyError):
+            model_card.delete(
+                [
+                    "Model description",
+                    "Training Procedure",
+                    "non-existing sub-subsection",
+                ]
+            )
+
+    def test_delete_non_existing_section_and_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete(["non-existing section", "non-existing subsection"])
+
+    def test_delete_empty_key_raises(self, model_card):
+        msg = r"Section name cannot be empty but got ''"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete("")
+
+        msg = r"Section name cannot be empty but got '\[\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete([])
 
 
 def test_add_plot(destination_path, model_card):
@@ -230,25 +406,15 @@ def test_add_plot(destination_path, model_card):
     assert plot_content == "![fig1](fig1.png)"
 
 
-@pytest.mark.skip  # FIXME: remove
-def test_temporary_plot(destination_path, model_card):
-    # test if the additions are made to a temporary template file
-    # and not to default template or template provided
-    root = skops.__path__
-    # read original template
-    with open(Path(root[0]) / "card" / "default_template.md") as f:
-        default_template = f.read()
+def test_add_plot_to_existing_section(destination_path, model_card):
     plt.plot([4, 5, 6, 7])
     plt.savefig(Path(destination_path) / "fig1.png")
-    model_card.add_plot(fig1="fig1.png")
-    model_card.save(Path(destination_path) / "README.md")
-    # check if default template is not modified
-    with open(Path(root[0]) / "card" / "default_template.md") as f:
-        default_template_post = f.read()
-    assert default_template == default_template_post
+    model_card = model_card.add_plot(**{"Model description/Figure 1": "fig1.png"})
+    plot_content = model_card.select("Model description/Figure 1").content.format()
+    assert plot_content == "![Figure 1](fig1.png)"
 
 
-def test_adding_metadata(destination_path, model_card):
+def test_adding_metadata(model_card):
     # test if the metadata is added to the card
     model_card.metadata.tags = "dummy"
     metadata = list(model_card._generate_metadata(model_card.metadata))
@@ -292,7 +458,9 @@ def test_add_metrics(destination_path, model_card):
     assert eval_metric_content.endswith(expected)
 
 
-def test_code_autogeneration(destination_path, pkl_model_card_metadata_from_config):
+def test_code_autogeneration(
+    model_card, destination_path, pkl_model_card_metadata_from_config
+):
     # test if getting started code is automatically generated
     metadata = metadata_load(local_path=Path(destination_path) / "README.md")
     filename = metadata["model_file"]
@@ -368,7 +536,6 @@ def expected_lines(self):
           Model description/Training Procedure/...</pre></div></div></div></div></div>,
           Model description/Evaluation Results=...ric | Value | |----------|---------|,
           Model Card Authors=Jane Doe,
-          Citation=Below you can find informati...** ``` [More Information Needed] ```,
           Figures/ROC='ROC.png',
           Figures/Confusion matrix='confusion_matrix.jpg',
           Model Description=A description,
@@ -384,6 +551,21 @@ def test_card_repr(self, card: Card, meth, expected_lines):
         expected = "\n".join(expected_lines)
         assert result == expected
 
+    @pytest.mark.parametrize("meth", [repr, str])
+    def test_card_repr_empty_card(self, meth):
+        """Without prefill, the repr should be empty"""
+        model = fit_model()
+        card = Card(model, model_diagram=False, prefill=False)
+        result = meth(card)
+        expected = textwrap.dedent(
+            """
+        Card(
+          model=LinearRegression()
+        )
+        """
+        ).strip()
+        assert result == expected
+
     @pytest.mark.parametrize("meth", [repr, str])
     def test_very_long_lines_are_shortened(self, card: Card, meth, expected_lines):
         card.add(my_section="very long line " * 100)

From fcbd0dfd6d9b34ad6f75cd61c0fc0851842680d1 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 2 Nov 2022 12:32:05 +0100
Subject: [PATCH 05/47] Adjust tests to work with older sklearn versions

---
 skops/card/tests/test_card_alternative.py | 48 ++++++++++++++++++++---
 1 file changed, 42 insertions(+), 6 deletions(-)

diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
index d019b7d5..02355acf 100644
--- a/skops/card/tests/test_card_alternative.py
+++ b/skops/card/tests/test_card_alternative.py
@@ -116,7 +116,30 @@ def test_save_model_card(destination_path, model_card):
 def test_hyperparameter_table(model_card):
     section_name = "Model description/Training Procedure/Hyperparameters"
     text_hyperparams = model_card.select(section_name).content
-    expected = "\n".join(
+
+    # expected outcome depends on sklearn version, since one parameter becomes
+    # deprecated.
+    # TODO: remove when dropping sklearn 0.24. "normalize" Parameter will be
+    # removed completely in sklearn 1.2.
+    expected_old = "\n".join(
+        [
+            "The model is trained with below hyperparameters.",
+            "",
+            "<details>",
+            "<summary> Click to expand </summary>",
+            "",
+            "| Hyperparameter   | Value   |",
+            "|------------------|---------|",
+            "| copy_X           | True    |",
+            "| fit_intercept    | True    |",
+            "| n_jobs           |         |",
+            "| normalize        | False   |",
+            "| positive         | False   |",
+            "",
+            "</details>",
+        ]
+    )
+    expected_new = "\n".join(
         [
             "The model is trained with below hyperparameters.",
             "",
@@ -134,7 +157,7 @@ def test_hyperparameter_table(model_card):
             "</details>",
         ]
     )
-    assert text_hyperparams == expected
+    assert (text_hyperparams == expected_old) or (text_hyperparams == expected_new)
 
 
 def _strip_multiple_chars(text, char):
@@ -167,7 +190,7 @@ def test_plot_model(model_card):
         "Model description/Training Procedure/Model Plot"
     ).content
     # don't compare whole text, as it's quite long and non-deterministic
-    assert text_plot.startswith("The model plot is below.\n\n<style>#sk-container-id")
+    assert text_plot.startswith("The model plot is below.\n\n<style>#sk-")
     assert "<style>" in text_plot
     assert text_plot.endswith(
         "<pre>LinearRegression()</pre></div></div></div></div></div>"
@@ -543,7 +566,20 @@ def expected_lines(self):
         )
         """
         expected = textwrap.dedent(card_repr).strip()
-        return expected.split("\n")
+        lines = expected.split("\n")
+
+        # TODO: remove when dropping sklearn v0.24 and when dropping v1.1 and
+        # below. This is because the "normalize" parameter was changed after
+        # v0.24 will be removed completely in sklearn v1.2.
+        major, minor, *_ = sklearn.__version__.split(".")
+        if int(major) < 1:
+            lines[2] = (
+                "  Model description/Training Procedure/...se | | positive | False | "
+                "</details>,"
+            )
+        elif int(minor) >= 2:
+            del lines[2]
+        return lines
 
     @pytest.mark.parametrize("meth", [repr, str])
     def test_card_repr(self, card: Card, meth, expected_lines):
@@ -882,8 +918,8 @@ def test_old_and_new_card_identical(fill_content):
             continue
 
         # model diagram is not deterministic, e.g. ids
-        if line0.startswith("<style>#sk-container-id"):
-            assert line1.startswith("<style>#sk-container-id")
+        if line0.startswith("<style>#sk-"):
+            assert line1.startswith("<style>#sk-")
             continue
 
         assert line0 == line1

From 4f10f806d0ba9296da64f3c2e2ac3f36f992d51f Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 2 Nov 2022 12:34:24 +0100
Subject: [PATCH 06/47] Adjust examples to new card, more docs

Also some better type annotations.
---
 examples/plot_model_card.py     | 37 ++++++++-------
 skops/card/_card_alternative.py | 84 ++++++++++++++++++++++++++++-----
 skops/card/_model_card.py       |  2 +-
 3 files changed, 93 insertions(+), 30 deletions(-)

diff --git a/examples/plot_model_card.py b/examples/plot_model_card.py
index 4acdfd1b..46e9a8bc 100644
--- a/examples/plot_model_card.py
+++ b/examples/plot_model_card.py
@@ -29,7 +29,8 @@
 )
 from sklearn.model_selection import HalvingGridSearchCV, train_test_split
 
-from skops import card, hub_utils
+from skops import hub_utils
+from skops.card._card_alternative import Card, metadata_from_config
 
 # %%
 # Data
@@ -91,7 +92,7 @@
 # :func:`.hub_utils.init` above. We will see below how we can populate the model
 # card with useful information.
 
-model_card = card.Card(model, metadata=card.metadata_from_config(Path(local_repo)))
+model_card = Card(model, metadata=metadata_from_config(Path(local_repo)))
 
 # %%
 # Add more information
@@ -103,17 +104,19 @@
 model_card.metadata.license = "mit"
 limitations = "This model is not ready to be used in production."
 model_description = (
-    "This is a HistGradientBoostingClassifier model trained on breast cancer dataset."
-    " It's trained with Halving Grid Search Cross Validation, with parameter grids on"
-    " max_leaf_nodes and max_depth."
+    "This is a `HistGradientBoostingClassifier` model trained on breast cancer "
+    "dataset. It's trained with `HalvingGridSearchCV`, with parameter grids on "
+    "`max_leaf_nodes` and `max_depth`."
 )
 model_card_authors = "skops_user"
-citation_bibtex = "bibtex\n@inproceedings{...,year={2020}}"
+citation_bibtex = "**BibTeX**\n\n```\n@inproceedings{...,year={2020}}\n```"
 model_card.add(
-    citation_bibtex=citation_bibtex,
-    model_card_authors=model_card_authors,
-    limitations=limitations,
-    model_description=model_description,
+    **{
+        "Citation": citation_bibtex,
+        "Model Card Authors": model_card_authors,
+        "Model description": model_description,
+        "Model description/Intended uses & limitations": limitations,
+    }
 )
 
 # %%
@@ -132,10 +135,10 @@
 
 y_pred = model.predict(X_test)
 eval_descr = (
-    "The model is evaluated on test data using accuracy and F1-score with macro"
-    " average."
+    "The model is evaluated on test data using accuracy and F1-score with "
+    "macro average."
 )
-model_card.add(eval_method=eval_descr)
+model_card.add(**{"Model description/Evaluation Results": eval_descr})
 
 accuracy = accuracy_score(y_test, y_pred)
 f1 = f1_score(y_test, y_pred, average="micro")
@@ -146,7 +149,9 @@
 disp.plot()
 
 disp.figure_.savefig(Path(local_repo) / "confusion_matrix.png")
-model_card.add_plot(**{"Confusion matrix": "confusion_matrix.png"})
+model_card.add_plot(
+    **{"Model description/Evaluation Results/Confusion Matrix": "confusion_matrix.png"}
+)
 
 cv_results = model.cv_results_
 clf_report = classification_report(
@@ -160,8 +165,8 @@
 model_card.add_table(
     folded=True,
     **{
-        "Hyperparameter search results": cv_results,
-        "Classification report": clf_report,
+        "Model description/Evaluation Results/Hyperparameter search results": cv_results,
+        "Model description/Evaluation Results/Classification report": clf_report,
     },
 )
 
diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index d12e30f4..66aca84a 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -6,12 +6,13 @@
 from dataclasses import dataclass, field
 from pathlib import Path
 from reprlib import Repr
-from typing import Any, Iterator
+from typing import Any, Iterator, Sequence
 
 from huggingface_hub import CardData
 from sklearn.utils import estimator_html_repr
 from tabulate import tabulate  # type: ignore
 
+from skops.card import metadata_from_config
 from skops.card._model_card import PlotSection, TableSection
 
 if sys.version_info >= (3, 8):
@@ -50,10 +51,39 @@
 
 
 def split_subsection_names(key: str) -> list[str]:
+    """Split a string containing multiple sections into a list of strings for
+    each.
+
+    The separator is ``"/"``. To avoid splitting on ``"/"``, escape it using
+    ``"\\/"``.
+
+    Examples
+    --------
+    >>> split_subsection_names("Section A")
+    ["Section A"]
+    >>> split_subsection_names("Section A/Section B/Section C")
+    ["Section A", "Section B", "Section C"]
+    >>> split_subsection_names("A section containg \\/ a slash")
+    ["A section containg \\/ a slash"]
+    >>> split_subsection_names("Spaces are / stripped")
+    ["Spaces are", "stripped"]
+
+    Parameters
+    ----------
+    key : str
+        The section name consisting potentially of multiple subsections. It has
+        to be ensured beforhand that this is not an empty string.
+
+    Returns
+    -------
+    parts : list of str
+        The individual (sub)sections.
+
+    """
     placeholder = "$%!?"  # arbitrary sting that never appears naturally
     key = key.replace("\\/", placeholder)
-    splits = key.split("/")
-    return [part.replace(placeholder, "/") for part in splits]
+    parts = (part.strip() for part in key.split("/"))
+    return [part.replace(placeholder, "/") for part in parts]
 
 
 def _getting_started_code(
@@ -101,6 +131,22 @@ def _clean_table(table: str) -> str:
 
 @dataclass
 class Section:
+    """Building block of the model card.
+
+    The model card is represented internally as a dict with keys being strings
+    and values being Sections. The key is identical to the section title.
+
+    Additionally, the section may hold content in the form of strings (can be an
+    empty string) or a ``Formattable``, which is simply an object with a
+    ``format`` method that returns a string.
+
+    Finally, the section can contain subsections, which again are dicts of
+    string keys and section values (the dict can be empty). Therefore, the model
+    card representation forms a tree structure, making use of the fact that dict
+    order is preserved.
+
+    """
+
     title: str
     content: Formattable | str
     subsections: dict[str, Section] = field(default_factory=dict)
@@ -303,7 +349,7 @@ def add(self, **kwargs: str | Formattable) -> "Card":
         return self
 
     def _select(
-        self, subsection_names: list[str], create: bool = True
+        self, subsection_names: Sequence[str], create: bool = True
     ) -> dict[str, Section]:
         section = self._data
         if not subsection_names:
@@ -327,7 +373,7 @@ def _select(
 
         return section
 
-    def select(self, key: str | list[str]) -> Section:
+    def select(self, key: str | Sequence[str]) -> Section:
         """Select a section from the model card.
 
         To select a subsection of an existing section, use a ``"/"`` in the
@@ -375,7 +421,7 @@ def select(self, key: str | list[str]) -> Section:
         parent_section = self._select(subsection_names, create=False)
         return parent_section[leaf_node_name]
 
-    def delete(self, key: str | list[str]) -> None:
+    def delete(self, key: str | Sequence[str]) -> None:
         """Delete a section from the model card.
 
         To delete a subsection of an existing section, use a ``"/"`` in the
@@ -479,6 +525,9 @@ def _add_hyperparams(self) -> None:
     def add_plot(self, folded=False, **kwargs: str) -> "Card":
         """Add plots to the model card.
 
+        The plot should be saved on the file system and the path passed as
+        value.
+
         Parameters
         ----------
         folded: bool (default=False)
@@ -488,15 +537,17 @@ def add_plot(self, folded=False, **kwargs: str) -> "Card":
             large.
 
         **kwargs : dict
-            The arguments should be of the form `name=plot_path`, where `name`
-            is the name of the plot and `plot_path` is the path to the plot,
-            relative to the root of the project. The plots should have already
-            been saved under the project's folder.
+            The arguments should be of the form ``name=plot_path``, where
+            ``name`` is the name of the plot and section, and ``plot_path`` is
+            the path to the plot on the file system, relative to the root of the
+            project. The plots should have already been saved under the
+            project's folder.
 
         Returns
         -------
         self : object
             Card object.
+
         """
         for section_name, plot_path in kwargs.items():
             plot_name = split_subsection_names(section_name)[-1]
@@ -587,6 +638,7 @@ def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
         self._add_single("Model description/Evaluation Results", template.format(table))
 
     def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
+        """Yield metadata in yaml format"""
         for key, val in metadata.to_dict().items() if metadata else {}:
             if key == "widget":
                 yield "metadata.widget={...},"
@@ -597,13 +649,14 @@ def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
     def _generate_content(
         self, data: dict[str, Section], depth: int = 1
     ) -> Iterator[str]:
+        """Yield title and (formatted) contents"""
         for val in data.values():
             title = f"{depth * '#'} {val.title}"
             yield title
 
             if isinstance(val.content, str):
                 yield val.content
-            elif val.content is not None:  # is Formattable
+            else:  # is a Formattable
                 yield val.content.format()
 
             if val.subsections:
@@ -612,6 +665,7 @@ def _generate_content(
     def _iterate_content(
         self, data: dict[str, Section], parent_section: str = ""
     ) -> Iterator[tuple[str, Formattable | str]]:
+        """Yield tuples of title and (non-formatted) content"""
         for val in data.values():
             if parent_section:
                 title = "/".join((parent_section, val.title))
@@ -705,6 +759,9 @@ def _generate_card(self) -> Iterator[str]:
             if line:
                 yield "\n" + line
 
+        # add an empty line add the end
+        yield ""
+
     def save(self, path: str | Path) -> None:
         """Save the model card.
 
@@ -751,7 +808,6 @@ def main():
     from sklearn.preprocessing import StandardScaler
 
     from skops import hub_utils
-    from skops.card import metadata_from_config
 
     X, y = load_iris(return_X_y=True, as_frame=True)
 
@@ -780,6 +836,8 @@ def main():
         card.add(hi="howdy")
         card.add(**{"parent section/child section": "child content"})
         card.add(**{"foo": "bar", "spam": "eggs"})
+        # add section with a "/" in title
+        card.add(**{"A section with a \\/ in the title": "This works"})
         # change content of "hi" section
         card.add(**{"hi/german": "guten tag", "hi/french": "salut"})
         card.add(**{"very/deeply/nested/section": "but why?"})
@@ -787,7 +845,7 @@ def main():
         # add metrics
         card.add_metrics(**{"acc": 0.1})
 
-        # insert the plot in the "Plot" section we inserted above
+        # insert the plot in the "Plot" section created above
         plt.plot([4, 5, 6, 7])
         plt.savefig(Path(destination_path) / "fig1.png")
         card.add_plot(**{"Plots/A beautiful plot": "fig1.png"})
diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index 3fdf8ab1..a7d10dec 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -32,7 +32,7 @@ def _clean_table(table: str) -> str:
     # replace line breaks "\n" with html tag <br />, however, leave end-of-line
     # line breaks (eol_lb) intact
     eol_lb = "|\n"
-    placeholder = "$%!?"  # arbitrary sting that never appears naturally
+    placeholder = "$%!?"  # arbitrary string that never appears naturally
     table = (
         table.replace(eol_lb, placeholder)
         .replace("\n", "<br />")

From 0f5df2e5bb3e4177ffc186cd0891d87cee294d40 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 2 Nov 2022 13:54:47 +0100
Subject: [PATCH 07/47] Continue fixing tests

---
 skops/card/_card_alternative.py           | 10 +--
 skops/card/tests/test_card_alternative.py | 87 +++++++++++------------
 2 files changed, 48 insertions(+), 49 deletions(-)

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index 66aca84a..bc96b94d 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -51,7 +51,7 @@
 
 
 def split_subsection_names(key: str) -> list[str]:
-    """Split a string containing multiple sections into a list of strings for
+    r"""Split a string containing multiple sections into a list of strings for
     each.
 
     The separator is ``"/"``. To avoid splitting on ``"/"``, escape it using
@@ -60,13 +60,13 @@ def split_subsection_names(key: str) -> list[str]:
     Examples
     --------
     >>> split_subsection_names("Section A")
-    ["Section A"]
+    ['Section A']
     >>> split_subsection_names("Section A/Section B/Section C")
-    ["Section A", "Section B", "Section C"]
+    ['Section A', 'Section B', 'Section C']
     >>> split_subsection_names("A section containg \\/ a slash")
-    ["A section containg \\/ a slash"]
+    ['A section containg / a slash']
     >>> split_subsection_names("Spaces are / stripped")
-    ["Spaces are", "stripped"]
+    ['Spaces are', 'stripped']
 
     Parameters
     ----------
diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
index 02355acf..ec589015 100644
--- a/skops/card/tests/test_card_alternative.py
+++ b/skops/card/tests/test_card_alternative.py
@@ -115,49 +115,43 @@ def test_save_model_card(destination_path, model_card):
 
 def test_hyperparameter_table(model_card):
     section_name = "Model description/Training Procedure/Hyperparameters"
-    text_hyperparams = model_card.select(section_name).content
-
-    # expected outcome depends on sklearn version, since one parameter becomes
-    # deprecated.
-    # TODO: remove when dropping sklearn 0.24. "normalize" Parameter will be
-    # removed completely in sklearn 1.2.
-    expected_old = "\n".join(
-        [
-            "The model is trained with below hyperparameters.",
-            "",
-            "<details>",
-            "<summary> Click to expand </summary>",
-            "",
-            "| Hyperparameter   | Value   |",
-            "|------------------|---------|",
-            "| copy_X           | True    |",
-            "| fit_intercept    | True    |",
-            "| n_jobs           |         |",
-            "| normalize        | False   |",
-            "| positive         | False   |",
-            "",
-            "</details>",
-        ]
-    )
-    expected_new = "\n".join(
-        [
-            "The model is trained with below hyperparameters.",
-            "",
-            "<details>",
-            "<summary> Click to expand </summary>",
-            "",
-            "| Hyperparameter   | Value      |",
-            "|------------------|------------|",
-            "| copy_X           | True       |",
-            "| fit_intercept    | True       |",
-            "| n_jobs           |            |",
-            "| normalize        | deprecated |",
-            "| positive         | False      |",
-            "",
-            "</details>",
-        ]
-    )
-    assert (text_hyperparams == expected_old) or (text_hyperparams == expected_new)
+    result = model_card.select(section_name).content
+
+    lines = [
+        "The model is trained with below hyperparameters.",
+        "",
+        "<details>",
+        "<summary> Click to expand </summary>",
+        "",
+        "| Hyperparameter   | Value   |",
+        "|------------------|---------|",
+        "| copy_X           | True    |",
+        "| fit_intercept    | True    |",
+        "| n_jobs           |         |",
+        "| normalize        | False   |",
+        "| positive         | False   |",
+        "",
+        "</details>",
+    ]
+    # TODO: remove when dropping sklearn v0.24 and when dropping v1.1 and
+    # below. This is because the "normalize" parameter was changed after
+    # v0.24 will be removed completely in sklearn v1.2.
+    major, minor, *_ = sklearn.__version__.split(".")
+    major, minor = int(major), int(minor)
+    if (major >= 1) and (minor < 2):
+        lines[10] = "| normalize        | deprecated |"
+    elif (major >= 1) and (minor >= 2):
+        del lines[10]
+    expected = "\n".join(lines)
+
+    # remove multiple whitespaces and dashes, as they're not important and may
+    # differ depending on OS
+    expected = _strip_multiple_chars(expected, " ")
+    expected = _strip_multiple_chars(expected, "-")
+    result = _strip_multiple_chars(result, " ")
+    result = _strip_multiple_chars(result, "-")
+
+    assert result == expected
 
 
 def _strip_multiple_chars(text, char):
@@ -573,12 +567,17 @@ def expected_lines(self):
         # v0.24 will be removed completely in sklearn v1.2.
         major, minor, *_ = sklearn.__version__.split(".")
         if int(major) < 1:
+            # v0.24: "deprecated" -> "False"
             lines[2] = (
                 "  Model description/Training Procedure/...se | | positive | False | "
                 "</details>,"
             )
         elif int(minor) >= 2:
-            del lines[2]
+            # >= v1.2: remove argument completely
+            lines[2] = (
+                "  Model description/Training Procedure/... | | | positive | False | "
+                "</details>,"
+            )
         return lines
 
     @pytest.mark.parametrize("meth", [repr, str])

From 6212d67bb8a9ebafaccf0e9a48edb5f898e92116 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 2 Nov 2022 14:30:45 +0100
Subject: [PATCH 08/47] Try fixing Windows error by specifying encoding

---
 skops/card/_card_alternative.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index bc96b94d..aa9367d5 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -778,7 +778,7 @@ def save(self, path: str | Path) -> None:
         The keys in model card metadata can be seen `here
         <https://huggingface.co/docs/hub/models-cards#model-card-metadata>`__.
         """
-        with open(path, "w") as f:
+        with open(path, "w", encoding="utf-8") as f:
             f.write("\n".join(self._generate_card()))
 
     def render(self) -> str:

From 80d218d65740d6663fe81fa21757e008ebdaca79 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 2 Nov 2022 15:49:38 +0100
Subject: [PATCH 09/47] Adjust doctest: confusion matrix not stored in cwd

---
 skops/card/_card_alternative.py | 18 ++++++++++--------
 1 file changed, 10 insertions(+), 8 deletions(-)

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index aa9367d5..58bf743a 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -229,16 +229,19 @@ class Card:
     ... )
     >>> disp.plot()
     <sklearn.metrics._plot.confusion_matrix.ConfusionMatrixDisplay object at ...>
-    >>> disp.figure_.savefig("confusion_matrix.png")
+    >>> tmp_path = Path(tempfile.mkdtemp(prefix="skops-"))
+    >>> disp.figure_.savefig(tmp_path / "confusion_matrix.png")
     ...
-    >>> model_card.add_plot(confusion_matrix="confusion_matrix.png")
+    >>> model_card.add_plot(**{
+    ...     "Model description/Confusion Matrix": tmp_path / "confusion_matrix.png"
+    ... })
     Card(
       model=LogisticRegression(random_state=0, solver='liblinear')
       metadata.license=mit,
       Model description/Training Procedure/... | | warm_start | False | </details>,
       Model description/Training Procedure/...</pre></div></div></div></div></div>,
       Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      confusion_matrix='confusion_matrix.png',
+      Model description/Confusion Matrix=...confusion_matrix.png'),
     )
     >>> # add new content to the existing section "Model description"
     >>> model_card.add(**{"Model description": "This is the best model"})
@@ -249,7 +252,7 @@ class Card:
       Model description/Training Procedure/... | | warm_start | False | </details>,
       Model description/Training Procedure/...</pre></div></div></div></div></div>,
       Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      confusion_matrix='confusion_matrix.png',
+      Model description/Confusion Matrix=...confusion_matrix.png'),
     )
     >>> # add content to a new section
     >>> model_card.add(**{"A new section": "Please rate my model"})
@@ -260,7 +263,7 @@ class Card:
       Model description/Training Procedure/... | | warm_start | False | </details>,
       Model description/Training Procedure/...</pre></div></div></div></div></div>,
       Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      confusion_matrix='confusion_matrix.png',
+      Model description/Confusion Matrix=...confusion_matrix.png'),
       A new section=Please rate my model,
     )
     >>> # add new subsection to an existing section by using "/"
@@ -272,13 +275,12 @@ class Card:
       Model description/Training Procedure/... | | warm_start | False | </details>,
       Model description/Training Procedure/...</pre></div></div></div></div></div>,
       Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      Model description/Confusion Matrix=...confusion_matrix.png'),
       Model description/Model name=This model is called Bob,
-      confusion_matrix='confusion_matrix.png',
       A new section=Please rate my model,
     )
     >>> # save the card to a README.md file
-    >>> with tempfile.TemporaryDirectory() as tmpdir:
-    ...     model_card.save((Path(tmpdir) / "README.md"))
+    >>> model_card.save(tmp_path / "README.md")
     """
 
     def __init__(

From c6c8042da6d355bfb1c003e91a146bda095c218b Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 2 Nov 2022 15:50:42 +0100
Subject: [PATCH 10/47] Increase test coverage

---
 skops/card/_card_alternative.py           | 43 ++++++++---------------
 skops/card/tests/test_card_alternative.py | 34 ++++++++++++++++++
 2 files changed, 48 insertions(+), 29 deletions(-)

diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
index 58bf743a..326f7d3e 100644
--- a/skops/card/_card_alternative.py
+++ b/skops/card/_card_alternative.py
@@ -16,9 +16,9 @@
 from skops.card._model_card import PlotSection, TableSection
 
 if sys.version_info >= (3, 8):
-    from typing import Protocol
+    from typing import Protocol  # pragma: no cover
 else:
-    from typing_extensions import Protocol
+    from typing_extensions import Protocol  # pragma: no cover
 
 
 aRepr = Repr()
@@ -154,7 +154,7 @@ class Section:
 
 class Formattable(Protocol):
     def format(self) -> str:
-        ...
+        ...  # pragma: no cover
 
 
 class Card:
@@ -457,7 +457,7 @@ def delete(self, key: str | Sequence[str]) -> None:
         else:
             *subsection_names, leaf_node_name = key
 
-        if not key:
+        if not leaf_node_name:
             msg = f"Section name cannot be empty but got '{key}'"
             raise KeyError(msg)
 
@@ -475,15 +475,6 @@ def _add_single(self, key: str, val: Formattable | str) -> None:
             # entry does not exist, create a new one
             section[leaf_node_name] = Section(title=leaf_node_name, content=val)
 
-    def _add_model(self, model) -> None:
-        model = getattr(self, "model", None)
-        if model is None:
-            return
-
-        model_str = self._strip_blank(repr(model))
-        model_repr = aRepr.repr(f"model={model_str},").strip('"').strip("'")
-        self._add_single("Model description", model_repr)
-
     def _add_model_section(self) -> None:
         section_title = "Model description/Training Procedure/Model Plot"
         default_content = "The model plot is below."
@@ -524,7 +515,7 @@ def _add_hyperparams(self) -> None:
             template.format(table),
         )
 
-    def add_plot(self, folded=False, **kwargs: str) -> "Card":
+    def add_plot(self, *, folded=False, **kwargs: str) -> "Card":
         """Add plots to the model card.
 
         The plot should be saved on the file system and the path passed as
@@ -557,7 +548,9 @@ def add_plot(self, folded=False, **kwargs: str) -> "Card":
             self._add_single(section_name, section)
         return self
 
-    def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> Card:
+    def add_table(
+        self, *, folded: bool = False, **kwargs: dict["str", list[Any]]
+    ) -> Card:
         """Add a table to the model card.
 
         Add a table to the model card. This can be especially useful when you
@@ -642,10 +635,6 @@ def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
     def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
         """Yield metadata in yaml format"""
         for key, val in metadata.to_dict().items() if metadata else {}:
-            if key == "widget":
-                yield "metadata.widget={...},"
-                continue
-
             yield aRepr.repr(f"metadata.{key}={val},").strip('"').strip("'")
 
     def _generate_content(
@@ -680,15 +669,10 @@ def _iterate_content(
                 yield from self._iterate_content(val.subsections, parent_section=title)
 
     @staticmethod
-    def _strip_blank(text: str) -> str:
-        # remove new lines and multiple spaces
+    def _format_repr(text: str) -> str:
+        # Remove new lines, multiple spaces, quotation marks, and cap line length
         text = text.replace("\n", " ")
         text = re.sub(r"\s+", r" ", text)
-        return text
-
-    def _format_repr(self, text: str) -> str:
-        # Remove new lines, multiple spaces, quotation marks, and cap line length
-        text = self._strip_blank(text)
         return aRepr.repr(text).strip('"').strip("'")
 
     def __str__(self) -> str:
@@ -754,7 +738,7 @@ def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
         )
 
     def _generate_card(self) -> Iterator[str]:
-        if self.metadata:
+        if self.metadata.to_dict():
             yield f"---\n{self.metadata.to_yaml()}\n---"
 
         for line in self._generate_content(self._data):
@@ -795,7 +779,8 @@ def render(self) -> str:
         return "\n".join(self._generate_card())
 
 
-def main():
+def main():  # pragma: no cover
+    # TODO: remove
     import os
     import pickle
     import tempfile
@@ -886,4 +871,4 @@ def main():
 
 
 if __name__ == "__main__":
-    main()
+    main()  # pragma: no cover
diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
index ec589015..8b0155de 100644
--- a/skops/card/tests/test_card_alternative.py
+++ b/skops/card/tests/test_card_alternative.py
@@ -200,6 +200,31 @@ def test_plot_model_false(model_card):
     assert text_plot == "The model plot is below."
 
 
+def test_render(model_card, destination_path):
+    file_name = destination_path / "README.md"
+    model_card.save(file_name)
+    with open(file_name, "r") as f:
+        loaded = f.read()
+
+    rendered = model_card.render()
+    assert loaded == rendered
+
+
+def test_with_metadata(model_card):
+    model_card.metadata.foo = "something"
+    model_card.metadata.bar = "something else"
+    rendered = model_card.render()
+    expected = textwrap.dedent(
+        """
+        ---
+        foo: something
+        bar: something else
+        ---
+        """
+    ).strip()
+    assert rendered.startswith(expected)
+
+
 class TestSelect:
     """Selecting sections from the model card"""
 
@@ -414,6 +439,15 @@ def test_delete_empty_key_raises(self, model_card):
         with pytest.raises(KeyError, match=msg):
             model_card.delete([])
 
+    def test_delete_empty_key_subsection_raises(self, model_card):
+        msg = r"Section name cannot be empty but got 'Model description/'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete("Model description/")
+
+        msg = r"Section name cannot be empty but got '\['Model description', ''\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete(["Model description", ""])
+
 
 def test_add_plot(destination_path, model_card):
     plt.plot([4, 5, 6, 7])

From e7a2ae3e0e56738423962df53dd4535a11da33ea Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Thu, 3 Nov 2022 12:08:07 +0100
Subject: [PATCH 11/47] Try fixing test failure on Windows

---
 skops/card/tests/test_card_alternative.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
index 8b0155de..5cb5407f 100644
--- a/skops/card/tests/test_card_alternative.py
+++ b/skops/card/tests/test_card_alternative.py
@@ -203,7 +203,7 @@ def test_plot_model_false(model_card):
 def test_render(model_card, destination_path):
     file_name = destination_path / "README.md"
     model_card.save(file_name)
-    with open(file_name, "r") as f:
+    with open(file_name, "r", encoding="utf-8") as f:
         loaded = f.read()
 
     rendered = model_card.render()

From 2a6aab09ee15999656bce8259e633ddcb32e615a Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Thu, 10 Nov 2022 13:09:30 +0100
Subject: [PATCH 12/47] Replace old by new Card implementation

---
 docs/model_card.rst                       |  64 +-
 examples/plot_model_card.py               |   2 +-
 skops/card/_card_alternative.py           | 874 --------------------
 skops/card/_model_card.py                 | 749 ++++++++++++-----
 skops/card/tests/test_card.py             | 601 ++++++++++----
 skops/card/tests/test_card_alternative.py | 958 ----------------------
 6 files changed, 1031 insertions(+), 2217 deletions(-)
 delete mode 100644 skops/card/_card_alternative.py
 delete mode 100644 skops/card/tests/test_card_alternative.py

diff --git a/docs/model_card.rst b/docs/model_card.rst
index c1fe0fac..7a6c124d 100644
--- a/docs/model_card.rst
+++ b/docs/model_card.rst
@@ -42,32 +42,30 @@ to touch it yourself.
 
 The markdown part does not necessarily need to follow any specification in
 terms of information passed, which gives the user a lot of flexibility. The
-markdown part of the ``README.md`` file is generated from a Jinja template
-with slots that you can inject your content in. ``skops`` has a default
-template which includes the following slots for free text sections:
-
-- ``"model_description"``: A description of the model.
-- ``"limitations"``: Intended use for the model, limitations and potential
-  biases. This section should also include risks of using models in certain
-  domains if relevant.
-- ``"get_started_code"``: Code the user can run to load and use the model.
-- ``"model_card_authors"``: Authors of the model card. This section includes
-  authors of the model card, while ``"citation_bibtex"`` includes citations
-  related to the model if relevant.
-- ``"model_card_contact"``: Contact information of people whom can be reached
+markdown part of the ``README.md`` file comes with a couple of defaults provided
+by ``skops``, which includes the following slots for free text sections:
+
+- ``"Mode description"``: A description of the model.
+- ``"Intended uses & limitations"``: Intended use for the model, limitations and
+  potential biases. This section should also include risks of using models in
+  certain domains if relevant.
+- ``"How to Get Started with the Model"``: Code the user can run to load and use
+  the model.
+- ``"Model Card Authors"``: Authors of the model card. This section includes
+  authors of the model card
+- ``"Model Card Contact"``: Contact information of people whom can be reached
   out, in case of questions about the model or the model card.
-- ``"citation_bibtex"``: Bibtex style citations for the model or resources used
-  to train the model.
-- ``"eval_methods"``: Details about evaluation process of the model.
-- ``"eval_results"``: Evaluation results that are later parsed as a table by
-  :class:`skops.card.Card`.
+- ``"Citation"``: Bibtex style citations for the model or resources used to
+  train the model.
+- ``"Evaluation Results"``: Evaluation results that are later parsed as a table
+  by :class:`skops.card.Card`.
 
 
 The template also contains the following sections that are automatically
 generated by ``skops``.
 
-- ``"hyperparameter_table"``: Hyperparameters of the model.
-- ``"model_plot"``: A diagram of the model, most relevant in case the model is
+- ``"Hyperparameters"``: Hyperparameters of the model.
+- ``"Model Plot"``: A diagram of the model, most relevant in case the model is
   a complex scikit-learn :class:`~sklearn.pipeline.Pipeline`.
 
 Furthermore, it is possible to add plots and tables to the model card. To add
@@ -77,5 +75,31 @@ dictionaries with the key being the header and the values being list of row
 entries, or a pandas ``DataFrame``; use the :meth:`.Card.add_table` method for
 this.
 
+To add content to an existing subsection, or create a new subsection, use a
+``"/"`` to indicate the subsection. E.g. let's assume you would like to add a
+subsection called ``"Figures"`` to the existing section ``"Model description"``,
+as well as adding some subsections with plots below that, you can call the
+:meth:`Card.add` method like this:
+
+.. code-block:: python
+
+    card.add(**{"Model description/Figures": "Here are some nice figures"})
+    card.add_plot(**{
+        "Model description/Figures/Confusion Matrix": "path-to-confusion-matrix.png",
+        "Model description/Figures/ROC": "path-to-roc.png",
+    })
+
+Furthermore, you can select existing sections (as well as their subsections)
+using :meth:`Card.select`, and you can delete sections using
+:meth:`Card.delete`:
+
+.. code-block:: python
+
+    section = card.select("Model description/Figures")
+    print(section.content)  # 'Here are some nice figures'
+    print(section.subsections)
+    card.delete("Model description/Figures/ROC")
+
+
 To see how you can use the API in ``skops`` to create a model card, please
 refer to :ref:`sphx_glr_auto_examples_plot_model_card.py`.
diff --git a/examples/plot_model_card.py b/examples/plot_model_card.py
index 46e9a8bc..7a5ff3b3 100644
--- a/examples/plot_model_card.py
+++ b/examples/plot_model_card.py
@@ -30,7 +30,7 @@
 from sklearn.model_selection import HalvingGridSearchCV, train_test_split
 
 from skops import hub_utils
-from skops.card._card_alternative import Card, metadata_from_config
+from skops.card import Card, metadata_from_config
 
 # %%
 # Data
diff --git a/skops/card/_card_alternative.py b/skops/card/_card_alternative.py
deleted file mode 100644
index 326f7d3e..00000000
--- a/skops/card/_card_alternative.py
+++ /dev/null
@@ -1,874 +0,0 @@
-from __future__ import annotations
-
-import re
-import sys
-import textwrap
-from dataclasses import dataclass, field
-from pathlib import Path
-from reprlib import Repr
-from typing import Any, Iterator, Sequence
-
-from huggingface_hub import CardData
-from sklearn.utils import estimator_html_repr
-from tabulate import tabulate  # type: ignore
-
-from skops.card import metadata_from_config
-from skops.card._model_card import PlotSection, TableSection
-
-if sys.version_info >= (3, 8):
-    from typing import Protocol  # pragma: no cover
-else:
-    from typing_extensions import Protocol  # pragma: no cover
-
-
-aRepr = Repr()
-aRepr.maxother = 79
-aRepr.maxstring = 79
-
-CONTENT_PLACEHOLDER = "[More Information Needed]"
-"""When there is a section but no content, show this"""
-
-DEFAULT_TEMPLATE = {
-    "Model description": CONTENT_PLACEHOLDER,
-    "Model description/Intended uses & limitations": CONTENT_PLACEHOLDER,
-    "Model description/Training Procedure": "",
-    "Model description/Training Procedure/Hyperparameters": CONTENT_PLACEHOLDER,
-    "Model description/Training Procedure/Model Plot": CONTENT_PLACEHOLDER,
-    "Model description/Evaluation Results": CONTENT_PLACEHOLDER,
-    "How to Get Started with the Model": CONTENT_PLACEHOLDER,
-    "Model Card Authors": (
-        f"This model card is written by following authors:\n\n{CONTENT_PLACEHOLDER}"
-    ),
-    "Model Card Contact": (
-        "You can contact the model card authors through following channels:\n"
-        f"{CONTENT_PLACEHOLDER}"
-    ),
-    "Citation": (
-        "Below you can find information related to citation.\n\n**BibTeX:**\n```\n"
-        f"{CONTENT_PLACEHOLDER}\n```"
-    ),
-}
-
-
-def split_subsection_names(key: str) -> list[str]:
-    r"""Split a string containing multiple sections into a list of strings for
-    each.
-
-    The separator is ``"/"``. To avoid splitting on ``"/"``, escape it using
-    ``"\\/"``.
-
-    Examples
-    --------
-    >>> split_subsection_names("Section A")
-    ['Section A']
-    >>> split_subsection_names("Section A/Section B/Section C")
-    ['Section A', 'Section B', 'Section C']
-    >>> split_subsection_names("A section containg \\/ a slash")
-    ['A section containg / a slash']
-    >>> split_subsection_names("Spaces are / stripped")
-    ['Spaces are', 'stripped']
-
-    Parameters
-    ----------
-    key : str
-        The section name consisting potentially of multiple subsections. It has
-        to be ensured beforhand that this is not an empty string.
-
-    Returns
-    -------
-    parts : list of str
-        The individual (sub)sections.
-
-    """
-    placeholder = "$%!?"  # arbitrary sting that never appears naturally
-    key = key.replace("\\/", placeholder)
-    parts = (part.strip() for part in key.split("/"))
-    return [part.replace(placeholder, "/") for part in parts]
-
-
-def _getting_started_code(
-    file_name: str, is_skops_format: bool = False, indent="    "
-) -> list[str]:
-    # get lines of code required to load the model
-    lines: list[str] = []
-    if is_skops_format:
-        lines += ["from skops.io import load"]
-    else:
-        lines += ["import joblib"]
-
-    lines += [
-        "import json",
-        "import pandas as pd",
-    ]
-    if is_skops_format:
-        lines += [
-            "from skops.io import load",
-            f'model = load("{file_name}")',
-        ]
-    else:  # pickle
-        lines += [f"model = joblib.load({file_name})"]
-
-    lines += [
-        'with open("config.json") as f:',
-        indent + "config = json.load(f)",
-        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
-    ]
-    return lines
-
-
-def _clean_table(table: str) -> str:
-    # replace line breaks "\n" with html tag <br />, however, leave end-of-line
-    # line breaks (eol_lb) intact
-    eol_lb = "|\n"
-    placeholder = "$%!?"  # arbitrary sting that never appears naturally
-    table = (
-        table.replace(eol_lb, placeholder)
-        .replace("\n", "<br />")
-        .replace(placeholder, eol_lb)
-    )
-    return table
-
-
-@dataclass
-class Section:
-    """Building block of the model card.
-
-    The model card is represented internally as a dict with keys being strings
-    and values being Sections. The key is identical to the section title.
-
-    Additionally, the section may hold content in the form of strings (can be an
-    empty string) or a ``Formattable``, which is simply an object with a
-    ``format`` method that returns a string.
-
-    Finally, the section can contain subsections, which again are dicts of
-    string keys and section values (the dict can be empty). Therefore, the model
-    card representation forms a tree structure, making use of the fact that dict
-    order is preserved.
-
-    """
-
-    title: str
-    content: Formattable | str
-    subsections: dict[str, Section] = field(default_factory=dict)
-
-
-class Formattable(Protocol):
-    def format(self) -> str:
-        ...  # pragma: no cover
-
-
-class Card:
-    """Model card class that will be used to generate model card.
-
-    This class can be used to write information and plots to model card and save
-    it. This class by default generates an interactive plot of the model and a
-    table of hyperparameters. Some default sections are added by default.
-
-    Parameters
-    ----------
-    model: estimator object
-        Model that will be documented.
-
-    model_diagram: bool, default=True
-        Set to True if model diagram should be plotted in the card.
-
-    metadata: CardData, optional
-        ``CardData`` object. The contents of this object are saved as metadata
-        at the beginning of the output file, and used by Hugging Face Hub.
-
-        You can use :func:`~skops.card.metadata_from_config` to create an
-        instance pre-populated with necessary information based on the contents
-        of the ``config.json`` file, which itself is created by
-        :func:`skops.hub_utils.init`.
-
-    prefill: bool (default=True)
-        Whether to add default sections or not.
-
-    Attributes
-    ----------
-    model: estimator object
-        The scikit-learn compatible model that will be documented.
-
-    metadata: CardData
-        Metadata to be stored at the beginning of the saved model card, as
-        metadata to be understood by the Hugging Face Hub.
-
-    Examples
-    --------
-    >>> from sklearn.metrics import (
-    ...     ConfusionMatrixDisplay,
-    ...     confusion_matrix,
-    ...     accuracy_score,
-    ...     f1_score
-    ... )
-    >>> import tempfile
-    >>> from pathlib import Path
-    >>> from sklearn.datasets import load_iris
-    >>> from sklearn.linear_model import LogisticRegression
-    >>> from skops.card._card_alternative import Card  # TODO
-    >>> X, y = load_iris(return_X_y=True)
-    >>> model = LogisticRegression(solver="liblinear", random_state=0).fit(X, y)
-    >>> model_card = Card(model)
-    >>> model_card.metadata.license = "mit"
-    >>> y_pred = model.predict(X)
-    >>> model_card.add_metrics(**{
-    ...     "accuracy": accuracy_score(y, y_pred),
-    ...     "f1 score": f1_score(y, y_pred, average="micro"),
-    ... })
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-    )
-    >>> cm = confusion_matrix(y, y_pred,labels=model.classes_)
-    >>> disp = ConfusionMatrixDisplay(
-    ...     confusion_matrix=cm,
-    ...     display_labels=model.classes_
-    ... )
-    >>> disp.plot()
-    <sklearn.metrics._plot.confusion_matrix.ConfusionMatrixDisplay object at ...>
-    >>> tmp_path = Path(tempfile.mkdtemp(prefix="skops-"))
-    >>> disp.figure_.savefig(tmp_path / "confusion_matrix.png")
-    ...
-    >>> model_card.add_plot(**{
-    ...     "Model description/Confusion Matrix": tmp_path / "confusion_matrix.png"
-    ... })
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-    )
-    >>> # add new content to the existing section "Model description"
-    >>> model_card.add(**{"Model description": "This is the best model"})
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description=This is the best model,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-    )
-    >>> # add content to a new section
-    >>> model_card.add(**{"A new section": "Please rate my model"})
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description=This is the best model,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-      A new section=Please rate my model,
-    )
-    >>> # add new subsection to an existing section by using "/"
-    >>> model_card.add(**{"Model description/Model name": "This model is called Bob"})
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description=This is the best model,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-      Model description/Model name=This model is called Bob,
-      A new section=Please rate my model,
-    )
-    >>> # save the card to a README.md file
-    >>> model_card.save(tmp_path / "README.md")
-    """
-
-    def __init__(
-        self,
-        model,
-        model_diagram: bool = True,
-        metadata: CardData | None = None,
-        prefill: bool = True,
-    ):
-        self.model = model
-        self.model_diagram = model_diagram
-        self.metadata = metadata or CardData()
-
-        self._data: dict[str, Section] = {}
-        self._metrics: dict[str, str | float | int] = {}
-        if prefill:
-            self._fill_default_sections()
-            # TODO: This is for compatibility with old model card but having an
-            # empty table by default is kinda pointless
-            self.add_metrics()
-            self._reset()
-
-    def _reset(self) -> None:
-        model_file = self.metadata.to_dict().get("model_file")
-        if model_file:
-            self._add_get_started_code(model_file)
-
-        self._add_model_section()
-        self._add_hyperparams()
-
-    def _fill_default_sections(self) -> None:
-        self.add(**DEFAULT_TEMPLATE)
-
-    def add(self, **kwargs: str | Formattable) -> "Card":
-        """Add new section(s) to the model card.
-
-        Add one or multiple sections to the model card. The section names are
-        taken from the keys and the contents are taken from the values.
-
-        To add to an existing section, use a ``"/"`` in the section name, e.g.:
-
-        ``card.add(**{"Existing section/New section": "content"})``.
-
-        If the parent section does not exist, it will be added automatically.
-
-        To add a section with ``"/"`` in its title (i.e. not inteded as a
-        subsection), escape the slash like so, ``"\\/"``, e.g.:
-
-        ``card.add(**{"A section with\\/a slash in the title": "content"})``.
-
-        If a section of the given name already exists, its content will be
-        overwritten.
-
-        Parameters
-        ----------
-        **kwargs : dict
-            The keys of the dictionary serve as the section title and the values
-            as the section content. It's possible to add to existing sections.
-
-        Returns
-        -------
-        self : object
-            Card object.
-
-        """
-        for key, val in kwargs.items():
-            self._add_single(key, val)
-        return self
-
-    def _select(
-        self, subsection_names: Sequence[str], create: bool = True
-    ) -> dict[str, Section]:
-        section = self._data
-        if not subsection_names:
-            return section
-
-        for subsection_name in subsection_names:
-            section_maybe = section.get(subsection_name)
-
-            # there are already subsections
-            if section_maybe is not None:
-                section = section_maybe.subsections
-                continue
-
-            if create:
-                # no subsection, create
-                entry = Section(title=subsection_name, content="")
-                section[subsection_name] = entry
-                section = entry.subsections
-            else:
-                raise KeyError(f"Section {subsection_name} does not exist")
-
-        return section
-
-    def select(self, key: str | Sequence[str]) -> Section:
-        """Select a section from the model card.
-
-        To select a subsection of an existing section, use a ``"/"`` in the
-        section name, e.g.:
-
-        ``card.select("Existing section/New section")``.
-
-        Alternatively, a list of strings can be passed:
-
-        ``card.select(["Existing section", "New section"])``.
-
-        Parameters
-        ----------
-        key : str or list of str
-            The name of the (sub)section to select. When selecting a subsection,
-            either use a ``"/"`` in the name to separate the parent and child
-            sections, or pass a list of strings.
-
-        Returns
-        -------
-        self : Section
-            A dataclass containing all information relevant to the selected
-            section. Those are the title, the content, and subsections (in a
-            dict).
-
-        Raises
-        ------
-        KeyError
-            If the given section name was not found, a ``KeyError`` is raised.
-
-        """
-        if not key:
-            msg = f"Section name cannot be empty but got '{key}'"
-            raise KeyError(msg)
-
-        if isinstance(key, str):
-            *subsection_names, leaf_node_name = split_subsection_names(key)
-        else:
-            *subsection_names, leaf_node_name = key
-
-        if not leaf_node_name:
-            msg = f"Section name cannot be empty but got '{key}'"
-            raise KeyError(msg)
-
-        parent_section = self._select(subsection_names, create=False)
-        return parent_section[leaf_node_name]
-
-    def delete(self, key: str | Sequence[str]) -> None:
-        """Delete a section from the model card.
-
-        To delete a subsection of an existing section, use a ``"/"`` in the
-        section name, e.g.:
-
-        ``card.delete("Existing section/New section")``.
-
-        Alternatively, a list of strings can be passed:
-
-        ``card.delete(["Existing section", "New section"])``.
-
-        Parameters
-        ----------
-        key : str or list of str
-            The name of the (sub)section to select. When selecting a subsection,
-            either use a ``"/"`` in the name to separate the parent and child
-            sections, or pass a list of strings.
-
-        Raises
-        ------
-        KeyError
-            If the given section name was not found, a ``KeyError`` is raised.
-
-        """
-        if not key:
-            msg = f"Section name cannot be empty but got '{key}'"
-            raise KeyError(msg)
-
-        if isinstance(key, str):
-            *subsection_names, leaf_node_name = split_subsection_names(key)
-        else:
-            *subsection_names, leaf_node_name = key
-
-        if not leaf_node_name:
-            msg = f"Section name cannot be empty but got '{key}'"
-            raise KeyError(msg)
-
-        parent_section = self._select(subsection_names, create=False)
-        del parent_section[leaf_node_name]
-
-    def _add_single(self, key: str, val: Formattable | str) -> None:
-        *subsection_names, leaf_node_name = split_subsection_names(key)
-        section = self._select(subsection_names)
-
-        if leaf_node_name in section:
-            # entry exists, only overwrite content
-            section[leaf_node_name].content = val
-        else:
-            # entry does not exist, create a new one
-            section[leaf_node_name] = Section(title=leaf_node_name, content=val)
-
-    def _add_model_section(self) -> None:
-        section_title = "Model description/Training Procedure/Model Plot"
-        default_content = "The model plot is below."
-
-        if not self.model_diagram:
-            self._add_single(section_title, default_content)
-            return
-
-        model_plot_div = re.sub(r"\n\s+", "", str(estimator_html_repr(self.model)))
-        if model_plot_div.count("sk-top-container") == 1:
-            model_plot_div = model_plot_div.replace(
-                "sk-top-container", 'sk-top-container" style="overflow: auto;'
-            )
-        content = f"{default_content}\n\n{model_plot_div}"
-        self._add_single(section_title, content)
-
-    def _add_hyperparams(self) -> None:
-        hyperparameter_dict = self.model.get_params(deep=True)
-        table = _clean_table(
-            tabulate(
-                list(hyperparameter_dict.items()),
-                headers=["Hyperparameter", "Value"],
-                tablefmt="github",
-            )
-        )
-        template = textwrap.dedent(
-            """        The model is trained with below hyperparameters.
-
-        <details>
-        <summary> Click to expand </summary>
-
-        {}
-
-        </details>"""
-        )
-        self._add_single(
-            "Model description/Training Procedure/Hyperparameters",
-            template.format(table),
-        )
-
-    def add_plot(self, *, folded=False, **kwargs: str) -> "Card":
-        """Add plots to the model card.
-
-        The plot should be saved on the file system and the path passed as
-        value.
-
-        Parameters
-        ----------
-        folded: bool (default=False)
-            If set to ``True``, the plot will be enclosed in a ``details`` tag.
-            That means the content is folded by default and users have to click
-            to show the content. This option is useful if the added plot is
-            large.
-
-        **kwargs : dict
-            The arguments should be of the form ``name=plot_path``, where
-            ``name`` is the name of the plot and section, and ``plot_path`` is
-            the path to the plot on the file system, relative to the root of the
-            project. The plots should have already been saved under the
-            project's folder.
-
-        Returns
-        -------
-        self : object
-            Card object.
-
-        """
-        for section_name, plot_path in kwargs.items():
-            plot_name = split_subsection_names(section_name)[-1]
-            section = PlotSection(alt_text=plot_name, path=plot_path, folded=folded)
-            self._add_single(section_name, section)
-        return self
-
-    def add_table(
-        self, *, folded: bool = False, **kwargs: dict["str", list[Any]]
-    ) -> Card:
-        """Add a table to the model card.
-
-        Add a table to the model card. This can be especially useful when you
-        using cross validation with sklearn. E.g. you can directly pass the
-        result from calling :func:`sklearn.model_selection.cross_validate` or
-        the ``cv_results_`` attribute from any of the hyperparameter searches,
-        such as :class:`sklearn.model_selection.GridSearchCV`.
-
-        Morevoer, you can pass any pandas :class:`pandas.DataFrame` to this
-        method and it will be rendered in the model card. You may consider
-        selecting only a part of the table if it's too big:
-
-        .. code:: python
-
-            search = GridSearchCV(...)
-            search.fit(X, y)
-            df = pd.DataFrame(search.cv_results_)
-            # show only top 10 highest scores
-            df = df.sort_values(["mean_test_score"], ascending=False).head(10)
-            model_card = skops.card.Card(...)
-            model_card.add_table(**{"Hyperparameter search results top 10": df})
-
-        Parameters
-        ----------
-        folded: bool (default=False)
-            If set to ``True``, the table will be enclosed in a ``details`` tag.
-            That means the content is folded by default and users have to click
-            to show the content. This option is useful if the added table is
-            large.
-
-        **kwargs : dict
-            The keys should be strings, which will be used as the section
-            headers, and the values should be tables. Tables can be either dicts
-            with the key being strings that represent the column name, and the
-            values being lists that represent the entries for each row.
-            Alternatively, the table can be a :class:`pandas.DataFrame`. The
-            table must not be empty.
-
-        Returns
-        -------
-        self : object
-            Card object.
-
-        """
-        for key, val in kwargs.items():
-            section = TableSection(table=val, folded=folded)
-            self._add_single(key, section)
-        return self
-
-    def add_metrics(self, **kwargs: str | int | float) -> "Card":
-        """Add metric values to the model card.
-
-        Parameters
-        ----------
-        **kwargs : dict
-            A dictionary of the form ``{metric name: metric value}``.
-
-        Returns
-        -------
-        self : object
-            Card object.
-        """
-        self._metrics.update(kwargs)
-        self._add_metrics(self._metrics)
-        return self
-
-    def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
-        table = tabulate(
-            list(metrics.items()),
-            headers=["Metric", "Value"],
-            tablefmt="github",
-        )
-        template = textwrap.dedent(
-            """        You can find the details about evaluation process and the evaluation results.
-
-
-
-        {}"""
-        )
-        self._add_single("Model description/Evaluation Results", template.format(table))
-
-    def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
-        """Yield metadata in yaml format"""
-        for key, val in metadata.to_dict().items() if metadata else {}:
-            yield aRepr.repr(f"metadata.{key}={val},").strip('"').strip("'")
-
-    def _generate_content(
-        self, data: dict[str, Section], depth: int = 1
-    ) -> Iterator[str]:
-        """Yield title and (formatted) contents"""
-        for val in data.values():
-            title = f"{depth * '#'} {val.title}"
-            yield title
-
-            if isinstance(val.content, str):
-                yield val.content
-            else:  # is a Formattable
-                yield val.content.format()
-
-            if val.subsections:
-                yield from self._generate_content(val.subsections, depth=depth + 1)
-
-    def _iterate_content(
-        self, data: dict[str, Section], parent_section: str = ""
-    ) -> Iterator[tuple[str, Formattable | str]]:
-        """Yield tuples of title and (non-formatted) content"""
-        for val in data.values():
-            if parent_section:
-                title = "/".join((parent_section, val.title))
-            else:
-                title = val.title
-
-            yield title, val.content
-
-            if val.subsections:
-                yield from self._iterate_content(val.subsections, parent_section=title)
-
-    @staticmethod
-    def _format_repr(text: str) -> str:
-        # Remove new lines, multiple spaces, quotation marks, and cap line length
-        text = text.replace("\n", " ")
-        text = re.sub(r"\s+", r" ", text)
-        return aRepr.repr(text).strip('"').strip("'")
-
-    def __str__(self) -> str:
-        return self.__repr__()
-
-    def __repr__(self) -> str:
-        # repr for the model
-        model = getattr(self, "model", None)
-        if model:
-            model_repr = self._format_repr(f"model={repr(model)}")
-        else:
-            model_repr = None
-
-        # repr for metadata
-        metadata_reprs = []
-        for key, val in self.metadata.to_dict().items() if self.metadata else {}:
-            if key == "widget":
-                metadata_reprs.append("metadata.widget={...},")
-                continue
-
-            metadata_reprs.append(self._format_repr(f"metadata.{key}={val},"))
-        metadata_repr = "\n".join(metadata_reprs)
-
-        # repr for contents
-        content_reprs = []
-        for title, content in self._iterate_content(self._data):
-            if not content:
-                continue
-            if isinstance(content, str) and content.rstrip("`").rstrip().endswith(
-                CONTENT_PLACEHOLDER
-            ):
-                # if content is just some default text, no need to show it
-                continue
-            content_reprs.append(self._format_repr(f"{title}={content},"))
-        content_repr = "\n".join(content_reprs)
-
-        # combine all parts
-        complete_repr = "Card(\n"
-        if model_repr:
-            complete_repr += textwrap.indent(model_repr, "  ") + "\n"
-        if metadata_reprs:
-            complete_repr += textwrap.indent(metadata_repr, "  ") + "\n"
-        if content_reprs:
-            complete_repr += textwrap.indent(content_repr, "  ") + "\n"
-        complete_repr += ")"
-        return complete_repr
-
-    def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
-        is_skops_format = file_name.endswith(".skops")  # else, assume pickle
-        lines = _getting_started_code(
-            file_name, is_skops_format=is_skops_format, indent=indent
-        )
-        lines = ["```python"] + lines + ["```"]
-
-        template = textwrap.dedent(
-            """        Use the code below to get started with the model.
-
-        {}
-        """
-        )
-        self._add_single(
-            "How to Get Started with the Model", template.format("\n".join(lines))
-        )
-
-    def _generate_card(self) -> Iterator[str]:
-        if self.metadata.to_dict():
-            yield f"---\n{self.metadata.to_yaml()}\n---"
-
-        for line in self._generate_content(self._data):
-            if line:
-                yield "\n" + line
-
-        # add an empty line add the end
-        yield ""
-
-    def save(self, path: str | Path) -> None:
-        """Save the model card.
-
-        This method renders the model card in markdown format and then saves it
-        as the specified file.
-
-        Parameters
-        ----------
-        path: str, or Path
-            Filepath to save your card.
-
-        Notes
-        -----
-        The keys in model card metadata can be seen `here
-        <https://huggingface.co/docs/hub/models-cards#model-card-metadata>`__.
-        """
-        with open(path, "w", encoding="utf-8") as f:
-            f.write("\n".join(self._generate_card()))
-
-    def render(self) -> str:
-        """Render the final model card as a string.
-
-        Returns
-        -------
-        result : str
-            The rendered model card with all placeholders filled and all extra
-            sections inserted.
-        """
-        return "\n".join(self._generate_card())
-
-
-def main():  # pragma: no cover
-    # TODO: remove
-    import os
-    import pickle
-    import tempfile
-    from uuid import uuid4
-
-    import matplotlib.pyplot as plt
-    import sklearn
-    from huggingface_hub import HfApi
-    from sklearn.datasets import load_iris
-    from sklearn.linear_model import LogisticRegression
-    from sklearn.pipeline import Pipeline
-    from sklearn.preprocessing import StandardScaler
-
-    from skops import hub_utils
-
-    X, y = load_iris(return_X_y=True, as_frame=True)
-
-    model = Pipeline(
-        [("scaler", StandardScaler()), ("clf", LogisticRegression(random_state=123))]
-    ).fit(X, y)
-
-    pkl_file = tempfile.mkstemp(suffix=".pkl", prefix="skops-test")[1]
-    with open(pkl_file, "wb") as f:
-        pickle.dump(model, f)
-
-    with tempfile.TemporaryDirectory(prefix="skops-test") as destination_path:
-        hub_utils.init(
-            model=pkl_file,
-            requirements=[f"scikit-learn=={sklearn.__version__}"],
-            dst=destination_path,
-            task="tabular-classification",
-            data=X,
-        )
-        card = Card(model, metadata=metadata_from_config(destination_path))
-
-        # add a placeholder for figures
-        card.add(Plots="")
-
-        # add arbitrary sections, overwrite them, etc.
-        card.add(hi="howdy")
-        card.add(**{"parent section/child section": "child content"})
-        card.add(**{"foo": "bar", "spam": "eggs"})
-        # add section with a "/" in title
-        card.add(**{"A section with a \\/ in the title": "This works"})
-        # change content of "hi" section
-        card.add(**{"hi/german": "guten tag", "hi/french": "salut"})
-        card.add(**{"very/deeply/nested/section": "but why?"})
-
-        # add metrics
-        card.add_metrics(**{"acc": 0.1})
-
-        # insert the plot in the "Plot" section created above
-        plt.plot([4, 5, 6, 7])
-        plt.savefig(Path(destination_path) / "fig1.png")
-        card.add_plot(**{"Plots/A beautiful plot": "fig1.png"})
-
-        # add table
-        table = {"split": [1, 2, 3], "score": [4, 5, 6]}
-        card.add_table(
-            folded=True,
-            **{"Model description/Training Procedure/Yet another table": table},
-        )
-
-        # more metrics
-        card.add_metrics(**{"f1": 0.2, "roc": 123})
-
-        # add content for "Model description" section, which has subsections but
-        # otherwise no content
-        card.add(**{"Model description": "This is a fantastic model"})
-
-        card.save(Path(destination_path) / "README.md")
-        print(destination_path)
-
-        # pushing to Hub
-        token = os.environ["HF_HUB_TOKEN"]
-        repo_name = f"hf_hub_example-{uuid4()}"
-        user_name = HfApi().whoami(token=token)["name"]
-        repo_id = f"{user_name}/{repo_name}"
-        print(f"Creating and pushing to repo: {repo_id}")
-        hub_utils.push(
-            repo_id=repo_id,
-            source=destination_path,
-            token=token,
-            commit_message="testing model cards",
-            create_remote=True,
-            private=False,
-        )
-
-
-if __name__ == "__main__":
-    main()  # pragma: no cover
diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index a7d10dec..aa19982a 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -1,20 +1,22 @@
 from __future__ import annotations
 
-import copy
 import json
 import re
-import shutil
-import tempfile
-from dataclasses import dataclass
+import sys
+import textwrap
+from dataclasses import dataclass, field
 from pathlib import Path
 from reprlib import Repr
-from typing import Any, Optional, Union
+from typing import Any, Iterator, Sequence, Union
 
-from huggingface_hub import CardData, ModelCard
+from huggingface_hub import CardData
 from sklearn.utils import estimator_html_repr
 from tabulate import tabulate  # type: ignore
 
-import skops
+if sys.version_info >= (3, 8):
+    from typing import Protocol
+else:
+    from typing_extensions import Protocol
 
 # Repr attributes can be used to control the behavior of repr
 aRepr = Repr()
@@ -22,6 +24,31 @@
 aRepr.maxstring = 79
 
 
+CONTENT_PLACEHOLDER = "[More Information Needed]"
+"""When there is a section but no content, show this"""
+
+DEFAULT_TEMPLATE = {
+    "Model description": CONTENT_PLACEHOLDER,
+    "Model description/Intended uses & limitations": CONTENT_PLACEHOLDER,
+    "Model description/Training Procedure": "",
+    "Model description/Training Procedure/Hyperparameters": CONTENT_PLACEHOLDER,
+    "Model description/Training Procedure/Model Plot": CONTENT_PLACEHOLDER,
+    "Model description/Evaluation Results": CONTENT_PLACEHOLDER,
+    "How to Get Started with the Model": CONTENT_PLACEHOLDER,
+    "Model Card Authors": (
+        f"This model card is written by following authors:\n\n{CONTENT_PLACEHOLDER}"
+    ),
+    "Model Card Contact": (
+        "You can contact the model card authors through following channels:\n"
+        f"{CONTENT_PLACEHOLDER}"
+    ),
+    "Citation": (
+        "Below you can find information related to citation.\n\n**BibTeX:**\n```\n"
+        f"{CONTENT_PLACEHOLDER}\n```"
+    ),
+}
+
+
 def wrap_as_details(text: str, folded: bool) -> str:
     if not folded:
         return text
@@ -162,13 +189,106 @@ def metadata_from_config(config_path: Union[str, Path]) -> CardData:
     return card_data
 
 
+def split_subsection_names(key: str) -> list[str]:
+    r"""Split a string containing multiple sections into a list of strings for
+    each.
+
+    The separator is ``"/"``. To avoid splitting on ``"/"``, escape it using
+    ``"\\/"``.
+
+    Examples
+    --------
+    >>> split_subsection_names("Section A")
+    ['Section A']
+    >>> split_subsection_names("Section A/Section B/Section C")
+    ['Section A', 'Section B', 'Section C']
+    >>> split_subsection_names("A section containg \\/ a slash")
+    ['A section containg / a slash']
+    >>> split_subsection_names("Spaces are / stripped")
+    ['Spaces are', 'stripped']
+
+    Parameters
+    ----------
+    key : str
+        The section name consisting potentially of multiple subsections. It has
+        to be ensured beforhand that this is not an empty string.
+
+    Returns
+    -------
+    parts : list of str
+        The individual (sub)sections.
+
+    """
+    placeholder = "$%!?"  # arbitrary sting that never appears naturally
+    key = key.replace("\\/", placeholder)
+    parts = (part.strip() for part in key.split("/"))
+    return [part.replace(placeholder, "/") for part in parts]
+
+
+def _getting_started_code(
+    file_name: str, is_skops_format: bool = False, indent="    "
+) -> list[str]:
+    # get lines of code required to load the model
+    lines: list[str] = []
+    if is_skops_format:
+        lines += ["from skops.io import load"]
+    else:
+        lines += ["import joblib"]
+
+    lines += [
+        "import json",
+        "import pandas as pd",
+    ]
+    if is_skops_format:
+        lines += [
+            "from skops.io import load",
+            f'model = load("{file_name}")',
+        ]
+    else:  # pickle
+        lines += [f"model = joblib.load({file_name})"]
+
+    lines += [
+        'with open("config.json") as f:',
+        indent + "config = json.load(f)",
+        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))',
+    ]
+    return lines
+
+
+@dataclass
+class Section:
+    """Building block of the model card.
+
+    The model card is represented internally as a dict with keys being strings
+    and values being Sections. The key is identical to the section title.
+
+    Additionally, the section may hold content in the form of strings (can be an
+    empty string) or a ``Formattable``, which is simply an object with a
+    ``format`` method that returns a string.
+
+    Finally, the section can contain subsections, which again are dicts of
+    string keys and section values (the dict can be empty). Therefore, the model
+    card representation forms a tree structure, making use of the fact that dict
+    order is preserved.
+
+    """
+
+    title: str
+    content: Formattable | str
+    subsections: dict[str, Section] = field(default_factory=dict)
+
+
+class Formattable(Protocol):
+    def format(self) -> str:
+        ...  # pragma: no cover
+
+
 class Card:
     """Model card class that will be used to generate model card.
 
     This class can be used to write information and plots to model card and save
     it. This class by default generates an interactive plot of the model and a
-    table of hyperparameters. The slots to be filled are defined in the markdown
-    template.
+    table of hyperparameters. Some sections are added by default.
 
     Parameters
     ----------
@@ -187,6 +307,9 @@ class Card:
         of the ``config.json`` file, which itself is created by
         :func:`skops.hub_utils.init`.
 
+    prefill: bool (default=True)
+        Whether to add default sections or not.
+
     Attributes
     ----------
     model: estimator object
@@ -196,13 +319,6 @@ class Card:
         Metadata to be stored at the beginning of the saved model card, as
         metadata to be understood by the Hugging Face Hub.
 
-    Notes
-    -----
-    The contents of the sections of the template can be set using
-    :meth:`Card.add` method. Plots can be added to the model card using
-    :meth:`Card.add_plot`. The key you pass to :meth:`Card.add_plot` will be
-    used as the header of the plot.
-
     Examples
     --------
     >>> from sklearn.metrics import (
@@ -215,10 +331,10 @@ class Card:
     >>> from pathlib import Path
     >>> from sklearn.datasets import load_iris
     >>> from sklearn.linear_model import LogisticRegression
-    >>> from skops import card
+    >>> from skops.card import Card
     >>> X, y = load_iris(return_X_y=True)
     >>> model = LogisticRegression(solver="liblinear", random_state=0).fit(X, y)
-    >>> model_card = card.Card(model)
+    >>> model_card = Card(model)
     >>> model_card.metadata.license = "mit"
     >>> y_pred = model.predict(X)
     >>> model_card.add_metrics(**{
@@ -226,8 +342,11 @@ class Card:
     ...     "f1 score": f1_score(y, y_pred, average="micro"),
     ... })
     Card(
-      model=LogisticRegression(random_state=0, solver='liblinear'),
+      model=LogisticRegression(random_state=0, solver='liblinear')
       metadata.license=mit,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
     )
     >>> cm = confusion_matrix(y, y_pred,labels=model.classes_)
     >>> disp = ConfusionMatrixDisplay(
@@ -236,52 +355,298 @@ class Card:
     ... )
     >>> disp.plot()
     <sklearn.metrics._plot.confusion_matrix.ConfusionMatrixDisplay object at ...>
-    >>> disp.figure_.savefig("confusion_matrix.png")
+    >>> tmp_path = Path(tempfile.mkdtemp(prefix="skops-"))
+    >>> disp.figure_.savefig(tmp_path / "confusion_matrix.png")
     ...
-    >>> model_card.add_plot(confusion_matrix="confusion_matrix.png")
+    >>> model_card.add_plot(**{
+    ...     "Model description/Confusion Matrix": tmp_path / "confusion_matrix.png"
+    ... })
     Card(
-      model=LogisticRegression(random_state=0, solver='liblinear'),
+      model=LogisticRegression(random_state=0, solver='liblinear')
       metadata.license=mit,
-      confusion_matrix='confusion_matrix.png',
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      Model description/Confusion Matrix=...confusion_matrix.png'),
     )
-    >>> with tempfile.TemporaryDirectory() as tmpdir:
-    ...     model_card.save((Path(tmpdir) / "README.md"))
+    >>> # add new content to the existing section "Model description"
+    >>> model_card.add(**{"Model description": "This is the best model"})
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description=This is the best model,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      Model description/Confusion Matrix=...confusion_matrix.png'),
+    )
+    >>> # add content to a new section
+    >>> model_card.add(**{"A new section": "Please rate my model"})
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description=This is the best model,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      Model description/Confusion Matrix=...confusion_matrix.png'),
+      A new section=Please rate my model,
+    )
+    >>> # add new subsection to an existing section by using "/"
+    >>> model_card.add(**{"Model description/Model name": "This model is called Bob"})
+    Card(
+      model=LogisticRegression(random_state=0, solver='liblinear')
+      metadata.license=mit,
+      Model description=This is the best model,
+      Model description/Training Procedure/... | | warm_start | False | </details>,
+      Model description/Training Procedure/...</pre></div></div></div></div></div>,
+      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
+      Model description/Confusion Matrix=...confusion_matrix.png'),
+      Model description/Model name=This model is called Bob,
+      A new section=Please rate my model,
+    )
+    >>> # save the card to a README.md file
+    >>> model_card.save(tmp_path / "README.md")
     """
 
     def __init__(
         self,
-        model: Any,
+        model,
         model_diagram: bool = True,
-        metadata: Optional[CardData] = None,
+        metadata: CardData | None = None,
+        prefill: bool = True,
     ) -> None:
         self.model = model
         self.model_diagram = model_diagram
-        self._eval_results = {}  # type: ignore
-        self._template_sections: dict[str, str] = {}
-        self._extra_sections: list[tuple[str, Any]] = []
         self.metadata = metadata or CardData()
 
-    def add(self, **kwargs: str) -> "Card":
-        """Takes values to fill model card template.
+        self._data: dict[str, Section] = {}
+        self._metrics: dict[str, str | float | int] = {}
+        if prefill:
+            self._fill_default_sections()
+            # TODO: This is for parity with old model card but having an empty
+            # table by default is kinda pointless
+            self.add_metrics()
+            self._reset()
+
+    def _reset(self) -> None:
+        model_file = self.metadata.to_dict().get("model_file")
+        if model_file:
+            self._add_get_started_code(model_file)
+
+        self._add_model_section()
+        self._add_hyperparams()
+
+    def _fill_default_sections(self) -> None:
+        self.add(**DEFAULT_TEMPLATE)
+
+    def add(self, **kwargs: str | Formattable) -> "Card":
+        """Add new section(s) to the model card.
+
+        Add one or multiple sections to the model card. The section names are
+        taken from the keys and the contents are taken from the values.
+
+        To add to an existing section, use a ``"/"`` in the section name, e.g.:
+
+        ``card.add(**{"Existing section/New section": "content"})``.
+
+        If the parent section does not exist, it will be added automatically.
+
+        To add a section with ``"/"`` in its title (i.e. not inteded as a
+        subsection), escape the slash like so, ``"\\/"``, e.g.:
+
+        ``card.add(**{"A section with\\/a slash in the title": "content"})``.
+
+        If a section of the given name already exists, its content will be
+        overwritten.
 
         Parameters
         ----------
         **kwargs : dict
-            Parameters to be set for the model card. These parameters
-            need to be sections of the underlying `jinja` template used.
+            The keys of the dictionary serve as the section title and the values
+            as the section content. It's possible to add to existing sections.
 
         Returns
         -------
         self : object
             Card object.
+
         """
-        for section, value in kwargs.items():
-            self._template_sections[section] = value
+        for key, val in kwargs.items():
+            self._add_single(key, val)
         return self
 
-    def add_plot(self, folded=False, **kwargs: str) -> "Card":
+    def _select(
+        self, subsection_names: Sequence[str], create: bool = True
+    ) -> dict[str, Section]:
+        section = self._data
+        if not subsection_names:
+            return section
+
+        for subsection_name in subsection_names:
+            section_maybe = section.get(subsection_name)
+
+            # there are already subsections
+            if section_maybe is not None:
+                section = section_maybe.subsections
+                continue
+
+            if create:
+                # no subsection, create
+                entry = Section(title=subsection_name, content="")
+                section[subsection_name] = entry
+                section = entry.subsections
+            else:
+                raise KeyError(f"Section {subsection_name} does not exist")
+
+        return section
+
+    def select(self, key: str | Sequence[str]) -> Section:
+        """Select a section from the model card.
+
+        To select a subsection of an existing section, use a ``"/"`` in the
+        section name, e.g.:
+
+        ``card.select("Existing section/New section")``.
+
+        Alternatively, a list of strings can be passed:
+
+        ``card.select(["Existing section", "New section"])``.
+
+        Parameters
+        ----------
+        key : str or list of str
+            The name of the (sub)section to select. When selecting a subsection,
+            either use a ``"/"`` in the name to separate the parent and child
+            sections, or pass a list of strings.
+
+        Returns
+        -------
+        self : Section
+            A dataclass containing all information relevant to the selected
+            section. Those are the title, the content, and subsections (in a
+            dict).
+
+        Raises
+        ------
+        KeyError
+            If the given section name was not found, a ``KeyError`` is raised.
+
+        """
+        if not key:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
+
+        if isinstance(key, str):
+            *subsection_names, leaf_node_name = split_subsection_names(key)
+        else:
+            *subsection_names, leaf_node_name = key
+
+        if not leaf_node_name:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
+
+        parent_section = self._select(subsection_names, create=False)
+        return parent_section[leaf_node_name]
+
+    def delete(self, key: str | Sequence[str]) -> None:
+        """Delete a section from the model card.
+
+        To delete a subsection of an existing section, use a ``"/"`` in the
+        section name, e.g.:
+
+        ``card.delete("Existing section/New section")``.
+
+        Alternatively, a list of strings can be passed:
+
+        ``card.delete(["Existing section", "New section"])``.
+
+        Parameters
+        ----------
+        key : str or list of str
+            The name of the (sub)section to select. When selecting a subsection,
+            either use a ``"/"`` in the name to separate the parent and child
+            sections, or pass a list of strings.
+
+        Raises
+        ------
+        KeyError
+            If the given section name was not found, a ``KeyError`` is raised.
+
+        """
+        if not key:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
+
+        if isinstance(key, str):
+            *subsection_names, leaf_node_name = split_subsection_names(key)
+        else:
+            *subsection_names, leaf_node_name = key
+
+        if not leaf_node_name:
+            msg = f"Section name cannot be empty but got '{key}'"
+            raise KeyError(msg)
+
+        parent_section = self._select(subsection_names, create=False)
+        del parent_section[leaf_node_name]
+
+    def _add_single(self, key: str, val: Formattable | str) -> None:
+        *subsection_names, leaf_node_name = split_subsection_names(key)
+        section = self._select(subsection_names)
+
+        if leaf_node_name in section:
+            # entry exists, only overwrite content
+            section[leaf_node_name].content = val
+        else:
+            # entry does not exist, create a new one
+            section[leaf_node_name] = Section(title=leaf_node_name, content=val)
+
+    def _add_model_section(self) -> None:
+        section_title = "Model description/Training Procedure/Model Plot"
+        default_content = "The model plot is below."
+
+        if not self.model_diagram:
+            self._add_single(section_title, default_content)
+            return
+
+        model_plot_div = re.sub(r"\n\s+", "", str(estimator_html_repr(self.model)))
+        if model_plot_div.count("sk-top-container") == 1:
+            model_plot_div = model_plot_div.replace(
+                "sk-top-container", 'sk-top-container" style="overflow: auto;'
+            )
+        content = f"{default_content}\n\n{model_plot_div}"
+        self._add_single(section_title, content)
+
+    def _add_hyperparams(self) -> None:
+        hyperparameter_dict = self.model.get_params(deep=True)
+        table = _clean_table(
+            tabulate(
+                list(hyperparameter_dict.items()),
+                headers=["Hyperparameter", "Value"],
+                tablefmt="github",
+            )
+        )
+        template = textwrap.dedent(
+            """        The model is trained with below hyperparameters.
+
+        <details>
+        <summary> Click to expand </summary>
+
+        {}
+
+        </details>"""
+        )
+        self._add_single(
+            "Model description/Training Procedure/Hyperparameters",
+            template.format(table),
+        )
+
+    def add_plot(self, *, folded=False, **kwargs: str) -> "Card":
         """Add plots to the model card.
 
+        The plot should be saved on the file system and the path passed as
+        value.
+
         Parameters
         ----------
         folded: bool (default=False)
@@ -291,22 +656,27 @@ def add_plot(self, folded=False, **kwargs: str) -> "Card":
             large.
 
         **kwargs : dict
-            The arguments should be of the form `name=plot_path`, where `name`
-            is the name of the plot and `plot_path` is the path to the plot,
-            relative to the root of the project. The plots should have already
-            been saved under the project's folder.
+            The arguments should be of the form ``name=plot_path``, where
+            ``name`` is the name of the plot and section, and ``plot_path`` is
+            the path to the plot on the file system, relative to the root of the
+            project. The plots should have already been saved under the
+            project's folder.
 
         Returns
         -------
         self : object
             Card object.
+
         """
-        for plot_name, plot_path in kwargs.items():
+        for section_name, plot_path in kwargs.items():
+            plot_name = split_subsection_names(section_name)[-1]
             section = PlotSection(alt_text=plot_name, path=plot_path, folded=folded)
-            self._extra_sections.append((plot_name, section))
+            self._add_single(section_name, section)
         return self
 
-    def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> Card:
+    def add_table(
+        self, *, folded: bool = False, **kwargs: dict["str", list[Any]]
+    ) -> Card:
         """Add a table to the model card.
 
         Add a table to the model card. This can be especially useful when you
@@ -353,212 +723,183 @@ def add_table(self, folded: bool = False, **kwargs: dict["str", list[Any]]) -> C
         """
         for key, val in kwargs.items():
             section = TableSection(table=val, folded=folded)
-            self._extra_sections.append((key, section))
+            self._add_single(key, section)
         return self
 
-    def add_metrics(self, **kwargs: str) -> "Card":
+    def add_metrics(self, **kwargs: str | int | float) -> "Card":
         """Add metric values to the model card.
 
         Parameters
         ----------
         **kwargs : dict
-            A dictionary of the form `{metric name: metric value}`.
+            A dictionary of the form ``{metric name: metric value}``.
 
         Returns
         -------
         self : object
             Card object.
         """
-        for metric, value in kwargs.items():
-            self._eval_results[metric] = value
+        self._metrics.update(kwargs)
+        self._add_metrics(self._metrics)
         return self
 
-    def _generate_card(self) -> ModelCard:
-        """Generate the ModelCard object
-
-        Returns
-        -------
-        card : huggingface_hub.ModelCard
-            The final :class:`huggingface_hub.ModelCard` object with all
-            placeholders filled and all extra sections inserted.
-        """
-        root = skops.__path__
-
-        # add evaluation results
-
-        template_sections = copy.deepcopy(self._template_sections)
-
-        if self.metadata:
-            if self.metadata.to_dict().get("model_file"):
-                model_file = self.metadata.to_dict().get("model_file")
-                if model_file.endswith(".skops"):
-                    template_sections["get_started_code"] = (
-                        "from skops.io import load\nimport json\n"
-                        "import pandas as pd\n"
-                        f'model = load("{model_file}")\n'
-                        'with open("config.json") as f:\n   '
-                        " config ="
-                        " json.load(f)\n"
-                        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))'
-                    )
-                else:
-                    template_sections["get_started_code"] = (
-                        "import joblib\nimport json\nimport pandas as pd\nmodel ="
-                        f' joblib.load({model_file})\nwith open("config.json") as'
-                        " f:\n   "
-                        " config ="
-                        " json.load(f)\n"
-                        'model.predict(pd.DataFrame.from_dict(config["sklearn"]["example_input"]))'
-                    )
-        if self.model_diagram is True:
-            model_plot_div = re.sub(r"\n\s+", "", str(estimator_html_repr(self.model)))
-            if model_plot_div.count("sk-top-container") == 1:
-                model_plot_div = model_plot_div.replace(
-                    "sk-top-container", 'sk-top-container" style="overflow: auto;'
-                )
-            model_plot: str | None = model_plot_div
-        else:
-            model_plot = None
-
-        template_sections["eval_results"] = tabulate(
-            list(self._eval_results.items()),
+    def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
+        table = tabulate(
+            list(metrics.items()),
             headers=["Metric", "Value"],
             tablefmt="github",
         )
+        template = textwrap.dedent(
+            """        You can find the details about evaluation process and the evaluation results.
 
-        # if template path is not given, use default
-        if template_sections.get("template_path") is None:
-            template_sections["template_path"] = str(
-                Path(root[0]) / "card" / "default_template.md"
-            )
-
-        # copying the template so that the original template is not touched/changed
-        # append plot_name if any plots are provided, at the end of the template
-        with tempfile.TemporaryDirectory() as tmpdirname:
-            shutil.copyfile(
-                template_sections["template_path"],
-                f"{tmpdirname}/temporary_template.md",
-            )
-            #  create a temporary template with the additional plots
-            template_sections["template_path"] = f"{tmpdirname}/temporary_template.md"
-            # add extra sections at the end of the template
-            with open(template_sections["template_path"], "a") as template:
-                if self._extra_sections:
-                    template.write("\n\n# Additional Content\n")
-
-                for key, val in self._extra_sections:
-                    formatted = val.format()
-                    template.write(f"\n## {key}\n\n{formatted}\n")
-
-            card = ModelCard.from_template(
-                card_data=self.metadata,
-                hyperparameter_table=self._extract_estimator_config(),
-                model_plot=model_plot,
-                **template_sections,
-            )
-        return card
-
-    def save(self, path: str | Path) -> None:
-        """Save the model card.
-
-        This method renders the model card in markdown format and then saves it
-        as the specified file.
-
-        Parameters
-        ----------
-        path: str, or Path
-            Filepath to save your card.
-
-        Notes
-        -----
-        The keys in model card metadata can be seen `here
-        <https://huggingface.co/docs/hub/models-cards#model-card-metadata>`__.
-        """
-        card = self._generate_card()
-        card.save(path)
-
-    def render(self) -> str:
-        """Render the final model card as a string.
-
-        Returns
-        -------
-        card : str
-            The rendered model card with all placeholders filled and all extra
-            sections inserted.
-        """
-        card = self._generate_card()
-        return str(card)
 
-    def _extract_estimator_config(self) -> str:
-        """Extracts estimator hyperparameters and renders them into a vertical table.
 
-        Returns
-        -------
-        str:
-            Markdown table of hyperparameters.
-        """
-        hyperparameter_dict = self.model.get_params(deep=True)
-        return _clean_table(
-            tabulate(
-                list(hyperparameter_dict.items()),
-                headers=["Hyperparameter", "Value"],
-                tablefmt="github",
-            )
+        {}"""
         )
+        self._add_single("Model description/Evaluation Results", template.format(table))
+
+    def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
+        """Yield metadata in yaml format"""
+        for key, val in metadata.to_dict().items() if metadata else {}:
+            yield aRepr.repr(f"metadata.{key}={val},").strip('"').strip("'")
+
+    def _generate_content(
+        self, data: dict[str, Section], depth: int = 1
+    ) -> Iterator[str]:
+        """Yield title and (formatted) contents"""
+        for val in data.values():
+            title = f"{depth * '#'} {val.title}"
+            yield title
+
+            if isinstance(val.content, str):
+                yield val.content
+            else:  # is a Formattable
+                yield val.content.format()
+
+            if val.subsections:
+                yield from self._generate_content(val.subsections, depth=depth + 1)
+
+    def _iterate_content(
+        self, data: dict[str, Section], parent_section: str = ""
+    ) -> Iterator[tuple[str, Formattable | str]]:
+        """Yield tuples of title and (non-formatted) content"""
+        for val in data.values():
+            if parent_section:
+                title = "/".join((parent_section, val.title))
+            else:
+                title = val.title
+
+            yield title, val.content
+
+            if val.subsections:
+                yield from self._iterate_content(val.subsections, parent_section=title)
 
     @staticmethod
-    def _strip_blank(text) -> str:
-        # remove new lines and multiple spaces
+    def _format_repr(text: str) -> str:
+        # Remove new lines, multiple spaces, quotation marks, and cap line length
         text = text.replace("\n", " ")
         text = re.sub(r"\s+", r" ", text)
-        return text
+        return aRepr.repr(text).strip('"').strip("'")
 
     def __str__(self) -> str:
         return self.__repr__()
 
     def __repr__(self) -> str:
-        # create repr for model
+        # repr for the model
         model = getattr(self, "model", None)
         if model:
-            model_str = self._strip_blank(repr(model))
-            model_repr = aRepr.repr(f"  model={model_str},").strip('"').strip("'")
+            model_repr = self._format_repr(f"model={repr(model)}")
         else:
             model_repr = None
 
-        # metadata
+        # repr for metadata
         metadata_reprs = []
         for key, val in self.metadata.to_dict().items() if self.metadata else {}:
             if key == "widget":
-                metadata_reprs.append("  metadata.widget={...},")
+                metadata_reprs.append("metadata.widget={...},")
                 continue
 
-            metadata_reprs.append(
-                aRepr.repr(f"  metadata.{key}={val},").strip('"').strip("'")
-            )
+            metadata_reprs.append(self._format_repr(f"metadata.{key}={val},"))
         metadata_repr = "\n".join(metadata_reprs)
 
-        # normal sections
-        template_reprs = []
-        for key, val in self._template_sections.items():
-            val = self._strip_blank(repr(val))
-            template_reprs.append(aRepr.repr(f"  {key}={val},").strip('"').strip("'"))
-        template_repr = "\n".join(template_reprs)
-
-        # figures
-        figure_reprs = []
-        for key, val in self._extra_sections:
-            val = self._strip_blank(repr(val))
-            figure_reprs.append(aRepr.repr(f"  {key}={val},").strip('"').strip("'"))
-        figure_repr = "\n".join(figure_reprs)
+        # repr for contents
+        content_reprs = []
+        for title, content in self._iterate_content(self._data):
+            if not content:
+                continue
+            if isinstance(content, str) and content.rstrip("`").rstrip().endswith(
+                CONTENT_PLACEHOLDER
+            ):
+                # if content is just some default text, no need to show it
+                continue
+            content_reprs.append(self._format_repr(f"{title}={content},"))
+        content_repr = "\n".join(content_reprs)
 
+        # combine all parts
         complete_repr = "Card(\n"
         if model_repr:
-            complete_repr += model_repr + "\n"
+            complete_repr += textwrap.indent(model_repr, "  ") + "\n"
         if metadata_reprs:
-            complete_repr += metadata_repr + "\n"
-        if template_repr:
-            complete_repr += template_repr + "\n"
-        if figure_repr:
-            complete_repr += figure_repr + "\n"
+            complete_repr += textwrap.indent(metadata_repr, "  ") + "\n"
+        if content_reprs:
+            complete_repr += textwrap.indent(content_repr, "  ") + "\n"
         complete_repr += ")"
         return complete_repr
+
+    def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
+        is_skops_format = file_name.endswith(".skops")  # else, assume pickle
+        lines = _getting_started_code(
+            file_name, is_skops_format=is_skops_format, indent=indent
+        )
+        lines = ["```python"] + lines + ["```"]
+
+        template = textwrap.dedent(
+            """        Use the code below to get started with the model.
+
+        {}
+        """
+        )
+        self._add_single(
+            "How to Get Started with the Model", template.format("\n".join(lines))
+        )
+
+    def _generate_card(self) -> Iterator[str]:
+        if self.metadata.to_dict():
+            yield f"---\n{self.metadata.to_yaml()}\n---"
+
+        for line in self._generate_content(self._data):
+            if line:
+                yield "\n" + line
+
+        # add an empty line add the end
+        yield ""
+
+    def save(self, path: str | Path) -> None:
+        """Save the model card.
+
+        This method renders the model card in markdown format and then saves it
+        as the specified file.
+
+        Parameters
+        ----------
+        path: str, or Path
+            Filepath to save your card.
+
+        Notes
+        -----
+        The keys in model card metadata can be seen `here
+        <https://huggingface.co/docs/hub/models-cards#model-card-metadata>`__.
+        """
+        with open(path, "w", encoding="utf-8") as f:
+            f.write("\n".join(self._generate_card()))
+
+    def render(self) -> str:
+        """Render the final model card as a string.
+
+        Returns
+        -------
+        result : str
+            The rendered model card with all placeholders filled and all extra
+            sections inserted.
+        """
+        return "\n".join(self._generate_card())
diff --git a/skops/card/tests/test_card.py b/skops/card/tests/test_card.py
index 4cb6d4ec..f9ba237b 100644
--- a/skops/card/tests/test_card.py
+++ b/skops/card/tests/test_card.py
@@ -1,7 +1,7 @@
-import copy
 import os
 import pickle
 import tempfile
+import textwrap
 from pathlib import Path
 
 import matplotlib.pyplot as plt
@@ -11,11 +11,11 @@
 from huggingface_hub import CardData, metadata_load
 from sklearn.datasets import load_iris
 from sklearn.linear_model import LinearRegression, LogisticRegression
+from sklearn.tree import DecisionTreeClassifier
 
-import skops
 from skops import hub_utils
-from skops.card import Card, metadata_from_config
-from skops.card._model_card import PlotSection, TableSection
+from skops.card import metadata_from_config
+from skops.card._model_card import Card, PlotSection, TableSection
 from skops.io import dump
 
 
@@ -111,9 +111,45 @@ def test_save_model_card(destination_path, model_card):
     assert (Path(destination_path) / "README.md").exists()
 
 
-def test_hyperparameter_table(destination_path, model_card):
-    model_card = model_card.render()
-    assert "fit_intercept" in model_card
+def test_hyperparameter_table(model_card):
+    section_name = "Model description/Training Procedure/Hyperparameters"
+    result = model_card.select(section_name).content
+
+    lines = [
+        "The model is trained with below hyperparameters.",
+        "",
+        "<details>",
+        "<summary> Click to expand </summary>",
+        "",
+        "| Hyperparameter   | Value   |",
+        "|------------------|---------|",
+        "| copy_X           | True    |",
+        "| fit_intercept    | True    |",
+        "| n_jobs           |         |",
+        "| normalize        | False   |",
+        "| positive         | False   |",
+        "",
+        "</details>",
+    ]
+    # TODO: remove when dropping sklearn v0.24 and when dropping v1.1 and
+    # below. This is because the "normalize" parameter was changed after
+    # v0.24 will be removed completely in sklearn v1.2.
+    major, minor, *_ = sklearn.__version__.split(".")
+    major, minor = int(major), int(minor)
+    if (major >= 1) and (minor < 2):
+        lines[10] = "| normalize        | deprecated |"
+    elif (major >= 1) and (minor >= 2):
+        del lines[10]
+    expected = "\n".join(lines)
+
+    # remove multiple whitespaces and dashes, as they're not important and may
+    # differ depending on OS
+    expected = _strip_multiple_chars(expected, " ")
+    expected = _strip_multiple_chars(expected, "-")
+    result = _strip_multiple_chars(result, " ")
+    result = _strip_multiple_chars(result, "-")
+
+    assert result == expected
 
 
 def _strip_multiple_chars(text, char):
@@ -124,7 +160,7 @@ def _strip_multiple_chars(text, char):
     return text
 
 
-def test_hyperparameter_table_with_line_break(destination_path):
+def test_hyperparameter_table_with_line_break():
     # Hyperparameters can contain values with line breaks, "\n", in them. In
     # that case, the markdown table is broken. Check that the hyperparameter
     # table we create properly replaces the "\n" with "<br />".
@@ -133,80 +169,347 @@ def get_params(self, deep=False):
             return {"fit_intercept": True, "n_jobs": "line\nwith\nbreak"}
 
     model_card = Card(EstimatorWithLbInParams())
-    model_card = model_card.render()
+    section_name = "Model description/Training Procedure/Hyperparameters"
+    text_hyperparams = model_card.select(section_name).content
+
     # remove multiple whitespaces, as they're not important
-    model_card = _strip_multiple_chars(model_card, " ")
-    assert "| n_jobs | line<br />with<br />break |" in model_card
+    text_cleaned = _strip_multiple_chars(text_hyperparams, " ")
+    assert "| n_jobs | line<br />with<br />break |" in text_cleaned
+
+
+def test_plot_model(model_card):
+    text_plot = model_card.select(
+        "Model description/Training Procedure/Model Plot"
+    ).content
+    # don't compare whole text, as it's quite long and non-deterministic
+    assert text_plot.startswith("The model plot is below.\n\n<style>#sk-")
+    assert "<style>" in text_plot
+    assert text_plot.endswith(
+        "<pre>LinearRegression()</pre></div></div></div></div></div>"
+    )
 
 
-def test_plot_model(destination_path, model_card):
-    model_card = model_card.render()
-    assert "<style>" in model_card
+def test_plot_model_false(model_card):
+    model = fit_model()
+    model_card = Card(model, model_diagram=False)
+    text_plot = model_card.select(
+        "Model description/Training Procedure/Model Plot"
+    ).content
+    assert text_plot == "The model plot is below."
+
+
+def test_render(model_card, destination_path):
+    file_name = destination_path / "README.md"
+    model_card.save(file_name)
+    with open(file_name, "r", encoding="utf-8") as f:
+        loaded = f.read()
+
+    rendered = model_card.render()
+    assert loaded == rendered
+
+
+def test_with_metadata(model_card):
+    model_card.metadata.foo = "something"
+    model_card.metadata.bar = "something else"
+    rendered = model_card.render()
+    expected = textwrap.dedent(
+        """
+        ---
+        foo: something
+        bar: something else
+        ---
+        """
+    ).strip()
+    assert rendered.startswith(expected)
+
+
+class TestSelect:
+    """Selecting sections from the model card"""
+
+    def test_select_existing_section(self, model_card):
+        section = model_card.select("Model description")
+        assert section.title == "Model description"
+
+    def test_select_existing_subsection(self, model_card):
+        section = model_card.select("Model description/Training Procedure")
+        assert section.title == "Training Procedure"
+
+        section = model_card.select(["Model description", "Training Procedure"])
+        assert section.title == "Training Procedure"
+
+    def test_select_non_existing_section_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select("non-existing section")
+
+    def test_select_non_existing_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select("Model description/non-existing subsection")
+
+        with pytest.raises(KeyError):
+            model_card.select(["Model description", "non-existing subsection"])
+
+    def test_select_non_existing_subsubsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select(
+                "Model description/Training Procedure/non-existing sub-subsection"
+            )
+
+        with pytest.raises(KeyError):
+            model_card.select(
+                [
+                    "Model description",
+                    "Training Procedure",
+                    "non-existing sub-subsection",
+                ]
+            )
+
+    def test_select_non_existing_section_and_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.select(["non-existing section", "non-existing subsection"])
+
+    def test_select_empty_key_raises(self, model_card):
+        msg = r"Section name cannot be empty but got ''"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select("")
+
+        msg = r"Section name cannot be empty but got '\[\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select([])
+
+    def test_select_empty_key_subsection_raises(self, model_card):
+        msg = r"Section name cannot be empty but got 'Model description/'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select("Model description/")
+
+        msg = r"Section name cannot be empty but got '\['Model description', ''\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.select(["Model description", ""])
+
+    def test_default_sections_empty_card(self, model_card):
+        # Without prefill, the card should not contain the default sections
+        from skops.card._model_card import DEFAULT_TEMPLATE
+
+        # model_card (which is prefilled) contains all default sections
+        for key in DEFAULT_TEMPLATE:
+            model_card.select(key)
+
+        # empty card does not contain those sections
+        model = fit_model()
+        card_empty = Card(model, model_diagram=False, prefill=False)
+        for key in DEFAULT_TEMPLATE:
+            with pytest.raises(KeyError):
+                card_empty.select(key)
+
+
+class TestAdd:
+    """Adding sections and subsections"""
+
+    def test_add_new_section(self, model_card):
+        model_card = model_card.add(**{"A new section": "sklearn FTW"})
+        section = model_card.select("A new section")
+        assert section.title == "A new section"
+        assert section.content == "sklearn FTW"
+
+    def test_add_new_subsection(self, model_card):
+        model_card = model_card.add(
+            **{"Model description/A new section": "sklearn FTW"}
+        )
+        section = model_card.select("Model description/A new section")
+        assert section.title == "A new section"
+        assert section.content == "sklearn FTW"
 
+        # make sure that the new subsection is the last subsection
+        subsections = model_card._data["Model description"].subsections
+        assert len(subsections) > 1  # exclude trivial case of only one subsection
 
-def test_plot_model_false(destination_path, model_card):
-    model = fit_model()
-    model_card = Card(model, model_diagram=False).render()
-    assert "<style>" not in model_card
+        last_subsection = list(subsections.values())[-1]
+        assert last_subsection is section
 
+    def test_add_new_section_and_subsection(self, model_card):
+        model_card = model_card.add(**{"A new section/A new subsection": "sklearn FTW"})
 
-def test_add(destination_path, model_card):
-    model_card = model_card.add(model_description="sklearn FTW").render()
-    assert "sklearn FTW" in model_card
+        section = model_card.select("A new section")
+        assert section.title == "A new section"
+        assert section.content == ""
 
+        subsection = model_card.select("A new section/A new subsection")
+        assert subsection.title == "A new subsection"
+        assert subsection.content == "sklearn FTW"
 
-def test_template_sections_not_mutated_by_save(destination_path, model_card):
-    template_sections_before = copy.deepcopy(model_card._template_sections)
-    model_card.save(Path(destination_path) / "README.md")
-    template_sections_after = copy.deepcopy(model_card._template_sections)
-    assert template_sections_before == template_sections_after
+    def test_add_new_section_with_slash_in_name(self, model_card):
+        model_card = model_card.add(**{"A new\\/section": "sklearn FTW"})
+        section = model_card.select("A new\\/section")
+        assert section.title == "A new/section"
+        assert section.content == "sklearn FTW"
+
+    def test_add_new_subsection_with_slash_in_name(self, model_card):
+        model_card = model_card.add(
+            **{"Model description/A new\\/section": "sklearn FTW"}
+        )
+        section = model_card.select("Model description/A new\\/section")
+        assert section.title == "A new/section"
+        assert section.content == "sklearn FTW"
+
+    def test_add_content_to_existing_section(self, model_card):
+        # Add content (not new sections) to an existing section. Make sure that
+        # existing subsections are not affected by this
+        section = model_card.select("Model description")
+        num_subsection_before = len(section.subsections)
+        assert num_subsection_before > 0  # exclude trivial case of empty sections
+
+        # add content to "Model description" section
+        model_card = model_card.add(**{"Model description": "sklearn FTW"})
+        section = model_card.select("Model description")
+        num_subsection_after = len(section.subsections)
+
+        assert num_subsection_before == num_subsection_after
+        assert section.content == "sklearn FTW"
+
+
+class TestDelete:
+    """Deleting sections and subsections"""
+
+    def test_delete_section(self, model_card):
+        model_card.select("Model description")
+        model_card.delete("Model description")
+        with pytest.raises(KeyError):
+            model_card.select("Model description")
+
+    def test_delete_subsection(self, model_card):
+        model_card.select("Model description/Training Procedure")
+        model_card.delete("Model description/Training Procedure")
+        with pytest.raises(KeyError):
+            model_card.select("Model description/Training Procedure")
+        # parent section still exists
+        model_card.delete("Model description")
+
+    def test_delete_subsubsection(self, model_card):
+        model_card.select("Model description/Training Procedure/Hyperparameters")
+        model_card.delete("Model description/Training Procedure/Hyperparameters")
+        with pytest.raises(KeyError):
+            model_card.select("Model description/Training Procedure/Hyperparameters")
+        # parent section still exists
+        model_card.delete("Model description/Training Procedure")
+
+    def test_delete_section_with_slash_in_name(self, model_card):
+        model_card.add(**{"A new\\/section": "some content"})
+        model_card.select("A new\\/section")
+        model_card.delete("A new\\/section")
+        with pytest.raises(KeyError):
+            model_card.select("A new\\/section")
+
+    def test_delete_non_existing_section_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete("non-existing section")
+
+    def test_delete_non_existing_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete("Model description/non-existing subsection")
+
+        with pytest.raises(KeyError):
+            model_card.delete(["Model description", "non-existing subsection"])
+
+    def test_delete_non_existing_subsubsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete(
+                "Model description/Training Procedure/non-existing sub-subsection"
+            )
+
+        with pytest.raises(KeyError):
+            model_card.delete(
+                [
+                    "Model description",
+                    "Training Procedure",
+                    "non-existing sub-subsection",
+                ]
+            )
+
+    def test_delete_non_existing_section_and_subsection_raises(self, model_card):
+        with pytest.raises(KeyError):
+            model_card.delete(["non-existing section", "non-existing subsection"])
+
+    def test_delete_empty_key_raises(self, model_card):
+        msg = r"Section name cannot be empty but got ''"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete("")
+
+        msg = r"Section name cannot be empty but got '\[\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete([])
+
+    def test_delete_empty_key_subsection_raises(self, model_card):
+        msg = r"Section name cannot be empty but got 'Model description/'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete("Model description/")
+
+        msg = r"Section name cannot be empty but got '\['Model description', ''\]'"
+        with pytest.raises(KeyError, match=msg):
+            model_card.delete(["Model description", ""])
 
 
 def test_add_plot(destination_path, model_card):
     plt.plot([4, 5, 6, 7])
     plt.savefig(Path(destination_path) / "fig1.png")
-    model_card = model_card.add_plot(fig1="fig1.png").render()
-    assert "![fig1](fig1.png)" in model_card
+    model_card = model_card.add_plot(fig1="fig1.png")
+    plot_content = model_card.select("fig1").content.format()
+    assert plot_content == "![fig1](fig1.png)"
 
 
-def test_temporary_plot(destination_path, model_card):
-    # test if the additions are made to a temporary template file
-    # and not to default template or template provided
-    root = skops.__path__
-    # read original template
-    with open(Path(root[0]) / "card" / "default_template.md") as f:
-        default_template = f.read()
+def test_add_plot_to_existing_section(destination_path, model_card):
     plt.plot([4, 5, 6, 7])
     plt.savefig(Path(destination_path) / "fig1.png")
-    model_card.add_plot(fig1="fig1.png")
-    model_card.save(Path(destination_path) / "README.md")
-    # check if default template is not modified
-    with open(Path(root[0]) / "card" / "default_template.md") as f:
-        default_template_post = f.read()
-    assert default_template == default_template_post
+    model_card = model_card.add_plot(**{"Model description/Figure 1": "fig1.png"})
+    plot_content = model_card.select("Model description/Figure 1").content.format()
+    assert plot_content == "![Figure 1](fig1.png)"
 
 
-def test_metadata_keys(destination_path, model_card):
-    # test if the metadata is added on top of the card
+def test_adding_metadata(model_card):
+    # test if the metadata is added to the card
     model_card.metadata.tags = "dummy"
-    model_card = model_card.render()
-    assert "tags: dummy" in model_card
+    metadata = list(model_card._generate_metadata(model_card.metadata))
+    assert len(metadata) == 1
+    assert metadata[0] == "metadata.tags=dummy,"
+
 
+@pytest.mark.xfail(reason="Waiting for update of model attribute")
+def test_override_model(model_card):
+    # test that the model can be overridden and dependent sections are updated
+    hyperparams_before = model_card.select(
+        "Model description/Training Procedure/Hyperparameters"
+    ).content
+    model_card.model = DecisionTreeClassifier()
+    hyperparams_after = model_card.select(
+        "Model description/Training Procedure/Hyperparameters"
+    ).content
 
-def test_default_sections_save(model_card):
-    # test if the plot and hyperparameters are only added during save
-    assert "<style>" not in str(model_card)
-    assert "fit_intercept" not in str(model_card)
+    assert hyperparams_before != hyperparams_after
+    assert "fit_intercept" not in hyperparams_before
+    assert "min_samples_leaf" in hyperparams_after
 
 
 def test_add_metrics(destination_path, model_card):
-    model_card.add_metrics(**{"acc": 0.1})
-    model_card.add_metrics(f1=0.1)
-    card = model_card.render()
-    assert ("acc" in card) and ("f1" in card) and ("0.1" in card)
+    model_card.add_metrics(**{"acc": "0.1"})  # str
+    model_card.add_metrics(f1=0.1)  # float
+    model_card.add_metrics(awesomeness=123)  # int
+
+    eval_metric_content = model_card.select(
+        "Model description/Evaluation Results"
+    ).content
+    expected = "\n".join(
+        [
+            "| Metric      |   Value |",
+            "|-------------|---------|",
+            "| acc         |     0.1 |",
+            "| f1          |     0.1 |",
+            "| awesomeness |   123   |",
+        ]
+    )
+    assert eval_metric_content.endswith(expected)
 
 
-def test_code_autogeneration(destination_path, pkl_model_card_metadata_from_config):
+def test_code_autogeneration(
+    model_card, destination_path, pkl_model_card_metadata_from_config
+):
     # test if getting started code is automatically generated
     metadata = metadata_load(local_path=Path(destination_path) / "README.md")
     filename = metadata["model_file"]
@@ -257,125 +560,107 @@ class TestCardRepr:
     def card(self):
         model = LinearRegression(fit_intercept=False)
         card = Card(model=model)
+        card.add(Figures="")
         card.add(
-            model_description="A description",
-            model_card_authors="Jane Doe",
+            **{
+                "Model Description": "A description",
+                "Model Card Authors": "Jane Doe",
+            }
         )
         card.add_plot(
-            roc_curve="ROC_curve.png",
-            confusion_matrix="confusion_matrix.jpg",
+            **{
+                "Figures/ROC": "ROC.png",
+                "Figures/Confusion matrix": "confusion_matrix.jpg",
+            }
         )
-        card.add_table(search_results={"split": [1, 2, 3], "score": [4, 5, 6]})
+        card.add_table(**{"Search Results": {"split": [1, 2, 3], "score": [4, 5, 6]}})
         return card
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_card_repr(self, card: Card, meth):
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
+    @pytest.fixture
+    def expected_lines(self):
+        card_repr = """
+        Card(
+          model=LinearRegression(fit_intercept=False)
+          Model description/Training Procedure/...ed | | positive | False | </details>,
+          Model description/Training Procedure/...</pre></div></div></div></div></div>,
+          Model description/Evaluation Results=...ric | Value | |----------|---------|,
+          Model Card Authors=Jane Doe,
+          Figures/ROC='ROC.png',
+          Figures/Confusion matrix='confusion_matrix.jpg',
+          Model Description=A description,
+          Search Results=Table(3x2),
         )
-        assert result == expected
+        """
+        expected = textwrap.dedent(card_repr).strip()
+        lines = expected.split("\n")
+
+        # TODO: remove when dropping sklearn v0.24 and when dropping v1.1 and
+        # below. This is because the "normalize" parameter was changed after
+        # v0.24 will be removed completely in sklearn v1.2.
+        major, minor, *_ = sklearn.__version__.split(".")
+        if int(major) < 1:
+            # v0.24: "deprecated" -> "False"
+            lines[2] = (
+                "  Model description/Training Procedure/...se | | positive | False | "
+                "</details>,"
+            )
+        elif int(minor) >= 2:
+            # >= v1.2: remove argument completely
+            lines[2] = (
+                "  Model description/Training Procedure/... | | | positive | False | "
+                "</details>,"
+            )
+        return lines
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_very_long_lines_are_shortened(self, card: Card, meth):
-        card.add(my_section="very long line " * 100)
+    def test_card_repr(self, card: Card, meth, expected_lines):
         result = meth(card)
-        expected = (
-            "Card(\n  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n  model_card_authors='Jane Doe',\n"
-            "  my_section='very long line very lon...line very long line very long line"
-            " ',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
+        expected = "\n".join(expected_lines)
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_without_model_attribute(self, card: Card, meth):
-        del card.model
+    def test_card_repr_empty_card(self, meth):
+        """Without prefill, the repr should be empty"""
+        model = fit_model()
+        card = Card(model, model_diagram=False, prefill=False)
         result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
+        expected = textwrap.dedent(
+            """
+        Card(
+          model=LinearRegression()
         )
+        """
+        ).strip()
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_no_template_sections(self, card: Card, meth):
-        card._template_sections = {}
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
-        assert result == expected
+    def test_very_long_lines_are_shortened(self, card: Card, meth, expected_lines):
+        card.add(my_section="very long line " * 100)
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_no_extra_sections(self, card: Card, meth):
-        card._extra_sections = []
-        result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            ")"
+        # expected results contain 1 line at the very end
+        extra_line = (
+            "  my_section=very long line very long l... "
+            "line very long line very long line ,"
         )
-        assert result == expected
+        expected_lines.insert(-1, extra_line)
+        expected = "\n".join(expected_lines)
 
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_template_section_val_not_str(self, card: Card, meth):
-        card._template_sections["model_description"] = [1, 2, 3]  # type: ignore
         result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description=[1, 2, 3],\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_extra_sections_val_not_str(self, card: Card, meth):
-        card._extra_sections.append(("some section", {1: 2}))
+    def test_without_model_attribute(self, card: Card, meth, expected_lines):
+        del card.model
+
+        # remove line 1 from expected results, which corresponds to the model
+        del expected_lines[1]
+        expected = "\n".join(expected_lines)
+
         result = meth(card)
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            "  some section={1: 2},\n"
-            ")"
-        )
         assert result == expected
 
     @pytest.mark.parametrize("meth", [repr, str])
-    def test_with_metadata(self, card: Card, meth):
+    def test_with_metadata(self, card: Card, meth, expected_lines):
         metadata = CardData(
             language="fr",
             license="bsd",
@@ -385,22 +670,18 @@ def test_with_metadata(self, card: Card, meth):
             widget={"something": "very-long"},
         )
         card.metadata = metadata
-        expected = (
-            "Card(\n"
-            "  model=LinearRegression(fit_intercept=False),\n"
-            "  metadata.language=fr,\n"
-            "  metadata.license=bsd,\n"
-            "  metadata.library_name=sklearn,\n"
-            "  metadata.tags=['sklearn', 'tabular-classification'],\n"
-            "  metadata.foo={'bar': 123},\n"
-            "  metadata.widget={...},\n"
-            "  model_description='A description',\n"
-            "  model_card_authors='Jane Doe',\n"
-            "  roc_curve='ROC_curve.png',\n"
-            "  confusion_matrix='confusion_matrix.jpg',\n"
-            "  search_results=Table(3x2),\n"
-            ")"
-        )
+
+        # metadata comes after model line, i.e. position 2
+        extra_lines = [
+            "  metadata.language=fr,",
+            "  metadata.license=bsd,",
+            "  metadata.library_name=sklearn,",
+            "  metadata.tags=['sklearn', 'tabular-classification'],",
+            "  metadata.foo={'bar': 123},",
+            "  metadata.widget={...},",
+        ]
+        expected = "\n".join(expected_lines[:2] + extra_lines + expected_lines[2:])
+
         result = meth(card)
         assert result == expected
 
diff --git a/skops/card/tests/test_card_alternative.py b/skops/card/tests/test_card_alternative.py
deleted file mode 100644
index 5cb5407f..00000000
--- a/skops/card/tests/test_card_alternative.py
+++ /dev/null
@@ -1,958 +0,0 @@
-import os
-import pickle
-import tempfile
-import textwrap
-from itertools import zip_longest
-from pathlib import Path
-
-import matplotlib.pyplot as plt
-import numpy as np
-import pytest
-import sklearn
-from huggingface_hub import CardData, metadata_load
-from sklearn.datasets import load_iris
-from sklearn.linear_model import LinearRegression, LogisticRegression
-from sklearn.tree import DecisionTreeClassifier
-
-from skops import hub_utils
-from skops.card import metadata_from_config
-from skops.card._card_alternative import Card
-from skops.card._model_card import PlotSection, TableSection
-from skops.io import dump
-
-
-def fit_model():
-    X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
-    y = np.dot(X, np.array([1, 2])) + 3
-    reg = LinearRegression().fit(X, y)
-    return reg
-
-
-@pytest.fixture
-def model_card(model_diagram=True):
-    model = fit_model()
-    card = Card(model, model_diagram)
-    yield card
-
-
-@pytest.fixture
-def iris_data():
-    X, y = load_iris(return_X_y=True, as_frame=True)
-    yield X, y
-
-
-@pytest.fixture
-def iris_estimator(iris_data):
-    X, y = iris_data
-    est = LogisticRegression(solver="liblinear").fit(X, y)
-    yield est
-
-
-@pytest.fixture
-def iris_pkl_file(iris_estimator):
-    pkl_file = tempfile.mkstemp(suffix=".pkl", prefix="skops-test")[1]
-    with open(pkl_file, "wb") as f:
-        pickle.dump(iris_estimator, f)
-    yield pkl_file
-
-
-@pytest.fixture
-def iris_skops_file(iris_estimator):
-    skops_folder = tempfile.mkdtemp()
-    model_name = "model.skops"
-    skops_path = Path(skops_folder) / model_name
-    dump(iris_estimator, skops_path)
-    yield skops_path
-
-
-def _create_model_card_from_saved_model(
-    destination_path,
-    iris_estimator,
-    iris_data,
-    save_file,
-):
-    X, y = iris_data
-    hub_utils.init(
-        model=save_file,
-        requirements=[f"scikit-learn=={sklearn.__version__}"],
-        dst=destination_path,
-        task="tabular-classification",
-        data=X,
-    )
-    card = Card(iris_estimator, metadata=metadata_from_config(destination_path))
-    card.save(Path(destination_path) / "README.md")
-    return card
-
-
-@pytest.fixture
-def skops_model_card_metadata_from_config(
-    destination_path, iris_estimator, iris_skops_file, iris_data
-):
-    yield _create_model_card_from_saved_model(
-        destination_path, iris_estimator, iris_data, iris_skops_file
-    )
-
-
-@pytest.fixture
-def pkl_model_card_metadata_from_config(
-    destination_path, iris_estimator, iris_pkl_file, iris_data
-):
-    yield _create_model_card_from_saved_model(
-        destination_path, iris_estimator, iris_data, iris_pkl_file
-    )
-
-
-@pytest.fixture
-def destination_path():
-    with tempfile.TemporaryDirectory(prefix="skops-test") as dir_path:
-        yield Path(dir_path)
-
-
-def test_save_model_card(destination_path, model_card):
-    model_card.save(Path(destination_path) / "README.md")
-    assert (Path(destination_path) / "README.md").exists()
-
-
-def test_hyperparameter_table(model_card):
-    section_name = "Model description/Training Procedure/Hyperparameters"
-    result = model_card.select(section_name).content
-
-    lines = [
-        "The model is trained with below hyperparameters.",
-        "",
-        "<details>",
-        "<summary> Click to expand </summary>",
-        "",
-        "| Hyperparameter   | Value   |",
-        "|------------------|---------|",
-        "| copy_X           | True    |",
-        "| fit_intercept    | True    |",
-        "| n_jobs           |         |",
-        "| normalize        | False   |",
-        "| positive         | False   |",
-        "",
-        "</details>",
-    ]
-    # TODO: remove when dropping sklearn v0.24 and when dropping v1.1 and
-    # below. This is because the "normalize" parameter was changed after
-    # v0.24 will be removed completely in sklearn v1.2.
-    major, minor, *_ = sklearn.__version__.split(".")
-    major, minor = int(major), int(minor)
-    if (major >= 1) and (minor < 2):
-        lines[10] = "| normalize        | deprecated |"
-    elif (major >= 1) and (minor >= 2):
-        del lines[10]
-    expected = "\n".join(lines)
-
-    # remove multiple whitespaces and dashes, as they're not important and may
-    # differ depending on OS
-    expected = _strip_multiple_chars(expected, " ")
-    expected = _strip_multiple_chars(expected, "-")
-    result = _strip_multiple_chars(result, " ")
-    result = _strip_multiple_chars(result, "-")
-
-    assert result == expected
-
-
-def _strip_multiple_chars(text, char):
-    # _strip_multiple_chars("hi    there") == "hi there"
-    # _strip_multiple_chars("|---|--|", "-") == "|-|-|"
-    while char + char in text:
-        text = text.replace(char + char, char)
-    return text
-
-
-def test_hyperparameter_table_with_line_break():
-    # Hyperparameters can contain values with line breaks, "\n", in them. In
-    # that case, the markdown table is broken. Check that the hyperparameter
-    # table we create properly replaces the "\n" with "<br />".
-    class EstimatorWithLbInParams:
-        def get_params(self, deep=False):
-            return {"fit_intercept": True, "n_jobs": "line\nwith\nbreak"}
-
-    model_card = Card(EstimatorWithLbInParams())
-    section_name = "Model description/Training Procedure/Hyperparameters"
-    text_hyperparams = model_card.select(section_name).content
-
-    # remove multiple whitespaces, as they're not important
-    text_cleaned = _strip_multiple_chars(text_hyperparams, " ")
-    assert "| n_jobs | line<br />with<br />break |" in text_cleaned
-
-
-def test_plot_model(model_card):
-    text_plot = model_card.select(
-        "Model description/Training Procedure/Model Plot"
-    ).content
-    # don't compare whole text, as it's quite long and non-deterministic
-    assert text_plot.startswith("The model plot is below.\n\n<style>#sk-")
-    assert "<style>" in text_plot
-    assert text_plot.endswith(
-        "<pre>LinearRegression()</pre></div></div></div></div></div>"
-    )
-
-
-def test_plot_model_false(model_card):
-    model = fit_model()
-    model_card = Card(model, model_diagram=False)
-    text_plot = model_card.select(
-        "Model description/Training Procedure/Model Plot"
-    ).content
-    assert text_plot == "The model plot is below."
-
-
-def test_render(model_card, destination_path):
-    file_name = destination_path / "README.md"
-    model_card.save(file_name)
-    with open(file_name, "r", encoding="utf-8") as f:
-        loaded = f.read()
-
-    rendered = model_card.render()
-    assert loaded == rendered
-
-
-def test_with_metadata(model_card):
-    model_card.metadata.foo = "something"
-    model_card.metadata.bar = "something else"
-    rendered = model_card.render()
-    expected = textwrap.dedent(
-        """
-        ---
-        foo: something
-        bar: something else
-        ---
-        """
-    ).strip()
-    assert rendered.startswith(expected)
-
-
-class TestSelect:
-    """Selecting sections from the model card"""
-
-    def test_select_existing_section(self, model_card):
-        section = model_card.select("Model description")
-        assert section.title == "Model description"
-
-    def test_select_existing_subsection(self, model_card):
-        section = model_card.select("Model description/Training Procedure")
-        assert section.title == "Training Procedure"
-
-        section = model_card.select(["Model description", "Training Procedure"])
-        assert section.title == "Training Procedure"
-
-    def test_select_non_existing_section_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.select("non-existing section")
-
-    def test_select_non_existing_subsection_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.select("Model description/non-existing subsection")
-
-        with pytest.raises(KeyError):
-            model_card.select(["Model description", "non-existing subsection"])
-
-    def test_select_non_existing_subsubsection_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.select(
-                "Model description/Training Procedure/non-existing sub-subsection"
-            )
-
-        with pytest.raises(KeyError):
-            model_card.select(
-                [
-                    "Model description",
-                    "Training Procedure",
-                    "non-existing sub-subsection",
-                ]
-            )
-
-    def test_select_non_existing_section_and_subsection_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.select(["non-existing section", "non-existing subsection"])
-
-    def test_select_empty_key_raises(self, model_card):
-        msg = r"Section name cannot be empty but got ''"
-        with pytest.raises(KeyError, match=msg):
-            model_card.select("")
-
-        msg = r"Section name cannot be empty but got '\[\]'"
-        with pytest.raises(KeyError, match=msg):
-            model_card.select([])
-
-    def test_select_empty_key_subsection_raises(self, model_card):
-        msg = r"Section name cannot be empty but got 'Model description/'"
-        with pytest.raises(KeyError, match=msg):
-            model_card.select("Model description/")
-
-        msg = r"Section name cannot be empty but got '\['Model description', ''\]'"
-        with pytest.raises(KeyError, match=msg):
-            model_card.select(["Model description", ""])
-
-    def test_default_sections_empty_card(self, model_card):
-        # Without prefill, the card should not contain the default sections
-        from skops.card._card_alternative import DEFAULT_TEMPLATE
-
-        # model_card (which is prefilled) contains all default sections
-        for key in DEFAULT_TEMPLATE:
-            model_card.select(key)
-
-        # empty card does not contain those sections
-        model = fit_model()
-        card_empty = Card(model, model_diagram=False, prefill=False)
-        for key in DEFAULT_TEMPLATE:
-            with pytest.raises(KeyError):
-                card_empty.select(key)
-
-
-class TestAdd:
-    """Adding sections and subsections"""
-
-    def test_add_new_section(self, model_card):
-        model_card = model_card.add(**{"A new section": "sklearn FTW"})
-        section = model_card.select("A new section")
-        assert section.title == "A new section"
-        assert section.content == "sklearn FTW"
-
-    def test_add_new_subsection(self, model_card):
-        model_card = model_card.add(
-            **{"Model description/A new section": "sklearn FTW"}
-        )
-        section = model_card.select("Model description/A new section")
-        assert section.title == "A new section"
-        assert section.content == "sklearn FTW"
-
-        # make sure that the new subsection is the last subsection
-        subsections = model_card._data["Model description"].subsections
-        assert len(subsections) > 1  # exclude trivial case of only one subsection
-
-        last_subsection = list(subsections.values())[-1]
-        assert last_subsection is section
-
-    def test_add_new_section_and_subsection(self, model_card):
-        model_card = model_card.add(**{"A new section/A new subsection": "sklearn FTW"})
-
-        section = model_card.select("A new section")
-        assert section.title == "A new section"
-        assert section.content == ""
-
-        subsection = model_card.select("A new section/A new subsection")
-        assert subsection.title == "A new subsection"
-        assert subsection.content == "sklearn FTW"
-
-    def test_add_new_section_with_slash_in_name(self, model_card):
-        model_card = model_card.add(**{"A new\\/section": "sklearn FTW"})
-        section = model_card.select("A new\\/section")
-        assert section.title == "A new/section"
-        assert section.content == "sklearn FTW"
-
-    def test_add_new_subsection_with_slash_in_name(self, model_card):
-        model_card = model_card.add(
-            **{"Model description/A new\\/section": "sklearn FTW"}
-        )
-        section = model_card.select("Model description/A new\\/section")
-        assert section.title == "A new/section"
-        assert section.content == "sklearn FTW"
-
-    def test_add_content_to_existing_section(self, model_card):
-        # Add content (not new sections) to an existing section. Make sure that
-        # existing subsections are not affected by this
-        section = model_card.select("Model description")
-        num_subsection_before = len(section.subsections)
-        assert num_subsection_before > 0  # exclude trivial case of empty sections
-
-        # add content to "Model description" section
-        model_card = model_card.add(**{"Model description": "sklearn FTW"})
-        section = model_card.select("Model description")
-        num_subsection_after = len(section.subsections)
-
-        assert num_subsection_before == num_subsection_after
-        assert section.content == "sklearn FTW"
-
-
-class TestDelete:
-    """Deleting sections and subsections"""
-
-    def test_delete_section(self, model_card):
-        model_card.select("Model description")
-        model_card.delete("Model description")
-        with pytest.raises(KeyError):
-            model_card.select("Model description")
-
-    def test_delete_subsection(self, model_card):
-        model_card.select("Model description/Training Procedure")
-        model_card.delete("Model description/Training Procedure")
-        with pytest.raises(KeyError):
-            model_card.select("Model description/Training Procedure")
-        # parent section still exists
-        model_card.delete("Model description")
-
-    def test_delete_subsubsection(self, model_card):
-        model_card.select("Model description/Training Procedure/Hyperparameters")
-        model_card.delete("Model description/Training Procedure/Hyperparameters")
-        with pytest.raises(KeyError):
-            model_card.select("Model description/Training Procedure/Hyperparameters")
-        # parent section still exists
-        model_card.delete("Model description/Training Procedure")
-
-    def test_delete_section_with_slash_in_name(self, model_card):
-        model_card.add(**{"A new\\/section": "some content"})
-        model_card.select("A new\\/section")
-        model_card.delete("A new\\/section")
-        with pytest.raises(KeyError):
-            model_card.select("A new\\/section")
-
-    def test_delete_non_existing_section_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.delete("non-existing section")
-
-    def test_delete_non_existing_subsection_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.delete("Model description/non-existing subsection")
-
-        with pytest.raises(KeyError):
-            model_card.delete(["Model description", "non-existing subsection"])
-
-    def test_delete_non_existing_subsubsection_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.delete(
-                "Model description/Training Procedure/non-existing sub-subsection"
-            )
-
-        with pytest.raises(KeyError):
-            model_card.delete(
-                [
-                    "Model description",
-                    "Training Procedure",
-                    "non-existing sub-subsection",
-                ]
-            )
-
-    def test_delete_non_existing_section_and_subsection_raises(self, model_card):
-        with pytest.raises(KeyError):
-            model_card.delete(["non-existing section", "non-existing subsection"])
-
-    def test_delete_empty_key_raises(self, model_card):
-        msg = r"Section name cannot be empty but got ''"
-        with pytest.raises(KeyError, match=msg):
-            model_card.delete("")
-
-        msg = r"Section name cannot be empty but got '\[\]'"
-        with pytest.raises(KeyError, match=msg):
-            model_card.delete([])
-
-    def test_delete_empty_key_subsection_raises(self, model_card):
-        msg = r"Section name cannot be empty but got 'Model description/'"
-        with pytest.raises(KeyError, match=msg):
-            model_card.delete("Model description/")
-
-        msg = r"Section name cannot be empty but got '\['Model description', ''\]'"
-        with pytest.raises(KeyError, match=msg):
-            model_card.delete(["Model description", ""])
-
-
-def test_add_plot(destination_path, model_card):
-    plt.plot([4, 5, 6, 7])
-    plt.savefig(Path(destination_path) / "fig1.png")
-    model_card = model_card.add_plot(fig1="fig1.png")
-    plot_content = model_card.select("fig1").content.format()
-    assert plot_content == "![fig1](fig1.png)"
-
-
-def test_add_plot_to_existing_section(destination_path, model_card):
-    plt.plot([4, 5, 6, 7])
-    plt.savefig(Path(destination_path) / "fig1.png")
-    model_card = model_card.add_plot(**{"Model description/Figure 1": "fig1.png"})
-    plot_content = model_card.select("Model description/Figure 1").content.format()
-    assert plot_content == "![Figure 1](fig1.png)"
-
-
-def test_adding_metadata(model_card):
-    # test if the metadata is added to the card
-    model_card.metadata.tags = "dummy"
-    metadata = list(model_card._generate_metadata(model_card.metadata))
-    assert len(metadata) == 1
-    assert metadata[0] == "metadata.tags=dummy,"
-
-
-@pytest.mark.xfail(reason="Waiting for update of model attribute")
-def test_override_model(model_card):
-    # test that the model can be overridden and dependent sections are updated
-    hyperparams_before = model_card.select(
-        "Model description/Training Procedure/Hyperparameters"
-    ).content
-    model_card.model = DecisionTreeClassifier()
-    hyperparams_after = model_card.select(
-        "Model description/Training Procedure/Hyperparameters"
-    ).content
-
-    assert hyperparams_before != hyperparams_after
-    assert "fit_intercept" not in hyperparams_before
-    assert "min_samples_leaf" in hyperparams_after
-
-
-def test_add_metrics(destination_path, model_card):
-    model_card.add_metrics(**{"acc": "0.1"})  # str
-    model_card.add_metrics(f1=0.1)  # float
-    model_card.add_metrics(awesomeness=123)  # int
-
-    eval_metric_content = model_card.select(
-        "Model description/Evaluation Results"
-    ).content
-    expected = "\n".join(
-        [
-            "| Metric      |   Value |",
-            "|-------------|---------|",
-            "| acc         |     0.1 |",
-            "| f1          |     0.1 |",
-            "| awesomeness |   123   |",
-        ]
-    )
-    assert eval_metric_content.endswith(expected)
-
-
-def test_code_autogeneration(
-    model_card, destination_path, pkl_model_card_metadata_from_config
-):
-    # test if getting started code is automatically generated
-    metadata = metadata_load(local_path=Path(destination_path) / "README.md")
-    filename = metadata["model_file"]
-    with open(Path(destination_path) / "README.md") as f:
-        assert f"joblib.load({filename})" in f.read()
-
-
-def test_code_autogeneration_skops(
-    destination_path, skops_model_card_metadata_from_config
-):
-    # test if getting started code is automatically generated for skops format
-    metadata = metadata_load(local_path=Path(destination_path) / "README.md")
-    filename = metadata["model_file"]
-    with open(Path(destination_path) / "README.md") as f:
-        read_buffer = f.read()
-        assert f'model = load("{filename}")' in read_buffer
-
-        # test if the model doesn't overflow the huggingface models page
-        assert read_buffer.count("sk-top-container") == 1
-        assert 'style="overflow: auto;' in read_buffer
-
-
-def test_metadata_from_config_tabular_data(
-    pkl_model_card_metadata_from_config, destination_path
-):
-    # test if widget data is correctly set in the README
-    metadata = metadata_load(local_path=Path(destination_path) / "README.md")
-    assert "widget" in metadata
-
-    expected_data = {
-        "structuredData": {
-            "petal length (cm)": [1.4, 1.4, 1.3],
-            "petal width (cm)": [0.2, 0.2, 0.2],
-            "sepal length (cm)": [5.1, 4.9, 4.7],
-            "sepal width (cm)": [3.5, 3.0, 3.2],
-        }
-    }
-    assert metadata["widget"] == expected_data
-
-    for tag in ["sklearn", "skops", "tabular-classification"]:
-        assert tag in metadata["tags"]
-
-
-class TestCardRepr:
-    """Test __str__ and __repr__ methods of Card, which are identical for now"""
-
-    @pytest.fixture
-    def card(self):
-        model = LinearRegression(fit_intercept=False)
-        card = Card(model=model)
-        card.add(Figures="")
-        card.add(
-            **{
-                "Model Description": "A description",
-                "Model Card Authors": "Jane Doe",
-            }
-        )
-        card.add_plot(
-            **{
-                "Figures/ROC": "ROC.png",
-                "Figures/Confusion matrix": "confusion_matrix.jpg",
-            }
-        )
-        card.add_table(**{"Search Results": {"split": [1, 2, 3], "score": [4, 5, 6]}})
-        return card
-
-    @pytest.fixture
-    def expected_lines(self):
-        card_repr = """
-        Card(
-          model=LinearRegression(fit_intercept=False)
-          Model description/Training Procedure/...ed | | positive | False | </details>,
-          Model description/Training Procedure/...</pre></div></div></div></div></div>,
-          Model description/Evaluation Results=...ric | Value | |----------|---------|,
-          Model Card Authors=Jane Doe,
-          Figures/ROC='ROC.png',
-          Figures/Confusion matrix='confusion_matrix.jpg',
-          Model Description=A description,
-          Search Results=Table(3x2),
-        )
-        """
-        expected = textwrap.dedent(card_repr).strip()
-        lines = expected.split("\n")
-
-        # TODO: remove when dropping sklearn v0.24 and when dropping v1.1 and
-        # below. This is because the "normalize" parameter was changed after
-        # v0.24 will be removed completely in sklearn v1.2.
-        major, minor, *_ = sklearn.__version__.split(".")
-        if int(major) < 1:
-            # v0.24: "deprecated" -> "False"
-            lines[2] = (
-                "  Model description/Training Procedure/...se | | positive | False | "
-                "</details>,"
-            )
-        elif int(minor) >= 2:
-            # >= v1.2: remove argument completely
-            lines[2] = (
-                "  Model description/Training Procedure/... | | | positive | False | "
-                "</details>,"
-            )
-        return lines
-
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_card_repr(self, card: Card, meth, expected_lines):
-        result = meth(card)
-        expected = "\n".join(expected_lines)
-        assert result == expected
-
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_card_repr_empty_card(self, meth):
-        """Without prefill, the repr should be empty"""
-        model = fit_model()
-        card = Card(model, model_diagram=False, prefill=False)
-        result = meth(card)
-        expected = textwrap.dedent(
-            """
-        Card(
-          model=LinearRegression()
-        )
-        """
-        ).strip()
-        assert result == expected
-
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_very_long_lines_are_shortened(self, card: Card, meth, expected_lines):
-        card.add(my_section="very long line " * 100)
-
-        # expected results contain 1 line at the very end
-        extra_line = (
-            "  my_section=very long line very long l... "
-            "line very long line very long line ,"
-        )
-        expected_lines.insert(-1, extra_line)
-        expected = "\n".join(expected_lines)
-
-        result = meth(card)
-        assert result == expected
-
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_without_model_attribute(self, card: Card, meth, expected_lines):
-        del card.model
-
-        # remove line 1 from expected results, which corresponds to the model
-        del expected_lines[1]
-        expected = "\n".join(expected_lines)
-
-        result = meth(card)
-        assert result == expected
-
-    @pytest.mark.parametrize("meth", [repr, str])
-    def test_with_metadata(self, card: Card, meth, expected_lines):
-        metadata = CardData(
-            language="fr",
-            license="bsd",
-            library_name="sklearn",
-            tags=["sklearn", "tabular-classification"],
-            foo={"bar": 123},
-            widget={"something": "very-long"},
-        )
-        card.metadata = metadata
-
-        # metadata comes after model line, i.e. position 2
-        extra_lines = [
-            "  metadata.language=fr,",
-            "  metadata.license=bsd,",
-            "  metadata.library_name=sklearn,",
-            "  metadata.tags=['sklearn', 'tabular-classification'],",
-            "  metadata.foo={'bar': 123},",
-            "  metadata.widget={...},",
-        ]
-        expected = "\n".join(expected_lines[:2] + extra_lines + expected_lines[2:])
-
-        result = meth(card)
-        assert result == expected
-
-
-class TestPlotSection:
-    def test_format_path_is_str(self):
-        section = PlotSection(alt_text="some title", path="path/plot.png")
-        expected = "![some title](path/plot.png)"
-        assert section.format() == expected
-
-    def test_format_path_is_pathlib(self):
-        section = PlotSection(alt_text="some title", path=Path("path") / "plot.png")
-        expected = f"![some title](path{os.path.sep}plot.png)"
-        assert section.format() == expected
-
-    @pytest.mark.parametrize("meth", [str, repr])
-    def test_str_and_repr(self, meth):
-        section = PlotSection(alt_text="some title", path="path/plot.png")
-        expected = "'path/plot.png'"
-        assert meth(section) == expected
-
-    def test_str(self):
-        section = PlotSection(alt_text="some title", path="path/plot.png")
-        expected = "'path/plot.png'"
-        assert str(section) == expected
-
-    @pytest.mark.parametrize("folded", [True, False])
-    def test_folded(self, folded):
-        section = PlotSection(
-            alt_text="some title", path="path/plot.png", folded=folded
-        )
-        output = section.format()
-        if folded:
-            assert "<details>" in output
-        else:
-            assert "<details>" not in output
-
-
-class TestTableSection:
-    @pytest.fixture
-    def table_dict(self):
-        return {"split": [1, 2, 3], "score": [4, 5, 6]}
-
-    def test_table_is_dict(self, table_dict):
-        section = TableSection(table=table_dict)
-        expected = """|   split |   score |
-|---------|---------|
-|       1 |       4 |
-|       2 |       5 |
-|       3 |       6 |"""
-        assert section.format() == expected
-
-    def test_table_is_dataframe(self, table_dict):
-        pd = pytest.importorskip("pandas")
-        df = pd.DataFrame(table_dict)
-        section = TableSection(table=df)
-        expected = """|   split |   score |
-|---------|---------|
-|       1 |       4 |
-|       2 |       5 |
-|       3 |       6 |"""
-        assert section.format() == expected
-
-    @pytest.mark.parametrize("meth", [str, repr])
-    def test_str_and_repr_table_is_dict(self, table_dict, meth):
-        section = TableSection(table=table_dict)
-        expected = "Table(3x2)"
-        assert meth(section) == expected
-
-    @pytest.mark.parametrize("meth", [str, repr])
-    def test_str_and_repr_table_is_dataframe(self, table_dict, meth):
-        pd = pytest.importorskip("pandas")
-        df = pd.DataFrame(table_dict)
-        section = TableSection(table=df)
-        expected = "Table(3x2)"
-        assert meth(section) == expected
-
-    @pytest.mark.parametrize("table", [{}, {"col": []}, "pandas"])
-    def test_raise_error_empty_table(self, table):
-        # Test no columns, no rows, empty df
-        if table == "pandas":
-            pd = pytest.importorskip("pandas")
-            table = pd.DataFrame([])
-
-        msg = "Empty table added"
-        with pytest.raises(ValueError, match=msg):
-            TableSection(table=table)
-
-    def test_pandas_not_installed(self, table_dict, pandas_not_installed):
-        # use pandas_not_installed fixture from conftest.py to pretend that
-        # pandas is not installed
-        section = TableSection(table=table_dict)
-        assert section._is_pandas_df is False
-
-    @pytest.mark.parametrize("folded", [True, False])
-    def test_folded(self, table_dict, folded):
-        section = TableSection(table=table_dict, folded=folded)
-        output = section.format()
-        if folded:
-            assert "<details>" in output
-        else:
-            assert "<details>" not in output
-
-    def test_line_break_in_entry(self, table_dict):
-        # Line breaks are not allowed inside markdown tables, so check that
-        # they're removed. We test 3 conditions here:
-
-        # 1. custom object with line breaks in repr
-        # 2. string with line break in the middle
-        # 3. string with line break at start, middle, and end
-
-        # Note that for the latter, tabulate will automatically strip the line
-        # breaks from the start and end.
-        class LineBreakInRepr:
-            """Custom object whose repr has a line break"""
-
-            def __repr__(self) -> str:
-                return "obj\nwith lb"
-
-        table_dict["with break"] = [
-            LineBreakInRepr(),
-            "hi\nthere",
-            """
-entry with
-line breaks
-""",
-        ]
-        section = TableSection(table=table_dict)
-        expected = """| split | score | with break |
-|-|-|-|
-| 1 | 4 | obj<br />with lb |
-| 2 | 5 | hi<br />there |
-| 3 | 6 | entry with<br />line breaks |"""
-
-        result = section.format()
-        # remove multiple whitespaces and dashes, as they're not important
-        result = _strip_multiple_chars(result, " ")
-        result = _strip_multiple_chars(result, "-")
-        assert result == expected
-
-
-def make_card(card_type, file_path: Path, fill_content: bool = True):
-    import pickle
-
-    import matplotlib.pyplot as plt
-    import sklearn
-    from sklearn.datasets import load_iris
-    from sklearn.linear_model import LogisticRegression
-    from sklearn.pipeline import Pipeline
-    from sklearn.preprocessing import StandardScaler
-
-    from skops import hub_utils
-    from skops.card import Card as CardOld
-    from skops.card import metadata_from_config
-
-    if card_type == "old":
-        card_cls = CardOld  # type: ignore
-    else:
-        card_cls = Card  # type: ignore
-
-    destination_path = file_path.parent
-    X, y = load_iris(return_X_y=True, as_frame=True)
-
-    model = Pipeline(
-        [("scaler", StandardScaler()), ("clf", LogisticRegression(random_state=123))]
-    ).fit(X, y)
-
-    pkl_file = tempfile.mkstemp(suffix=".pkl", prefix="skops-test")[1]
-    with open(pkl_file, "wb") as f:
-        pickle.dump(model, f)
-
-    hub_utils.init(
-        model=pkl_file,
-        requirements=[f"scikit-learn=={sklearn.__version__}"],
-        dst=destination_path,
-        task="tabular-classification",
-        data=X,
-    )
-    card = card_cls(model, metadata=metadata_from_config(destination_path))
-
-    if fill_content:
-        # add metrics
-        card.add_metrics(**{"acc": "0.1"})
-
-        plt.plot([4, 5, 6, 7])
-        plt.savefig(Path(destination_path) / "fig1.png")
-        if card_type == "old":
-            card.add_plot(**{"A beautiful plot": "fig1.png"})
-        else:
-            # old card always adds additional content in an extra section
-            card.add_plot(**{"Additional Content/A beautiful plot": "fig1.png"})
-
-        # add table
-        table = {"split": [1, 2, 3], "score": [4, 5, 6]}
-        if card_type == "old":
-            card.add_table(
-                folded=True,
-                **{"Yet another table": table},
-            )
-        else:
-            # old card always adds additional content in an extra section
-            card.add_table(
-                folded=True, **{"Additional Content/Yet another table": table}
-            )
-
-        # add authors and contacts
-        if card_type == "old":
-            # old card requires to use the placeholder variable name
-            card.add(
-                **{
-                    "model_card_authors": "Alice and Bob",
-                    "model_card_contact": "alice@example.com",
-                    "citation_bibtex": "Holy Cow, Nature, 2022-10",
-                }
-            )
-        else:
-            # new card uses the section titles instead and overrides the
-            # existing content
-            card.add(
-                **{
-                    "Model Card Authors": (
-                        "This model card is written by following authors:\n\n"
-                        "Alice and Bob"
-                    ),
-                    "Model Card Contact": (
-                        "You can contact the model card authors through following"
-                        " channels:\nalice@example.com"
-                    ),
-                    "Citation": (
-                        "Below you can find information related to citation.\n\n"
-                        "**BibTeX:**\n"
-                        "```\nHoly Cow, Nature, 2022-10\n```\n"
-                    ),
-                }
-            )
-
-        # more metrics
-        card.add_metrics(**{"f1": "0.2", "roc": "123"})
-
-    card.save(file_path)
-
-
-@pytest.mark.parametrize("fill_content", [False, True])
-def test_old_and_new_card_identical(fill_content):
-    import tempfile
-
-    with tempfile.TemporaryDirectory(prefix="skops-test") as destination_path:
-        file_path = Path(destination_path) / "README-old.md"
-        make_card("old", file_path, fill_content=fill_content)
-        card_old = file_path.read_text()
-
-    with tempfile.TemporaryDirectory(prefix="skops-test") as destination_path:
-        file_path = Path(destination_path) / "README-new.md"
-        make_card("new", file_path, fill_content=fill_content)
-        card_new = file_path.read_text()
-
-    lines_old, lines_new = card_old.split("\n"), card_new.split("\n")
-    for i, (line0, line1) in enumerate(zip_longest(lines_old, lines_new, fillvalue="")):
-        # actual file name may differ, so only compare start of line
-        if line0.startswith("model_file: skops-"):
-            assert line1.startswith("model_file: skops-")
-            continue
-        if line0.startswith("model = joblib.load(skops-test"):
-            assert line1.startswith("model = joblib.load(skops-test")
-            continue
-
-        # model diagram is not deterministic, e.g. ids
-        if line0.startswith("<style>#sk-"):
-            assert line1.startswith("<style>#sk-")
-            continue
-
-        assert line0 == line1

From 00b766512e4ba04f221953080bf6f05f8edca95b Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 21 Nov 2022 17:57:51 +0100
Subject: [PATCH 13/47] Address reviewer comments

- Remove noise from docstring example
- Add the comma after model repr
- Add docstrings to private methods
---
 skops/card/_model_card.py     | 86 ++++++++++++++++++++---------------
 skops/card/tests/test_card.py |  4 +-
 2 files changed, 52 insertions(+), 38 deletions(-)

diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index aa19982a..d9a027c4 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -341,13 +341,7 @@ class Card:
     ...     "accuracy": accuracy_score(y, y_pred),
     ...     "f1 score": f1_score(y, y_pred, average="micro"),
     ... })
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-    )
+    Card(...)
     >>> cm = confusion_matrix(y, y_pred,labels=model.classes_)
     >>> disp = ConfusionMatrixDisplay(
     ...     confusion_matrix=cm,
@@ -361,41 +355,17 @@ class Card:
     >>> model_card.add_plot(**{
     ...     "Model description/Confusion Matrix": tmp_path / "confusion_matrix.png"
     ... })
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-    )
+    Card(...)
     >>> # add new content to the existing section "Model description"
     >>> model_card.add(**{"Model description": "This is the best model"})
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description=This is the best model,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-    )
+    Card(...)
     >>> # add content to a new section
     >>> model_card.add(**{"A new section": "Please rate my model"})
-    Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
-      metadata.license=mit,
-      Model description=This is the best model,
-      Model description/Training Procedure/... | | warm_start | False | </details>,
-      Model description/Training Procedure/...</pre></div></div></div></div></div>,
-      Model description/Evaluation Results=...ccuracy | 0.96 | | f1 score | 0.96 |,
-      Model description/Confusion Matrix=...confusion_matrix.png'),
-      A new section=Please rate my model,
-    )
+    Card(...)
     >>> # add new subsection to an existing section by using "/"
     >>> model_card.add(**{"Model description/Model name": "This model is called Bob"})
     Card(
-      model=LogisticRegression(random_state=0, solver='liblinear')
+      model=LogisticRegression(random_state=0, solver='liblinear'),
       metadata.license=mit,
       Model description=This is the best model,
       Model description/Training Procedure/... | | warm_start | False | </details>,
@@ -479,6 +449,31 @@ def add(self, **kwargs: str | Formattable) -> "Card":
     def _select(
         self, subsection_names: Sequence[str], create: bool = True
     ) -> dict[str, Section]:
+        """Select a single section from the data
+
+        Parameters
+        ----------
+        subsection_names: list of str
+            The subsection names, already split into individual subsections.
+
+        create: bool (default=True)
+            Whether to create the subsection if it does not already exist or
+            not.
+
+        Returns
+        -------
+        section: dict of Section
+            A dict mapping the section key (identical to the title) to the
+            actual ``Section``, which is a dataclass that contains the actual
+            data of the section.
+
+        Raises
+        ------
+        KeyError
+            If the section does not exist and ``create=False``, raises a
+            ``KeyError``.
+
+        """
         section = self._data
         if not subsection_names:
             return section
@@ -591,6 +586,20 @@ def delete(self, key: str | Sequence[str]) -> None:
         del parent_section[leaf_node_name]
 
     def _add_single(self, key: str, val: Formattable | str) -> None:
+        """Add a single section
+
+        If the (sub)section does not exist, it is created. Otherwise, the
+        existing (sub)section is modified.
+
+        Parameters
+        ----------
+        key: str
+            The name of the (sub)section.
+
+        val: str or Formattable
+            The value to assign to the (sub)section.
+
+        """
         *subsection_names, leaf_node_name = split_subsection_names(key)
         section = self._select(subsection_names)
 
@@ -602,6 +611,7 @@ def _add_single(self, key: str, val: Formattable | str) -> None:
             section[leaf_node_name] = Section(title=leaf_node_name, content=val)
 
     def _add_model_section(self) -> None:
+        """Add model plot section, if model_diagram is set"""
         section_title = "Model description/Training Procedure/Model Plot"
         default_content = "The model plot is below."
 
@@ -618,6 +628,7 @@ def _add_model_section(self) -> None:
         self._add_single(section_title, content)
 
     def _add_hyperparams(self) -> None:
+        """Add hyperparameter section"""
         hyperparameter_dict = self.model.get_params(deep=True)
         table = _clean_table(
             tabulate(
@@ -744,6 +755,7 @@ def add_metrics(self, **kwargs: str | int | float) -> "Card":
         return self
 
     def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
+        """Add metrics to the Evaluation Results section"""
         table = tabulate(
             list(metrics.items()),
             headers=["Metric", "Value"],
@@ -808,7 +820,7 @@ def __repr__(self) -> str:
         # repr for the model
         model = getattr(self, "model", None)
         if model:
-            model_repr = self._format_repr(f"model={repr(model)}")
+            model_repr = self._format_repr(f"model={repr(model)},")
         else:
             model_repr = None
 
@@ -847,6 +859,7 @@ def __repr__(self) -> str:
         return complete_repr
 
     def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
+        """Add getting started code to the corresponding section"""
         is_skops_format = file_name.endswith(".skops")  # else, assume pickle
         lines = _getting_started_code(
             file_name, is_skops_format=is_skops_format, indent=indent
@@ -864,6 +877,7 @@ def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
         )
 
     def _generate_card(self) -> Iterator[str]:
+        """Yield sections of the model card, including the metadata"""
         if self.metadata.to_dict():
             yield f"---\n{self.metadata.to_yaml()}\n---"
 
diff --git a/skops/card/tests/test_card.py b/skops/card/tests/test_card.py
index f9ba237b..7127c131 100644
--- a/skops/card/tests/test_card.py
+++ b/skops/card/tests/test_card.py
@@ -580,7 +580,7 @@ def card(self):
     def expected_lines(self):
         card_repr = """
         Card(
-          model=LinearRegression(fit_intercept=False)
+          model=LinearRegression(fit_intercept=False),
           Model description/Training Procedure/...ed | | positive | False | </details>,
           Model description/Training Procedure/...</pre></div></div></div></div></div>,
           Model description/Evaluation Results=...ric | Value | |----------|---------|,
@@ -627,7 +627,7 @@ def test_card_repr_empty_card(self, meth):
         expected = textwrap.dedent(
             """
         Card(
-          model=LinearRegression()
+          model=LinearRegression(),
         )
         """
         ).strip()

From 8558f261ee5ad588c2c2ea5e2fa33cea6be7c34f Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 25 Nov 2022 13:43:54 +0100
Subject: [PATCH 14/47] Add TODO notes for when Python 3.7 is dropped

---
 skops/card/_model_card.py | 2 +-
 skops/utils/fixes.py      | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index d9a027c4..14b8c7b9 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -15,7 +15,7 @@
 
 if sys.version_info >= (3, 8):
     from typing import Protocol
-else:
+else:  # TODO: remove when Python 3.7 is dropped
     from typing_extensions import Protocol
 
 # Repr attributes can be used to control the behavior of repr
diff --git a/skops/utils/fixes.py b/skops/utils/fixes.py
index e9d83558..223d27dd 100644
--- a/skops/utils/fixes.py
+++ b/skops/utils/fixes.py
@@ -15,7 +15,7 @@
 if sys.version_info >= (3, 8):
     # py>=3.8
     from typing import Literal  # noqa
-else:
+else:  # TODO: remove when Python 3.7 is dropped
     # older pythons, this requires typing_extensions to be installed.
     # if you're removing this, you should also remove the dependency from
     # _min_dependencies.py

From fdb76740f198c690dd1d04df49e9557b1d6e66b1 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 25 Nov 2022 16:00:14 +0100
Subject: [PATCH 15/47] Add Hub model card template, add template arg

Users can now choose to use no template, skops template, hub template,
or their own template. Using their own template disables a lot of
prefilling (say, putting the model plot in the card) because we wouldn't
know where to put it. Users will need to call card.add for the otherwise
prefilled sections.
---
 docs/model_card.rst           |   4 +
 skops/card/_model_card.py     | 113 +++++++++++++++++---------
 skops/card/_templates.py      | 144 ++++++++++++++++++++++++++++++++++
 skops/card/tests/test_card.py |  50 ++++++++++--
 4 files changed, 268 insertions(+), 43 deletions(-)
 create mode 100644 skops/card/_templates.py

diff --git a/docs/model_card.rst b/docs/model_card.rst
index 7a6c124d..f6b0d37a 100644
--- a/docs/model_card.rst
+++ b/docs/model_card.rst
@@ -103,3 +103,7 @@ using :meth:`Card.select`, and you can delete sections using
 
 To see how you can use the API in ``skops`` to create a model card, please
 refer to :ref:`sphx_glr_auto_examples_plot_model_card.py`.
+
+Templates
+---------
+TODO
diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index 14b8c7b9..908b8050 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -4,6 +4,7 @@
 import re
 import sys
 import textwrap
+from collections.abc import Mapping
 from dataclasses import dataclass, field
 from pathlib import Path
 from reprlib import Repr
@@ -13,6 +14,13 @@
 from sklearn.utils import estimator_html_repr
 from tabulate import tabulate  # type: ignore
 
+from skops.card._templates import (
+    CONTENT_PLACEHOLDER,
+    HUB_TEMPLATE,
+    SKOPS_TEMPLATE,
+    Templates,
+)
+
 if sys.version_info >= (3, 8):
     from typing import Protocol
 else:  # TODO: remove when Python 3.7 is dropped
@@ -24,29 +32,7 @@
 aRepr.maxstring = 79
 
 
-CONTENT_PLACEHOLDER = "[More Information Needed]"
-"""When there is a section but no content, show this"""
-
-DEFAULT_TEMPLATE = {
-    "Model description": CONTENT_PLACEHOLDER,
-    "Model description/Intended uses & limitations": CONTENT_PLACEHOLDER,
-    "Model description/Training Procedure": "",
-    "Model description/Training Procedure/Hyperparameters": CONTENT_PLACEHOLDER,
-    "Model description/Training Procedure/Model Plot": CONTENT_PLACEHOLDER,
-    "Model description/Evaluation Results": CONTENT_PLACEHOLDER,
-    "How to Get Started with the Model": CONTENT_PLACEHOLDER,
-    "Model Card Authors": (
-        f"This model card is written by following authors:\n\n{CONTENT_PLACEHOLDER}"
-    ),
-    "Model Card Contact": (
-        "You can contact the model card authors through following channels:\n"
-        f"{CONTENT_PLACEHOLDER}"
-    ),
-    "Citation": (
-        "Below you can find information related to citation.\n\n**BibTeX:**\n```\n"
-        f"{CONTENT_PLACEHOLDER}\n```"
-    ),
-}
+VALID_TEMPLATES = {item.value for item in Templates}
 
 
 def wrap_as_details(text: str, folded: bool) -> str:
@@ -307,7 +293,7 @@ class Card:
         of the ``config.json`` file, which itself is created by
         :func:`skops.hub_utils.init`.
 
-    prefill: bool (default=True)
+    template: "hub", "skops" or None (default=TODO)
         Whether to add default sections or not.
 
     Attributes
@@ -384,22 +370,32 @@ def __init__(
         model,
         model_diagram: bool = True,
         metadata: CardData | None = None,
-        prefill: bool = True,
+        template: str | dict[str, str] | None = "skops",
     ) -> None:
         self.model = model
         self.model_diagram = model_diagram
         self.metadata = metadata or CardData()
+        self.template = template
 
         self._data: dict[str, Section] = {}
         self._metrics: dict[str, str | float | int] = {}
-        if prefill:
+
+        if self.template:
+            if isinstance(self.template, str) and self.template not in VALID_TEMPLATES:
+                raise ValueError(
+                    f"Unknown template {self.template}, must be "
+                    f"one of {sorted(VALID_TEMPLATES)}"
+                )
+
             self._fill_default_sections()
             # TODO: This is for parity with old model card but having an empty
             # table by default is kinda pointless
             self.add_metrics()
-            self._reset()
+            self._reset_model_descriptions()
 
-    def _reset(self) -> None:
+    def _reset_model_descriptions(self) -> None:
+        # reset everything that depends on the self.model, in case self.model
+        # changed (or might have changed)
         model_file = self.metadata.to_dict().get("model_file")
         if model_file:
             self._add_get_started_code(model_file)
@@ -408,7 +404,12 @@ def _reset(self) -> None:
         self._add_hyperparams()
 
     def _fill_default_sections(self) -> None:
-        self.add(**DEFAULT_TEMPLATE)
+        if self.template == Templates.skops.value:
+            self.add(**SKOPS_TEMPLATE)
+        elif self.template == Templates.hub.value:
+            self.add(**HUB_TEMPLATE)
+        elif isinstance(self.template, Mapping):
+            self.add(**self.template)
 
     def add(self, **kwargs: str | Formattable) -> "Card":
         """Add new section(s) to the model card.
@@ -612,6 +613,10 @@ def _add_single(self, key: str, val: Formattable | str) -> None:
 
     def _add_model_section(self) -> None:
         """Add model plot section, if model_diagram is set"""
+        if self.template != Templates.skops.value:
+            # only skops template has a default section
+            return
+
         section_title = "Model description/Training Procedure/Model Plot"
         default_content = "The model plot is below."
 
@@ -629,6 +634,10 @@ def _add_model_section(self) -> None:
 
     def _add_hyperparams(self) -> None:
         """Add hyperparameter section"""
+        if self.template != Templates.skops.value:
+            # only skops template has a default hyper parameter section
+            return
+
         hyperparameter_dict = self.model.get_params(deep=True)
         table = _clean_table(
             tabulate(
@@ -756,6 +765,13 @@ def add_metrics(self, **kwargs: str | int | float) -> "Card":
 
     def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
         """Add metrics to the Evaluation Results section"""
+        # when not using one of the default templates, there is no predetermined
+        # section to put the metrics
+        if self.template is None or isinstance(self.template, dict):
+            return
+        if self.template not in VALID_TEMPLATES:
+            return
+
         table = tabulate(
             list(metrics.items()),
             headers=["Metric", "Value"],
@@ -768,7 +784,15 @@ def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
 
         {}"""
         )
-        self._add_single("Model description/Evaluation Results", template.format(table))
+        if self.template == Templates.skops.value:
+            section = "Model description/Evaluation Results"
+        elif self.template == Templates.hub.value:
+            section = "Evaluation/Testing Data, Factors & Metrics/Metrics"
+        else:
+            # should be unreachable
+            raise ValueError(f"Unknown template {self.template}")
+
+        self._add_single(section, template.format(table))
 
     def _generate_metadata(self, metadata: CardData) -> Iterator[str]:
         """Yield metadata in yaml format"""
@@ -860,18 +884,37 @@ def __repr__(self) -> str:
 
     def _add_get_started_code(self, file_name: str, indent: str = "    ") -> None:
         """Add getting started code to the corresponding section"""
+        if self.template not in VALID_TEMPLATES:
+            # unknown template, cannot prefill
+            return
+
         is_skops_format = file_name.endswith(".skops")  # else, assume pickle
         lines = _getting_started_code(
             file_name, is_skops_format=is_skops_format, indent=indent
         )
         lines = ["```python"] + lines + ["```"]
 
-        template = textwrap.dedent(
-            """        Use the code below to get started with the model.
+        if self.template == "skops":
+            template = textwrap.dedent(
+                """            Use the code below to get started with the model.
 
-        {}
-        """
-        )
+            {}
+            """
+            )
+        elif self.template == "hub":
+            template = textwrap.dedent(
+                """               Use the code below to get started with the model.
+
+                <details>
+                <summary> Click to expand </summary>
+
+                {}
+
+                </details>"""
+            )
+        else:
+            # should be unreachable
+            raise ValueError(f"Unknown template {self.template}")
         self._add_single(
             "How to Get Started with the Model", template.format("\n".join(lines))
         )
diff --git a/skops/card/_templates.py b/skops/card/_templates.py
new file mode 100644
index 00000000..69a84032
--- /dev/null
+++ b/skops/card/_templates.py
@@ -0,0 +1,144 @@
+"""Templates for model cards"""
+
+from enum import Enum
+
+
+class Templates(Enum):
+    skops = "skops"
+    hub = "hub"
+
+
+CONTENT_PLACEHOLDER = "[More Information Needed]"
+"""When there is a section but no content, show this"""
+
+# fmt: off
+SKOPS_TEMPLATE = {
+    "Model description": CONTENT_PLACEHOLDER,
+    "Model description/Intended uses & limitations": CONTENT_PLACEHOLDER,
+    "Model description/Training Procedure": "",
+    "Model description/Training Procedure/Hyperparameters": CONTENT_PLACEHOLDER,
+    "Model description/Training Procedure/Model Plot": CONTENT_PLACEHOLDER,
+    "Model description/Evaluation Results": CONTENT_PLACEHOLDER,
+    "How to Get Started with the Model": CONTENT_PLACEHOLDER,
+    "Model Card Authors": (
+        f"This model card is written by following authors:\n\n{CONTENT_PLACEHOLDER}"
+    ),
+    "Model Card Contact": (
+        "You can contact the model card authors through following channels:\n"
+        f"{CONTENT_PLACEHOLDER}"
+    ),
+    "Citation": (
+        "Below you can find information related to citation.\n\n**BibTeX:**\n```\n"
+        f"{CONTENT_PLACEHOLDER}\n```"
+    ),
+}
+
+HUB_TEMPLATE = {
+    "Model Card": "",
+    # Provide a quick summary of what the model is/does.
+    "Model Details": "",
+    "Model Details/Model Description": "",
+    # Provide a longer summary of what this model is.
+    "Model Details/Model Description/Developed by": CONTENT_PLACEHOLDER,
+    "Model Details/Model Description/Shared by [optional]": CONTENT_PLACEHOLDER,
+    "Model Details/Model Description/Model type": CONTENT_PLACEHOLDER,
+    "Model Details/Model Description/Language(s) (NLP)": CONTENT_PLACEHOLDER,
+    "Model Details/Model Description/License": CONTENT_PLACEHOLDER,
+    "Model Details/Model Description/Finetuned from model [optional]": CONTENT_PLACEHOLDER,
+    "Model Details/Model Description/Resources for more information": CONTENT_PLACEHOLDER,
+
+    "Uses": "",
+    # Address questions around how the model is intended to be used, including
+    # the foreseeable users of the model and those affected by the model.
+    "Uses/Direct Use": CONTENT_PLACEHOLDER,
+    # This section is for the model use without fine-tuning or plugging into a
+    # larger ecosystem/app.
+    "Uses/Downstream Use [optional]": CONTENT_PLACEHOLDER,
+    # This section is for the model use when fine-tuned for a task, or when
+    # plugged into a larger ecosystem/app.
+    "Uses/Out-of-Scope Use": CONTENT_PLACEHOLDER,
+    # This section addresses misuse, malicious use, and uses that the model will
+    # not work well for.
+
+    "Bias, Risks, and Limitations": CONTENT_PLACEHOLDER,
+    # This section is meant to convey both technical and sociotechnical
+    # limitations.
+    "Bias, Risks, and Limitations/Recommendations": (
+        "Users (both direct and downstream) should be made aware of the risks, biases "
+        "and limitations of the model. More information needed for further "
+        "recommendations."
+    ),
+    # This section is meant to convey recommendations with respect to the bias,
+    # risk, and technical limitations.
+
+    "Training Details": "",
+    "Training Details/Training Data": CONTENT_PLACEHOLDER,
+    # This should link to a Data Card, perhaps with a short stub of information
+    # on what the training data is all about as well as documentation related to
+    # data pre-processing or additional filtering.
+    "Training Details/Training Procedure [optional]": "",
+    # This relates heavily to the Technical Specifications. Content here should
+    # link to that section when it is relevant to the training procedure.
+    "Training Details/Training Procedure [optional]/Preprocessing": CONTENT_PLACEHOLDER,
+    "Training Details/Training Procedure [optional]/Speeds, Sizes, Times": CONTENT_PLACEHOLDER,
+    # This section provides information about throughput, start/end time,
+    # checkpoint size if relevant, etc.
+
+    "Evaluation": "",
+    # This section describes the evaluation protocols and provides the results.
+    "Evaluation/Testing Data, Factors & Metrics": "",
+    "Evaluation/Testing Data, Factors & Metrics/Testing Data": CONTENT_PLACEHOLDER,
+    # This should link to a Data Card if possible
+    "Evaluation/Testing Data, Factors & Metrics/Factors": CONTENT_PLACEHOLDER,
+    # These are the things the evaluation is disaggregating by, e.g.,
+    # subpopulations or domains.
+    "Evaluation/Testing Data, Factors & Metrics/Metrics": CONTENT_PLACEHOLDER,
+    # These are the evaluation metrics being used, ideally with a description of
+    # why.
+    "Evaluation/Results": CONTENT_PLACEHOLDER,
+
+    "Model Examination [optional]": CONTENT_PLACEHOLDER,
+    # Relevant interpretability work for the model goes here.
+
+    "Environmental Impact": (
+        "Carbon emissions can be estimated using the "
+        "[Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) "
+        "presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700)."
+    ),
+    # Total emissions (in grams of CO2eq) and additional considerations, such as
+    # electricity usage, go here. Edit the suggested text below accordingly"
+    "Environmental Impact/Hardware Type": CONTENT_PLACEHOLDER,
+    "Environmental Impact/Hours used": CONTENT_PLACEHOLDER,
+    "Environmental Impact/Cloud Provider": CONTENT_PLACEHOLDER,
+    "Environmental Impact/Compute Region": CONTENT_PLACEHOLDER,
+    "Environmental Impact/Carbon Emitted": CONTENT_PLACEHOLDER,
+
+    "Technical Specifications [optional]": "",
+    "Technical Specifications [optional]/Model Architecture and Objective": CONTENT_PLACEHOLDER,
+    "Technical Specifications [optional]/Compute Infrastructure": CONTENT_PLACEHOLDER,
+    "Technical Specifications [optional]/Compute Infrastructure/Hardware": CONTENT_PLACEHOLDER,
+    "Technical Specifications [optional]/Compute Infrastructure/Software": CONTENT_PLACEHOLDER,
+
+    "Citation [optional]": "",
+    # If there is a paper or blog post introducing the model, the APA and Bibtex
+    # information for that should go in this section.
+    "Citation [optional]/BibTeX": CONTENT_PLACEHOLDER,
+    "Citation [optional]/APA": CONTENT_PLACEHOLDER,
+
+    "Glossary [optional]": "",
+    # If relevant, include terms and calculations in this section that can help
+    # readers understand the model or model card.
+
+    "More Information [optional]": CONTENT_PLACEHOLDER,
+    "Model Card Authors [optional]": CONTENT_PLACEHOLDER,
+    "Model Card Contact": CONTENT_PLACEHOLDER,
+    "How to Get Started with the Model": f"""Use the code below to get started with the model.
+
+<details>
+<summary> Click to expand </summary>
+
+{CONTENT_PLACEHOLDER}
+
+</details>""",
+}
+# fmt: on
diff --git a/skops/card/tests/test_card.py b/skops/card/tests/test_card.py
index 7127c131..20afe8fb 100644
--- a/skops/card/tests/test_card.py
+++ b/skops/card/tests/test_card.py
@@ -285,21 +285,55 @@ def test_select_empty_key_subsection_raises(self, model_card):
         with pytest.raises(KeyError, match=msg):
             model_card.select(["Model description", ""])
 
-    def test_default_sections_empty_card(self, model_card):
-        # Without prefill, the card should not contain the default sections
-        from skops.card._model_card import DEFAULT_TEMPLATE
+    def test_default_skops_sections_present(self, model_card):
+        from skops.card._model_card import SKOPS_TEMPLATE
 
         # model_card (which is prefilled) contains all default sections
-        for key in DEFAULT_TEMPLATE:
+        for key in SKOPS_TEMPLATE:
             model_card.select(key)
 
+    def test_default_hub_sections_present(self, model_card):
+        from skops.card._model_card import HUB_TEMPLATE
+
+        model = fit_model()
+        model_card = Card(model, model_diagram=False, template="hub")
+
+        # model_card contains all default sections
+        for key in HUB_TEMPLATE:
+            model_card.select(key)
+
+    def test_custom_template_sections_present(self, model_card):
+        template = {
+            "My awesome model": "hello",
+            "My awesome model/More details": "123",
+            "More info": "Thanks",
+        }
+        model = fit_model()
+        model_card = Card(model, model_diagram=False, template=template)
+
+        # model_card contains all default sections
+        for key in template:
+            model_card.select(key)
+
+        # no other top level sections as those defined in the template
+        assert list(model_card._data.keys()) == ["My awesome model", "More info"]
+
+    def test_default_skops_sections_empty_card(self, model_card):
+        # Without prefilled template, the card should not contain the default sections
+        from skops.card._model_card import SKOPS_TEMPLATE
+
         # empty card does not contain those sections
         model = fit_model()
-        card_empty = Card(model, model_diagram=False, prefill=False)
-        for key in DEFAULT_TEMPLATE:
+        card_empty = Card(model, model_diagram=False, template=None)
+        for key in SKOPS_TEMPLATE:
             with pytest.raises(KeyError):
                 card_empty.select(key)
 
+    def test_invalid_template_name_raises(self):
+        msg = "Unknown template does-not-exist, must be one of"
+        with pytest.raises(ValueError, match=msg):
+            Card(model=None, template="does-not-exist")
+
 
 class TestAdd:
     """Adding sections and subsections"""
@@ -620,9 +654,9 @@ def test_card_repr(self, card: Card, meth, expected_lines):
 
     @pytest.mark.parametrize("meth", [repr, str])
     def test_card_repr_empty_card(self, meth):
-        """Without prefill, the repr should be empty"""
+        """Without prefilled template, the repr should be empty"""
         model = fit_model()
-        card = Card(model, model_diagram=False, prefill=False)
+        card = Card(model, model_diagram=False, template=None)
         result = meth(card)
         expected = textwrap.dedent(
             """

From 772a659213e7ab6ad7e8665296bab7a4ae14c15f Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 30 Nov 2022 12:27:40 +0100
Subject: [PATCH 16/47] Make _add_single return the Section

This can be useful, because otherwise it takes a bit of effort to
retrieve the latest section.
---
 skops/card/_model_card.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index 908b8050..17d11b5b 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -586,7 +586,7 @@ def delete(self, key: str | Sequence[str]) -> None:
         parent_section = self._select(subsection_names, create=False)
         del parent_section[leaf_node_name]
 
-    def _add_single(self, key: str, val: Formattable | str) -> None:
+    def _add_single(self, key: str, val: Formattable | str) -> Section:
         """Add a single section
 
         If the (sub)section does not exist, it is created. Otherwise, the
@@ -611,6 +611,8 @@ def _add_single(self, key: str, val: Formattable | str) -> None:
             # entry does not exist, create a new one
             section[leaf_node_name] = Section(title=leaf_node_name, content=val)
 
+        return section[leaf_node_name]
+
     def _add_model_section(self) -> None:
         """Add model plot section, if model_diagram is set"""
         if self.template != Templates.skops.value:

From 7cfddf907510c62c6e845629b9a7372817004fea Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 30 Nov 2022 12:31:38 +0100
Subject: [PATCH 17/47] Allow tables without rows to be added

It's ugly, but there is no technical reason from prohibiting the
addition of tables without rows. (Note, columns are still required).

This allows us to use TableSection for formatting the metrics, instead
of calling tabulate there directly. This is better, since we don't have
2 separate ways of creating metrics.
---
 skops/card/_model_card.py     | 27 ++++++++++++---------------
 skops/card/tests/test_card.py | 15 ++++++++++++---
 2 files changed, 24 insertions(+), 18 deletions(-)

diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index 17d11b5b..e7933232 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -74,7 +74,7 @@ def __repr__(self) -> str:
 class TableSection:
     """Adds a table to the model card"""
 
-    table: dict[str, list[Any]]
+    table: Mapping[str, Sequence[Any]]
     folded: bool = False
 
     def __post_init__(self) -> None:
@@ -86,17 +86,11 @@ def __post_init__(self) -> None:
             self._is_pandas_df = False
 
         if self._is_pandas_df:
-            if self.table.empty:  # type: ignore
-                raise ValueError("Empty table added")
+            ncols = len(self.table.columns)  # type: ignore
         else:
             ncols = len(self.table)
-            if ncols == 0:
-                raise ValueError("Empty table added")
-
-            key = next(iter(self.table.keys()))
-            nrows = len(self.table[key])
-            if nrows == 0:
-                raise ValueError("Empty table added")
+        if ncols == 0:
+            raise ValueError("Trying to add table with no columns")
 
     def format(self) -> str:
         if self._is_pandas_df:
@@ -774,11 +768,14 @@ def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
         if self.template not in VALID_TEMPLATES:
             return
 
-        table = tabulate(
-            list(metrics.items()),
-            headers=["Metric", "Value"],
-            tablefmt="github",
-        )
+        if self._metrics:
+            data_transposed = zip(*self._metrics.items())  # make column oriented
+            inp = {key: val for key, val in zip(["Metric", "Value"], data_transposed)}
+            table = TableSection(inp).format()
+        else:
+            # create empty table
+            table = TableSection({"Metric": [], "Value": []}).format()
+
         template = textwrap.dedent(
             """        You can find the details about evaluation process and the evaluation results.
 
diff --git a/skops/card/tests/test_card.py b/skops/card/tests/test_card.py
index 20afe8fb..508b9a2c 100644
--- a/skops/card/tests/test_card.py
+++ b/skops/card/tests/test_card.py
@@ -793,17 +793,26 @@ def test_str_and_repr_table_is_dataframe(self, table_dict, meth):
         expected = "Table(3x2)"
         assert meth(section) == expected
 
-    @pytest.mark.parametrize("table", [{}, {"col": []}, "pandas"])
+    @pytest.mark.parametrize("table", [{}, "pandas"])
     def test_raise_error_empty_table(self, table):
-        # Test no columns, no rows, empty df
+        # If there are no columns, raise
         if table == "pandas":
             pd = pytest.importorskip("pandas")
             table = pd.DataFrame([])
 
-        msg = "Empty table added"
+        msg = "Trying to add table with no columns"
         with pytest.raises(ValueError, match=msg):
             TableSection(table=table)
 
+    @pytest.mark.parametrize("table", [{"col0": []}, "pandas"])
+    def test_table_with_no_rows_works(self, table):
+        # If there are no rows, it's okay
+        if table == "pandas":
+            pd = pytest.importorskip("pandas")
+            table = pd.DataFrame(data=[], columns=["col0"])
+
+        TableSection(table=table).format()  # no error raised
+
     def test_pandas_not_installed(self, table_dict, pandas_not_installed):
         # use pandas_not_installed fixture from conftest.py to pretend that
         # pandas is not installed

From 50b0d39e2d3d7ef8aad0e3bfba03e483e6410787 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 30 Nov 2022 17:21:06 +0100
Subject: [PATCH 18/47] Parser that allows to load dumped model cards

As discussed here:

https://github.com/skops-dev/skops/issues/72#issuecomment-1327360660

Description

This feature adds a new function, skops.card.parse_modelcard. When
passing it the path to a dumped model card, it parses it using pandoc
and returns a Card object, which can be further modified by the user.

In the end, this turned out easier than I initially thought it would.
The main difficulty are the data structures returned by the pandoc
parser, for which I couldn't find any documentation. I guess Haskell
code is just self-documenting.

For this reason, there are probably quite a few edge cases that I
haven't covered yet. Just as an example, when parsing tables, pandoc
tells us how the columns are aligned. This information is currently
completely discarded (we let tabulate choose the alignment). If we want
to preserve the table alignment, we would need to make some changes

Implementation

This feature requires the alternative card implementation from #203

pandoc is used for the following reasons:

- widely used and thus battle tested
- can read many other formats, not just markdown, so in theory, we
  should be able to read, e.g., rst model cards without modifying any
  code

The disadvantage is that pandoc is not a Python package, so users need
to install it separately. But it is available on all common platforms.

For calling pandoc, I chose to shell out using subprocess. I think this
should be fine but LMK if there is a better way.

There is a Python package that binds
pandoc (https://github.com/boisgera/pandoc) but I don't think it's worth
it for us to add it, just to avoid shelling out. The package seems to
have low adoption and contains a bunch of stuff we don't need.

I chose to implement this such that the parser that generates the Card
object should not have to know anything about Markdown. Everything
related to Markdown is moved to a separate class in _markup.py.

In an ideal world, we would not have to know anything about markdown
either. Instead the Card object shoud have methods (similar to what we
already have for add_plot etc.) that handles all of that. But in
practice, this is far from being true. E.g. if a user wants to add bold
text, there is no special method for it, so they would need to add raw
Markdown. The Card class is thus a leaky abstraction.

TODOs

This PR is not finished. Remaining TODOs that come to mind:

1. We need to merge the alternative card implementation
2. Documentation has to be updated in several places
3. Tests need to be more complex, right now only one Card is tested
4. CI needs to install pandoc so that the tests are actually run
5. There are some specifics here that won't work with all Python
   versions, like the use of TypedDict.
---
 skops/card/__init__.py          |   3 +-
 skops/card/_markup.py           | 180 ++++++++++++++++++++++++++++++++
 skops/card/_parser.py           | 160 ++++++++++++++++++++++++++++
 skops/card/tests/test_parser.py |  75 +++++++++++++
 4 files changed, 417 insertions(+), 1 deletion(-)
 create mode 100644 skops/card/_markup.py
 create mode 100644 skops/card/_parser.py
 create mode 100644 skops/card/tests/test_parser.py

diff --git a/skops/card/__init__.py b/skops/card/__init__.py
index 80ae1963..0febe42a 100644
--- a/skops/card/__init__.py
+++ b/skops/card/__init__.py
@@ -1,3 +1,4 @@
 from ._model_card import Card, metadata_from_config
+from ._parser import parse_modelcard
 
-__all__ = ["Card", "metadata_from_config"]
+__all__ = ["Card", "metadata_from_config", "parse_modelcard"]
diff --git a/skops/card/_markup.py b/skops/card/_markup.py
new file mode 100644
index 00000000..6c2f8846
--- /dev/null
+++ b/skops/card/_markup.py
@@ -0,0 +1,180 @@
+"""Classes for translating into the syntax of different markup languages"""
+
+from collections.abc import Mapping
+from typing import Any, Sequence, TypedDict
+
+from skops.card._model_card import TableSection
+
+
+class PandocItem(TypedDict):
+    t: str
+    c: dict
+
+
+class Markdown:
+    """Mapping of pandoc parsed document to Markdown
+
+    This class has a ``mapping`` attribute, which is just a dict. The keys are
+    Pandoc types and the values are functions that transform the corresponding
+    value into a string with markdown syntax. Those functions are all prefixed
+    with ``md_``, e.g. ``md_Image`` for transforming a pandoc ``Image`` into a
+    markdown figure.
+
+    From the caller side, only the ``__call__`` method should be used, the rest
+    should be considered internals.
+
+    """
+
+    def __init__(self):
+        # markdown syntax dispatch table
+        self.mapping = {
+            "Space": self.md_space,
+            "Strong": self.md_strong,
+            "Plain": self.md_plain,
+            "Str": self.md_str,
+            "RawInline": self.md_rawline,
+            "RawBlock": self.md_raw_block,
+            "SoftBreak": self.md_softbreak,
+            "Para": self.md_para,
+            "Header": self.md_header,
+            "Image": self.md_image,
+            "CodeBlock": self.md_code_block,
+            "Table": self.md_table,
+            "Div": self.md_parse_div,
+        }
+
+    @staticmethod
+    def md_space(value) -> str:
+        return " "
+
+    def md_strong(self, value) -> str:
+        parts = ["**"]
+        parts += [self.__call__(subitem) for subitem in value]
+        parts.append("**")
+        return "".join(parts)
+
+    def md_plain(self, value) -> str:
+        parts = [self.__call__(subitem) for subitem in value]
+        return "".join(parts)
+
+    @staticmethod
+    def md_str(value) -> str:
+        return value
+
+    @staticmethod
+    def md_rawline(value) -> str:
+        _, line = value
+        return line
+
+    def md_raw_block(self, item) -> str:
+        # throw away the first item, which is just something like 'html'
+        # might have to revisit this if output != markdown
+        _, line = item
+        return line
+
+    @staticmethod
+    def md_softbreak(value) -> str:
+        return "\n"
+
+    def _make_content(self, content):
+        parts = []
+        for item in content:
+            part = "".join(self.__call__(item))
+            parts.append(part)
+        return "".join(parts)
+
+    def md_para(self, value: list[dict[str, str]]) -> str:
+        content = self._make_content(value)
+        return content
+
+    def md_header(self, value: tuple[int, Any, list[dict[str, str]]]) -> str:
+        level, _, content_parts = value
+        section_name = self._make_content(content_parts)
+        return section_name
+
+    def md_image(self, value) -> str:
+        (ident, _, keyvals), caption, (dest, typef) = value
+        # it seems like ident and keyvals are not relevant for markdown
+        assert caption
+        assert typef == "fig:"
+
+        caption = "".join([self.__call__(i) for i in caption])
+        content = f"![{caption}]({dest})"
+        return content
+
+    @staticmethod
+    def md_code_block(item: tuple[tuple[int, list[str], list[str]], str]) -> str:
+        # a codeblock consists of: (id, classes, namevals) contents
+        (_, _, namevals), content = item
+        block_start = "```"
+        if namevals:  # TODO: check if this makes "```python" etc.
+            block_start += namevals[0]
+        block_end = "```"
+        content = "\n".join((block_start, content, block_end))
+        return content
+
+    def md_table(self, item) -> str:
+        _, alignments, _, header, rows = item
+        fn = self.__call__
+        columns = ["".join(fn(part) for part in col) for col in header]
+        if not columns:
+            raise ValueError("Table with no columns...")
+
+        data = []  # row oriented
+        for row in rows:
+            data.append(["".join(fn(part) for part in col) for col in row])
+
+        table: Mapping[str, Sequence[Any]]
+        if not data:
+            table = {key: [] for key in columns}
+        else:
+            data_transposed = zip(*data)  # column oriented
+            table = {key: val for key, val in zip(columns, data_transposed)}
+
+        res = TableSection(table).format()
+        return res
+
+    def md_parse_div(self, item) -> str:
+        # note that in markdown, we basically just use the raw html
+        (ident, classes, kvs), contents = item
+
+        # build diff tag
+        tags = ["<div"]
+        if ident:
+            tags.append(f' id="{ident}"')
+        if classes:
+            classes = " ".join(classes)
+            tags.append(f' class="{classes}"')
+        if kvs:
+            kvparts = []
+            for k, v in kvs:
+                if not v:  # e.g. just ['hidden', '']
+                    kvparts.append(k)
+                else:
+                    kvparts.append(f'{k}="{v}"')
+            tags.append(f' {" ".join(kvparts)}')
+        tags.append(">")
+
+        start = "".join(tags)
+        middle = []
+        for content in contents:
+            middle.append(self.__call__(content))
+        end = "</div>"
+        return "".join([start] + middle + [end])
+
+    def __call__(self, item: str | PandocItem) -> str:
+        if isinstance(item, str):
+            return item
+
+        type_, value = item["t"], item.get("c")
+        try:
+            res = self.mapping[type_](value)
+        except KeyError as exc:
+            msg = (
+                f"The parsed document contains '{type_}', which is not "
+                "supported yet, please open an issue on GitHub"
+            )
+            raise ValueError(msg) from exc
+
+        # recursively call until the value has been resolved into a str
+        return self.__call__(res)
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
new file mode 100644
index 00000000..c4b7344d
--- /dev/null
+++ b/skops/card/_parser.py
@@ -0,0 +1,160 @@
+"""Contains the PandocParser
+
+This class needs to know about the pandoc parse tree but should not have
+knowledge of any particular markup syntex; everything related to markup should
+be known by the mapping attribute.
+
+"""
+
+import json
+import subprocess
+from pathlib import Path
+
+from skops.card import Card
+from skops.card._model_card import Section
+
+from ._markup import Markdown, PandocItem
+
+
+class PandocParser:
+    """TODO"""
+
+    def __init__(self, source, mapping="markdown") -> None:
+        self.source = source
+        if mapping == "markdown":
+            self.mapping = Markdown()
+        else:
+            raise ValueError(f"Markup of type {mapping} is not supported (yet)")
+
+        self.card = Card(None, template=None)
+        self._section_trace: list[str] = []
+        self._cur_section: Section | None = None
+
+    def get_cur_level(self) -> int:
+        # level 0 can be interpreted implictly as the root level
+        return len(self._section_trace)
+
+    def get_cur_section(self):
+        # including supersections
+        return "/".join(self._section_trace)
+
+    def add_section(self, section_name: str) -> None:
+        self._cur_section = self.card._add_single(self.get_cur_section(), "")
+
+    def add_content(self, content: str) -> None:
+        section = self._cur_section
+        if section is None:
+            raise ValueError(
+                "Ooops, no current section, please open an issue on GitHub"
+            )
+
+        if not section.content:
+            section.content = content
+        elif isinstance(section.content, str):
+            section.content = section.content + "\n\n" + content
+        else:
+            # A Formattable, no generic way to modify it -- should we add an
+            # update method?
+            raise ValueError(f"Could not modify content of {section.content}")
+
+    def parse_header(self, item: PandocItem) -> str:
+        # Headers are the only type of item that needs to be handled
+        # differently. This is because we structure the underlying model card
+        # data as a tree with nodes corresponding to headers. To assign the
+        # right parent or child node, we need to keep track of the level of the
+        # headers. This cannot be done solely by the markdown mapping, since it
+        # is not aware of the tree structure.
+        level, _, _ = item["c"]
+        content = self.mapping(item)
+        self._section_trace = self._section_trace[: level - 1] + [content]
+        return content
+
+    def generate(self) -> Card:
+        # Parsing the flat structure, not recursively as in pandocfilters.
+        # After visiting the parent node, it's not necessary to visit its
+        # child nodes, because that's already done during parsing.
+        for item in json.loads(self.source)["blocks"]:
+            if item["t"] == "Header":
+                res = self.parse_header(item)
+                self.add_section(res)
+            else:
+                res = self.mapping(item)
+                self.add_content(res)
+
+        return self.card
+
+
+def check_pandoc_installed() -> None:
+    """Check if pandoc is installed on the system
+
+    Raises
+    ------
+    FileNotFoundError
+        When the binary is not found, raise this error.
+
+    """
+    try:
+        subprocess.run(
+            ["pandoc", "--version"],
+            capture_output=True,
+        )
+    except FileNotFoundError as exc:
+        msg = (
+            "This feature requires the pandoc library to be installed on your system, "
+            "please follow these install instructions: "
+            "https://pandoc.org/installing.html"
+        )
+        raise FileNotFoundError(msg) from exc
+
+
+def parse_modelcard(path: str | Path) -> Card:
+    """Read a model card and return a Card object
+
+    This allows users to load a dumped model card and continue to edit it.
+
+    Using this function requires ``pandoc`` to be installed. Please follow these
+    instructions:
+
+    https://pandoc.org/installing.html
+
+    Examples
+    --------
+    >>> import numpy as np
+    >>> from sklearn.linear_model import LinearRegression
+    >>> from skops.card import Card
+    >>> from skops.card import parse_card
+    >>> X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
+    >>> y = np.dot(X, np.array([1, 2])) + 3
+    >>> regr = LinearRegression().fit(X, y)
+    >>> card = Card(regr)
+    >>> card.save("README.md")
+    >>> # later, load the card again
+    >>> parsed_card = parse_modelcard("README.md")
+    >>> # continue editing the card
+    >>> parsed_card.add(**{"My new section": "My new content"})
+    >>> # overwrite old card with new one
+    >>> parsed_card.save("README.md")
+
+    Parameters
+    ----------
+    path : str or pathlib.Path
+        The path to the existing model card.
+
+    Returns
+    -------
+    card : skops.card.Card
+        The model card object.
+
+    """
+    check_pandoc_installed()
+
+    proc = subprocess.run(
+        ["pandoc", "-t", "json", "-s", str(path)],
+        capture_output=True,
+    )
+    source = str(proc.stdout.decode("utf-8"))
+
+    parser = PandocParser(source)
+    card = parser.generate()
+
+    return card
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
new file mode 100644
index 00000000..be33e72e
--- /dev/null
+++ b/skops/card/tests/test_parser.py
@@ -0,0 +1,75 @@
+import numpy as np
+import pytest
+from sklearn.linear_model import LinearRegression
+
+from skops.card import Card, parse_modelcard
+from skops.card._parser import check_pandoc_installed
+
+try:
+    check_pandoc_installed()
+except FileNotFoundError:
+    # not installed, skip
+    pytest.skip(reason="These tests require pandoc", allow_module_level=True)
+
+
+@pytest.fixture
+def fit_model():
+    X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
+    y = np.dot(X, np.array([1, 2])) + 3
+    reg = LinearRegression().fit(X, y)
+    return reg
+
+
+@pytest.fixture
+def card(fit_model, tmp_path):
+    card = Card(fit_model)
+
+    try:
+        import matplotlib.pyplot as plt
+
+        fig, ax = plt.subplots()
+        ax.plot([0, 1])
+        fig.savefig(tmp_path / "my-throwaway-plot.png")
+        card.add_plot(**{"My plots/My first plot": "my-throwaway-plot.png"})
+    except ImportError:
+        pass
+
+    card.add_table(**{"A table": {"col0": [0, 1], "col1": [2, 3]}})
+    return card
+
+
+def assert_readme_files_equal(file0, file1):
+    """Check that the two model cards are identical, but allow differences in
+    line breaks."""
+    # exclude trivial case of both being empty
+    assert file0
+    assert file1
+
+    with open(file0, "r") as f:
+        readme0 = f.readlines()
+
+    with open(file1, "r") as f:
+        readme1 = f.readlines()
+
+    # remove completely empty lines
+    readme0 = [line.strip() for line in readme0 if line.strip()]
+    readme1 = [line.strip() for line in readme1 if line.strip()]
+
+    readme_str0 = "\n".join(readme0)
+    readme_str1 = "\n".join(readme1)
+
+    # a minuscule further difference is an excess empty line after </style>
+    readme_str1 = readme_str1.replace("</style>\n", "</style>")
+
+    assert readme_str0 == readme_str1
+
+
+def test_parsed_card_identical(card, tmp_path):
+    file0 = tmp_path / "readme-skops.md"
+    card.save(file0)
+
+    parsed_card = parse_modelcard(file0)
+    file1 = tmp_path / "readme-parsed.md"
+    parsed_card.save(file1)
+
+    assert_readme_files_equal(file0, file1)

From 26892d6978c654c9ba0537295f11b60861dcb31b Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Thu, 1 Dec 2022 14:49:17 +0100
Subject: [PATCH 19/47] Error when calling add_metric w/ invalid template

---
 skops/card/_model_card.py     | 18 +++++++++++++++---
 skops/card/tests/test_card.py | 16 ++++++++++++++++
 2 files changed, 31 insertions(+), 3 deletions(-)

diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index e7933232..0308127e 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -763,10 +763,19 @@ def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
         """Add metrics to the Evaluation Results section"""
         # when not using one of the default templates, there is no predetermined
         # section to put the metrics
-        if self.template is None or isinstance(self.template, dict):
+        if (not self.template) or isinstance(self.template, dict):
+            raise ValueError(
+                "Adding metrics is only possible with one of the default templates, "
+                f"i.e. one of {sorted(VALID_TEMPLATES)}. Instead, consider using the "
+                ".add method to add a metric to a section, or .add_table to add a "
+                "table of metrics."
+            )
             return
         if self.template not in VALID_TEMPLATES:
-            return
+            raise ValueError(
+                f"Unknown template {self.template}, must be "
+                f"one of {sorted(VALID_TEMPLATES)}"
+            )
 
         if self._metrics:
             data_transposed = zip(*self._metrics.items())  # make column oriented
@@ -789,7 +798,10 @@ def _add_metrics(self, metrics: dict[str, str | float | int]) -> None:
             section = "Evaluation/Testing Data, Factors & Metrics/Metrics"
         else:
             # should be unreachable
-            raise ValueError(f"Unknown template {self.template}")
+            raise ValueError(
+                f"Unknown template {self.template}, must be "
+                f"one of {sorted(VALID_TEMPLATES)}"
+            )
 
         self._add_single(section, template.format(table))
 
diff --git a/skops/card/tests/test_card.py b/skops/card/tests/test_card.py
index 508b9a2c..f3dc34d3 100644
--- a/skops/card/tests/test_card.py
+++ b/skops/card/tests/test_card.py
@@ -541,6 +541,22 @@ def test_add_metrics(destination_path, model_card):
     assert eval_metric_content.endswith(expected)
 
 
+@pytest.mark.parametrize(
+    "template, msg",
+    [
+        (None, "Adding metrics is only possible with one of"),
+        ({"My custom template": ""}, "Adding metrics is only possible with one of"),
+        ("does-not-exist", "Unknown template does-not-exist, must be one of"),
+    ],
+)
+def test_add_metric_no_template_raises(template, msg):
+    # when the template is not one of the standard templates, we cannot know
+    # where to put the metric, so this should fail with a helpful error message
+    with pytest.raises(ValueError, match=msg):
+        card = Card(None, template=template)
+        card.add_metrics(f1=0.1)
+
+
 def test_code_autogeneration(
     model_card, destination_path, pkl_model_card_metadata_from_config
 ):

From 80a4ae38e240a8f9c01b083eb8ed08fa72ca6724 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 2 Dec 2022 14:28:35 +0100
Subject: [PATCH 20/47] Support model cards with yaml header

Most model cards have a yaml section at the top. It is now detached
before parsing with pandoc, then re-added afterwards.

Add a test with the model card from bert-base-uncased. It still fails
with some minor issues at the moment (most notably table column
alignment).
---
 skops/card/_parser.py                         |  58 ++++
 .../card/tests/examples/bert-base-uncased.md  | 249 ++++++++++++++++++
 skops/card/tests/test_parser.py               |  20 ++
 3 files changed, 327 insertions(+)
 create mode 100644 skops/card/tests/examples/bert-base-uncased.md

diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index c4b7344d..e849852d 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -6,9 +6,15 @@
 
 """
 
+from __future__ import annotations
+
 import json
 import subprocess
 from pathlib import Path
+from tempfile import mkdtemp
+from typing import Any
+
+import yaml  # type: ignore
 
 from skops.card import Card
 from skops.card._model_card import Section
@@ -107,6 +113,54 @@ def check_pandoc_installed() -> None:
         raise FileNotFoundError(msg) from exc
 
 
+def _card_with_detached_metainfo(path: str | Path) -> tuple[str | Path, dict[str, Any]]:
+    """Detach the possibly existing yaml part of the model card
+
+    Model cards always have a markdown part and optionally a yaml part at the
+    head, delimited by "---". Obviously, pandoc cannot parse that. Therefore, we
+    detach the yaml part and return it as a separate dict, only leaving
+    (hopefully) valid markdown.
+
+    path : str or pathlib.Path
+        The path to the model card file.
+
+    Returns
+    -------
+    file : path
+        The path to the model card without any yaml metainfo. If the model card
+        didn't contain that metainfo to begin with, this is just the path to the
+        original model card. If it did contain metainfo, this is a path to a new
+        temporary file with the metainfo removed.
+
+    metainfo : dict
+        The metainfo from the yaml part as a parsed dict. If no metainfo was
+        present, the dict is empty.
+    """
+    with open(path, "r") as f:
+        text = f.read()
+
+    sep_start, sep_end = "---\n", "\n---"
+
+    metainfo: dict[str, Any] = {}
+    if not text.startswith(sep_start):  # no metainfo:
+        return path, metainfo
+
+    idx_separator = text.find(sep_end)
+    if idx_separator < len(sep_start):  # separator shouldn't come earlier than this
+        return path, metainfo
+
+    # https://black.readthedocs.io/en/stable/faq.html#why-are-flake8-s-e203-and-w503-violated
+    text_clean = text[idx_separator + len(sep_end) :]  # noqa: E203
+    metainfo = yaml.safe_load(  # type: ignore
+        text[len(sep_start) : idx_separator]  # noqa: E203
+    )
+
+    file = Path(mkdtemp()) / "tmp-model-card.md"
+    with open(file, "w") as f:
+        f.write(text_clean)
+    return file, metainfo
+
+
 def parse_modelcard(path: str | Path) -> Card:
     """Read a model card and return a Card object
 
@@ -148,6 +202,8 @@ def parse_modelcard(path: str | Path) -> Card:
     """
     check_pandoc_installed()
 
+    path, metainfo = _card_with_detached_metainfo(path)
+
     proc = subprocess.run(
         ["pandoc", "-t", "json", "-s", str(path)],
         capture_output=True,
@@ -156,5 +212,7 @@ def parse_modelcard(path: str | Path) -> Card:
 
     parser = PandocParser(source)
     card = parser.generate()
+    for key, val in metainfo.items():
+        setattr(card.metadata, key, val)
 
     return card
diff --git a/skops/card/tests/examples/bert-base-uncased.md b/skops/card/tests/examples/bert-base-uncased.md
new file mode 100644
index 00000000..e762fc35
--- /dev/null
+++ b/skops/card/tests/examples/bert-base-uncased.md
@@ -0,0 +1,249 @@
+---
+language: en
+tags:
+- exbert
+license: apache-2.0
+datasets:
+- bookcorpus
+- wikipedia
+---
+
+# BERT base model (uncased)
+
+<!-- retrieved on 2022-12-02 | mod: removed trailing whitespaces -->
+
+Pretrained model on English language using a masked language modeling (MLM) objective. It was introduced in
+[this paper](https://arxiv.org/abs/1810.04805) and first released in
+[this repository](https://github.com/google-research/bert). This model is uncased: it does not make a difference
+between english and English.
+
+Disclaimer: The team releasing BERT did not write a model card for this model so this model card has been written by
+the Hugging Face team.
+
+## Model description
+
+BERT is a transformers model pretrained on a large corpus of English data in a self-supervised fashion. This means it
+was pretrained on the raw texts only, with no humans labeling them in any way (which is why it can use lots of
+publicly available data) with an automatic process to generate inputs and labels from those texts. More precisely, it
+was pretrained with two objectives:
+
+- Masked language modeling (MLM): taking a sentence, the model randomly masks 15% of the words in the input then run
+  the entire masked sentence through the model and has to predict the masked words. This is different from traditional
+  recurrent neural networks (RNNs) that usually see the words one after the other, or from autoregressive models like
+  GPT which internally masks the future tokens. It allows the model to learn a bidirectional representation of the
+  sentence.
+- Next sentence prediction (NSP): the models concatenates two masked sentences as inputs during pretraining. Sometimes
+  they correspond to sentences that were next to each other in the original text, sometimes not. The model then has to
+  predict if the two sentences were following each other or not.
+
+This way, the model learns an inner representation of the English language that can then be used to extract features
+useful for downstream tasks: if you have a dataset of labeled sentences, for instance, you can train a standard
+classifier using the features produced by the BERT model as inputs.
+
+## Model variations
+
+BERT has originally been released in base and large variations, for cased and uncased input text. The uncased models also strips out an accent markers.
+Chinese and multilingual uncased and cased versions followed shortly after.
+Modified preprocessing with whole word masking has replaced subpiece masking in a following work, with the release of two models.
+Other 24 smaller models are released afterward.
+
+The detailed release history can be found on the [google-research/bert readme](https://github.com/google-research/bert/blob/master/README.md) on github.
+
+| Model | #params | Language |
+|------------------------|--------------------------------|-------|
+| [`bert-base-uncased`](https://huggingface.co/bert-base-uncased) | 110M   | English |
+| [`bert-large-uncased`](https://huggingface.co/bert-large-uncased)              | 340M    | English | sub
+| [`bert-base-cased`](https://huggingface.co/bert-base-cased)        | 110M    | English |
+| [`bert-large-cased`](https://huggingface.co/bert-large-cased) | 340M    |  English |
+| [`bert-base-chinese`](https://huggingface.co/bert-base-chinese) | 110M    | Chinese |
+| [`bert-base-multilingual-cased`](https://huggingface.co/bert-base-multilingual-cased) | 110M | Multiple |
+| [`bert-large-uncased-whole-word-masking`](https://huggingface.co/bert-large-uncased-whole-word-masking) | 340M | English |
+| [`bert-large-cased-whole-word-masking`](https://huggingface.co/bert-large-cased-whole-word-masking) | 340M | English |
+
+## Intended uses & limitations
+
+You can use the raw model for either masked language modeling or next sentence prediction, but it's mostly intended to
+be fine-tuned on a downstream task. See the [model hub](https://huggingface.co/models?filter=bert) to look for
+fine-tuned versions of a task that interests you.
+
+Note that this model is primarily aimed at being fine-tuned on tasks that use the whole sentence (potentially masked)
+to make decisions, such as sequence classification, token classification or question answering. For tasks such as text
+generation you should look at model like GPT2.
+
+### How to use
+
+You can use this model directly with a pipeline for masked language modeling:
+
+```python
+>>> from transformers import pipeline
+>>> unmasker = pipeline('fill-mask', model='bert-base-uncased')
+>>> unmasker("Hello I'm a [MASK] model.")
+[{'sequence': "[CLS] hello i'm a fashion model. [SEP]",
+  'score': 0.1073106899857521,
+  'token': 4827,
+  'token_str': 'fashion'},
+ {'sequence': "[CLS] hello i'm a role model. [SEP]",
+  'score': 0.08774490654468536,
+  'token': 2535,
+  'token_str': 'role'},
+ {'sequence': "[CLS] hello i'm a new model. [SEP]",
+  'score': 0.05338378623127937,
+  'token': 2047,
+  'token_str': 'new'},
+ {'sequence': "[CLS] hello i'm a super model. [SEP]",
+  'score': 0.04667217284440994,
+  'token': 3565,
+  'token_str': 'super'},
+ {'sequence': "[CLS] hello i'm a fine model. [SEP]",
+  'score': 0.027095865458250046,
+  'token': 2986,
+  'token_str': 'fine'}]
+```
+
+Here is how to use this model to get the features of a given text in PyTorch:
+
+```python
+from transformers import BertTokenizer, BertModel
+tokenizer = BertTokenizer.from_pretrained('bert-base-uncased')
+model = BertModel.from_pretrained("bert-base-uncased")
+text = "Replace me by any text you'd like."
+encoded_input = tokenizer(text, return_tensors='pt')
+output = model(**encoded_input)
+```
+
+and in TensorFlow:
+
+```python
+from transformers import BertTokenizer, TFBertModel
+tokenizer = BertTokenizer.from_pretrained('bert-base-uncased')
+model = TFBertModel.from_pretrained("bert-base-uncased")
+text = "Replace me by any text you'd like."
+encoded_input = tokenizer(text, return_tensors='tf')
+output = model(encoded_input)
+```
+
+### Limitations and bias
+
+Even if the training data used for this model could be characterized as fairly neutral, this model can have biased
+predictions:
+
+```python
+>>> from transformers import pipeline
+>>> unmasker = pipeline('fill-mask', model='bert-base-uncased')
+>>> unmasker("The man worked as a [MASK].")
+[{'sequence': '[CLS] the man worked as a carpenter. [SEP]',
+  'score': 0.09747550636529922,
+  'token': 10533,
+  'token_str': 'carpenter'},
+ {'sequence': '[CLS] the man worked as a waiter. [SEP]',
+  'score': 0.0523831807076931,
+  'token': 15610,
+  'token_str': 'waiter'},
+ {'sequence': '[CLS] the man worked as a barber. [SEP]',
+  'score': 0.04962705448269844,
+  'token': 13362,
+  'token_str': 'barber'},
+ {'sequence': '[CLS] the man worked as a mechanic. [SEP]',
+  'score': 0.03788609802722931,
+  'token': 15893,
+  'token_str': 'mechanic'},
+ {'sequence': '[CLS] the man worked as a salesman. [SEP]',
+  'score': 0.037680890411138535,
+  'token': 18968,
+  'token_str': 'salesman'}]
+>>> unmasker("The woman worked as a [MASK].")
+[{'sequence': '[CLS] the woman worked as a nurse. [SEP]',
+  'score': 0.21981462836265564,
+  'token': 6821,
+  'token_str': 'nurse'},
+ {'sequence': '[CLS] the woman worked as a waitress. [SEP]',
+  'score': 0.1597415804862976,
+  'token': 13877,
+  'token_str': 'waitress'},
+ {'sequence': '[CLS] the woman worked as a maid. [SEP]',
+  'score': 0.1154729500412941,
+  'token': 10850,
+  'token_str': 'maid'},
+ {'sequence': '[CLS] the woman worked as a prostitute. [SEP]',
+  'score': 0.037968918681144714,
+  'token': 19215,
+  'token_str': 'prostitute'},
+ {'sequence': '[CLS] the woman worked as a cook. [SEP]',
+  'score': 0.03042375110089779,
+  'token': 5660,
+  'token_str': 'cook'}]
+```
+
+This bias will also affect all fine-tuned versions of this model.
+
+## Training data
+
+The BERT model was pretrained on [BookCorpus](https://yknzhu.wixsite.com/mbweb), a dataset consisting of 11,038
+unpublished books and [English Wikipedia](https://en.wikipedia.org/wiki/English_Wikipedia) (excluding lists, tables and
+headers).
+
+## Training procedure
+
+### Preprocessing
+
+The texts are lowercased and tokenized using WordPiece and a vocabulary size of 30,000. The inputs of the model are
+then of the form:
+
+```
+[CLS] Sentence A [SEP] Sentence B [SEP]
+```
+
+With probability 0.5, sentence A and sentence B correspond to two consecutive sentences in the original corpus, and in
+the other cases, it's another random sentence in the corpus. Note that what is considered a sentence here is a
+consecutive span of text usually longer than a single sentence. The only constrain is that the result with the two
+"sentences" has a combined length of less than 512 tokens.
+
+The details of the masking procedure for each sentence are the following:
+- 15% of the tokens are masked.
+- In 80% of the cases, the masked tokens are replaced by `[MASK]`.
+- In 10% of the cases, the masked tokens are replaced by a random token (different) from the one they replace.
+- In the 10% remaining cases, the masked tokens are left as is.
+
+### Pretraining
+
+The model was trained on 4 cloud TPUs in Pod configuration (16 TPU chips total) for one million steps with a batch size
+of 256. The sequence length was limited to 128 tokens for 90% of the steps and 512 for the remaining 10%. The optimizer
+used is Adam with a learning rate of 1e-4, \\(\beta_{1} = 0.9\\) and \\(\beta_{2} = 0.999\\), a weight decay of 0.01,
+learning rate warmup for 10,000 steps and linear decay of the learning rate after.
+
+## Evaluation results
+
+When fine-tuned on downstream tasks, this model achieves the following results:
+
+Glue test results:
+
+| Task | MNLI-(m/mm) | QQP  | QNLI | SST-2 | CoLA | STS-B | MRPC | RTE  | Average |
+|:----:|:-----------:|:----:|:----:|:-----:|:----:|:-----:|:----:|:----:|:-------:|
+|      | 84.6/83.4   | 71.2 | 90.5 | 93.5  | 52.1 | 85.8  | 88.9 | 66.4 | 79.6    |
+
+
+### BibTeX entry and citation info
+
+```bibtex
+@article{DBLP:journals/corr/abs-1810-04805,
+  author    = {Jacob Devlin and
+               Ming{-}Wei Chang and
+               Kenton Lee and
+               Kristina Toutanova},
+  title     = {{BERT:} Pre-training of Deep Bidirectional Transformers for Language
+               Understanding},
+  journal   = {CoRR},
+  volume    = {abs/1810.04805},
+  year      = {2018},
+  url       = {http://arxiv.org/abs/1810.04805},
+  archivePrefix = {arXiv},
+  eprint    = {1810.04805},
+  timestamp = {Tue, 30 Oct 2018 20:39:56 +0100},
+  biburl    = {https://dblp.org/rec/journals/corr/abs-1810-04805.bib},
+  bibsource = {dblp computer science bibliography, https://dblp.org}
+}
+```
+
+<a href="https://huggingface.co/exbert/?model=bert-base-uncased">
+	<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
+</a>
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index be33e72e..87d54d84 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -1,3 +1,6 @@
+import os
+from pathlib import Path
+
 import numpy as np
 import pytest
 from sklearn.linear_model import LinearRegression
@@ -73,3 +76,20 @@ def test_parsed_card_identical(card, tmp_path):
     parsed_card.save(file1)
 
     assert_readme_files_equal(file0, file1)
+
+
+@pytest.mark.xfail(reason="small diff, especially in tables")
+def test_bert_base_uncased(tmp_path):
+    file0 = (
+        Path(os.getcwd())
+        / "skops"
+        / "card"
+        / "tests"
+        / "examples"
+        / "bert-base-uncased.md"
+    )
+    parsed_card = parse_modelcard(file0)
+    file1 = tmp_path / "readme-parsed.md"
+    parsed_card.save(file1)
+
+    assert_readme_files_equal(file0, file1)

From 9744998d0d80d358b599a14ecc943e47f0dae326 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 2 Dec 2022 14:30:16 +0100
Subject: [PATCH 21/47] Add a bunch of more markup support

Now supports:

- Space
- Strong
- Emph
- Strikeout
- Subscript
- Superscript
- Plain
- Str
- RawInline
- RawBlock
- SoftBreak
- LineBreak
- Para
- Header
- Image
- CodeBlock
- Code
- Table
- Div
- Link
- BulletList
- Quoted
---
 skops/card/_markup.py | 80 ++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 76 insertions(+), 4 deletions(-)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index 6c2f8846..a0425f81 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -17,7 +17,7 @@ class Markdown:
     This class has a ``mapping`` attribute, which is just a dict. The keys are
     Pandoc types and the values are functions that transform the corresponding
     value into a string with markdown syntax. Those functions are all prefixed
-    with ``md_``, e.g. ``md_Image`` for transforming a pandoc ``Image`` into a
+    with ``md_``, e.g. ``md_image`` for transforming a pandoc ``Image`` into a
     markdown figure.
 
     From the caller side, only the ``__call__`` method should be used, the rest
@@ -30,17 +30,26 @@ def __init__(self):
         self.mapping = {
             "Space": self.md_space,
             "Strong": self.md_strong,
+            "Emph": self.md_emph,
+            "Strikeout": self.md_strikeout,
+            "Subscript": self.md_subscript,
+            "Superscript": self.md_superscript,
             "Plain": self.md_plain,
             "Str": self.md_str,
             "RawInline": self.md_rawline,
             "RawBlock": self.md_raw_block,
             "SoftBreak": self.md_softbreak,
+            "LineBreak": self.md_linebreak,
             "Para": self.md_para,
             "Header": self.md_header,
             "Image": self.md_image,
             "CodeBlock": self.md_code_block,
+            "Code": self.md_code,
             "Table": self.md_table,
             "Div": self.md_parse_div,
+            "Link": self.md_link,
+            "BulletList": self.md_bullet_list,
+            "Quoted": self.md_quoted,
         }
 
     @staticmethod
@@ -53,6 +62,30 @@ def md_strong(self, value) -> str:
         parts.append("**")
         return "".join(parts)
 
+    def md_emph(self, value) -> str:
+        parts = ["_"]
+        parts += [self.__call__(subitem) for subitem in value]
+        parts.append("_")
+        return "".join(parts)
+
+    def md_strikeout(self, value) -> str:
+        parts = ["~~"]
+        parts += [self.__call__(subitem) for subitem in value]
+        parts.append("~~")
+        return "".join(parts)
+
+    def md_subscript(self, value) -> str:
+        parts = ["<sub>"]
+        parts += [self.__call__(subitem) for subitem in value]
+        parts.append("</sub>")
+        return "".join(parts)
+
+    def md_superscript(self, value) -> str:
+        parts = ["<sup>"]
+        parts += [self.__call__(subitem) for subitem in value]
+        parts.append("</sup>")
+        return "".join(parts)
+
     def md_plain(self, value) -> str:
         parts = [self.__call__(subitem) for subitem in value]
         return "".join(parts)
@@ -76,6 +109,10 @@ def md_raw_block(self, item) -> str:
     def md_softbreak(value) -> str:
         return "\n"
 
+    @staticmethod
+    def md_linebreak(value) -> str:
+        return "\n"
+
     def _make_content(self, content):
         parts = []
         for item in content:
@@ -105,14 +142,19 @@ def md_image(self, value) -> str:
     @staticmethod
     def md_code_block(item: tuple[tuple[int, list[str], list[str]], str]) -> str:
         # a codeblock consists of: (id, classes, namevals) contents
-        (_, _, namevals), content = item
+        (_, classes, _), content = item
         block_start = "```"
-        if namevals:  # TODO: check if this makes "```python" etc.
-            block_start += namevals[0]
+        if classes:
+            block_start += ", ".join(classes)
         block_end = "```"
         content = "\n".join((block_start, content, block_end))
         return content
 
+    @staticmethod
+    def md_code(item: tuple[Any, str]) -> str:
+        _, txt = item
+        return f"`{txt}`"
+
     def md_table(self, item) -> str:
         _, alignments, _, header, rows = item
         fn = self.__call__
@@ -162,6 +204,36 @@ def md_parse_div(self, item) -> str:
         end = "</div>"
         return "".join([start] + middle + [end])
 
+    def md_link(self, item) -> str:
+        _, txt, (src, _) = item
+        txt_formatted = self._make_content(txt)
+        return f"[{txt_formatted}]({src})"
+
+    def md_bullet_list(self, item) -> str:
+        parts = []
+        for subitem in item:
+            assert len(subitem) == 1
+            content = "".join(self.__call__(i) for i in subitem)
+            # indent the lines in lists if they contain line breaks
+            content = content.replace("\n", "\n  ")
+            parts.append(f"- {content}")
+        return "\n".join(parts)
+
+    def md_quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
+        quote_type, content = item
+        type_ = quote_type["t"]
+        try:
+            sym = {"DoubleQuote": '"', "SingleQuote": "'"}[type_]
+        except KeyError as exc:
+            msg = (
+                f"The parsed document contains '{type_}', which is not "
+                "supported yet, please open an issue on GitHub"
+            )
+            raise ValueError(msg) from exc
+
+        text = "".join(self.__call__(i) for i in content)
+        return f"{sym}{text}{sym}"
+
     def __call__(self, item: str | PandocItem) -> str:
         if isinstance(item, str):
             return item

From d8649411df5329746705cb6ec6f4c7cc1a714d3a Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 5 Dec 2022 16:55:22 +0100
Subject: [PATCH 22/47] Add more test cases for model card parser

I added 5 model cards from the top 10 most used models from the Hub (I
excluded cards that were too similar to one another). The tests were
rewritten so that they should now pass.

There are some limitations to the parser that results in the generated
cards not being 100% identical. Those limiations are now documented.
However, I don't believe that those limitations matter, as they make no
semantic difference but rather are stylistic or even invisible. The most
notable difference is the alignment of columns in tables.

The tests pass despite those differences because I rewrote them to
include a diff file for each model card. When the generated card is
compared to the original one, a diff is created and compared to the
checked in diff. This way, we have control over what diff we permit.

I had to exclude the folder containing the cards and diffs from the
pre-commit task "trailing-whitespace", as we need the trailing
whitespace in there.
---
 .pre-commit-config.yaml                       |   1 +
 skops/card/_markup.py                         |  16 +-
 skops/card/_parser.py                         |  35 +++-
 .../tests/examples/bert-base-uncased.md.diff  |  40 +++++
 .../tests/examples/clip-vit-large-patch14.md  | 147 +++++++++++++++
 .../examples/clip-vit-large-patch14.md.diff   |  19 ++
 skops/card/tests/examples/gpt2.md             | 168 ++++++++++++++++++
 skops/card/tests/examples/gpt2.md.diff        |  22 +++
 skops/card/tests/examples/specter.md          |  26 +++
 skops/card/tests/examples/specter.md.diff     |  11 ++
 .../examples/vit-base-patch32-224-in21k.md    |  94 ++++++++++
 .../vit-base-patch32-224-in21k.md.diff        |   5 +
 skops/card/tests/test_parser.py               |  70 ++++----
 13 files changed, 619 insertions(+), 35 deletions(-)
 create mode 100644 skops/card/tests/examples/bert-base-uncased.md.diff
 create mode 100644 skops/card/tests/examples/clip-vit-large-patch14.md
 create mode 100644 skops/card/tests/examples/clip-vit-large-patch14.md.diff
 create mode 100644 skops/card/tests/examples/gpt2.md
 create mode 100644 skops/card/tests/examples/gpt2.md.diff
 create mode 100644 skops/card/tests/examples/specter.md
 create mode 100644 skops/card/tests/examples/specter.md.diff
 create mode 100644 skops/card/tests/examples/vit-base-patch32-224-in21k.md
 create mode 100644 skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 4068292e..319d9a63 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -6,6 +6,7 @@ repos:
         exclude: .github/conda/meta.yaml
     -   id: end-of-file-fixer
     -   id: trailing-whitespace
+        exclude: skops/card/tests/examples
     -   id: check-case-conflict
     -   id: check-merge-conflict
 -   repo: https://github.com/psf/black
diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index a0425f81..9ddf1afd 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -50,6 +50,7 @@ def __init__(self):
             "Link": self.md_link,
             "BulletList": self.md_bullet_list,
             "Quoted": self.md_quoted,
+            "BlockQuote": self.md_block_quote,
         }
 
     @staticmethod
@@ -92,7 +93,8 @@ def md_plain(self, value) -> str:
 
     @staticmethod
     def md_str(value) -> str:
-        return value
+        # escape \
+        return value.replace("\\", "\\\\")
 
     @staticmethod
     def md_rawline(value) -> str:
@@ -234,6 +236,18 @@ def md_quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
         text = "".join(self.__call__(i) for i in content)
         return f"{sym}{text}{sym}"
 
+    def md_block_quote(self, item: list[PandocItem]) -> str:
+        parts = []
+        for subitem in item:
+            content = self.__call__(subitem)
+            # add quote symbolx
+            content = content.replace("\n", "\n> ")
+            parts.append(content)
+
+        # add a quote symbol to the very start
+        text = "> " + "\n> ".join(parts)
+        return text
+
     def __call__(self, item: str | PandocItem) -> str:
         if isinstance(item, str):
             return item
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index e849852d..933ea1d8 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -75,16 +75,21 @@ def parse_header(self, item: PandocItem) -> str:
         self._section_trace = self._section_trace[: level - 1] + [content]
         return content
 
+    def post_process(self, res: str) -> str:
+        # replace Latin1 space
+        res = res.replace("\xa0", " ")
+        return res
+
     def generate(self) -> Card:
         # Parsing the flat structure, not recursively as in pandocfilters.
         # After visiting the parent node, it's not necessary to visit its
         # child nodes, because that's already done during parsing.
         for item in json.loads(self.source)["blocks"]:
             if item["t"] == "Header":
-                res = self.parse_header(item)
+                res = self.post_process(self.parse_header(item))
                 self.add_section(res)
             else:
-                res = self.mapping(item)
+                res = self.post_process(self.mapping(item))
                 self.add_content(res)
 
         return self.card
@@ -189,6 +194,32 @@ def parse_modelcard(path: str | Path) -> Card:
     >>> # overwrite old card with new one
     >>> parsed_card.save("README.md")
 
+    Notes
+    -----
+    There are some **known limitations** to the parser that may result in the
+    model card generated from the parsed file not being 100% identical to the
+    original model card:
+
+    - In markdown, bold and italic text can be encoded in different fashions,
+      e.g. ``_like this_`` or ``*like this*`` for italic text. Pandoc doesn't
+      differentiate between the two. Therefore, the output may use one method
+      where the original card used the other. When rendered, the two results
+      should, however, be the same.
+    - Table alignment may be different. At the moment, skops does not make use
+      of column alignment information in tables, so that may differ.
+    - Quote symbols may differ, e.g. ``it’s`` becoming ``it's``.
+    - The number of empty lines may differ, e.g. two empty lines being
+      transformed into one empty line.
+    - Trailing whitespace is removed.
+    - Tab indentation may be removed, e.g. in raw html.
+    - The yaml part of the model card can have some non-semantic differences,
+      like omitting optional quotation marks.
+
+    For these reasons, please don't expect the output of a parsed card to be
+    100% identical to the original input. However, none of the listed changes
+    makes any _semantic_ difference. If you find that there is a semantic
+    difference in the output, please open an issue on GitHub.
+
     Parameters
     ----------
     path : str or pathlib.Path
diff --git a/skops/card/tests/examples/bert-base-uncased.md.diff b/skops/card/tests/examples/bert-base-uncased.md.diff
new file mode 100644
index 00000000..e4fb5c66
--- /dev/null
+++ b/skops/card/tests/examples/bert-base-uncased.md.diff
@@ -0,0 +1,40 @@
+--- 
++++ 
+@@ -52,10 +52,10 @@
+-| Model | #params | Language |
+-|------------------------|--------------------------------|-------|
+-| [`bert-base-uncased`](https://huggingface.co/bert-base-uncased) | 110M   | English |
+-| [`bert-large-uncased`](https://huggingface.co/bert-large-uncased)              | 340M    | English | sub
+-| [`bert-base-cased`](https://huggingface.co/bert-base-cased)        | 110M    | English |
+-| [`bert-large-cased`](https://huggingface.co/bert-large-cased) | 340M    |  English |
+-| [`bert-base-chinese`](https://huggingface.co/bert-base-chinese) | 110M    | Chinese |
+-| [`bert-base-multilingual-cased`](https://huggingface.co/bert-base-multilingual-cased) | 110M | Multiple |
+-| [`bert-large-uncased-whole-word-masking`](https://huggingface.co/bert-large-uncased-whole-word-masking) | 340M | English |
+-| [`bert-large-cased-whole-word-masking`](https://huggingface.co/bert-large-cased-whole-word-masking) | 340M | English |
++| Model                                                                                                   | #params   | Language   |
++|---------------------------------------------------------------------------------------------------------|-----------|------------|
++| [`bert-base-uncased`](https://huggingface.co/bert-base-uncased)                                         | 110M      | English    |
++| [`bert-large-uncased`](https://huggingface.co/bert-large-uncased)                                       | 340M      | English    |
++| [`bert-base-cased`](https://huggingface.co/bert-base-cased)                                             | 110M      | English    |
++| [`bert-large-cased`](https://huggingface.co/bert-large-cased)                                           | 340M      | English    |
++| [`bert-base-chinese`](https://huggingface.co/bert-base-chinese)                                         | 110M      | Chinese    |
++| [`bert-base-multilingual-cased`](https://huggingface.co/bert-base-multilingual-cased)                   | 110M      | Multiple   |
++| [`bert-large-uncased-whole-word-masking`](https://huggingface.co/bert-large-uncased-whole-word-masking) | 340M      | English    |
++| [`bert-large-cased-whole-word-masking`](https://huggingface.co/bert-large-cased-whole-word-masking)     | 340M      | English    |
+@@ -65 +65 @@
+-You can use the raw model for either masked language modeling or next sentence prediction, but it's mostly intended to
++You can use the raw model for either masked language modeling or next sentence prediction, but it’s mostly intended to
+@@ -197 +197 @@
+-the other cases, it's another random sentence in the corpus. Note that what is considered a sentence here is a
++the other cases, it’s another random sentence in the corpus. Note that what is considered a sentence here is a
+@@ -220,4 +220,3 @@
+-| Task | MNLI-(m/mm) | QQP  | QNLI | SST-2 | CoLA | STS-B | MRPC | RTE  | Average |
+-|:----:|:-----------:|:----:|:----:|:-----:|:----:|:-----:|:----:|:----:|:-------:|
+-|      | 84.6/83.4   | 71.2 | 90.5 | 93.5  | 52.1 | 85.8  | 88.9 | 66.4 | 79.6    |
+-
++| Task   | MNLI-(m/mm)   |   QQP |   QNLI |   SST-2 |   CoLA |   STS-B |   MRPC |   RTE |   Average |
++|--------|---------------|-------|--------|---------|--------|---------|--------|-------|-----------|
++|        | 84.6/83.4     |  71.2 |   90.5 |    93.5 |   52.1 |    85.8 |   88.9 |  66.4 |      79.6 |
+@@ -248 +247 @@
+-	<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
++<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
diff --git a/skops/card/tests/examples/clip-vit-large-patch14.md b/skops/card/tests/examples/clip-vit-large-patch14.md
new file mode 100644
index 00000000..cbbfa909
--- /dev/null
+++ b/skops/card/tests/examples/clip-vit-large-patch14.md
@@ -0,0 +1,147 @@
+---
+tags:
+- vision
+widget:
+- src: https://huggingface.co/datasets/mishig/sample_images/resolve/main/cat-dog-music.png
+  candidate_labels: playing music, playing sports
+  example_title: Cat & Dog
+---
+
+# Model Card: CLIP
+
+<!-- retrieved on 2022-12-05  | mod: removed trailing whitespaces -->
+
+Disclaimer: The model card is taken and modified from the official CLIP repository, it can be found [here](https://github.com/openai/CLIP/blob/main/model-card.md).
+
+## Model Details
+
+The CLIP model was developed by researchers at OpenAI to learn about what contributes to robustness in computer vision tasks. The model was also developed to test the ability of models to generalize to arbitrary image classification tasks in a zero-shot manner. It was not developed for general model deployment - to deploy models like CLIP, researchers will first need to carefully study their capabilities in relation to the specific context they’re being deployed within.
+
+### Model Date
+
+January 2021
+
+### Model Type
+
+The base model uses a ViT-L/14 Transformer architecture as an image encoder and uses a masked self-attention Transformer as a text encoder. These encoders are trained to maximize the similarity of (image, text) pairs via a contrastive loss.
+
+The original implementation had two variants: one using a ResNet image encoder and the other using a Vision Transformer. This repository has the variant with the Vision Transformer.
+
+
+### Documents
+
+- [Blog Post](https://openai.com/blog/clip/)
+- [CLIP Paper](https://arxiv.org/abs/2103.00020)
+
+
+### Use with Transformers
+
+```python
+from PIL import Image
+import requests
+
+from transformers import CLIPProcessor, CLIPModel
+
+model = CLIPModel.from_pretrained("openai/clip-vit-large-patch14")
+processor = CLIPProcessor.from_pretrained("openai/clip-vit-large-patch14")
+
+url = "http://images.cocodataset.org/val2017/000000039769.jpg"
+image = Image.open(requests.get(url, stream=True).raw)
+
+inputs = processor(text=["a photo of a cat", "a photo of a dog"], images=image, return_tensors="pt", padding=True)
+
+outputs = model(**inputs)
+logits_per_image = outputs.logits_per_image # this is the image-text similarity score
+probs = logits_per_image.softmax(dim=1) # we can take the softmax to get the label probabilities
+```
+
+
+## Model Use
+
+### Intended Use
+
+The model is intended as a research output for research communities. We hope that this model will enable researchers to better understand and explore zero-shot, arbitrary image classification. We also hope it can be used for interdisciplinary studies of the potential impact of such models - the CLIP paper includes a discussion of potential downstream impacts to provide an example for this sort of analysis.
+
+#### Primary intended uses
+
+The primary intended users of these models are AI researchers.
+
+We primarily imagine the model will be used by researchers to better understand robustness, generalization, and other capabilities, biases, and constraints of computer vision models.
+
+### Out-of-Scope Use Cases
+
+**Any** deployed use case of the model - whether commercial or not - is currently out of scope. Non-deployed use cases such as image search in a constrained environment, are also not recommended unless there is thorough in-domain testing of the model with a specific, fixed class taxonomy. This is because our safety assessment demonstrated a high need for task specific testing especially given the variability of CLIP’s performance with different class taxonomies. This makes untested and unconstrained deployment of the model in any use case currently potentially harmful.
+
+Certain use cases which would fall under the domain of surveillance and facial recognition are always out-of-scope regardless of performance of the model. This is because the use of artificial intelligence for tasks such as these can be premature currently given the lack of testing norms and checks to ensure its fair use.
+
+Since the model has not been purposefully trained in or evaluated on any languages other than English, its use should be limited to English language use cases.
+
+
+
+## Data
+
+The model was trained on publicly available image-caption data. This was done through a combination of crawling a handful of websites and using commonly-used pre-existing image datasets such as [YFCC100M](http://projects.dfki.uni-kl.de/yfcc100m/). A large portion of the data comes from our crawling of the internet. This means that the data is more representative of people and societies most connected to the internet which tend to skew towards more developed nations, and younger, male users.
+
+### Data Mission Statement
+
+Our goal with building this dataset was to test out robustness and generalizability in computer vision tasks. As a result, the focus was on gathering large quantities of data from different publicly-available internet data sources. The data was gathered in a mostly non-interventionist manner. However, we only crawled websites that had policies against excessively violent and adult images and allowed us to filter out such content. We do not intend for this dataset to be used as the basis for any commercial or deployed model and will not be releasing the dataset.
+
+
+
+## Performance and Limitations
+
+### Performance
+
+We have evaluated the performance of CLIP on a wide range of benchmarks across a variety of computer vision datasets such as OCR to texture recognition to fine-grained classification. The paper describes model performance on the following datasets:
+
+- Food101
+- CIFAR10
+- CIFAR100
+- Birdsnap
+- SUN397
+- Stanford Cars
+- FGVC Aircraft
+- VOC2007
+- DTD
+- Oxford-IIIT Pet dataset
+- Caltech101
+- Flowers102
+- MNIST
+- SVHN
+- IIIT5K
+- Hateful Memes
+- SST-2
+- UCF101
+- Kinetics700
+- Country211
+- CLEVR Counting
+- KITTI Distance
+- STL-10
+- RareAct
+- Flickr30
+- MSCOCO
+- ImageNet
+- ImageNet-A
+- ImageNet-R
+- ImageNet Sketch
+- ObjectNet (ImageNet Overlap)
+- Youtube-BB
+- ImageNet-Vid
+
+## Limitations
+
+CLIP and our analysis of it have a number of limitations. CLIP currently struggles with respect to certain tasks such as fine grained classification and counting objects. CLIP also poses issues with regards to fairness and bias which we discuss in the paper and briefly in the next section. Additionally, our approach to testing CLIP also has an important limitation- in many cases we have used linear probes to evaluate the performance of CLIP and there is evidence suggesting that linear probes can underestimate model performance.
+
+### Bias and Fairness
+
+We find that the performance of CLIP - and the specific biases it exhibits - can depend significantly on class design and the choices one makes for categories to include and exclude. We tested the risk of certain kinds of denigration with CLIP by classifying images of people from [Fairface](https://arxiv.org/abs/1908.04913) into crime-related and non-human animal categories. We found significant disparities with respect to race and gender. Additionally, we found that these disparities could shift based on how the classes were constructed. (Details captured in the Broader Impacts Section in the paper).
+
+We also tested the performance of CLIP on gender, race and age classification using the Fairface dataset (We default to using race categories as they are constructed in the Fairface dataset.) in order to assess quality of performance across different demographics. We found accuracy >96% across all races for gender classification with ‘Middle Eastern’ having the highest accuracy (98.4%) and ‘White’ having the lowest (96.5%). Additionally, CLIP averaged ~93% for racial classification and ~63% for age classification. Our use of evaluations to test for gender, race and age classification as well as denigration harms is simply to evaluate performance of the model across people and surface potential risks and not to demonstrate an endorsement/enthusiasm for such tasks.
+
+
+
+## Feedback
+
+### Where to send questions or comments about the model
+
+Please use [this Google Form](https://forms.gle/Uv7afRH5dvY34ZEs9)
diff --git a/skops/card/tests/examples/clip-vit-large-patch14.md.diff b/skops/card/tests/examples/clip-vit-large-patch14.md.diff
new file mode 100644
index 00000000..f2da254b
--- /dev/null
+++ b/skops/card/tests/examples/clip-vit-large-patch14.md.diff
@@ -0,0 +1,19 @@
+--- 
++++ 
+@@ -30 +29,0 @@
+-
+@@ -35 +33,0 @@
+-
+@@ -58 +55,0 @@
+-
+@@ -79,2 +75,0 @@
+-
+-
+@@ -88,2 +82,0 @@
+-
+-
+@@ -139,3 +132 @@
+-We also tested the performance of CLIP on gender, race and age classification using the Fairface dataset (We default to using race categories as they are constructed in the Fairface dataset.) in order to assess quality of performance across different demographics. We found accuracy >96% across all races for gender classification with ‘Middle Eastern’ having the highest accuracy (98.4%) and ‘White’ having the lowest (96.5%). Additionally, CLIP averaged ~93% for racial classification and ~63% for age classification. Our use of evaluations to test for gender, race and age classification as well as denigration harms is simply to evaluate performance of the model across people and surface potential risks and not to demonstrate an endorsement/enthusiasm for such tasks.
+-
+-
++We also tested the performance of CLIP on gender, race and age classification using the Fairface dataset (We default to using race categories as they are constructed in the Fairface dataset.) in order to assess quality of performance across different demographics. We found accuracy >96% across all races for gender classification with 'Middle Eastern' having the highest accuracy (98.4%) and 'White' having the lowest (96.5%). Additionally, CLIP averaged ~93% for racial classification and ~63% for age classification. Our use of evaluations to test for gender, race and age classification as well as denigration harms is simply to evaluate performance of the model across people and surface potential risks and not to demonstrate an endorsement/enthusiasm for such tasks.
diff --git a/skops/card/tests/examples/gpt2.md b/skops/card/tests/examples/gpt2.md
new file mode 100644
index 00000000..6481d600
--- /dev/null
+++ b/skops/card/tests/examples/gpt2.md
@@ -0,0 +1,168 @@
+---
+language: en
+tags:
+- exbert
+
+license: mit
+---
+
+# GPT-2
+
+<!-- retrieved on 2022-12-05 | mod: removed trailing whitespaces -->
+
+Test the whole generation capabilities here: https://transformer.huggingface.co/doc/gpt2-large
+
+Pretrained model on English language using a causal language modeling (CLM) objective. It was introduced in
+[this paper](https://d4mucfpksywv.cloudfront.net/better-language-models/language_models_are_unsupervised_multitask_learners.pdf)
+and first released at [this page](https://openai.com/blog/better-language-models/).
+
+Disclaimer: The team releasing GPT-2 also wrote a
+[model card](https://github.com/openai/gpt-2/blob/master/model_card.md) for their model. Content from this model card
+has been written by the Hugging Face team to complete the information they provided and give specific examples of bias.
+
+## Model description
+
+GPT-2 is a transformers model pretrained on a very large corpus of English data in a self-supervised fashion. This
+means it was pretrained on the raw texts only, with no humans labelling them in any way (which is why it can use lots
+of publicly available data) with an automatic process to generate inputs and labels from those texts. More precisely,
+it was trained to guess the next word in sentences.
+
+More precisely, inputs are sequences of continuous text of a certain length and the targets are the same sequence,
+shifted one token (word or piece of word) to the right. The model uses internally a mask-mechanism to make sure the
+predictions for the token `i` only uses the inputs from `1` to `i` but not the future tokens.
+
+This way, the model learns an inner representation of the English language that can then be used to extract features
+useful for downstream tasks. The model is best at what it was pretrained for however, which is generating texts from a
+prompt.
+
+This is the **smallest** version of GPT-2, with 124M parameters.
+
+**Related Models:** [GPT-Large](https://huggingface.co/gpt2-large), [GPT-Medium](https://huggingface.co/gpt2-medium) and [GPT-XL](https://huggingface.co/gpt2-xl)
+
+## Intended uses & limitations
+
+You can use the raw model for text generation or fine-tune it to a downstream task. See the
+[model hub](https://huggingface.co/models?filter=gpt2) to look for fine-tuned versions on a task that interests you.
+
+### How to use
+
+You can use this model directly with a pipeline for text generation. Since the generation relies on some randomness, we
+set a seed for reproducibility:
+
+```python
+>>> from transformers import pipeline, set_seed
+>>> generator = pipeline('text-generation', model='gpt2')
+>>> set_seed(42)
+>>> generator("Hello, I'm a language model,", max_length=30, num_return_sequences=5)
+
+[{'generated_text': "Hello, I'm a language model, a language for thinking, a language for expressing thoughts."},
+ {'generated_text': "Hello, I'm a language model, a compiler, a compiler library, I just want to know how I build this kind of stuff. I don"},
+ {'generated_text': "Hello, I'm a language model, and also have more than a few of your own, but I understand that they're going to need some help"},
+ {'generated_text': "Hello, I'm a language model, a system model. I want to know my language so that it might be more interesting, more user-friendly"},
+ {'generated_text': 'Hello, I\'m a language model, not a language model"\n\nThe concept of "no-tricks" comes in handy later with new'}]
+```
+
+Here is how to use this model to get the features of a given text in PyTorch:
+
+```python
+from transformers import GPT2Tokenizer, GPT2Model
+tokenizer = GPT2Tokenizer.from_pretrained('gpt2')
+model = GPT2Model.from_pretrained('gpt2')
+text = "Replace me by any text you'd like."
+encoded_input = tokenizer(text, return_tensors='pt')
+output = model(**encoded_input)
+```
+
+and in TensorFlow:
+
+```python
+from transformers import GPT2Tokenizer, TFGPT2Model
+tokenizer = GPT2Tokenizer.from_pretrained('gpt2')
+model = TFGPT2Model.from_pretrained('gpt2')
+text = "Replace me by any text you'd like."
+encoded_input = tokenizer(text, return_tensors='tf')
+output = model(encoded_input)
+```
+
+### Limitations and bias
+
+The training data used for this model has not been released as a dataset one can browse. We know it contains a lot of
+unfiltered content from the internet, which is far from neutral. As the openAI team themselves point out in their
+[model card](https://github.com/openai/gpt-2/blob/master/model_card.md#out-of-scope-use-cases):
+
+> Because large-scale language models like GPT-2 do not distinguish fact from fiction, we don’t support use-cases
+> that require the generated text to be true.
+>
+> Additionally, language models like GPT-2 reflect the biases inherent to the systems they were trained on, so we do
+> not recommend that they be deployed into systems that interact with humans > unless the deployers first carry out a
+> study of biases relevant to the intended use-case. We found no statistically significant difference in gender, race,
+> and religious bias probes between 774M and 1.5B, implying all versions of GPT-2 should be approached with similar
+> levels of caution around use cases that are sensitive to biases around human attributes.
+
+Here's an example of how the model can have biased predictions:
+
+```python
+>>> from transformers import pipeline, set_seed
+>>> generator = pipeline('text-generation', model='gpt2')
+>>> set_seed(42)
+>>> generator("The White man worked as a", max_length=10, num_return_sequences=5)
+
+[{'generated_text': 'The White man worked as a mannequin for'},
+ {'generated_text': 'The White man worked as a maniser of the'},
+ {'generated_text': 'The White man worked as a bus conductor by day'},
+ {'generated_text': 'The White man worked as a plumber at the'},
+ {'generated_text': 'The White man worked as a journalist. He had'}]
+
+>>> set_seed(42)
+>>> generator("The Black man worked as a", max_length=10, num_return_sequences=5)
+
+[{'generated_text': 'The Black man worked as a man at a restaurant'},
+ {'generated_text': 'The Black man worked as a car salesman in a'},
+ {'generated_text': 'The Black man worked as a police sergeant at the'},
+ {'generated_text': 'The Black man worked as a man-eating monster'},
+ {'generated_text': 'The Black man worked as a slave, and was'}]
+```
+
+This bias will also affect all fine-tuned versions of this model.
+
+## Training data
+
+The OpenAI team wanted to train this model on a corpus as large as possible. To build it, they scraped all the web
+pages from outbound links on Reddit which received at least 3 karma. Note that all Wikipedia pages were removed from
+this dataset, so the model was not trained on any part of Wikipedia. The resulting dataset (called WebText) weights
+40GB of texts but has not been publicly released. You can find a list of the top 1,000 domains present in WebText
+[here](https://github.com/openai/gpt-2/blob/master/domains.txt).
+
+## Training procedure
+
+### Preprocessing
+
+The texts are tokenized using a byte-level version of Byte Pair Encoding (BPE) (for unicode characters) and a
+vocabulary size of 50,257. The inputs are sequences of 1024 consecutive tokens.
+
+The larger model was trained on 256 cloud TPU v3 cores. The training duration was not disclosed, nor were the exact
+details of training.
+
+## Evaluation results
+
+The model achieves the following results without any fine-tuning (zero-shot):
+
+| Dataset  | LAMBADA | LAMBADA | CBT-CN | CBT-NE | WikiText2 | PTB    | enwiki8 | text8  | WikiText103 | 1BW   |
+|:--------:|:-------:|:-------:|:------:|:------:|:---------:|:------:|:-------:|:------:|:-----------:|:-----:|
+| (metric) | (PPL)   | (ACC)   | (ACC)  | (ACC)  | (PPL)     | (PPL)  | (BPB)   | (BPC)  | (PPL)       | (PPL) |
+|          | 35.13   | 45.99   | 87.65  | 83.4   | 29.41     | 65.85  | 1.16    | 1,17   | 37.50       | 75.20 |
+
+
+### BibTeX entry and citation info
+
+```bibtex
+@article{radford2019language,
+  title={Language Models are Unsupervised Multitask Learners},
+  author={Radford, Alec and Wu, Jeff and Child, Rewon and Luan, David and Amodei, Dario and Sutskever, Ilya},
+  year={2019}
+}
+```
+
+<a href="https://huggingface.co/exbert/?model=gpt2">
+	<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
+</a>
diff --git a/skops/card/tests/examples/gpt2.md.diff b/skops/card/tests/examples/gpt2.md.diff
new file mode 100644
index 00000000..e95bc0cb
--- /dev/null
+++ b/skops/card/tests/examples/gpt2.md.diff
@@ -0,0 +1,22 @@
+--- 
++++ 
+@@ -5 +4,0 @@
+-
+@@ -95 +93,0 @@
+->
+@@ -102 +100 @@
+-Here's an example of how the model can have biased predictions:
++Here’s an example of how the model can have biased predictions:
+@@ -150,5 +148,4 @@
+-| Dataset  | LAMBADA | LAMBADA | CBT-CN | CBT-NE | WikiText2 | PTB    | enwiki8 | text8  | WikiText103 | 1BW   |
+-|:--------:|:-------:|:-------:|:------:|:------:|:---------:|:------:|:-------:|:------:|:-----------:|:-----:|
+-| (metric) | (PPL)   | (ACC)   | (ACC)  | (ACC)  | (PPL)     | (PPL)  | (BPB)   | (BPC)  | (PPL)       | (PPL) |
+-|          | 35.13   | 45.99   | 87.65  | 83.4   | 29.41     | 65.85  | 1.16    | 1,17   | 37.50       | 75.20 |
+-
++| Dataset   | LAMBADA   | CBT-CN   | CBT-NE   | WikiText2   | PTB   | enwiki8   | text8   | WikiText103   | 1BW   |
++|-----------|-----------|----------|----------|-------------|-------|-----------|---------|---------------|-------|
++| (metric)  | (ACC)     | (ACC)    | (ACC)    | (PPL)       | (PPL) | (BPB)     | (BPC)   | (PPL)         | (PPL) |
++|           | 45.99     | 87.65    | 83.4     | 29.41       | 65.85 | 1.16      | 1,17    | 37.50         | 75.20 |
+@@ -167 +164 @@
+-	<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
++<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
diff --git a/skops/card/tests/examples/specter.md b/skops/card/tests/examples/specter.md
new file mode 100644
index 00000000..e53e77ce
--- /dev/null
+++ b/skops/card/tests/examples/specter.md
@@ -0,0 +1,26 @@
+---
+language: en
+thumbnail: "https://camo.githubusercontent.com/7d080b7a769f7fdf64ac0ebeb47b039cb50be35287e3071f9d633f0fe33e7596/68747470733a2f2f692e6962622e636f2f33544331576d472f737065637465722d6c6f676f2d63726f707065642e706e67"
+license: apache-2.0
+datasets:
+- SciDocs
+metrics:
+- F1
+- accuracy
+- map
+- ndcg
+---
+
+## SPECTER
+
+<!-- retrieved on 2022-12-05 | mod: removed trailing whitespaces -->
+
+SPECTER is a pre-trained language model to generate document-level embedding of documents. It is pre-trained on a a powerful signal of document-level relatedness: the citation graph. Unlike existing pretrained language models, SPECTER can be easily applied to downstream applications without task-specific fine-tuning.
+
+Paper: [SPECTER: Document-level Representation Learning using Citation-informed Transformers](https://arxiv.org/pdf/2004.07180.pdf)
+
+Original Repo: [Github](https://github.com/allenai/specter)
+
+Evaluation Benchmark: [SciDocs](https://github.com/allenai/scidocs)
+
+Authors: *Arman Cohan, Sergey Feldman, Iz Beltagy, Doug Downey, Daniel S. Weld*
diff --git a/skops/card/tests/examples/specter.md.diff b/skops/card/tests/examples/specter.md.diff
new file mode 100644
index 00000000..7fcfa951
--- /dev/null
+++ b/skops/card/tests/examples/specter.md.diff
@@ -0,0 +1,11 @@
+--- 
++++ 
+@@ -3 +3 @@
+-thumbnail: "https://camo.githubusercontent.com/7d080b7a769f7fdf64ac0ebeb47b039cb50be35287e3071f9d633f0fe33e7596/68747470733a2f2f692e6962622e636f2f33544331576d472f737065637465722d6c6f676f2d63726f707065642e706e67"
++thumbnail: https://camo.githubusercontent.com/7d080b7a769f7fdf64ac0ebeb47b039cb50be35287e3071f9d633f0fe33e7596/68747470733a2f2f692e6962622e636f2f33544331576d472f737065637465722d6c6f676f2d63726f707065642e706e67
+@@ -14 +14 @@
+-## SPECTER
++# SPECTER
+@@ -26 +26 @@
+-Authors: *Arman Cohan, Sergey Feldman, Iz Beltagy, Doug Downey, Daniel S. Weld*
++Authors: _Arman Cohan, Sergey Feldman, Iz Beltagy, Doug Downey, Daniel S. Weld_
diff --git a/skops/card/tests/examples/vit-base-patch32-224-in21k.md b/skops/card/tests/examples/vit-base-patch32-224-in21k.md
new file mode 100644
index 00000000..570f5916
--- /dev/null
+++ b/skops/card/tests/examples/vit-base-patch32-224-in21k.md
@@ -0,0 +1,94 @@
+---
+license: apache-2.0
+tags:
+- vision
+datasets:
+- imagenet-21k
+inference: false
+---
+
+# Vision Transformer (base-sized model)
+
+<!-- retrieved on 2022-12-05 | mod: removed trailing whitespaces, double whitespace -->
+
+Vision Transformer (ViT) model pre-trained on ImageNet-21k (14 million images, 21,843 classes) at resolution 224x224. It was introduced in the paper [An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale](https://arxiv.org/abs/2010.11929) by Dosovitskiy et al. and first released in [this repository](https://github.com/google-research/vision_transformer). However, the weights were converted from the [timm repository](https://github.com/rwightman/pytorch-image-models) by Ross Wightman, who already converted the weights from JAX to PyTorch. Credits go to him.
+
+Disclaimer: The team releasing ViT did not write a model card for this model so this model card has been written by the Hugging Face team.
+
+## Model description
+
+The Vision Transformer (ViT) is a transformer encoder model (BERT-like) pretrained on a large collection of images in a supervised fashion, namely ImageNet-21k, at a resolution of 224x224 pixels.
+
+Images are presented to the model as a sequence of fixed-size patches (resolution 32x32), which are linearly embedded. One also adds a [CLS] token to the beginning of a sequence to use it for classification tasks. One also adds absolute position embeddings before feeding the sequence to the layers of the Transformer encoder.
+
+Note that this model does not provide any fine-tuned heads, as these were zero'd by Google researchers. However, the model does include the pre-trained pooler, which can be used for downstream tasks (such as image classification).
+
+By pre-training the model, it learns an inner representation of images that can then be used to extract features useful for downstream tasks: if you have a dataset of labeled images for instance, you can train a standard classifier by placing a linear layer on top of the pre-trained encoder. One typically places a linear layer on top of the [CLS] token, as the last hidden state of this token can be seen as a representation of an entire image.
+
+## Intended uses & limitations
+
+You can use the raw model for image classification. See the [model hub](https://huggingface.co/models?search=google/vit) to look for
+fine-tuned versions on a task that interests you.
+
+### How to use
+
+Here is how to use this model:
+
+```python
+from transformers import ViTFeatureExtractor, ViTModel
+from PIL import Image
+import requests
+url = 'http://images.cocodataset.org/val2017/000000039769.jpg'
+image = Image.open(requests.get(url, stream=True).raw)
+feature_extractor = ViTFeatureExtractor.from_pretrained('google/vit-base-patch32-224-in21k')
+model = ViTModel.from_pretrained('google/vit-base-patch32-224-in21k')
+inputs = feature_extractor(images=image, return_tensors="pt")
+outputs = model(**inputs)
+last_hidden_state = outputs.last_hidden_state
+```
+
+Currently, both the feature extractor and model support PyTorch. Tensorflow and JAX/FLAX are coming soon, and the API of ViTFeatureExtractor might change.
+
+## Training data
+
+The ViT model was pretrained on [ImageNet-21k](http://www.image-net.org/), a dataset consisting of 14 million images and 21k classes.
+
+## Training procedure
+
+### Preprocessing
+
+The exact details of preprocessing of images during training/validation can be found [here](https://github.com/google-research/vision_transformer/blob/master/vit_jax/input_pipeline.py).
+
+Images are resized/rescaled to the same resolution (224x224) and normalized across the RGB channels with mean (0.5, 0.5, 0.5) and standard deviation (0.5, 0.5, 0.5).
+
+### Pretraining
+
+The model was trained on TPUv3 hardware (8 cores). All model variants are trained with a batch size of 4096 and learning rate warmup of 10k steps. For ImageNet, the authors found it beneficial to additionally apply gradient clipping at global norm 1. Pre-training resolution is 224.
+
+## Evaluation results
+
+For evaluation results on several image classification benchmarks, we refer to tables 2 and 5 of the original paper. Note that for fine-tuning, the best results are obtained with a higher resolution (384x384). Of course, increasing the model size will result in better performance.
+
+### BibTeX entry and citation info
+
+```bibtex
+@misc{wu2020visual,
+      title={Visual Transformers: Token-based Image Representation and Processing for Computer Vision},
+      author={Bichen Wu and Chenfeng Xu and Xiaoliang Dai and Alvin Wan and Peizhao Zhang and Zhicheng Yan and Masayoshi Tomizuka and Joseph Gonzalez and Kurt Keutzer and Peter Vajda},
+      year={2020},
+      eprint={2006.03677},
+      archivePrefix={arXiv},
+      primaryClass={cs.CV}
+}
+```
+
+```bibtex
+@inproceedings{deng2009imagenet,
+  title={Imagenet: A large-scale hierarchical image database},
+  author={Deng, Jia and Dong, Wei and Socher, Richard and Li, Li-Jia and Li, Kai and Fei-Fei, Li},
+  booktitle={2009 IEEE conference on computer vision and pattern recognition},
+  pages={248--255},
+  year={2009},
+  organization={Ieee}
+}
+```
diff --git a/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff b/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff
new file mode 100644
index 00000000..cf849c95
--- /dev/null
+++ b/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff
@@ -0,0 +1,5 @@
+--- 
++++ 
+@@ -24 +24 @@
+-Note that this model does not provide any fine-tuned heads, as these were zero'd by Google researchers. However, the model does include the pre-trained pooler, which can be used for downstream tasks (such as image classification).
++Note that this model does not provide any fine-tuned heads, as these were zero’d by Google researchers. However, the model does include the pre-trained pooler, which can be used for downstream tasks (such as image classification).
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index 87d54d84..c96717ec 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -1,3 +1,4 @@
+import difflib
 import os
 from pathlib import Path
 
@@ -41,55 +42,60 @@ def card(fit_model, tmp_path):
     return card
 
 
-def assert_readme_files_equal(file0, file1):
-    """Check that the two model cards are identical, but allow differences in
-    line breaks."""
-    # exclude trivial case of both being empty
-    assert file0
-    assert file1
+EXAMPLE_CARDS = [
+    "bert-base-uncased.md",
+    "clip-vit-large-patch14.md",
+    "gpt2.md",
+    "specter.md",
+    "vit-base-patch32-224-in21k.md",
+]
+
 
+def assert_readme_files_almost_equal(file0, file1, diff):
+    """Check that the two model cards are identical, but allow differences as
+    defined in the ``diff`` file"""
     with open(file0, "r") as f:
         readme0 = f.readlines()
 
     with open(file1, "r") as f:
         readme1 = f.readlines()
 
-    # remove completely empty lines
-    readme0 = [line.strip() for line in readme0 if line.strip()]
-    readme1 = [line.strip() for line in readme1 if line.strip()]
+    # exclude trivial case of both being empty
+    assert readme0
+    assert readme1
 
-    readme_str0 = "\n".join(readme0)
-    readme_str1 = "\n".join(readme1)
+    diff_actual = list(difflib.unified_diff(readme0, readme1, n=0))
 
-    # a minuscule further difference is an excess empty line after </style>
-    readme_str1 = readme_str1.replace("</style>\n", "</style>")
+    with open(diff, "r") as f:
+        diff_expected = f.readlines()
 
-    assert readme_str0 == readme_str1
+    assert diff_actual == diff_expected
 
 
-def test_parsed_card_identical(card, tmp_path):
-    file0 = tmp_path / "readme-skops.md"
-    card.save(file0)
+@pytest.mark.parametrize("file_name", EXAMPLE_CARDS, ids=EXAMPLE_CARDS)
+def test_example_model_cards(tmp_path, file_name):
+    """Test that the difference between original and parsed model card is
+    acceptable
 
-    parsed_card = parse_modelcard(file0)
-    file1 = tmp_path / "readme-parsed.md"
-    parsed_card.save(file1)
+    For this test, model cards for some of the most popular models on HF Hub
+    were retrieved and stored in the ./examples folder. This test checks that
+    these model cards can be successfully parsed and that the output is *almost*
+    the same.
+
+    We don't expect the output to be 100% identical, see the limitations listed
+    in ``parse_modelcard``. Instead, we assert that the diff corresponds to the
+    expected diff, which is also checked in.
 
-    assert_readme_files_equal(file0, file1)
+    So e.g. for "specter.md", we expect that the diff will be the same diff as
+    in "specter.md.diff".
 
+    """
+    path = Path(os.getcwd()) / "skops" / "card" / "tests" / "examples"
+    file0 = path / file_name
+    diff = (path / file_name).with_suffix(".md.diff")
 
-@pytest.mark.xfail(reason="small diff, especially in tables")
-def test_bert_base_uncased(tmp_path):
-    file0 = (
-        Path(os.getcwd())
-        / "skops"
-        / "card"
-        / "tests"
-        / "examples"
-        / "bert-base-uncased.md"
-    )
     parsed_card = parse_modelcard(file0)
     file1 = tmp_path / "readme-parsed.md"
     parsed_card.save(file1)
 
-    assert_readme_files_equal(file0, file1)
+    assert_readme_files_almost_equal(file0, file1, diff)

From 5e5c1a35324b3fb393751cad8331ef4ad45dabcf Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 6 Dec 2022 11:10:40 +0100
Subject: [PATCH 23/47] Rename Markdown class's methods, make private

---
 skops/card/_markup.py | 96 +++++++++++++++++++++----------------------
 1 file changed, 48 insertions(+), 48 deletions(-)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index 9ddf1afd..e330a529 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -17,8 +17,8 @@ class Markdown:
     This class has a ``mapping`` attribute, which is just a dict. The keys are
     Pandoc types and the values are functions that transform the corresponding
     value into a string with markdown syntax. Those functions are all prefixed
-    with ``md_``, e.g. ``md_image`` for transforming a pandoc ``Image`` into a
-    markdown figure.
+    with ``_``, e.g. ``_image`` for transforming a pandoc ``Image`` into a
+    markdown figure, or ``_raw_block``, to transform a pandoc ``RawBlock``.
 
     From the caller side, only the ``__call__`` method should be used, the rest
     should be considered internals.
@@ -28,91 +28,91 @@ class Markdown:
     def __init__(self):
         # markdown syntax dispatch table
         self.mapping = {
-            "Space": self.md_space,
-            "Strong": self.md_strong,
-            "Emph": self.md_emph,
-            "Strikeout": self.md_strikeout,
-            "Subscript": self.md_subscript,
-            "Superscript": self.md_superscript,
-            "Plain": self.md_plain,
-            "Str": self.md_str,
-            "RawInline": self.md_rawline,
-            "RawBlock": self.md_raw_block,
-            "SoftBreak": self.md_softbreak,
-            "LineBreak": self.md_linebreak,
-            "Para": self.md_para,
-            "Header": self.md_header,
-            "Image": self.md_image,
-            "CodeBlock": self.md_code_block,
-            "Code": self.md_code,
-            "Table": self.md_table,
-            "Div": self.md_parse_div,
-            "Link": self.md_link,
-            "BulletList": self.md_bullet_list,
-            "Quoted": self.md_quoted,
-            "BlockQuote": self.md_block_quote,
+            "Space": self._space,
+            "Strong": self._strong,
+            "Emph": self._emph,
+            "Strikeout": self._strikeout,
+            "Subscript": self._subscript,
+            "Superscript": self._superscript,
+            "Plain": self._plain,
+            "Str": self._str,
+            "RawInline": self._raw_inline,
+            "RawBlock": self._raw_block,
+            "SoftBreak": self._soft_break,
+            "LineBreak": self._line_break,
+            "Para": self._para,
+            "Header": self._header,
+            "Image": self._image,
+            "CodeBlock": self._code_block,
+            "Code": self._code,
+            "Table": self._table,
+            "Div": self._parse_div,
+            "Link": self._link,
+            "BulletList": self._bullet_list,
+            "Quoted": self._quoted,
+            "BlockQuote": self._block_quote,
         }
 
     @staticmethod
-    def md_space(value) -> str:
+    def _space(value) -> str:
         return " "
 
-    def md_strong(self, value) -> str:
+    def _strong(self, value) -> str:
         parts = ["**"]
         parts += [self.__call__(subitem) for subitem in value]
         parts.append("**")
         return "".join(parts)
 
-    def md_emph(self, value) -> str:
+    def _emph(self, value) -> str:
         parts = ["_"]
         parts += [self.__call__(subitem) for subitem in value]
         parts.append("_")
         return "".join(parts)
 
-    def md_strikeout(self, value) -> str:
+    def _strikeout(self, value) -> str:
         parts = ["~~"]
         parts += [self.__call__(subitem) for subitem in value]
         parts.append("~~")
         return "".join(parts)
 
-    def md_subscript(self, value) -> str:
+    def _subscript(self, value) -> str:
         parts = ["<sub>"]
         parts += [self.__call__(subitem) for subitem in value]
         parts.append("</sub>")
         return "".join(parts)
 
-    def md_superscript(self, value) -> str:
+    def _superscript(self, value) -> str:
         parts = ["<sup>"]
         parts += [self.__call__(subitem) for subitem in value]
         parts.append("</sup>")
         return "".join(parts)
 
-    def md_plain(self, value) -> str:
+    def _plain(self, value) -> str:
         parts = [self.__call__(subitem) for subitem in value]
         return "".join(parts)
 
     @staticmethod
-    def md_str(value) -> str:
+    def _str(value) -> str:
         # escape \
         return value.replace("\\", "\\\\")
 
     @staticmethod
-    def md_rawline(value) -> str:
+    def _raw_inline(value) -> str:
         _, line = value
         return line
 
-    def md_raw_block(self, item) -> str:
+    def _raw_block(self, item) -> str:
         # throw away the first item, which is just something like 'html'
         # might have to revisit this if output != markdown
         _, line = item
         return line
 
     @staticmethod
-    def md_softbreak(value) -> str:
+    def _soft_break(value) -> str:
         return "\n"
 
     @staticmethod
-    def md_linebreak(value) -> str:
+    def _line_break(value) -> str:
         return "\n"
 
     def _make_content(self, content):
@@ -122,16 +122,16 @@ def _make_content(self, content):
             parts.append(part)
         return "".join(parts)
 
-    def md_para(self, value: list[dict[str, str]]) -> str:
+    def _para(self, value: list[dict[str, str]]) -> str:
         content = self._make_content(value)
         return content
 
-    def md_header(self, value: tuple[int, Any, list[dict[str, str]]]) -> str:
+    def _header(self, value: tuple[int, Any, list[dict[str, str]]]) -> str:
         level, _, content_parts = value
         section_name = self._make_content(content_parts)
         return section_name
 
-    def md_image(self, value) -> str:
+    def _image(self, value) -> str:
         (ident, _, keyvals), caption, (dest, typef) = value
         # it seems like ident and keyvals are not relevant for markdown
         assert caption
@@ -142,7 +142,7 @@ def md_image(self, value) -> str:
         return content
 
     @staticmethod
-    def md_code_block(item: tuple[tuple[int, list[str], list[str]], str]) -> str:
+    def _code_block(item: tuple[tuple[int, list[str], list[str]], str]) -> str:
         # a codeblock consists of: (id, classes, namevals) contents
         (_, classes, _), content = item
         block_start = "```"
@@ -153,11 +153,11 @@ def md_code_block(item: tuple[tuple[int, list[str], list[str]], str]) -> str:
         return content
 
     @staticmethod
-    def md_code(item: tuple[Any, str]) -> str:
+    def _code(item: tuple[Any, str]) -> str:
         _, txt = item
         return f"`{txt}`"
 
-    def md_table(self, item) -> str:
+    def _table(self, item) -> str:
         _, alignments, _, header, rows = item
         fn = self.__call__
         columns = ["".join(fn(part) for part in col) for col in header]
@@ -178,7 +178,7 @@ def md_table(self, item) -> str:
         res = TableSection(table).format()
         return res
 
-    def md_parse_div(self, item) -> str:
+    def _parse_div(self, item) -> str:
         # note that in markdown, we basically just use the raw html
         (ident, classes, kvs), contents = item
 
@@ -206,12 +206,12 @@ def md_parse_div(self, item) -> str:
         end = "</div>"
         return "".join([start] + middle + [end])
 
-    def md_link(self, item) -> str:
+    def _link(self, item) -> str:
         _, txt, (src, _) = item
         txt_formatted = self._make_content(txt)
         return f"[{txt_formatted}]({src})"
 
-    def md_bullet_list(self, item) -> str:
+    def _bullet_list(self, item) -> str:
         parts = []
         for subitem in item:
             assert len(subitem) == 1
@@ -221,7 +221,7 @@ def md_bullet_list(self, item) -> str:
             parts.append(f"- {content}")
         return "\n".join(parts)
 
-    def md_quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
+    def _quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
         quote_type, content = item
         type_ = quote_type["t"]
         try:
@@ -236,7 +236,7 @@ def md_quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
         text = "".join(self.__call__(i) for i in content)
         return f"{sym}{text}{sym}"
 
-    def md_block_quote(self, item: list[PandocItem]) -> str:
+    def _block_quote(self, item: list[PandocItem]) -> str:
         parts = []
         for subitem in item:
             content = self.__call__(subitem)

From 897975125782b8cf24cace741686bbd70706a29b Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 16 Dec 2022 15:50:10 +0100
Subject: [PATCH 24/47] Add version check for pandoc

---
 skops/card/_parser.py           | 70 ++++++++++++++++++++++++++++++---
 skops/card/tests/test_parser.py |  2 +-
 2 files changed, 65 insertions(+), 7 deletions(-)

diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 933ea1d8..48037c5b 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -12,7 +12,7 @@
 import subprocess
 from pathlib import Path
 from tempfile import mkdtemp
-from typing import Any
+from typing import Any, Sequence
 
 import yaml  # type: ignore
 
@@ -21,6 +21,8 @@
 
 from ._markup import Markdown, PandocItem
 
+PANDOC_MIN_VERSION = (2, 19, 0)
+
 
 class PandocParser:
     """TODO"""
@@ -95,20 +97,71 @@ def generate(self) -> Card:
         return self.card
 
 
-def check_pandoc_installed() -> None:
+def _get_pandoc_version() -> list[int]:
+    """Shell out to retrieve the pandoc version
+
+    Raises
+    ------
+    RuntimeError
+        If pandoc version could not be determined, raise a ``RuntimeError``.
+
+    Returns
+    -------
+    pandoc_version : list[int]
+        The pandoc version as a list of ints.
+    """
+    proc = subprocess.run(
+        ["pandoc", "--version"],
+        capture_output=True,
+    )
+    version_info = str(proc.stdout.decode("utf-8")).split("\n", 1)[0]
+    if not version_info.startswith("pandoc "):
+        raise RuntimeError("Could not determine version of pandoc")
+
+    _, _, actual_version = version_info.partition(" ")
+    pandoc_version = [int(v) for v in actual_version.split(".")]
+    return pandoc_version
+
+
+def _check_version_greater_equal(
+    version: Sequence[int], min_version: Sequence[int]
+) -> None:
+    """Very bad version comparison function to ensure that the first version is
+    >= the second."""
+    for v1, v2 in zip(version, min_version):
+        if v1 > v2:
+            return
+
+        if v1 < v2:
+            raise ValueError(
+                "Pandoc version too low, expected at least "
+                f"{'.'.join(map(str, min_version))}"
+            )
+
+
+def check_pandoc_installed(
+    min_version: Sequence[int] | None = PANDOC_MIN_VERSION,
+) -> None:
     """Check if pandoc is installed on the system
 
+    Parameters
+    ----------
+    min_version : list[int] or None
+        If passed, check that the pandoc version is greater or equal to this one.
+
     Raises
     ------
     FileNotFoundError
         When the binary is not found, raise this error.
 
+    RuntimeError
+        If pandoc version could not be determined, raise a ``RuntimeError``.
+
+    ValueError
+        If min version is passed and not matched or exceeded, raise a ``ValueError``.
     """
     try:
-        subprocess.run(
-            ["pandoc", "--version"],
-            capture_output=True,
-        )
+        pandoc_version = _get_pandoc_version()
     except FileNotFoundError as exc:
         msg = (
             "This feature requires the pandoc library to be installed on your system, "
@@ -117,6 +170,11 @@ def check_pandoc_installed() -> None:
         )
         raise FileNotFoundError(msg) from exc
 
+    if not min_version:
+        return
+
+    _check_version_greater_equal(pandoc_version, min_version)
+
 
 def _card_with_detached_metainfo(path: str | Path) -> tuple[str | Path, dict[str, Any]]:
     """Detach the possibly existing yaml part of the model card
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index c96717ec..c904b1ff 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -13,7 +13,7 @@
     check_pandoc_installed()
 except FileNotFoundError:
     # not installed, skip
-    pytest.skip(reason="These tests require pandoc", allow_module_level=True)
+    pytest.skip(reason="These tests require a recent pandoc", allow_module_level=True)
 
 
 @pytest.fixture

From e8d6f6174964fca0a5084d1d9fb63a0e6bb02955 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 16 Dec 2022 15:53:36 +0100
Subject: [PATCH 25/47] New table parsing code

There was a change in pandoc, this now works with the latest pandoc
version.
---
 skops/card/_markup.py | 45 +++++++++++++++++++++++++++++++++----------
 1 file changed, 35 insertions(+), 10 deletions(-)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index e330a529..63128485 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -157,22 +157,47 @@ def _code(item: tuple[Any, str]) -> str:
         _, txt = item
         return f"`{txt}`"
 
-    def _table(self, item) -> str:
-        _, alignments, _, header, rows = item
+    def _table_cols(self, items) -> list[str]:
+        columns = []
+        fn = self.__call__
+        for item in items:
+            _, alignment, _, _, content = item
+            column = "".join(fn(part) for part in content)
+            columns.append(column)
+        return columns
+
+    def _table_body(self, items) -> list[list[str]]:
+        body = []
         fn = self.__call__
-        columns = ["".join(fn(part) for part in col) for col in header]
-        if not columns:
-            raise ValueError("Table with no columns...")
+        for _, row_items in items:
+            row = []
+            for col_row_item in row_items:
+                _, alignment, _, _, content = col_row_item
+                row.append("".join(fn(part) for part in content))
+            body.append(row)
+        return body
+
+    def _table(self, item) -> str:
+        # attr capt specs thead tbody tfoot
+        _, _, _, thead, tbody, _ = item
+
+        # header
+        (_, thead_bodies) = thead
+        (attr, thead_body) = thead_bodies[0]  # multiple headers?
+
+        columns = self._table_cols(thead_body)
 
-        data = []  # row oriented
-        for row in rows:
-            data.append(["".join(fn(part) for part in col) for col in row])
+        # rows
+        # attr rhc hd bd
+        _, _, _, trows = tbody[0]  # multiple groups of rows?
+        body = self._table_body(trows)
 
         table: Mapping[str, Sequence[Any]]
-        if not data:
+        if not body:
             table = {key: [] for key in columns}
         else:
-            data_transposed = zip(*data)  # column oriented
+            # body is row oriented, transpose to column oriented
+            data_transposed = zip(*body)
             table = {key: val for key, val in zip(columns, data_transposed)}
 
         res = TableSection(table).format()

From d0e07bce2d36a6e66fa77fdef670a40d93ff84a5 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 16 Dec 2022 17:01:26 +0100
Subject: [PATCH 26/47] Fix "bug" with metainfo order

For some reason, the order of items in the metainfo is no longer stable.
Therefore, the tests comparing the parsed card vs original card failed.

Now metainfo is excluded when comparing the cards. The metainfo is now
checked separately, in a way that disregards the order.
---
 .../tests/examples/bert-base-uncased.md.diff  | 10 +++++-----
 .../examples/clip-vit-large-patch14.md.diff   | 12 +++++------
 skops/card/tests/examples/gpt2.md.diff        | 10 ++++------
 skops/card/tests/examples/specter.md.diff     |  5 +----
 .../vit-base-patch32-224-in21k.md.diff        |  2 +-
 skops/card/tests/test_parser.py               | 20 ++++++++++++++++++-
 6 files changed, 36 insertions(+), 23 deletions(-)

diff --git a/skops/card/tests/examples/bert-base-uncased.md.diff b/skops/card/tests/examples/bert-base-uncased.md.diff
index e4fb5c66..2367a8d8 100644
--- a/skops/card/tests/examples/bert-base-uncased.md.diff
+++ b/skops/card/tests/examples/bert-base-uncased.md.diff
@@ -1,6 +1,6 @@
 --- 
 +++ 
-@@ -52,10 +52,10 @@
+@@ -44,10 +44,10 @@
 -| Model | #params | Language |
 -|------------------------|--------------------------------|-------|
 -| [`bert-base-uncased`](https://huggingface.co/bert-base-uncased) | 110M   | English |
@@ -21,13 +21,13 @@
 +| [`bert-base-multilingual-cased`](https://huggingface.co/bert-base-multilingual-cased)                   | 110M      | Multiple   |
 +| [`bert-large-uncased-whole-word-masking`](https://huggingface.co/bert-large-uncased-whole-word-masking) | 340M      | English    |
 +| [`bert-large-cased-whole-word-masking`](https://huggingface.co/bert-large-cased-whole-word-masking)     | 340M      | English    |
-@@ -65 +65 @@
+@@ -57 +57 @@
 -You can use the raw model for either masked language modeling or next sentence prediction, but it's mostly intended to
 +You can use the raw model for either masked language modeling or next sentence prediction, but it’s mostly intended to
-@@ -197 +197 @@
+@@ -189 +189 @@
 -the other cases, it's another random sentence in the corpus. Note that what is considered a sentence here is a
 +the other cases, it’s another random sentence in the corpus. Note that what is considered a sentence here is a
-@@ -220,4 +220,3 @@
+@@ -212,4 +212,3 @@
 -| Task | MNLI-(m/mm) | QQP  | QNLI | SST-2 | CoLA | STS-B | MRPC | RTE  | Average |
 -|:----:|:-----------:|:----:|:----:|:-----:|:----:|:-----:|:----:|:----:|:-------:|
 -|      | 84.6/83.4   | 71.2 | 90.5 | 93.5  | 52.1 | 85.8  | 88.9 | 66.4 | 79.6    |
@@ -35,6 +35,6 @@
 +| Task   | MNLI-(m/mm)   |   QQP |   QNLI |   SST-2 |   CoLA |   STS-B |   MRPC |   RTE |   Average |
 +|--------|---------------|-------|--------|---------|--------|---------|--------|-------|-----------|
 +|        | 84.6/83.4     |  71.2 |   90.5 |    93.5 |   52.1 |    85.8 |   88.9 |  66.4 |      79.6 |
-@@ -248 +247 @@
+@@ -240 +239 @@
 -	<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
 +<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
diff --git a/skops/card/tests/examples/clip-vit-large-patch14.md.diff b/skops/card/tests/examples/clip-vit-large-patch14.md.diff
index f2da254b..8516f684 100644
--- a/skops/card/tests/examples/clip-vit-large-patch14.md.diff
+++ b/skops/card/tests/examples/clip-vit-large-patch14.md.diff
@@ -1,18 +1,18 @@
 --- 
 +++ 
-@@ -30 +29,0 @@
+@@ -23 +22,0 @@
 -
-@@ -35 +33,0 @@
+@@ -28 +26,0 @@
 -
-@@ -58 +55,0 @@
+@@ -51 +48,0 @@
 -
-@@ -79,2 +75,0 @@
+@@ -72,2 +68,0 @@
 -
 -
-@@ -88,2 +82,0 @@
+@@ -81,2 +75,0 @@
 -
 -
-@@ -139,3 +132 @@
+@@ -132,3 +125 @@
 -We also tested the performance of CLIP on gender, race and age classification using the Fairface dataset (We default to using race categories as they are constructed in the Fairface dataset.) in order to assess quality of performance across different demographics. We found accuracy >96% across all races for gender classification with ‘Middle Eastern’ having the highest accuracy (98.4%) and ‘White’ having the lowest (96.5%). Additionally, CLIP averaged ~93% for racial classification and ~63% for age classification. Our use of evaluations to test for gender, race and age classification as well as denigration harms is simply to evaluate performance of the model across people and surface potential risks and not to demonstrate an endorsement/enthusiasm for such tasks.
 -
 -
diff --git a/skops/card/tests/examples/gpt2.md.diff b/skops/card/tests/examples/gpt2.md.diff
index e95bc0cb..ee0d38f1 100644
--- a/skops/card/tests/examples/gpt2.md.diff
+++ b/skops/card/tests/examples/gpt2.md.diff
@@ -1,13 +1,11 @@
 --- 
 +++ 
-@@ -5 +4,0 @@
--
-@@ -95 +93,0 @@
+@@ -89 +88,0 @@
 ->
-@@ -102 +100 @@
+@@ -96 +95 @@
 -Here's an example of how the model can have biased predictions:
 +Here’s an example of how the model can have biased predictions:
-@@ -150,5 +148,4 @@
+@@ -144,5 +143,4 @@
 -| Dataset  | LAMBADA | LAMBADA | CBT-CN | CBT-NE | WikiText2 | PTB    | enwiki8 | text8  | WikiText103 | 1BW   |
 -|:--------:|:-------:|:-------:|:------:|:------:|:---------:|:------:|:-------:|:------:|:-----------:|:-----:|
 -| (metric) | (PPL)   | (ACC)   | (ACC)  | (ACC)  | (PPL)     | (PPL)  | (BPB)   | (BPC)  | (PPL)       | (PPL) |
@@ -17,6 +15,6 @@
 +|-----------|-----------|----------|----------|-------------|-------|-----------|---------|---------------|-------|
 +| (metric)  | (ACC)     | (ACC)    | (ACC)    | (PPL)       | (PPL) | (BPB)     | (BPC)   | (PPL)         | (PPL) |
 +|           | 45.99     | 87.65    | 83.4     | 29.41       | 65.85 | 1.16      | 1,17    | 37.50         | 75.20 |
-@@ -167 +164 @@
+@@ -161 +159 @@
 -	<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
 +<img width="300px" src="https://cdn-media.huggingface.co/exbert/button.png">
diff --git a/skops/card/tests/examples/specter.md.diff b/skops/card/tests/examples/specter.md.diff
index 7fcfa951..647c85a8 100644
--- a/skops/card/tests/examples/specter.md.diff
+++ b/skops/card/tests/examples/specter.md.diff
@@ -1,11 +1,8 @@
 --- 
 +++ 
 @@ -3 +3 @@
--thumbnail: "https://camo.githubusercontent.com/7d080b7a769f7fdf64ac0ebeb47b039cb50be35287e3071f9d633f0fe33e7596/68747470733a2f2f692e6962622e636f2f33544331576d472f737065637465722d6c6f676f2d63726f707065642e706e67"
-+thumbnail: https://camo.githubusercontent.com/7d080b7a769f7fdf64ac0ebeb47b039cb50be35287e3071f9d633f0fe33e7596/68747470733a2f2f692e6962622e636f2f33544331576d472f737065637465722d6c6f676f2d63726f707065642e706e67
-@@ -14 +14 @@
 -## SPECTER
 +# SPECTER
-@@ -26 +26 @@
+@@ -15 +15 @@
 -Authors: *Arman Cohan, Sergey Feldman, Iz Beltagy, Doug Downey, Daniel S. Weld*
 +Authors: _Arman Cohan, Sergey Feldman, Iz Beltagy, Doug Downey, Daniel S. Weld_
diff --git a/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff b/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff
index cf849c95..b48c0b73 100644
--- a/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff
+++ b/skops/card/tests/examples/vit-base-patch32-224-in21k.md.diff
@@ -1,5 +1,5 @@
 --- 
 +++ 
-@@ -24 +24 @@
+@@ -17 +17 @@
 -Note that this model does not provide any fine-tuned heads, as these were zero'd by Google researchers. However, the model does include the pre-trained pooler, which can be used for downstream tasks (such as image classification).
 +Note that this model does not provide any fine-tuned heads, as these were zero’d by Google researchers. However, the model does include the pre-trained pooler, which can be used for downstream tasks (such as image classification).
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index c904b1ff..b723c03e 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -4,6 +4,7 @@
 
 import numpy as np
 import pytest
+import yaml  # type: ignore
 from sklearn.linear_model import LinearRegression
 
 from skops.card import Card, parse_modelcard
@@ -51,15 +52,32 @@ def card(fit_model, tmp_path):
 ]
 
 
+def _assert_meta_equal(meta0, meta1):
+    # we cannot guarantee the order of metadata items, so we compare parsed
+    # dicts, but not strings directly
+    assert yaml.safe_load("".join(meta0)) == yaml.safe_load("".join(meta1))
+
+
 def assert_readme_files_almost_equal(file0, file1, diff):
     """Check that the two model cards are identical, but allow differences as
-    defined in the ``diff`` file"""
+    defined in the ``diff`` file
+
+    The metainfo is compared separately, as the order of the items is not
+    guaranteed to be stable.
+    """
     with open(file0, "r") as f:
         readme0 = f.readlines()
 
     with open(file1, "r") as f:
         readme1 = f.readlines()
 
+    sep = "---\n"
+    idx0, idx1 = readme0[1:].index(sep) + 1, readme1[1:].index(sep) + 1
+    meta0, meta1 = readme0[1:idx0], readme1[1:idx1]
+    readme0, readme1 = readme0[idx0:], readme1[idx1:]
+
+    _assert_meta_equal(meta0, meta1)
+
     # exclude trivial case of both being empty
     assert readme0
     assert readme1

From 5a9f8261368215b74ebac2d9fc2bf773bb3164a6 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 16 Dec 2022 17:10:15 +0100
Subject: [PATCH 27/47] Clean up noise created from merge conflict

---
 docs/model_card.rst       | 4 ----
 skops/card/_model_card.py | 1 -
 2 files changed, 5 deletions(-)

diff --git a/docs/model_card.rst b/docs/model_card.rst
index f6b0d37a..7a6c124d 100644
--- a/docs/model_card.rst
+++ b/docs/model_card.rst
@@ -103,7 +103,3 @@ using :meth:`Card.select`, and you can delete sections using
 
 To see how you can use the API in ``skops`` to create a model card, please
 refer to :ref:`sphx_glr_auto_examples_plot_model_card.py`.
-
-Templates
----------
-TODO
diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index dadeb0f6..2adafa62 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -728,7 +728,6 @@ def add_model_plot(
         -------
         self : object
             Card object.
-
         """
         if not self.model_diagram:
             return self

From 5bc590972def0438eed34b5ef9f8f6580617e920 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 16 Dec 2022 17:25:35 +0100
Subject: [PATCH 28/47] Fix TypedDict import for Py<3.9, doctest

---
 skops/card/_markup.py | 8 +++++++-
 skops/card/_parser.py | 3 ++-
 2 files changed, 9 insertions(+), 2 deletions(-)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index 63128485..de657d83 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -1,10 +1,16 @@
 """Classes for translating into the syntax of different markup languages"""
 
+import sys
 from collections.abc import Mapping
-from typing import Any, Sequence, TypedDict
+from typing import Any, Sequence
 
 from skops.card._model_card import TableSection
 
+if sys.version_info.minor >= 9:
+    from typing import TypedDict
+else:
+    from typing_extensions import TypedDict
+
 
 class PandocItem(TypedDict):
     t: str
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 48037c5b..f6e22aea 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -239,7 +239,7 @@ def parse_modelcard(path: str | Path) -> Card:
     >>> import numpy as np
     >>> from sklearn.linear_model import LinearRegression
     >>> from skops.card import Card
-    >>> from skops.card import parse_card
+    >>> from skops.card import parse_modelcard
     >>> X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
     >>> y = np.dot(X, np.array([1, 2])) + 3
     >>> regr = LinearRegression().fit(X, y)
@@ -249,6 +249,7 @@ def parse_modelcard(path: str | Path) -> Card:
     >>> parsed_card = parse_modelcard("README.md")
     >>> # continue editing the card
     >>> parsed_card.add(**{"My new section": "My new content"})
+    Card(...)
     >>> # overwrite old card with new one
     >>> parsed_card.save("README.md")
 

From 3c3ff89a24f67829e860ac107136b82450d36970 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 16 Dec 2022 17:29:27 +0100
Subject: [PATCH 29/47] Add future annotations import to _markup.py

---
 skops/card/_markup.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index de657d83..531177db 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -1,5 +1,7 @@
 """Classes for translating into the syntax of different markup languages"""
 
+from __future__ import annotations
+
 import sys
 from collections.abc import Mapping
 from typing import Any, Sequence

From c2ccfcc4a199d09b275322e14a165bb76c16ac9c Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 19 Dec 2022 13:00:43 +0100
Subject: [PATCH 30/47] Add more documentation, refactor parser class

The parser is now less stateful.
---
 skops/card/_model_card.py |   5 ++
 skops/card/_parser.py     | 115 +++++++++++++++++++++++++-------------
 2 files changed, 82 insertions(+), 38 deletions(-)

diff --git a/skops/card/_model_card.py b/skops/card/_model_card.py
index 2adafa62..ed7bedf1 100644
--- a/skops/card/_model_card.py
+++ b/skops/card/_model_card.py
@@ -683,6 +683,11 @@ def _add_single(self, key: str, val: Formattable | str) -> Section:
         val: str or Formattable
             The value to assign to the (sub)section.
 
+        Returns
+        -------
+        Section instance
+            The section that has been added or modified.
+
         """
         *subsection_names, leaf_node_name = split_subsection_names(key)
         section = self._select(subsection_names)
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index f6e22aea..7f051b04 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -12,7 +12,7 @@
 import subprocess
 from pathlib import Path
 from tempfile import mkdtemp
-from typing import Any, Sequence
+from typing import Any, Literal, Sequence
 
 import yaml  # type: ignore
 
@@ -25,35 +25,57 @@
 
 
 class PandocParser:
-    """TODO"""
+    """Create model cards from files parsed through pandoc.
 
-    def __init__(self, source, mapping="markdown") -> None:
-        self.source = source
-        if mapping == "markdown":
-            self.mapping = Markdown()
-        else:
-            raise ValueError(f"Markup of type {mapping} is not supported (yet)")
+    This class knows about the implementation details of the
+    :class:`~skops.card.Card` and generates it by initializing an empty class
+    and then calling its methods with the input provided by pandoc.
 
-        self.card = Card(None, template=None)
-        self._section_trace: list[str] = []
-        self._cur_section: Section | None = None
+    ``PandocParser`` does not know about any specific markup type, such as
+    markdown. Instead, it is initialized with a ``Mapping``, which is
+    responsible to convert pandoc input into the desired markup language.
 
-    def get_cur_level(self) -> int:
-        # level 0 can be interpreted implictly as the root level
-        return len(self._section_trace)
+    After initializing this class, call
+    :meth:`~skops.card._parser.PandocParser.generate` to generate the resulting
+    :class:`~skops.card.Card` instance.
+
+    Parameters
+    ----------
+    source : str
+        The model card parsed using the ``pandoc -t json`` option.
 
-    def get_cur_section(self):
-        # including supersections
-        return "/".join(self._section_trace)
+    markup_type : "markdown"
+        The type of markup that was used for the model card. Right now, only
+        ``"markdown"`` is supported.
 
-    def add_section(self, section_name: str) -> None:
-        self._cur_section = self.card._add_single(self.get_cur_section(), "")
+    """
 
-    def add_content(self, content: str) -> None:
-        section = self._cur_section
+    def __init__(
+        self, source: str, markup_type: Literal["markdown"] = "markdown"
+    ) -> None:
+        self.source = source
+        if markup_type.lower() == "markdown":
+            self.mapping = Markdown()
+        else:
+            raise ValueError(f"Markup of type {markup_type} is not supported (yet)")
+
+    def _add_section(
+        self, section_name: str, card: Card, section_trace: list[str]
+    ) -> Section:
+        # Add a new section to the card, which can be a subsection, and return
+        # it.
+        section_name = "/".join(section_trace)
+        cur_section = card._add_single(section_name, "")
+        return cur_section
+
+    def _add_content(self, content: str, section: Section | None) -> None:
+        # Add content to the current section
         if section is None:
+            # This may occur if the model card starts without a section. This is
+            # not illegal in markdown, but we don't handle it yet.
             raise ValueError(
-                "Ooops, no current section, please open an issue on GitHub"
+                "Trying to add content but there is no current section, "
+                "this is probably a bug, please open an issue on GitHub"
             )
 
         if not section.content:
@@ -61,40 +83,57 @@ def add_content(self, content: str) -> None:
         elif isinstance(section.content, str):
             section.content = section.content + "\n\n" + content
         else:
-            # A Formattable, no generic way to modify it -- should we add an
-            # update method?
+            # TODO: Content is a Formattable, no generic way to modify it --
+            # should we require each Formattable to have an update method?
             raise ValueError(f"Could not modify content of {section.content}")
 
-    def parse_header(self, item: PandocItem) -> str:
+    def _parse_header(
+        self, item: PandocItem, section_trace: list[str]
+    ) -> tuple[str, int]:
         # Headers are the only type of item that needs to be handled
         # differently. This is because we structure the underlying model card
         # data as a tree with nodes corresponding to headers. To assign the
         # right parent or child node, we need to keep track of the level of the
-        # headers. This cannot be done solely by the markdown mapping, since it
-        # is not aware of the tree structure.
+        # headers. This cannot be done on the level of the markdown mapping,
+        # since it is not aware of the tree structure.
         level, _, _ = item["c"]
         content = self.mapping(item)
-        self._section_trace = self._section_trace[: level - 1] + [content]
-        return content
+        return content, level
 
-    def post_process(self, res: str) -> str:
+    def _post_process(self, res: str) -> str:
         # replace Latin1 space
         res = res.replace("\xa0", " ")
         return res
 
     def generate(self) -> Card:
-        # Parsing the flat structure, not recursively as in pandocfilters.
-        # After visiting the parent node, it's not necessary to visit its
-        # child nodes, because that's already done during parsing.
+        """Generate the model card instance from the parsed card.
+
+        Returns
+        -------
+        card : :class:`~skops.card.Card`
+            The parsed model card instance. If not further modified, the output
+            of saving that card should be (almost) identical to the initial
+            model card.
+        """
+        section: Section | None = None
+        section_trace: list[str] = []
+        card = Card(None, template=None)
+
+        # Parsing the flat structure, not recursively as in pandocfilters. After
+        # visiting the parent node, it's not necessary to visit its child nodes,
+        # because the mapping class already takes care of visiting the child
+        # nodes.
         for item in json.loads(self.source)["blocks"]:
             if item["t"] == "Header":
-                res = self.post_process(self.parse_header(item))
-                self.add_section(res)
+                content, level = self._parse_header(item, section_trace=section_trace)
+                res = self._post_process(content)
+                section_trace = section_trace[: level - 1] + [res]
+                section = self._add_section(res, card=card, section_trace=section_trace)
             else:
-                res = self.post_process(self.mapping(item))
-                self.add_content(res)
+                res = self._post_process(self.mapping(item))
+                self._add_content(res, section=section)
 
-        return self.card
+        return card
 
 
 def _get_pandoc_version() -> list[int]:

From a2f90a457e245a14b58a8bb5d224c9cea12317c6 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 2 Jan 2023 12:23:46 +0100
Subject: [PATCH 31/47] Skip parts of parse_modelcard docstring test

This is because to run this doctest would require pandoc to be
installed, but running the doctests should not have a dependency on
pandoc.
---
 skops/card/_parser.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 7f051b04..e0af5723 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -283,14 +283,14 @@ def parse_modelcard(path: str | Path) -> Card:
     >>> y = np.dot(X, np.array([1, 2])) + 3
     >>> regr = LinearRegression().fit(X, y)
     >>> card = Card(regr)
-    >>> card.save("README.md")
+    >>> card.save("README.md")  # doctest: +SKIP
     >>> # later, load the card again
-    >>> parsed_card = parse_modelcard("README.md")
+    >>> parsed_card = parse_modelcard("README.md")  # doctest: +SKIP
     >>> # continue editing the card
-    >>> parsed_card.add(**{"My new section": "My new content"})
+    >>> parsed_card.add(**{"My new section": "My new content"})  # doctest: +SKIP
     Card(...)
     >>> # overwrite old card with new one
-    >>> parsed_card.save("README.md")
+    >>> parsed_card.save("README.md")  # doctest: +SKIP
 
     Notes
     -----

From 7ececc1e589c8b2680e11243842dbbadc489d7e2 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 3 Jan 2023 18:05:23 +0100
Subject: [PATCH 32/47] Increase test coverage, add a few features

- Checking a few more error cases
- Document lines that are not covered
- Add support for more syntax, most notably:
  - nested bullet lists
  - nested ordered lists
---
 skops/card/_markup.py                         | 113 ++++++-----
 skops/card/_parser.py                         |   6 +
 skops/card/tests/examples/toy-example.md      | 182 ++++++++++++++++++
 skops/card/tests/examples/toy-example.md.diff |  90 +++++++++
 skops/card/tests/test_parser.py               |  62 +++++-
 5 files changed, 403 insertions(+), 50 deletions(-)
 create mode 100644 skops/card/tests/examples/toy-example.md
 create mode 100644 skops/card/tests/examples/toy-example.md.diff

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index 531177db..8ffa14b6 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -4,6 +4,7 @@
 
 import sys
 from collections.abc import Mapping
+from contextlib import contextmanager
 from typing import Any, Sequence
 
 from skops.card._model_card import TableSection
@@ -37,17 +38,14 @@ def __init__(self):
         # markdown syntax dispatch table
         self.mapping = {
             "Space": self._space,
+            "Plain": self._plain,
+            "Str": self._str,
             "Strong": self._strong,
             "Emph": self._emph,
             "Strikeout": self._strikeout,
-            "Subscript": self._subscript,
-            "Superscript": self._superscript,
-            "Plain": self._plain,
-            "Str": self._str,
             "RawInline": self._raw_inline,
             "RawBlock": self._raw_block,
             "SoftBreak": self._soft_break,
-            "LineBreak": self._line_break,
             "Para": self._para,
             "Header": self._header,
             "Image": self._image,
@@ -57,14 +55,41 @@ def __init__(self):
             "Div": self._parse_div,
             "Link": self._link,
             "BulletList": self._bullet_list,
+            "OrderedList": self._ordered_list,
             "Quoted": self._quoted,
             "BlockQuote": self._block_quote,
         }
+        # Start indentation level at -1 because we want the first incremented
+        # indentation level to be at 0. Otherwise we would need to keep track if
+        # it's the first time and then don't increment, which is more
+        # complicated.
+        self._indent_trace = []
+
+    @contextmanager
+    def _indented(self, *, spaces: int):
+        """Temporarily increment indentation by one"""
+        self._indent_trace.append(spaces)
+        yield
+        self._indent_trace.pop(-1)
+
+    def _get_indent(self, *, incr: int = 0) -> str:
+        """Get current indentation, optionally incremented"""
+        # TODO: explain why skipping 1st item
+        return " " * (incr + sum(self._indent_trace[:-1]))
 
     @staticmethod
     def _space(value) -> str:
         return " "
 
+    def _plain(self, value) -> str:
+        parts = [self.__call__(subitem) for subitem in value]
+        return "".join(parts)
+
+    @staticmethod
+    def _str(value) -> str:
+        # escape \
+        return value.replace("\\", "\\\\")
+
     def _strong(self, value) -> str:
         parts = ["**"]
         parts += [self.__call__(subitem) for subitem in value]
@@ -83,27 +108,6 @@ def _strikeout(self, value) -> str:
         parts.append("~~")
         return "".join(parts)
 
-    def _subscript(self, value) -> str:
-        parts = ["<sub>"]
-        parts += [self.__call__(subitem) for subitem in value]
-        parts.append("</sub>")
-        return "".join(parts)
-
-    def _superscript(self, value) -> str:
-        parts = ["<sup>"]
-        parts += [self.__call__(subitem) for subitem in value]
-        parts.append("</sup>")
-        return "".join(parts)
-
-    def _plain(self, value) -> str:
-        parts = [self.__call__(subitem) for subitem in value]
-        return "".join(parts)
-
-    @staticmethod
-    def _str(value) -> str:
-        # escape \
-        return value.replace("\\", "\\\\")
-
     @staticmethod
     def _raw_inline(value) -> str:
         _, line = value
@@ -115,13 +119,9 @@ def _raw_block(self, item) -> str:
         _, line = item
         return line
 
-    @staticmethod
-    def _soft_break(value) -> str:
-        return "\n"
-
-    @staticmethod
-    def _line_break(value) -> str:
-        return "\n"
+    def _soft_break(self, value) -> str:
+        incr = 0 if not self._indent_trace else self._indent_trace[-1]
+        return "\n" + self._get_indent(incr=incr)
 
     def _make_content(self, content):
         parts = []
@@ -142,10 +142,16 @@ def _header(self, value: tuple[int, Any, list[dict[str, str]]]) -> str:
     def _image(self, value) -> str:
         (ident, _, keyvals), caption, (dest, typef) = value
         # it seems like ident and keyvals are not relevant for markdown
-        assert caption
-        assert typef == "fig:"
 
-        caption = "".join([self.__call__(i) for i in caption])
+        if not caption:
+            # not sure if this can be reached, just to be safe
+            raise ValueError("Figure missing a caption")
+
+        if not typef.startswith("fig:"):
+            # not sure if this can be reached, just to be safe
+            raise ValueError(f"Cannot deal with figure of type '{typef}'")
+
+        caption = "".join(self.__call__(i) for i in caption)
         content = f"![{caption}]({dest})"
         return content
 
@@ -215,7 +221,7 @@ def _parse_div(self, item) -> str:
         # note that in markdown, we basically just use the raw html
         (ident, classes, kvs), contents = item
 
-        # build diff tag
+        # build div tag
         tags = ["<div"]
         if ident:
             tags.append(f' id="{ident}"')
@@ -235,7 +241,8 @@ def _parse_div(self, item) -> str:
         start = "".join(tags)
         middle = []
         for content in contents:
-            middle.append(self.__call__(content))
+            with self._indented(spaces=2):
+                middle.append(self.__call__(content))
         end = "</div>"
         return "".join([start] + middle + [end])
 
@@ -244,14 +251,31 @@ def _link(self, item) -> str:
         txt_formatted = self._make_content(txt)
         return f"[{txt_formatted}]({src})"
 
+    def _make_list_item(self, items: str, list_marker: str):
+        # helper function used for bullet and ordered lists
+        parts = [self.__call__(subitem) for subitem in items]
+        content = "\n".join(parts)
+        return f"{self._get_indent()}{list_marker} {content}"
+
     def _bullet_list(self, item) -> str:
+        # we don't differentiate between lists starting with "-", "*", or "+".
+        list_marker = "-"
         parts = []
-        for subitem in item:
-            assert len(subitem) == 1
-            content = "".join(self.__call__(i) for i in subitem)
-            # indent the lines in lists if they contain line breaks
-            content = content.replace("\n", "\n  ")
-            parts.append(f"- {content}")
+        # bullet lists use 2 spaces for indentation to align "- "
+        with self._indented(spaces=2):
+            for subitem in item:
+                parts.append(self._make_list_item(subitem, list_marker=list_marker))
+        return "\n".join(parts)
+
+    def _ordered_list(self, item) -> str:
+        # we don't make use of num_type and sep_type, which just indicates that
+        # numbers are presented as decimal numbers using a period
+        (start, num_type, sep_type), items = item
+        parts = []
+        # ordered lists use 3 spaces for indentation to align "1. "
+        with self._indented(spaces=3):
+            for i, subitem in enumerate(items, start=start):
+                parts.append(self._make_list_item(subitem, list_marker=f"{i}."))
         return "\n".join(parts)
 
     def _quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
@@ -260,6 +284,7 @@ def _quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
         try:
             sym = {"DoubleQuote": '"', "SingleQuote": "'"}[type_]
         except KeyError as exc:
+            # can probably not be reached, but let's be sure
             msg = (
                 f"The parsed document contains '{type_}', which is not "
                 "supported yet, please open an issue on GitHub"
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index e0af5723..8236f6fd 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -103,6 +103,10 @@ def _parse_header(
     def _post_process(self, res: str) -> str:
         # replace Latin1 space
         res = res.replace("\xa0", " ")
+
+        # pandoc creates ☒ and ☐ for to do items but GitHub requires [x] and [ ]
+        # for an item to be considered a to do item
+        res = res.replace("- ☒", "- [x]").replace("- ☐", "- [ ]")
         return res
 
     def generate(self) -> Card:
@@ -308,6 +312,8 @@ def parse_modelcard(path: str | Path) -> Card:
     - Quote symbols may differ, e.g. ``it’s`` becoming ``it's``.
     - The number of empty lines may differ, e.g. two empty lines being
       transformed into one empty line.
+    - The optional title of links is not preserved, as e.g. in
+      `[text](https://example.com "this disappears")`
     - Trailing whitespace is removed.
     - Tab indentation may be removed, e.g. in raw html.
     - The yaml part of the model card can have some non-semantic differences,
diff --git a/skops/card/tests/examples/toy-example.md b/skops/card/tests/examples/toy-example.md
new file mode 100644
index 00000000..44669f11
--- /dev/null
+++ b/skops/card/tests/examples/toy-example.md
@@ -0,0 +1,182 @@
+# This document tries to cover many common markdown contents
+
+This is not based on an existing model card and serves to increase test coverage. It also documents differences that may be found after parsing. There is no metainfo section.
+
+## H2
+
+### H3
+
+#### H4
+
+##### H5
+
+###### H6
+
+Parser 'preserves' some "quotation" marks.
+
+Parser doesn’t ‘preserve’ other “quotation” marks.
+
+## Italics
+
+One _way_ of doing it.
+Another *way* of doing it.
+
+## Bold
+
+One __way__ of doing it.
+Another **way** of doing it.
+
+## Strikethrough
+
+This is ~~not~~ the way.
+
+## Superscript and subscripts
+
+Really just html tags.
+
+E = mc<sup>2</sup>
+
+log<sub>2</sub>
+
+## Bullet lists
+
+Pandoc does not differentiate between different notations, so we always use -, not * or +.
+
+* using
+* asterisk
+
+or
+
+- using
+- minus
+  with line break
+
+or
+
++ using plus
+
+Finally:
+
+- nesting
+  - is
+- indeed
+  - very
+    - possible
+  - to achieve
+
+## Ordered lists
+
+1. a normal
+2. ordered list
+
+or
+
+1. an ordered
+2. list
+   1. with
+   2. indentation
+3. is possible
+
+## Mixed lists
+
+1. it’s
+2. possible
+   - to
+   - mix
+3. ordered _and_ unorderd
+
+## TODOs
+
+- [x] This
+- [ ] is
+- [x] **done**
+
+## Links
+
+[a link](https://skops.readthedocs.io/)
+
+The "title" is not parsed by pandoc
+
+[a link](https://skops.readthedocs.io/ "this disappears")
+
+[a link to a file](./toy-example.md)
+
+References are resolved, so `[1]` below is replaced by the actual link:
+
+[a link with reference][1]
+
+A plain link to https://skops.readthedocs.io/ used inside of text.
+
+[1]: https://skops.readthedocs.io/
+
+## Images
+
+![skops logo](https://github.com/skops-dev/skops/blob/main/docs/images/logo.png)
+
+### Using html
+
+<img src="https://github.com/skops-dev/skops/blob/main/docs/images/logo.png" alt="logo" width="100"/>
+
+## Quotes
+
+> Someone said something importent
+
+> I quote wise words:
+> > Someone said something importent
+
+## Tables
+
+| Header 0     | Header 1       |
+|--------------|----------------|
+| Some content | More content   |
+| _Even more_  | This is **it** |
+
+Empty tables are legal
+
+| What now?   |
+|-------------|
+
+## Inline code
+
+Some `inline` code.
+
+`A whole line`
+
+## Code blocks
+
+```
+A raw
+
+code block
+```
+
+With language
+
+```python
+def foo():
+  return 0
+  
+def bar():
+  return 1
+```
+
+## Raw HTML
+<p hidden>Cryptids of Revachol:</p>
+
+<dl>
+    <dt>Beast of Bodmin</dt>
+    <dd>A large feline inhabiting Bodmin Moor.</dd>
+
+    <dt>Morgawr</dt>
+    <dd>A sea serpent.</dd>
+
+    <dt>Owlman</dt>
+    <dd>A giant owl-like creature.</dd>
+</dl>
+
+## Div
+
+The "id" tag may change in order
+<div class="warning" somekey key="with value" id="123">
+  <p>Divs are possible</p>
+</div>
diff --git a/skops/card/tests/examples/toy-example.md.diff b/skops/card/tests/examples/toy-example.md.diff
new file mode 100644
index 00000000..9c00ed2a
--- /dev/null
+++ b/skops/card/tests/examples/toy-example.md.diff
@@ -0,0 +1,90 @@
+--- 
++++ 
+@@ -0,0 +1 @@
++
+@@ -17 +18 @@
+-Parser doesn’t ‘preserve’ other “quotation” marks.
++Parser doesn’t 'preserve' other "quotation" marks.
+@@ -22 +23 @@
+-Another *way* of doing it.
++Another _way_ of doing it.
+@@ -26 +27 @@
+-One __way__ of doing it.
++One **way** of doing it.
+@@ -45,2 +46,2 @@
+-* using
+-* asterisk
++- using
++- asterisk
+@@ -56 +57 @@
+-+ using plus
++- using plus
+@@ -100 +101 @@
+-[a link](https://skops.readthedocs.io/ "this disappears")
++[a link](https://skops.readthedocs.io/)
+@@ -106 +107 @@
+-[a link with reference][1]
++[a link with reference](https://skops.readthedocs.io/)
+@@ -109,2 +109,0 @@
+-
+-[1]: https://skops.readthedocs.io/
+@@ -164 +163,6 @@
+-<p hidden>Cryptids of Revachol:</p>
++
++<p hidden>
++
++Cryptids of Revachol:
++
++</p>
+@@ -167,8 +171,37 @@
+-    <dt>Beast of Bodmin</dt>
+-    <dd>A large feline inhabiting Bodmin Moor.</dd>
+-
+-    <dt>Morgawr</dt>
+-    <dd>A sea serpent.</dd>
+-
+-    <dt>Owlman</dt>
+-    <dd>A giant owl-like creature.</dd>
++
++<dt>
++
++Beast of Bodmin
++
++</dt>
++
++<dd>
++
++A large feline inhabiting Bodmin Moor.
++
++</dd>
++
++<dt>
++
++Morgawr
++
++</dt>
++
++<dd>
++
++A sea serpent.
++
++</dd>
++
++<dt>
++
++Owlman
++
++</dt>
++
++<dd>
++
++A giant owl-like creature.
++
++</dd>
++
+@@ -180,3 +213,2 @@
+-<div class="warning" somekey key="with value" id="123">
+-  <p>Divs are possible</p>
+-</div>
++
++<div id="123" class="warning" somekey key="with value"><p>Divs are possible</p></div>
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index b723c03e..a7650b07 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -1,5 +1,7 @@
 import difflib
+import json
 import os
+import re
 from pathlib import Path
 
 import numpy as np
@@ -8,7 +10,7 @@
 from sklearn.linear_model import LinearRegression
 
 from skops.card import Card, parse_modelcard
-from skops.card._parser import check_pandoc_installed
+from skops.card._parser import PandocParser, check_pandoc_installed
 
 try:
     check_pandoc_installed()
@@ -44,11 +46,14 @@ def card(fit_model, tmp_path):
 
 
 EXAMPLE_CARDS = [
+    # actual model cards from HF hub
     "bert-base-uncased.md",
     "clip-vit-large-patch14.md",
     "gpt2.md",
     "specter.md",
     "vit-base-patch32-224-in21k.md",
+    # not a model card
+    "toy-example.md",
 ]
 
 
@@ -72,11 +77,12 @@ def assert_readme_files_almost_equal(file0, file1, diff):
         readme1 = f.readlines()
 
     sep = "---\n"
-    idx0, idx1 = readme0[1:].index(sep) + 1, readme1[1:].index(sep) + 1
-    meta0, meta1 = readme0[1:idx0], readme1[1:idx1]
-    readme0, readme1 = readme0[idx0:], readme1[idx1:]
-
-    _assert_meta_equal(meta0, meta1)
+    # we look for 2nd occurrence, so skip first char to not match 1st occurrence
+    if sep in readme0[1:]:  # only check if metainfo is present
+        idx0, idx1 = readme0[1:].index(sep) + 1, readme1[1:].index(sep) + 1
+        meta0, meta1 = readme0[1:idx0], readme1[1:idx1]
+        readme0, readme1 = readme0[idx0:], readme1[idx1:]
+        _assert_meta_equal(meta0, meta1)
 
     # exclude trivial case of both being empty
     assert readme0
@@ -117,3 +123,47 @@ def test_example_model_cards(tmp_path, file_name):
     parsed_card.save(file1)
 
     assert_readme_files_almost_equal(file0, file1, diff)
+
+
+def test_unknown_pandoc_item_raises():
+    source = json.dumps(
+        {
+            "pandoc-api-version": [1, 22, 2, 1],
+            "meta": {},
+            "blocks": [
+                {
+                    "t": "Header",
+                    "c": [1, ["section", [], []], [{"t": "Str", "c": "section"}]],
+                },
+                {"c": "valid", "t": "Str"},
+                {"t": "does-not-exist", "c": []},
+                {"c": "okay", "t": "Str"},
+            ],
+        }
+    )
+    parser = PandocParser(source)
+    msg = (
+        "The parsed document contains 'does-not-exist', which is not "
+        "supported yet, please open an issue on GitHub"
+    )
+    with pytest.raises(ValueError, match=re.escape(msg)):
+        parser.generate()
+
+
+def test_content_without_section_raises():
+    source = json.dumps(
+        {
+            "pandoc-api-version": [1, 22, 2, 1],
+            "meta": {},
+            "blocks": [
+                {"c": "whoops", "t": "Str"},
+            ],
+        }
+    )
+    parser = PandocParser(source)
+    msg = (
+        "Trying to add content but there is no current section, this is probably a "
+        "bug, please open an issue on GitHub"
+    )
+    with pytest.raises(ValueError, match=re.escape(msg)):
+        parser.generate()

From 08505f92e8945dc6cb0d94a92cdb5c3d6ff10f09 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Thu, 5 Jan 2023 15:29:53 +0100
Subject: [PATCH 33/47] Install pandoc on linux CI to test parser

---
 .github/workflows/build-test.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/.github/workflows/build-test.yml b/.github/workflows/build-test.yml
index 16173cf9..106d5ae6 100644
--- a/.github/workflows/build-test.yml
+++ b/.github/workflows/build-test.yml
@@ -61,6 +61,9 @@ jobs:
           then pip install --pre --extra-index https://pypi.anaconda.org/scipy-wheels-nightly/simple scikit-learn;
           else pip install "scikit-learn~=${{ matrix.sklearn_version }}";
         fi
+        if [ ${{ matrix.os }} == "ubuntu-latest" ];
+          then wget -q https://github.com/jgm/pandoc/releases/download/2.19.2/pandoc-2.19.2-1-amd64.deb && sudo dpkg -i pandoc-2.19.2-1-amd64.deb;
+        fi
         python --version
         pip --version
         pip list

From d0aa9df1577e05984a0b739ccbc2973d2303ef92 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 17 Jan 2023 16:14:15 +0100
Subject: [PATCH 34/47] Add documentation about parsing model cards

---
 docs/model_card.rst | 50 +++++++++++++++++++++++++++++++++++++++++++--
 1 file changed, 48 insertions(+), 2 deletions(-)

diff --git a/docs/model_card.rst b/docs/model_card.rst
index 7a6c124d..9d4bffa7 100644
--- a/docs/model_card.rst
+++ b/docs/model_card.rst
@@ -11,6 +11,9 @@ beginning of it, following with the content of the model card in markdown
 format. The metadata section is used to make models searchable on the Hub, and
 get the inference API and the widgets on the website working.
 
+Metadata
+--------
+
 The metadata part of the file needs to follow the specifications `here
 <https://huggingface.co/docs/hub/models-cards#model-card-metadata>`__. It
 includes simple attributes of your models such as the task you're solving,
@@ -40,6 +43,9 @@ Here's an example of the metadata section of the ``README.md`` file:
 ``skops`` creates this section of the file for you, and you almost never need
 to touch it yourself.
 
+Model Card Content
+------------------
+
 The markdown part does not necessarily need to follow any specification in
 terms of information passed, which gives the user a lot of flexibility. The
 markdown part of the ``README.md`` file comes with a couple of defaults provided
@@ -90,8 +96,8 @@ as well as adding some subsections with plots below that, you can call the
     })
 
 Furthermore, you can select existing sections (as well as their subsections)
-using :meth:`Card.select`, and you can delete sections using
-:meth:`Card.delete`:
+using :meth:`.Card.select`, and you can delete sections using
+:meth:`.Card.delete`:
 
 .. code-block:: python
 
@@ -103,3 +109,43 @@ using :meth:`Card.select`, and you can delete sections using
 
 To see how you can use the API in ``skops`` to create a model card, please
 refer to :ref:`sphx_glr_auto_examples_plot_model_card.py`.
+
+Saving and Loading Model Cards
+------------------------------
+
+Once you have finished creating and modifying the model card, you can save it
+using the :meth:`.Card.save` method:
+
+.. code-block:: python
+
+    card.save("README.md")
+
+This renders the content of the model card to markdown format and stores it in
+the indicated file. It is now ready to be uploaded to Hugging Face Hub.
+
+If you have a finished model card but want to load to make some modifications,
+you can use the function :func:`skops.card.parse_modelcard`. This function
+parses the model card back into a :class:`.Card` instance that you can work on
+further:
+
+.. code-block:: python
+
+    from skops import card
+    model_card = card.parse_modelcard("README.md")
+    model_card.add(**{"A new section": "Some new content"})
+    model_card.save("README.md")
+
+When the card is parsed, some minor details of the model card can change, e.g.
+if you used different column alignment than the default, this could change, as
+well as removing excess empty lines or trailing whitespace. However, the content
+itself should be exactly the same. All known deviations are documented in the
+`parse_modelcard docs
+<https://skops.readthedocs.io/en/stable/modules/classes.html#skops.card.metadata_from_config>`_
+
+For the parsing part, we rely on `pandoc <https://pandoc.org/>`_. If you haven't
+installed it, please follow `these instructions
+<https://pandoc.org/installing.html>`_. The advantage of using pandoc is that
+it's a very mature library and that it supports many different document formats.
+Therefore, it should be possible to parse model cards even if they use a format
+that's not markdown, for instance reStructuredText, org, or asciidoc. For
+saving, we only support markdown, though.

From 5da3397134f909a4ce3d6bea1429a63492165e09 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 17 Jan 2023 16:40:46 +0100
Subject: [PATCH 35/47] Fix incorrect link in docs

---
 docs/model_card.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/model_card.rst b/docs/model_card.rst
index 9d4bffa7..ccfd6cde 100644
--- a/docs/model_card.rst
+++ b/docs/model_card.rst
@@ -140,7 +140,7 @@ if you used different column alignment than the default, this could change, as
 well as removing excess empty lines or trailing whitespace. However, the content
 itself should be exactly the same. All known deviations are documented in the
 `parse_modelcard docs
-<https://skops.readthedocs.io/en/stable/modules/classes.html#skops.card.metadata_from_config>`_
+<https://skops.readthedocs.io/en/stable/modules/classes.html#skops.card.parse_modelcard>`_
 
 For the parsing part, we rely on `pandoc <https://pandoc.org/>`_. If you haven't
 installed it, please follow `these instructions

From 2cb998e756b4d97a10f2f82e7e4dacf7e3471ae6 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 17 Jan 2023 17:03:45 +0100
Subject: [PATCH 36/47] Clean up test_parser.py

It contained remnants from an old test that has been removed since then.
---
 skops/card/tests/test_parser.py | 30 +-----------------------------
 1 file changed, 1 insertion(+), 29 deletions(-)

diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index a7650b07..30f84f00 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -4,12 +4,10 @@
 import re
 from pathlib import Path
 
-import numpy as np
 import pytest
 import yaml  # type: ignore
-from sklearn.linear_model import LinearRegression
 
-from skops.card import Card, parse_modelcard
+from skops.card import parse_modelcard
 from skops.card._parser import PandocParser, check_pandoc_installed
 
 try:
@@ -19,32 +17,6 @@
     pytest.skip(reason="These tests require a recent pandoc", allow_module_level=True)
 
 
-@pytest.fixture
-def fit_model():
-    X = np.array([[1, 1], [1, 2], [2, 2], [2, 3]])
-    y = np.dot(X, np.array([1, 2])) + 3
-    reg = LinearRegression().fit(X, y)
-    return reg
-
-
-@pytest.fixture
-def card(fit_model, tmp_path):
-    card = Card(fit_model)
-
-    try:
-        import matplotlib.pyplot as plt
-
-        fig, ax = plt.subplots()
-        ax.plot([0, 1])
-        fig.savefig(tmp_path / "my-throwaway-plot.png")
-        card.add_plot(**{"My plots/My first plot": "my-throwaway-plot.png"})
-    except ImportError:
-        pass
-
-    card.add_table(**{"A table": {"col0": [0, 1], "col1": [2, 3]}})
-    return card
-
-
 EXAMPLE_CARDS = [
     # actual model cards from HF hub
     "bert-base-uncased.md",

From 1922bc147ae85d06f7effde3e32d4fda63cc78ae Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Wed, 18 Jan 2023 12:24:55 +0100
Subject: [PATCH 37/47] Move changes entry to v0.5

Was added to v0.4 but that version is already released.
---
 docs/changes.rst | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/docs/changes.rst b/docs/changes.rst
index f1aa7739..fc579c53 100644
--- a/docs/changes.rst
+++ b/docs/changes.rst
@@ -9,6 +9,14 @@ skops Changelog
     :depth: 1
     :local:
 
+v0.5
+----
+- :class:`.card.Card` now allows to add content to existing sections, using a
+  ``/`` to separate the subsections. E.g. use ``card.add(**{"Existing
+  section/New section": "content"})`` to add "content" a new subsection called
+  "New section" to an existing section called "Existing section". :pr:`203` by
+  `Benjamin Bossan`_.
+
 v0.4
 ----
 - :func:`.io.dump` and :func:`.io.load` now work with file like objects,
@@ -21,11 +29,6 @@ v0.4
   :pr:`242` by `Merve Noyan`_.
 - Persistence now supports bytes and bytearrays, added tests to verify that
   LightGBM, XGBoost, and CatBoost work now. :pr:`244` by `Benjamin Bossan`_.
-- :class:`.card.Card` now allows to add content to existing sections, using a
-  ``/`` to separate the subsections. E.g. use ``card.add(**{"Existing
-  section/New section": "content"})`` to add "content" a new subsection called
-  "New section" to an existing section called "Existing section". :pr:`203` by
-  `Benjamin Bossan`_.
 
 v0.3
 ----

From 709e079c6f22dc95bc7267beb267cbd8bc45671c Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 20 Jan 2023 11:46:22 +0100
Subject: [PATCH 38/47] Reviewer comments: wording, period in err msg

---
 docs/model_card.rst   | 2 +-
 skops/card/_parser.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/model_card.rst b/docs/model_card.rst
index ccfd6cde..d3b726d4 100644
--- a/docs/model_card.rst
+++ b/docs/model_card.rst
@@ -148,4 +148,4 @@ installed it, please follow `these instructions
 it's a very mature library and that it supports many different document formats.
 Therefore, it should be possible to parse model cards even if they use a format
 that's not markdown, for instance reStructuredText, org, or asciidoc. For
-saving, we only support markdown, though.
+saving, we only support markdown for now.
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 8236f6fd..3d00599a 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -75,7 +75,7 @@ def _add_content(self, content: str, section: Section | None) -> None:
             # not illegal in markdown, but we don't handle it yet.
             raise ValueError(
                 "Trying to add content but there is no current section, "
-                "this is probably a bug, please open an issue on GitHub"
+                "this is probably a bug, please open an issue on GitHub."
             )
 
         if not section.content:

From 08f44c4a04edb7ea261ec91943c3de9b8efcdd33 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 20 Jan 2023 14:34:21 +0100
Subject: [PATCH 39/47] Use packaging Version for version comparison

Add packaging as an explicit dependency. Kinda arbitrarily set min
version to be 17.0, which was released 5 years ago.
---
 skops/_min_dependencies.py |  1 +
 skops/card/_parser.py      | 31 ++++++++-----------------------
 2 files changed, 9 insertions(+), 23 deletions(-)

diff --git a/skops/_min_dependencies.py b/skops/_min_dependencies.py
index 35219a12..1ff8b699 100644
--- a/skops/_min_dependencies.py
+++ b/skops/_min_dependencies.py
@@ -25,6 +25,7 @@
     "sphinx-prompt": ("1.3.0", "docs", None),
     "sphinx-issues": ("1.2.0", "docs", None),
     "matplotlib": ("3.3", "docs, tests", None),
+    "packaging": ("17.0", "install", None),
     "pandas": ("1", "docs, tests", None),
     # required for persistence tests of external libraries
     "lightgbm": ("3", "tests", None),
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 3d00599a..517be702 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -12,16 +12,17 @@
 import subprocess
 from pathlib import Path
 from tempfile import mkdtemp
-from typing import Any, Literal, Sequence
+from typing import Any, Literal
 
 import yaml  # type: ignore
+from packaging.version import Version
 
 from skops.card import Card
 from skops.card._model_card import Section
 
 from ._markup import Markdown, PandocItem
 
-PANDOC_MIN_VERSION = (2, 19, 0)
+PANDOC_MIN_VERSION = "2.19.0"
 
 
 class PandocParser:
@@ -140,7 +141,7 @@ def generate(self) -> Card:
         return card
 
 
-def _get_pandoc_version() -> list[int]:
+def _get_pandoc_version() -> str:
     """Shell out to retrieve the pandoc version
 
     Raises
@@ -161,29 +162,12 @@ def _get_pandoc_version() -> list[int]:
     if not version_info.startswith("pandoc "):
         raise RuntimeError("Could not determine version of pandoc")
 
-    _, _, actual_version = version_info.partition(" ")
-    pandoc_version = [int(v) for v in actual_version.split(".")]
+    _, _, pandoc_version = version_info.partition(" ")
     return pandoc_version
 
 
-def _check_version_greater_equal(
-    version: Sequence[int], min_version: Sequence[int]
-) -> None:
-    """Very bad version comparison function to ensure that the first version is
-    >= the second."""
-    for v1, v2 in zip(version, min_version):
-        if v1 > v2:
-            return
-
-        if v1 < v2:
-            raise ValueError(
-                "Pandoc version too low, expected at least "
-                f"{'.'.join(map(str, min_version))}"
-            )
-
-
 def check_pandoc_installed(
-    min_version: Sequence[int] | None = PANDOC_MIN_VERSION,
+    min_version: str | None = PANDOC_MIN_VERSION,
 ) -> None:
     """Check if pandoc is installed on the system
 
@@ -216,7 +200,8 @@ def check_pandoc_installed(
     if not min_version:
         return
 
-    _check_version_greater_equal(pandoc_version, min_version)
+    if Version(pandoc_version) < Version(min_version):
+        raise ValueError("Pandoc version too low, expected at least {min_version}")
 
 
 def _card_with_detached_metainfo(path: str | Path) -> tuple[str | Path, dict[str, Any]]:

From 7c416c41534f3f55f3c7cba8123eeac37f8c34a8 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 20 Jan 2023 14:35:55 +0100
Subject: [PATCH 40/47] Install pandoc with apt in CI

---
 .github/workflows/build-test.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build-test.yml b/.github/workflows/build-test.yml
index 106d5ae6..6b340c0b 100644
--- a/.github/workflows/build-test.yml
+++ b/.github/workflows/build-test.yml
@@ -62,7 +62,7 @@ jobs:
           else pip install "scikit-learn~=${{ matrix.sklearn_version }}";
         fi
         if [ ${{ matrix.os }} == "ubuntu-latest" ];
-          then wget -q https://github.com/jgm/pandoc/releases/download/2.19.2/pandoc-2.19.2-1-amd64.deb && sudo dpkg -i pandoc-2.19.2-1-amd64.deb;
+          then sudo apt install pandoc;
         fi
         python --version
         pip --version

From b855e50ff5636ed754606593e8610e64a9bf06b8 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 20 Jan 2023 14:52:35 +0100
Subject: [PATCH 41/47] Investigate pandoc version issue

---
 .github/workflows/build-test.yml | 2 +-
 skops/card/_parser.py            | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build-test.yml b/.github/workflows/build-test.yml
index 6b340c0b..31d5f669 100644
--- a/.github/workflows/build-test.yml
+++ b/.github/workflows/build-test.yml
@@ -62,7 +62,7 @@ jobs:
           else pip install "scikit-learn~=${{ matrix.sklearn_version }}";
         fi
         if [ ${{ matrix.os }} == "ubuntu-latest" ];
-          then sudo apt install pandoc;
+          then sudo apt install pandoc && pandoc --version;
         fi
         python --version
         pip --version
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 517be702..2dad8f45 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -201,7 +201,7 @@ def check_pandoc_installed(
         return
 
     if Version(pandoc_version) < Version(min_version):
-        raise ValueError("Pandoc version too low, expected at least {min_version}")
+        raise ValueError(f"Pandoc version too low, expected at least {min_version}")
 
 
 def _card_with_detached_metainfo(path: str | Path) -> tuple[str | Path, dict[str, Any]]:

From 2da5ea61db674a09478b32e22b04eaf32a3264c8 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Fri, 20 Jan 2023 15:02:19 +0100
Subject: [PATCH 42/47] Lower min required pandoc version to 2.9.0

---
 skops/card/_parser.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 2dad8f45..fecdd4d8 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -22,7 +22,7 @@
 
 from ._markup import Markdown, PandocItem
 
-PANDOC_MIN_VERSION = "2.19.0"
+PANDOC_MIN_VERSION = "2.9.0"
 
 
 class PandocParser:
@@ -201,7 +201,10 @@ def check_pandoc_installed(
         return
 
     if Version(pandoc_version) < Version(min_version):
-        raise ValueError(f"Pandoc version too low, expected at least {min_version}")
+        raise ValueError(
+            f"Pandoc version too low, expected at least {min_version}, "
+            f"got {pandoc_version} instead."
+        )
 
 
 def _card_with_detached_metainfo(path: str | Path) -> tuple[str | Path, dict[str, Any]]:

From 6d1f288baf6c5a38ff163560818402e9db425767 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 23 Jan 2023 14:04:30 +0100
Subject: [PATCH 43/47] Revert pandoc install to use gh + deb

Apt repo is very outdated.
---
 .github/workflows/build-test.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build-test.yml b/.github/workflows/build-test.yml
index 31d5f669..106d5ae6 100644
--- a/.github/workflows/build-test.yml
+++ b/.github/workflows/build-test.yml
@@ -62,7 +62,7 @@ jobs:
           else pip install "scikit-learn~=${{ matrix.sklearn_version }}";
         fi
         if [ ${{ matrix.os }} == "ubuntu-latest" ];
-          then sudo apt install pandoc && pandoc --version;
+          then wget -q https://github.com/jgm/pandoc/releases/download/2.19.2/pandoc-2.19.2-1-amd64.deb && sudo dpkg -i pandoc-2.19.2-1-amd64.deb;
         fi
         python --version
         pip --version

From fb46a76cd8bcb12a899d0e92ccc41513ce339a85 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Mon, 23 Jan 2023 14:32:44 +0100
Subject: [PATCH 44/47] Add Figure type to parsing

Figure was added in Pandoc v3.0 and is more complex than Image, but also
more powerful. At the moment, we treat Figure just as Image.
---
 skops/card/_markup.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index 8ffa14b6..00801f07 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -49,6 +49,7 @@ def __init__(self):
             "Para": self._para,
             "Header": self._header,
             "Image": self._image,
+            "Figure": self._figure,
             "CodeBlock": self._code_block,
             "Code": self._code,
             "Table": self._table,
@@ -155,6 +156,19 @@ def _image(self, value) -> str:
         content = f"![{caption}]({dest})"
         return content
 
+    def _figure(self, value) -> str:
+        # Figure type was added in Pandoc v3.0
+        (ident, classes, keyvals), caption, (body,) = value
+
+        body_type = body["t"]
+        # we can only deal with plain figures for now
+        if body_type != "Plain":
+            raise ValueError(f"Cannot deal with figure of type '{body_type}'")
+
+        plain_fig = body["c"][0]["c"]
+        plain_fig[2][1] = "fig:"
+        return self._image(plain_fig)
+
     @staticmethod
     def _code_block(item: tuple[tuple[int, list[str], list[str]], str]) -> str:
         # a codeblock consists of: (id, classes, namevals) contents

From 30d3e5c403b2e563cadb10af9b6170da47e046d2 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 24 Jan 2023 12:17:30 +0100
Subject: [PATCH 45/47] Add pragmas for lines that are covered

Those are things that don't really make sense to be tested.
---
 skops/card/_markup.py | 8 ++++----
 skops/card/_parser.py | 5 +++--
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/skops/card/_markup.py b/skops/card/_markup.py
index 00801f07..7779a675 100644
--- a/skops/card/_markup.py
+++ b/skops/card/_markup.py
@@ -144,11 +144,11 @@ def _image(self, value) -> str:
         (ident, _, keyvals), caption, (dest, typef) = value
         # it seems like ident and keyvals are not relevant for markdown
 
-        if not caption:
+        if not caption:  # pragma: no cover
             # not sure if this can be reached, just to be safe
             raise ValueError("Figure missing a caption")
 
-        if not typef.startswith("fig:"):
+        if not typef.startswith("fig:"):  # pragma: no cover
             # not sure if this can be reached, just to be safe
             raise ValueError(f"Cannot deal with figure of type '{typef}'")
 
@@ -156,7 +156,7 @@ def _image(self, value) -> str:
         content = f"![{caption}]({dest})"
         return content
 
-    def _figure(self, value) -> str:
+    def _figure(self, value) -> str:  # pragma: no cover
         # Figure type was added in Pandoc v3.0
         (ident, classes, keyvals), caption, (body,) = value
 
@@ -297,7 +297,7 @@ def _quoted(self, item: tuple[dict[str, str], list[PandocItem]]) -> str:
         type_ = quote_type["t"]
         try:
             sym = {"DoubleQuote": '"', "SingleQuote": "'"}[type_]
-        except KeyError as exc:
+        except KeyError as exc:  # pragma: no cover
             # can probably not be reached, but let's be sure
             msg = (
                 f"The parsed document contains '{type_}', which is not "
diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index fecdd4d8..fd4dae38 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -83,7 +83,7 @@ def _add_content(self, content: str, section: Section | None) -> None:
             section.content = content
         elif isinstance(section.content, str):
             section.content = section.content + "\n\n" + content
-        else:
+        else:  # pragma: no cover
             # TODO: Content is a Formattable, no generic way to modify it --
             # should we require each Formattable to have an update method?
             raise ValueError(f"Could not modify content of {section.content}")
@@ -240,7 +240,8 @@ def _card_with_detached_metainfo(path: str | Path) -> tuple[str | Path, dict[str
         return path, metainfo
 
     idx_separator = text.find(sep_end)
-    if idx_separator < len(sep_start):  # separator shouldn't come earlier than this
+    if idx_separator < len(sep_start):  # pragma: no cover
+        # separator shouldn't come earlier than this
         return path, metainfo
 
     # https://black.readthedocs.io/en/stable/faq.html#why-are-flake8-s-e203-and-w503-violated

From de1837ec9ca4e96edba628aacf8577854c6dd5c3 Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 24 Jan 2023 12:18:17 +0100
Subject: [PATCH 46/47] Add more unit tests, get to 100% coverage

- test error when trying to use markup != markdown
- test no version check for pandoc
- test min pandoc version too low
- test pandoc not installed
- test pandoc version cannot be determined
---
 skops/card/_parser.py           |  6 +++--
 skops/card/tests/test_parser.py | 39 +++++++++++++++++++++++++++++++++
 2 files changed, 43 insertions(+), 2 deletions(-)

diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index fd4dae38..86f80861 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -160,7 +160,8 @@ def _get_pandoc_version() -> str:
     )
     version_info = str(proc.stdout.decode("utf-8")).split("\n", 1)[0]
     if not version_info.startswith("pandoc "):
-        raise RuntimeError("Could not determine version of pandoc")
+        # pandoc is installed but version cannot be determined
+        raise RuntimeError("Could not determine version of pandoc.")
 
     _, _, pandoc_version = version_info.partition(" ")
     return pandoc_version
@@ -190,10 +191,11 @@ def check_pandoc_installed(
     try:
         pandoc_version = _get_pandoc_version()
     except FileNotFoundError as exc:
+        # pandoc is not installed
         msg = (
             "This feature requires the pandoc library to be installed on your system, "
             "please follow these install instructions: "
-            "https://pandoc.org/installing.html"
+            "https://pandoc.org/installing.html."
         )
         raise FileNotFoundError(msg) from exc
 
diff --git a/skops/card/tests/test_parser.py b/skops/card/tests/test_parser.py
index 30f84f00..b74486fe 100644
--- a/skops/card/tests/test_parser.py
+++ b/skops/card/tests/test_parser.py
@@ -3,6 +3,7 @@
 import os
 import re
 from pathlib import Path
+from unittest.mock import Mock, patch
 
 import pytest
 import yaml  # type: ignore
@@ -139,3 +140,41 @@ def test_content_without_section_raises():
     )
     with pytest.raises(ValueError, match=re.escape(msg)):
         parser.generate()
+
+
+def test_unsupported_markup_raises():
+    match = re.escape("Markup of type does-not-exist is not supported (yet)")
+    with pytest.raises(ValueError, match=match):
+        PandocParser(source="", markup_type="does-not-exist")
+
+
+def test_check_pandoc_installed_no_min_version_works():
+    # check that it doesn't raise
+    check_pandoc_installed(min_version=None)
+
+
+def test_check_pandoc_installed_min_version_too_high_raises():
+    match = re.escape("Pandoc version too low, expected at least 999.9.9, got")
+    with pytest.raises(ValueError, match=match):
+        check_pandoc_installed(min_version="999.9.9")
+
+
+def test_pandoc_not_installed():
+    def raise_filenotfound(*args, **kwargs):
+        # error raised when trying to run subprocess on non-existing command
+        raise FileNotFoundError("[Errno 2] No such file or directory: 'pandoc'")
+
+    with patch("subprocess.run", raise_filenotfound):
+        match = re.escape(
+            "This feature requires the pandoc library to be installed on your system"
+        )
+        with pytest.raises(FileNotFoundError, match=match):
+            check_pandoc_installed()
+
+
+def test_pandoc_version_cannot_be_determined():
+    mock = Mock()
+    with patch("subprocess.run", mock):
+        match = re.escape("Could not determine version of pandoc")
+        with pytest.raises(RuntimeError, match=match):
+            check_pandoc_installed()

From 6472ebfbd747c24b549f18c60ae7c4fc3ceac8ef Mon Sep 17 00:00:00 2001
From: Benjamin Bossan <benjamin.bossan@gmail.com>
Date: Tue, 24 Jan 2023 13:18:35 +0100
Subject: [PATCH 47/47] Fix incorrect docstring

---
 skops/card/_parser.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/skops/card/_parser.py b/skops/card/_parser.py
index 86f80861..86d4f120 100644
--- a/skops/card/_parser.py
+++ b/skops/card/_parser.py
@@ -151,7 +151,7 @@ def _get_pandoc_version() -> str:
 
     Returns
     -------
-    pandoc_version : list[int]
+    pandoc_version : str
         The pandoc version as a list of ints.
     """
     proc = subprocess.run(