From 57c20d2638a116df64489c60258606b6707c049f Mon Sep 17 00:00:00 2001
From: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
Date: Wed, 6 Dec 2023 20:48:41 +0100
Subject: [PATCH 1/6] fix: updated docs

---
 docs/evaluation/utils.py   |  11 +-
 docs/performance_ner.ipynb | 654 ++++++++++++++++++-------------------
 2 files changed, 318 insertions(+), 347 deletions(-)
diff --git a/docs/evaluation/utils.py b/docs/evaluation/utils.py
index 99b8b548..7de29704 100644
--- a/docs/evaluation/utils.py
+++ b/docs/evaluation/utils.py
@@ -6,13 +6,12 @@
 import numpy as np
 import pandas as pd
 import spacy
+from evaluation.datasets import datasets
 from spacy.language import Language
 from spacy.scorer import Scorer
 from spacy.tokens import Doc
 from spacy.training import Example
 
-from evaluation.datasets import datasets
-
 
 def bootstrap(
     examples: List[Example],
@@ -74,7 +73,13 @@ def compute_mean_and_ci(scores: List[Dict[str, Any]]) -> Dict[str, Any]:
         "MISC": "Misc.",
     }
 
-    labels = {label for score in scores for label in score["ents_per_type"]}
+    def get_ents_per_type(score):
+        x = score["ents_per_type"]
+        if x is None:
+            return []
+        return x
+
+    labels = {label for score in scores for label in get_ents_per_type(score)}
 
     for label in labels:
         label_f = [
diff --git a/docs/performance_ner.ipynb b/docs/performance_ner.ipynb
index a3ba0659..2a13d263 100644
--- a/docs/performance_ner.ipynb
+++ b/docs/performance_ner.ipynb
@@ -86,7 +86,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 24,
+   "execution_count": 2,
    "metadata": {
     "tags": [
      "remove-input"
@@ -140,7 +140,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -154,7 +154,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 4,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -178,7 +178,7 @@
       "dane (test): Loading prediction for da_core_news_md-3.5.0\n",
       "dane (test): Loading prediction for da_core_news_sm-3.5.0\n",
       "dane (test): Loading prediction for openai/gpt-3.5-turbo (02/05/23)\n",
-      "dane (test): Running openai/gpt-4 (02/05/23)\n"
+      "dane (test): Loading prediction for openai/gpt-4 (02/05/23)\n"
      ]
     }
    ],
@@ -191,7 +191,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 5,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -220,7 +220,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 6,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -282,7 +282,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 7,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -300,7 +300,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 8,
    "metadata": {
     "tags": [
      "remove-input"
@@ -311,140 +311,140 @@
      "data": {
       "text/html": [
        "<style type=\"text/css\">\n",
-       "#T_f48d8 .level0 {\n",
+       "#T_98f1b .level0 {\n",
        "  text-align: center;\n",
        "}\n",
-       "#T_f48d8 .col_heading {\n",
+       "#T_98f1b .col_heading {\n",
        "  text-align: center;\n",
        "}\n",
-       "#T_f48d8_row0_col0, #T_f48d8_row1_col0, #T_f48d8_row2_col0, #T_f48d8_row3_col0, #T_f48d8_row4_col0, #T_f48d8_row5_col0, #T_f48d8_row6_col0, #T_f48d8_row7_col0, #T_f48d8_row8_col0, #T_f48d8_row9_col0, #T_f48d8_row10_col0 {\n",
+       "#T_98f1b_row0_col0, #T_98f1b_row1_col0, #T_98f1b_row2_col0, #T_98f1b_row3_col0, #T_98f1b_row4_col0, #T_98f1b_row5_col0, #T_98f1b_row6_col0, #T_98f1b_row7_col0, #T_98f1b_row8_col0, #T_98f1b_row9_col0, #T_98f1b_row10_col0 {\n",
        "  text-align: left;\n",
        "}\n",
-       "#T_f48d8_row0_col1, #T_f48d8_row0_col4, #T_f48d8_row1_col3, #T_f48d8_row1_col5, #T_f48d8_row3_col2 {\n",
+       "#T_98f1b_row0_col1, #T_98f1b_row0_col4, #T_98f1b_row1_col3, #T_98f1b_row1_col5, #T_98f1b_row3_col2 {\n",
        "  text-decoration: underline;\n",
        "  text-align: right;\n",
        "}\n",
-       "#T_f48d8_row0_col2, #T_f48d8_row0_col5, #T_f48d8_row3_col1, #T_f48d8_row3_col3, #T_f48d8_row3_col4 {\n",
+       "#T_98f1b_row0_col2, #T_98f1b_row0_col5, #T_98f1b_row3_col1, #T_98f1b_row3_col3, #T_98f1b_row3_col4 {\n",
        "  font-weight: bold;\n",
        "  text-align: right;\n",
        "}\n",
-       "#T_f48d8_row0_col3, #T_f48d8_row1_col1, #T_f48d8_row1_col2, #T_f48d8_row1_col4, #T_f48d8_row2_col1, #T_f48d8_row2_col2, #T_f48d8_row2_col3, #T_f48d8_row2_col4, #T_f48d8_row2_col5, #T_f48d8_row3_col5, #T_f48d8_row4_col1, #T_f48d8_row4_col2, #T_f48d8_row4_col3, #T_f48d8_row4_col4, #T_f48d8_row4_col5, #T_f48d8_row5_col1, #T_f48d8_row5_col2, #T_f48d8_row5_col3, #T_f48d8_row5_col4, #T_f48d8_row5_col5, #T_f48d8_row6_col1, #T_f48d8_row6_col2, #T_f48d8_row6_col3, #T_f48d8_row6_col4, #T_f48d8_row6_col5, #T_f48d8_row7_col1, #T_f48d8_row7_col2, #T_f48d8_row7_col3, #T_f48d8_row7_col4, #T_f48d8_row7_col5, #T_f48d8_row8_col1, #T_f48d8_row8_col2, #T_f48d8_row8_col3, #T_f48d8_row8_col4, #T_f48d8_row8_col5, #T_f48d8_row9_col1, #T_f48d8_row9_col2, #T_f48d8_row9_col3, #T_f48d8_row9_col4, #T_f48d8_row9_col5, #T_f48d8_row10_col1, #T_f48d8_row10_col2, #T_f48d8_row10_col3, #T_f48d8_row10_col4, #T_f48d8_row10_col5 {\n",
+       "#T_98f1b_row0_col3, #T_98f1b_row1_col1, #T_98f1b_row1_col2, #T_98f1b_row1_col4, #T_98f1b_row2_col1, #T_98f1b_row2_col2, #T_98f1b_row2_col3, #T_98f1b_row2_col4, #T_98f1b_row2_col5, #T_98f1b_row3_col5, #T_98f1b_row4_col1, #T_98f1b_row4_col2, #T_98f1b_row4_col3, #T_98f1b_row4_col4, #T_98f1b_row4_col5, #T_98f1b_row5_col1, #T_98f1b_row5_col2, #T_98f1b_row5_col3, #T_98f1b_row5_col4, #T_98f1b_row5_col5, #T_98f1b_row6_col1, #T_98f1b_row6_col2, #T_98f1b_row6_col3, #T_98f1b_row6_col4, #T_98f1b_row6_col5, #T_98f1b_row7_col1, #T_98f1b_row7_col2, #T_98f1b_row7_col3, #T_98f1b_row7_col4, #T_98f1b_row7_col5, #T_98f1b_row8_col1, #T_98f1b_row8_col2, #T_98f1b_row8_col3, #T_98f1b_row8_col4, #T_98f1b_row8_col5, #T_98f1b_row9_col1, #T_98f1b_row9_col2, #T_98f1b_row9_col3, #T_98f1b_row9_col4, #T_98f1b_row9_col5, #T_98f1b_row10_col1, #T_98f1b_row10_col2, #T_98f1b_row10_col3, #T_98f1b_row10_col4, #T_98f1b_row10_col5 {\n",
        "  text-align: right;\n",
        "}\n",
        "</style>\n",
-       "<table id=\"T_f48d8\" style=\"font-size: 0.65em\">\n",
+       "<table id=\"T_98f1b\" style=\"font-size: 0.65em\">\n",
        "  <caption>F1 score with 95% confidence interval calculated using bootstrapping with 500 samples.</caption>\n",
        "  <thead>\n",
        "    <tr>\n",
-       "      <th id=\"T_f48d8_level0_col0\" class=\"col_heading level0 col0\" ></th>\n",
-       "      <th id=\"T_f48d8_level0_col1\" class=\"col_heading level0 col1\" colspan=\"5\">F1</th>\n",
+       "      <th id=\"T_98f1b_level0_col0\" class=\"col_heading level0 col0\" ></th>\n",
+       "      <th id=\"T_98f1b_level0_col1\" class=\"col_heading level0 col1\" colspan=\"5\">F1</th>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_f48d8_level1_col0\" class=\"col_heading level1 col0\" >Models</th>\n",
-       "      <th id=\"T_f48d8_level1_col1\" class=\"col_heading level1 col1\" >Average</th>\n",
-       "      <th id=\"T_f48d8_level1_col2\" class=\"col_heading level1 col2\" >Location</th>\n",
-       "      <th id=\"T_f48d8_level1_col3\" class=\"col_heading level1 col3\" >Person</th>\n",
-       "      <th id=\"T_f48d8_level1_col4\" class=\"col_heading level1 col4\" >Organization</th>\n",
-       "      <th id=\"T_f48d8_level1_col5\" class=\"col_heading level1 col5\" >Misc.</th>\n",
+       "      <th id=\"T_98f1b_level1_col0\" class=\"col_heading level1 col0\" >Models</th>\n",
+       "      <th id=\"T_98f1b_level1_col1\" class=\"col_heading level1 col1\" >Average</th>\n",
+       "      <th id=\"T_98f1b_level1_col2\" class=\"col_heading level1 col2\" >Location</th>\n",
+       "      <th id=\"T_98f1b_level1_col3\" class=\"col_heading level1 col3\" >Person</th>\n",
+       "      <th id=\"T_98f1b_level1_col4\" class=\"col_heading level1 col4\" >Organization</th>\n",
+       "      <th id=\"T_98f1b_level1_col5\" class=\"col_heading level1 col5\" >Misc.</th>\n",
        "    </tr>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row0_col0\" class=\"data row0 col0\" >da_dacy_large_trf-0.2.0</td>\n",
-       "      <td id=\"T_f48d8_row0_col1\" class=\"data row0 col1\" >85.4 (81.2, 88.9)</td>\n",
-       "      <td id=\"T_f48d8_row0_col2\" class=\"data row0 col2\" >89.5 (84.0, 94.7)</td>\n",
-       "      <td id=\"T_f48d8_row0_col3\" class=\"data row0 col3\" >92.6 (89.0, 95.4)</td>\n",
-       "      <td id=\"T_f48d8_row0_col4\" class=\"data row0 col4\" >79.0 (72.5, 84.6)</td>\n",
-       "      <td id=\"T_f48d8_row0_col5\" class=\"data row0 col5\" >79.0 (70.8, 86.0)</td>\n",
+       "      <td id=\"T_98f1b_row0_col0\" class=\"data row0 col0\" >da_dacy_large_trf-0.2.0</td>\n",
+       "      <td id=\"T_98f1b_row0_col1\" class=\"data row0 col1\" >85.4 (81.2, 88.9)</td>\n",
+       "      <td id=\"T_98f1b_row0_col2\" class=\"data row0 col2\" >89.5 (84.0, 94.7)</td>\n",
+       "      <td id=\"T_98f1b_row0_col3\" class=\"data row0 col3\" >92.6 (89.0, 95.4)</td>\n",
+       "      <td id=\"T_98f1b_row0_col4\" class=\"data row0 col4\" >79.0 (72.5, 84.6)</td>\n",
+       "      <td id=\"T_98f1b_row0_col5\" class=\"data row0 col5\" >79.0 (70.8, 86.0)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row1_col0\" class=\"data row1 col0\" >da_dacy_medium_trf-0.2.0</td>\n",
-       "      <td id=\"T_f48d8_row1_col1\" class=\"data row1 col1\" >84.9 (81.0, 88.5)</td>\n",
-       "      <td id=\"T_f48d8_row1_col2\" class=\"data row1 col2\" >86.8 (81.2, 92.3)</td>\n",
-       "      <td id=\"T_f48d8_row1_col3\" class=\"data row1 col3\" >92.7 (89.2, 95.6)</td>\n",
-       "      <td id=\"T_f48d8_row1_col4\" class=\"data row1 col4\" >78.7 (71.8, 85.0)</td>\n",
-       "      <td id=\"T_f48d8_row1_col5\" class=\"data row1 col5\" >78.7 (70.6, 86.1)</td>\n",
+       "      <td id=\"T_98f1b_row1_col0\" class=\"data row1 col0\" >da_dacy_medium_trf-0.2.0</td>\n",
+       "      <td id=\"T_98f1b_row1_col1\" class=\"data row1 col1\" >84.9 (81.0, 88.5)</td>\n",
+       "      <td id=\"T_98f1b_row1_col2\" class=\"data row1 col2\" >86.8 (81.2, 92.3)</td>\n",
+       "      <td id=\"T_98f1b_row1_col3\" class=\"data row1 col3\" >92.7 (89.2, 95.6)</td>\n",
+       "      <td id=\"T_98f1b_row1_col4\" class=\"data row1 col4\" >78.7 (71.8, 85.0)</td>\n",
+       "      <td id=\"T_98f1b_row1_col5\" class=\"data row1 col5\" >78.7 (70.6, 86.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row2_col0\" class=\"data row2 col0\" >da_dacy_small_trf-0.2.0</td>\n",
-       "      <td id=\"T_f48d8_row2_col1\" class=\"data row2 col1\" >82.7 (79.3, 85.9)</td>\n",
-       "      <td id=\"T_f48d8_row2_col2\" class=\"data row2 col2\" >84.2 (78.3, 89.8)</td>\n",
-       "      <td id=\"T_f48d8_row2_col3\" class=\"data row2 col3\" >92.2 (88.5, 95.1)</td>\n",
-       "      <td id=\"T_f48d8_row2_col4\" class=\"data row2 col4\" >75.9 (69.3, 81.7)</td>\n",
-       "      <td id=\"T_f48d8_row2_col5\" class=\"data row2 col5\" >75.7 (68.8, 81.8)</td>\n",
+       "      <td id=\"T_98f1b_row2_col0\" class=\"data row2 col0\" >da_dacy_small_trf-0.2.0</td>\n",
+       "      <td id=\"T_98f1b_row2_col1\" class=\"data row2 col1\" >82.7 (79.3, 85.9)</td>\n",
+       "      <td id=\"T_98f1b_row2_col2\" class=\"data row2 col2\" >84.2 (78.3, 89.8)</td>\n",
+       "      <td id=\"T_98f1b_row2_col3\" class=\"data row2 col3\" >92.2 (88.5, 95.1)</td>\n",
+       "      <td id=\"T_98f1b_row2_col4\" class=\"data row2 col4\" >75.9 (69.3, 81.7)</td>\n",
+       "      <td id=\"T_98f1b_row2_col5\" class=\"data row2 col5\" >75.7 (68.8, 81.8)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row3_col0\" class=\"data row3 col0\" >saattrupdan/nbailab-base-ner-scandi</td>\n",
-       "      <td id=\"T_f48d8_row3_col1\" class=\"data row3 col1\" >86.3 (82.4, 89.7)</td>\n",
-       "      <td id=\"T_f48d8_row3_col2\" class=\"data row3 col2\" >88.6 (83.0, 93.3)</td>\n",
-       "      <td id=\"T_f48d8_row3_col3\" class=\"data row3 col3\" >95.1 (92.4, 97.8)</td>\n",
-       "      <td id=\"T_f48d8_row3_col4\" class=\"data row3 col4\" >80.3 (73.6, 85.8)</td>\n",
-       "      <td id=\"T_f48d8_row3_col5\" class=\"data row3 col5\" >78.6 (69.4, 86.0)</td>\n",
+       "      <td id=\"T_98f1b_row3_col0\" class=\"data row3 col0\" >saattrupdan/nbailab-base-ner-scandi</td>\n",
+       "      <td id=\"T_98f1b_row3_col1\" class=\"data row3 col1\" >86.3 (82.4, 89.7)</td>\n",
+       "      <td id=\"T_98f1b_row3_col2\" class=\"data row3 col2\" >88.6 (83.0, 93.3)</td>\n",
+       "      <td id=\"T_98f1b_row3_col3\" class=\"data row3 col3\" >95.1 (92.4, 97.8)</td>\n",
+       "      <td id=\"T_98f1b_row3_col4\" class=\"data row3 col4\" >80.3 (73.6, 85.8)</td>\n",
+       "      <td id=\"T_98f1b_row3_col5\" class=\"data row3 col5\" >78.6 (69.4, 86.0)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row4_col0\" class=\"data row4 col0\" >alexandrainst/da-ner-base</td>\n",
-       "      <td id=\"T_f48d8_row4_col1\" class=\"data row4 col1\" >70.7 (66.2, 75.2)</td>\n",
-       "      <td id=\"T_f48d8_row4_col2\" class=\"data row4 col2\" >84.8 (77.8, 91.0)</td>\n",
-       "      <td id=\"T_f48d8_row4_col3\" class=\"data row4 col3\" >90.3 (86.3, 93.9)</td>\n",
-       "      <td id=\"T_f48d8_row4_col4\" class=\"data row4 col4\" >64.7 (57.0, 71.3)</td>\n",
-       "      <td id=\"T_f48d8_row4_col5\" class=\"data row4 col5\" > </td>\n",
+       "      <td id=\"T_98f1b_row4_col0\" class=\"data row4 col0\" >alexandrainst/da-ner-base</td>\n",
+       "      <td id=\"T_98f1b_row4_col1\" class=\"data row4 col1\" >70.7 (66.2, 75.2)</td>\n",
+       "      <td id=\"T_98f1b_row4_col2\" class=\"data row4 col2\" >84.8 (77.8, 91.0)</td>\n",
+       "      <td id=\"T_98f1b_row4_col3\" class=\"data row4 col3\" >90.3 (86.3, 93.9)</td>\n",
+       "      <td id=\"T_98f1b_row4_col4\" class=\"data row4 col4\" >64.7 (57.0, 71.3)</td>\n",
+       "      <td id=\"T_98f1b_row4_col5\" class=\"data row4 col5\" > </td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row5_col0\" class=\"data row5 col0\" >da_core_news_trf-3.5.0</td>\n",
-       "      <td id=\"T_f48d8_row5_col1\" class=\"data row5 col1\" >79.0 (75.1, 82.3)</td>\n",
-       "      <td id=\"T_f48d8_row5_col2\" class=\"data row5 col2\" >82.1 (75.5, 88.5)</td>\n",
-       "      <td id=\"T_f48d8_row5_col3\" class=\"data row5 col3\" >91.6 (88.2, 94.5)</td>\n",
-       "      <td id=\"T_f48d8_row5_col4\" class=\"data row5 col4\" >68.0 (61.0, 75.2)</td>\n",
-       "      <td id=\"T_f48d8_row5_col5\" class=\"data row5 col5\" >69.0 (61.1, 77.3)</td>\n",
+       "      <td id=\"T_98f1b_row5_col0\" class=\"data row5 col0\" >da_core_news_trf-3.5.0</td>\n",
+       "      <td id=\"T_98f1b_row5_col1\" class=\"data row5 col1\" >79.0 (75.1, 82.3)</td>\n",
+       "      <td id=\"T_98f1b_row5_col2\" class=\"data row5 col2\" >82.1 (75.5, 88.5)</td>\n",
+       "      <td id=\"T_98f1b_row5_col3\" class=\"data row5 col3\" >91.6 (88.2, 94.5)</td>\n",
+       "      <td id=\"T_98f1b_row5_col4\" class=\"data row5 col4\" >68.0 (61.0, 75.2)</td>\n",
+       "      <td id=\"T_98f1b_row5_col5\" class=\"data row5 col5\" >69.0 (61.1, 77.3)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row6_col0\" class=\"data row6 col0\" >da_core_news_lg-3.5.0</td>\n",
-       "      <td id=\"T_f48d8_row6_col1\" class=\"data row6 col1\" >74.6 (70.8, 78.1)</td>\n",
-       "      <td id=\"T_f48d8_row6_col2\" class=\"data row6 col2\" >81.6 (75.3, 88.2)</td>\n",
-       "      <td id=\"T_f48d8_row6_col3\" class=\"data row6 col3\" >85.5 (81.1, 89.9)</td>\n",
-       "      <td id=\"T_f48d8_row6_col4\" class=\"data row6 col4\" >62.7 (54.8, 70.3)</td>\n",
-       "      <td id=\"T_f48d8_row6_col5\" class=\"data row6 col5\" >64.4 (55.9, 72.8)</td>\n",
+       "      <td id=\"T_98f1b_row6_col0\" class=\"data row6 col0\" >da_core_news_lg-3.5.0</td>\n",
+       "      <td id=\"T_98f1b_row6_col1\" class=\"data row6 col1\" >74.6 (70.8, 78.1)</td>\n",
+       "      <td id=\"T_98f1b_row6_col2\" class=\"data row6 col2\" >81.6 (75.3, 88.2)</td>\n",
+       "      <td id=\"T_98f1b_row6_col3\" class=\"data row6 col3\" >85.5 (81.1, 89.9)</td>\n",
+       "      <td id=\"T_98f1b_row6_col4\" class=\"data row6 col4\" >62.7 (54.8, 70.3)</td>\n",
+       "      <td id=\"T_98f1b_row6_col5\" class=\"data row6 col5\" >64.4 (55.9, 72.8)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row7_col0\" class=\"data row7 col0\" >da_core_news_md-3.5.0</td>\n",
-       "      <td id=\"T_f48d8_row7_col1\" class=\"data row7 col1\" >71.2 (66.9, 75.2)</td>\n",
-       "      <td id=\"T_f48d8_row7_col2\" class=\"data row7 col2\" >76.8 (69.9, 83.6)</td>\n",
-       "      <td id=\"T_f48d8_row7_col3\" class=\"data row7 col3\" >82.6 (77.8, 87.0)</td>\n",
-       "      <td id=\"T_f48d8_row7_col4\" class=\"data row7 col4\" >58.2 (49.6, 66.7)</td>\n",
-       "      <td id=\"T_f48d8_row7_col5\" class=\"data row7 col5\" >61.8 (52.6, 70.6)</td>\n",
+       "      <td id=\"T_98f1b_row7_col0\" class=\"data row7 col0\" >da_core_news_md-3.5.0</td>\n",
+       "      <td id=\"T_98f1b_row7_col1\" class=\"data row7 col1\" >71.2 (66.9, 75.2)</td>\n",
+       "      <td id=\"T_98f1b_row7_col2\" class=\"data row7 col2\" >76.8 (69.9, 83.6)</td>\n",
+       "      <td id=\"T_98f1b_row7_col3\" class=\"data row7 col3\" >82.6 (77.8, 87.0)</td>\n",
+       "      <td id=\"T_98f1b_row7_col4\" class=\"data row7 col4\" >58.2 (49.6, 66.7)</td>\n",
+       "      <td id=\"T_98f1b_row7_col5\" class=\"data row7 col5\" >61.8 (52.6, 70.6)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row8_col0\" class=\"data row8 col0\" >da_core_news_sm-3.5.0</td>\n",
-       "      <td id=\"T_f48d8_row8_col1\" class=\"data row8 col1\" >64.4 (59.7, 68.5)</td>\n",
-       "      <td id=\"T_f48d8_row8_col2\" class=\"data row8 col2\" >61.6 (52.2, 69.9)</td>\n",
-       "      <td id=\"T_f48d8_row8_col3\" class=\"data row8 col3\" >80.1 (74.9, 85.1)</td>\n",
-       "      <td id=\"T_f48d8_row8_col4\" class=\"data row8 col4\" >49.0 (39.0, 57.5)</td>\n",
-       "      <td id=\"T_f48d8_row8_col5\" class=\"data row8 col5\" >58.4 (49.8, 67.1)</td>\n",
+       "      <td id=\"T_98f1b_row8_col0\" class=\"data row8 col0\" >da_core_news_sm-3.5.0</td>\n",
+       "      <td id=\"T_98f1b_row8_col1\" class=\"data row8 col1\" >64.4 (59.7, 68.5)</td>\n",
+       "      <td id=\"T_98f1b_row8_col2\" class=\"data row8 col2\" >61.6 (52.2, 69.9)</td>\n",
+       "      <td id=\"T_98f1b_row8_col3\" class=\"data row8 col3\" >80.1 (74.9, 85.1)</td>\n",
+       "      <td id=\"T_98f1b_row8_col4\" class=\"data row8 col4\" >49.0 (39.0, 57.5)</td>\n",
+       "      <td id=\"T_98f1b_row8_col5\" class=\"data row8 col5\" >58.4 (49.8, 67.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row9_col0\" class=\"data row9 col0\" >openai/gpt-3.5-turbo (02/05/23)</td>\n",
-       "      <td id=\"T_f48d8_row9_col1\" class=\"data row9 col1\" >57.5 (52.3, 62.2)</td>\n",
-       "      <td id=\"T_f48d8_row9_col2\" class=\"data row9 col2\" >50.7 (41.9, 59.2)</td>\n",
-       "      <td id=\"T_f48d8_row9_col3\" class=\"data row9 col3\" >81.9 (76.8, 86.5)</td>\n",
-       "      <td id=\"T_f48d8_row9_col4\" class=\"data row9 col4\" >55.7 (47.1, 63.7)</td>\n",
-       "      <td id=\"T_f48d8_row9_col5\" class=\"data row9 col5\" > </td>\n",
+       "      <td id=\"T_98f1b_row9_col0\" class=\"data row9 col0\" >openai/gpt-3.5-turbo (02/05/23)</td>\n",
+       "      <td id=\"T_98f1b_row9_col1\" class=\"data row9 col1\" >57.5 (52.3, 62.2)</td>\n",
+       "      <td id=\"T_98f1b_row9_col2\" class=\"data row9 col2\" >50.7 (41.9, 59.2)</td>\n",
+       "      <td id=\"T_98f1b_row9_col3\" class=\"data row9 col3\" >81.9 (76.8, 86.5)</td>\n",
+       "      <td id=\"T_98f1b_row9_col4\" class=\"data row9 col4\" >55.7 (47.1, 63.7)</td>\n",
+       "      <td id=\"T_98f1b_row9_col5\" class=\"data row9 col5\" > </td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <td id=\"T_f48d8_row10_col0\" class=\"data row10 col0\" >openai/gpt-4 (02/05/23)</td>\n",
-       "      <td id=\"T_f48d8_row10_col1\" class=\"data row10 col1\" >70.1 (66.0, 74.3)</td>\n",
-       "      <td id=\"T_f48d8_row10_col2\" class=\"data row10 col2\" >78.9 (71.5, 85.7)</td>\n",
-       "      <td id=\"T_f48d8_row10_col3\" class=\"data row10 col3\" >85.3 (80.4, 89.5)</td>\n",
-       "      <td id=\"T_f48d8_row10_col4\" class=\"data row10 col4\" >72.0 (65.4, 78.5)</td>\n",
-       "      <td id=\"T_f48d8_row10_col5\" class=\"data row10 col5\" > </td>\n",
+       "      <td id=\"T_98f1b_row10_col0\" class=\"data row10 col0\" >openai/gpt-4 (02/05/23)</td>\n",
+       "      <td id=\"T_98f1b_row10_col1\" class=\"data row10 col1\" >70.1 (66.0, 74.3)</td>\n",
+       "      <td id=\"T_98f1b_row10_col2\" class=\"data row10 col2\" >78.9 (71.5, 85.7)</td>\n",
+       "      <td id=\"T_98f1b_row10_col3\" class=\"data row10 col3\" >85.3 (80.4, 89.5)</td>\n",
+       "      <td id=\"T_98f1b_row10_col4\" class=\"data row10 col4\" >72.0 (65.4, 78.5)</td>\n",
+       "      <td id=\"T_98f1b_row10_col5\" class=\"data row10 col5\" > </td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n"
       ],
       "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x2910f8580>"
+       "<pandas.io.formats.style.Styler at 0x176781ba0>"
       ]
      },
-     "execution_count": 6,
+     "execution_count": 8,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -524,26 +524,39 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 9,
    "metadata": {
     "tags": [
      "remove-cell"
     ]
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "functools.partial(<function openai_model_loader_fine_ner at 0x169e02b00>, model='gpt-4')"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "from functools import partial\n",
     "from evaluation.models import openai_model_loader_fine_ner\n",
     "MODELS_ = MODELS.copy()\n",
     "MODELS_[\"openai/gpt-3.5-turbo (02/05/23)\"] = partial(openai_model_loader_fine_ner, model=\"gpt-3.5-turbo\")\n",
     "MODELS_[\"openai/gpt-4 (02/05/23)\"] = partial(openai_model_loader_fine_ner, model=\"gpt-4\")\n",
-    "MODELS.pop(\"openai/gpt-3.5-turbo (02/05/23)\")\n",
-    "MODELS.pop(\"openai/gpt-4 (02/05/23)\")\n"
+    "\n",
+    "# don't test openai models on DANSK\n",
+    "MODELS_.pop(\"openai/gpt-3.5-turbo (02/05/23)\")\n",
+    "MODELS_.pop(\"openai/gpt-4 (02/05/23)\")\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 10,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -589,81 +602,7 @@
       "dansk (test): Loading prediction for da_core_news_md-3.5.0\n",
       "dansk (train): Loading prediction for da_core_news_sm-3.5.0\n",
       "dansk (dev): Loading prediction for da_core_news_sm-3.5.0\n",
-      "dansk (test): Loading prediction for da_core_news_sm-3.5.0\n",
-      "dansk (test): Running openai/gpt-3.5-turbo (02/05/23)\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Found cached dataset parquet (/Users/au561649/.cache/huggingface/datasets/chcaa___parquet/chcaa--DANSK-8622a47955f5c4cb/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n",
-      "Found cached dataset parquet (/Users/au561649/.cache/huggingface/datasets/chcaa___parquet/chcaa--DANSK-8622a47955f5c4cb/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n",
-      "Found cached dataset parquet (/Users/au561649/.cache/huggingface/datasets/chcaa___parquet/chcaa--DANSK-8622a47955f5c4cb/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "dansk (test): Running openai/gpt-4 (02/05/23)\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "Found cached dataset parquet (/Users/au561649/.cache/huggingface/datasets/chcaa___parquet/chcaa--DANSK-8622a47955f5c4cb/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n",
-      "Found cached dataset parquet (/Users/au561649/.cache/huggingface/datasets/chcaa___parquet/chcaa--DANSK-8622a47955f5c4cb/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n",
-      "Found cached dataset parquet (/Users/au561649/.cache/huggingface/datasets/chcaa___parquet/chcaa--DANSK-8622a47955f5c4cb/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n"
-     ]
-    },
-    {
-     "ename": "ConnectionError",
-     "evalue": "HTTPSConnectionPool(host='api.openai.com', port=443): Max retries exceeded with url: /v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x152a0ba30>: Failed to resolve 'api.openai.com' ([Errno 8] nodename nor servname provided, or not known)\"))",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mgaierror\u001b[0m                                  Traceback (most recent call last)",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connection.py:200\u001b[0m, in \u001b[0;36mHTTPConnection._new_conn\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    199\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m--> 200\u001b[0m     sock \u001b[39m=\u001b[39m connection\u001b[39m.\u001b[39;49mcreate_connection(\n\u001b[1;32m    201\u001b[0m         (\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_dns_host, \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mport),\n\u001b[1;32m    202\u001b[0m         \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mtimeout,\n\u001b[1;32m    203\u001b[0m         source_address\u001b[39m=\u001b[39;49m\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49msource_address,\n\u001b[1;32m    204\u001b[0m         socket_options\u001b[39m=\u001b[39;49m\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49msocket_options,\n\u001b[1;32m    205\u001b[0m     )\n\u001b[1;32m    206\u001b[0m \u001b[39mexcept\u001b[39;00m socket\u001b[39m.\u001b[39mgaierror \u001b[39mas\u001b[39;00m e:\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/util/connection.py:60\u001b[0m, in \u001b[0;36mcreate_connection\u001b[0;34m(address, timeout, source_address, socket_options)\u001b[0m\n\u001b[1;32m     58\u001b[0m     \u001b[39mraise\u001b[39;00m LocationParseError(\u001b[39mf\u001b[39m\u001b[39m\"\u001b[39m\u001b[39m'\u001b[39m\u001b[39m{\u001b[39;00mhost\u001b[39m}\u001b[39;00m\u001b[39m'\u001b[39m\u001b[39m, label empty or too long\u001b[39m\u001b[39m\"\u001b[39m) \u001b[39mfrom\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[0;32m---> 60\u001b[0m \u001b[39mfor\u001b[39;00m res \u001b[39min\u001b[39;00m socket\u001b[39m.\u001b[39;49mgetaddrinfo(host, port, family, socket\u001b[39m.\u001b[39;49mSOCK_STREAM):\n\u001b[1;32m     61\u001b[0m     af, socktype, proto, canonname, sa \u001b[39m=\u001b[39m res\n",
-      "File \u001b[0;32m/Library/Frameworks/Python.framework/Versions/3.10/lib/python3.10/socket.py:955\u001b[0m, in \u001b[0;36mgetaddrinfo\u001b[0;34m(host, port, family, type, proto, flags)\u001b[0m\n\u001b[1;32m    954\u001b[0m addrlist \u001b[39m=\u001b[39m []\n\u001b[0;32m--> 955\u001b[0m \u001b[39mfor\u001b[39;00m res \u001b[39min\u001b[39;00m _socket\u001b[39m.\u001b[39;49mgetaddrinfo(host, port, family, \u001b[39mtype\u001b[39;49m, proto, flags):\n\u001b[1;32m    956\u001b[0m     af, socktype, proto, canonname, sa \u001b[39m=\u001b[39m res\n",
-      "\u001b[0;31mgaierror\u001b[0m: [Errno 8] nodename nor servname provided, or not known",
-      "\nThe above exception was the direct cause of the following exception:\n",
-      "\u001b[0;31mNameResolutionError\u001b[0m                       Traceback (most recent call last)",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connectionpool.py:790\u001b[0m, in \u001b[0;36mHTTPConnectionPool.urlopen\u001b[0;34m(self, method, url, body, headers, retries, redirect, assert_same_host, timeout, pool_timeout, release_conn, chunked, body_pos, preload_content, decode_content, **response_kw)\u001b[0m\n\u001b[1;32m    789\u001b[0m \u001b[39m# Make the request on the HTTPConnection object\u001b[39;00m\n\u001b[0;32m--> 790\u001b[0m response \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_make_request(\n\u001b[1;32m    791\u001b[0m     conn,\n\u001b[1;32m    792\u001b[0m     method,\n\u001b[1;32m    793\u001b[0m     url,\n\u001b[1;32m    794\u001b[0m     timeout\u001b[39m=\u001b[39;49mtimeout_obj,\n\u001b[1;32m    795\u001b[0m     body\u001b[39m=\u001b[39;49mbody,\n\u001b[1;32m    796\u001b[0m     headers\u001b[39m=\u001b[39;49mheaders,\n\u001b[1;32m    797\u001b[0m     chunked\u001b[39m=\u001b[39;49mchunked,\n\u001b[1;32m    798\u001b[0m     retries\u001b[39m=\u001b[39;49mretries,\n\u001b[1;32m    799\u001b[0m     response_conn\u001b[39m=\u001b[39;49mresponse_conn,\n\u001b[1;32m    800\u001b[0m     preload_content\u001b[39m=\u001b[39;49mpreload_content,\n\u001b[1;32m    801\u001b[0m     decode_content\u001b[39m=\u001b[39;49mdecode_content,\n\u001b[1;32m    802\u001b[0m     \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mresponse_kw,\n\u001b[1;32m    803\u001b[0m )\n\u001b[1;32m    805\u001b[0m \u001b[39m# Everything went great!\u001b[39;00m\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connectionpool.py:491\u001b[0m, in \u001b[0;36mHTTPConnectionPool._make_request\u001b[0;34m(self, conn, method, url, body, headers, retries, timeout, chunked, response_conn, preload_content, decode_content, enforce_content_length)\u001b[0m\n\u001b[1;32m    490\u001b[0m         new_e \u001b[39m=\u001b[39m _wrap_proxy_error(new_e, conn\u001b[39m.\u001b[39mproxy\u001b[39m.\u001b[39mscheme)\n\u001b[0;32m--> 491\u001b[0m     \u001b[39mraise\u001b[39;00m new_e\n\u001b[1;32m    493\u001b[0m \u001b[39m# conn.request() calls http.client.*.request, not the method in\u001b[39;00m\n\u001b[1;32m    494\u001b[0m \u001b[39m# urllib3.request. It also calls makefile (recv) on the socket.\u001b[39;00m\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connectionpool.py:467\u001b[0m, in \u001b[0;36mHTTPConnectionPool._make_request\u001b[0;34m(self, conn, method, url, body, headers, retries, timeout, chunked, response_conn, preload_content, decode_content, enforce_content_length)\u001b[0m\n\u001b[1;32m    466\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m--> 467\u001b[0m     \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_validate_conn(conn)\n\u001b[1;32m    468\u001b[0m \u001b[39mexcept\u001b[39;00m (SocketTimeout, BaseSSLError) \u001b[39mas\u001b[39;00m e:\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connectionpool.py:1092\u001b[0m, in \u001b[0;36mHTTPSConnectionPool._validate_conn\u001b[0;34m(self, conn)\u001b[0m\n\u001b[1;32m   1091\u001b[0m \u001b[39mif\u001b[39;00m conn\u001b[39m.\u001b[39mis_closed:\n\u001b[0;32m-> 1092\u001b[0m     conn\u001b[39m.\u001b[39;49mconnect()\n\u001b[1;32m   1094\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m conn\u001b[39m.\u001b[39mis_verified:\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connection.py:604\u001b[0m, in \u001b[0;36mHTTPSConnection.connect\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    603\u001b[0m sock: socket\u001b[39m.\u001b[39msocket \u001b[39m|\u001b[39m ssl\u001b[39m.\u001b[39mSSLSocket\n\u001b[0;32m--> 604\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39msock \u001b[39m=\u001b[39m sock \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_new_conn()\n\u001b[1;32m    605\u001b[0m server_hostname: \u001b[39mstr\u001b[39m \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mhost\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connection.py:207\u001b[0m, in \u001b[0;36mHTTPConnection._new_conn\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    206\u001b[0m \u001b[39mexcept\u001b[39;00m socket\u001b[39m.\u001b[39mgaierror \u001b[39mas\u001b[39;00m e:\n\u001b[0;32m--> 207\u001b[0m     \u001b[39mraise\u001b[39;00m NameResolutionError(\u001b[39mself\u001b[39m\u001b[39m.\u001b[39mhost, \u001b[39mself\u001b[39m, e) \u001b[39mfrom\u001b[39;00m \u001b[39me\u001b[39;00m\n\u001b[1;32m    208\u001b[0m \u001b[39mexcept\u001b[39;00m SocketTimeout \u001b[39mas\u001b[39;00m e:\n",
-      "\u001b[0;31mNameResolutionError\u001b[0m: <urllib3.connection.HTTPSConnection object at 0x152a0ba30>: Failed to resolve 'api.openai.com' ([Errno 8] nodename nor servname provided, or not known)",
-      "\nThe above exception was the direct cause of the following exception:\n",
-      "\u001b[0;31mMaxRetryError\u001b[0m                             Traceback (most recent call last)",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/requests/adapters.py:486\u001b[0m, in \u001b[0;36mHTTPAdapter.send\u001b[0;34m(self, request, stream, timeout, verify, cert, proxies)\u001b[0m\n\u001b[1;32m    485\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m--> 486\u001b[0m     resp \u001b[39m=\u001b[39m conn\u001b[39m.\u001b[39;49murlopen(\n\u001b[1;32m    487\u001b[0m         method\u001b[39m=\u001b[39;49mrequest\u001b[39m.\u001b[39;49mmethod,\n\u001b[1;32m    488\u001b[0m         url\u001b[39m=\u001b[39;49murl,\n\u001b[1;32m    489\u001b[0m         body\u001b[39m=\u001b[39;49mrequest\u001b[39m.\u001b[39;49mbody,\n\u001b[1;32m    490\u001b[0m         headers\u001b[39m=\u001b[39;49mrequest\u001b[39m.\u001b[39;49mheaders,\n\u001b[1;32m    491\u001b[0m         redirect\u001b[39m=\u001b[39;49m\u001b[39mFalse\u001b[39;49;00m,\n\u001b[1;32m    492\u001b[0m         assert_same_host\u001b[39m=\u001b[39;49m\u001b[39mFalse\u001b[39;49;00m,\n\u001b[1;32m    493\u001b[0m         preload_content\u001b[39m=\u001b[39;49m\u001b[39mFalse\u001b[39;49;00m,\n\u001b[1;32m    494\u001b[0m         decode_content\u001b[39m=\u001b[39;49m\u001b[39mFalse\u001b[39;49;00m,\n\u001b[1;32m    495\u001b[0m         retries\u001b[39m=\u001b[39;49m\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mmax_retries,\n\u001b[1;32m    496\u001b[0m         timeout\u001b[39m=\u001b[39;49mtimeout,\n\u001b[1;32m    497\u001b[0m         chunked\u001b[39m=\u001b[39;49mchunked,\n\u001b[1;32m    498\u001b[0m     )\n\u001b[1;32m    500\u001b[0m \u001b[39mexcept\u001b[39;00m (ProtocolError, \u001b[39mOSError\u001b[39;00m) \u001b[39mas\u001b[39;00m err:\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/connectionpool.py:844\u001b[0m, in \u001b[0;36mHTTPConnectionPool.urlopen\u001b[0;34m(self, method, url, body, headers, retries, redirect, assert_same_host, timeout, pool_timeout, release_conn, chunked, body_pos, preload_content, decode_content, **response_kw)\u001b[0m\n\u001b[1;32m    842\u001b[0m     new_e \u001b[39m=\u001b[39m ProtocolError(\u001b[39m\"\u001b[39m\u001b[39mConnection aborted.\u001b[39m\u001b[39m\"\u001b[39m, new_e)\n\u001b[0;32m--> 844\u001b[0m retries \u001b[39m=\u001b[39m retries\u001b[39m.\u001b[39;49mincrement(\n\u001b[1;32m    845\u001b[0m     method, url, error\u001b[39m=\u001b[39;49mnew_e, _pool\u001b[39m=\u001b[39;49m\u001b[39mself\u001b[39;49m, _stacktrace\u001b[39m=\u001b[39;49msys\u001b[39m.\u001b[39;49mexc_info()[\u001b[39m2\u001b[39;49m]\n\u001b[1;32m    846\u001b[0m )\n\u001b[1;32m    847\u001b[0m retries\u001b[39m.\u001b[39msleep()\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/urllib3/util/retry.py:515\u001b[0m, in \u001b[0;36mRetry.increment\u001b[0;34m(self, method, url, response, error, _pool, _stacktrace)\u001b[0m\n\u001b[1;32m    514\u001b[0m     reason \u001b[39m=\u001b[39m error \u001b[39mor\u001b[39;00m ResponseError(cause)\n\u001b[0;32m--> 515\u001b[0m     \u001b[39mraise\u001b[39;00m MaxRetryError(_pool, url, reason) \u001b[39mfrom\u001b[39;00m \u001b[39mreason\u001b[39;00m  \u001b[39m# type: ignore[arg-type]\u001b[39;00m\n\u001b[1;32m    517\u001b[0m log\u001b[39m.\u001b[39mdebug(\u001b[39m\"\u001b[39m\u001b[39mIncremented Retry for (url=\u001b[39m\u001b[39m'\u001b[39m\u001b[39m%s\u001b[39;00m\u001b[39m'\u001b[39m\u001b[39m): \u001b[39m\u001b[39m%r\u001b[39;00m\u001b[39m\"\u001b[39m, url, new_retry)\n",
-      "\u001b[0;31mMaxRetryError\u001b[0m: HTTPSConnectionPool(host='api.openai.com', port=443): Max retries exceeded with url: /v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x152a0ba30>: Failed to resolve 'api.openai.com' ([Errno 8] nodename nor servname provided, or not known)\"))",
-      "\nDuring handling of the above exception, another exception occurred:\n",
-      "\u001b[0;31mConnectionError\u001b[0m                           Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[7], line 7\u001b[0m\n\u001b[1;32m      5\u001b[0m \u001b[39melse\u001b[39;00m:\n\u001b[1;32m      6\u001b[0m     splits\u001b[39m=\u001b[39m[\u001b[39m\"\u001b[39m\u001b[39mtrain\u001b[39m\u001b[39m\"\u001b[39m, \u001b[39m\"\u001b[39m\u001b[39mdev\u001b[39m\u001b[39m\"\u001b[39m, \u001b[39m\"\u001b[39m\u001b[39mtest\u001b[39m\u001b[39m\"\u001b[39m]\n\u001b[0;32m----> 7\u001b[0m mdl_results \u001b[39m=\u001b[39m apply_models(\n\u001b[1;32m      8\u001b[0m     mdl_name, model_getter, dataset\u001b[39m=\u001b[39;49m\u001b[39m\"\u001b[39;49m\u001b[39mdansk\u001b[39;49m\u001b[39m\"\u001b[39;49m, splits\u001b[39m=\u001b[39;49msplits\n\u001b[1;32m      9\u001b[0m )\n\u001b[1;32m     10\u001b[0m dansk[mdl_name] \u001b[39m=\u001b[39m mdl_results\n",
-      "File \u001b[0;32m~/Github/DaCy/docs/evaluation/utils.py:177\u001b[0m, in \u001b[0;36mapply_models\u001b[0;34m(mdl_name, mdl_getter, dataset, splits, cache)\u001b[0m\n\u001b[1;32m    175\u001b[0m start \u001b[39m=\u001b[39m time()\n\u001b[1;32m    176\u001b[0m docs \u001b[39m=\u001b[39m nlp\u001b[39m.\u001b[39mpipe(example\u001b[39m.\u001b[39mreference\u001b[39m.\u001b[39mtext \u001b[39mfor\u001b[39;00m example \u001b[39min\u001b[39;00m examples)\n\u001b[0;32m--> 177\u001b[0m \u001b[39mfor\u001b[39;00m doc, example \u001b[39min\u001b[39;00m \u001b[39mzip\u001b[39m(docs, examples):\n\u001b[1;32m    178\u001b[0m     example\u001b[39m.\u001b[39mpredicted \u001b[39m=\u001b[39m doc\n\u001b[1;32m    179\u001b[0m end \u001b[39m=\u001b[39m time()\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy/language.py:1574\u001b[0m, in \u001b[0;36mLanguage.pipe\u001b[0;34m(self, texts, as_tuples, batch_size, disable, component_cfg, n_process)\u001b[0m\n\u001b[1;32m   1572\u001b[0m     \u001b[39mfor\u001b[39;00m pipe \u001b[39min\u001b[39;00m pipes:\n\u001b[1;32m   1573\u001b[0m         docs \u001b[39m=\u001b[39m pipe(docs)\n\u001b[0;32m-> 1574\u001b[0m \u001b[39mfor\u001b[39;00m doc \u001b[39min\u001b[39;00m docs:\n\u001b[1;32m   1575\u001b[0m     \u001b[39myield\u001b[39;00m doc\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy/util.py:1670\u001b[0m, in \u001b[0;36m_pipe\u001b[0;34m(docs, proc, name, default_error_handler, kwargs)\u001b[0m\n\u001b[1;32m   1660\u001b[0m \u001b[39mdef\u001b[39;00m \u001b[39m_pipe\u001b[39m(\n\u001b[1;32m   1661\u001b[0m     docs: Iterable[\u001b[39m\"\u001b[39m\u001b[39mDoc\u001b[39m\u001b[39m\"\u001b[39m],\n\u001b[1;32m   1662\u001b[0m     proc: \u001b[39m\"\u001b[39m\u001b[39mPipeCallable\u001b[39m\u001b[39m\"\u001b[39m,\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m   1667\u001b[0m     kwargs: Mapping[\u001b[39mstr\u001b[39m, Any],\n\u001b[1;32m   1668\u001b[0m ) \u001b[39m-\u001b[39m\u001b[39m>\u001b[39m Iterator[\u001b[39m\"\u001b[39m\u001b[39mDoc\u001b[39m\u001b[39m\"\u001b[39m]:\n\u001b[1;32m   1669\u001b[0m     \u001b[39mif\u001b[39;00m \u001b[39mhasattr\u001b[39m(proc, \u001b[39m\"\u001b[39m\u001b[39mpipe\u001b[39m\u001b[39m\"\u001b[39m):\n\u001b[0;32m-> 1670\u001b[0m         \u001b[39myield from\u001b[39;00m proc\u001b[39m.\u001b[39mpipe(docs, \u001b[39m*\u001b[39m\u001b[39m*\u001b[39mkwargs)\n\u001b[1;32m   1671\u001b[0m     \u001b[39melse\u001b[39;00m:\n\u001b[1;32m   1672\u001b[0m         \u001b[39m# We added some args for pipe that __call__ doesn't expect.\u001b[39;00m\n\u001b[1;32m   1673\u001b[0m         kwargs \u001b[39m=\u001b[39m \u001b[39mdict\u001b[39m(kwargs)\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/pipeline/llm.py:140\u001b[0m, in \u001b[0;36mLLMWrapper.pipe\u001b[0;34m(self, stream, batch_size)\u001b[0m\n\u001b[1;32m    138\u001b[0m     \u001b[39myield from\u001b[39;00m \u001b[39miter\u001b[39m(\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_process_docs(doc_batch))\n\u001b[1;32m    139\u001b[0m \u001b[39mexcept\u001b[39;00m \u001b[39mException\u001b[39;00m \u001b[39mas\u001b[39;00m e:\n\u001b[0;32m--> 140\u001b[0m     error_handler(\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_name, \u001b[39mself\u001b[39;49m, doc_batch, e)\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy/util.py:1689\u001b[0m, in \u001b[0;36mraise_error\u001b[0;34m(proc_name, proc, docs, e)\u001b[0m\n\u001b[1;32m   1688\u001b[0m \u001b[39mdef\u001b[39;00m \u001b[39mraise_error\u001b[39m(proc_name, proc, docs, e):\n\u001b[0;32m-> 1689\u001b[0m     \u001b[39mraise\u001b[39;00m e\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/pipeline/llm.py:138\u001b[0m, in \u001b[0;36mLLMWrapper.pipe\u001b[0;34m(self, stream, batch_size)\u001b[0m\n\u001b[1;32m    136\u001b[0m \u001b[39mfor\u001b[39;00m doc_batch \u001b[39min\u001b[39;00m spacy\u001b[39m.\u001b[39mutil\u001b[39m.\u001b[39mminibatch(stream, batch_size):\n\u001b[1;32m    137\u001b[0m     \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m--> 138\u001b[0m         \u001b[39myield from\u001b[39;00m \u001b[39miter\u001b[39m(\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_process_docs(doc_batch))\n\u001b[1;32m    139\u001b[0m     \u001b[39mexcept\u001b[39;00m \u001b[39mException\u001b[39;00m \u001b[39mas\u001b[39;00m e:\n\u001b[1;32m    140\u001b[0m         error_handler(\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_name, \u001b[39mself\u001b[39m, doc_batch, e)\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/pipeline/llm.py:152\u001b[0m, in \u001b[0;36mLLMWrapper._process_docs\u001b[0;34m(self, docs)\u001b[0m\n\u001b[1;32m    150\u001b[0m noncached_doc_batch \u001b[39m=\u001b[39m [doc \u001b[39mfor\u001b[39;00m i, doc \u001b[39min\u001b[39;00m \u001b[39menumerate\u001b[39m(docs) \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m is_cached[i]]\n\u001b[1;32m    151\u001b[0m prompts \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_task\u001b[39m.\u001b[39mgenerate_prompts(noncached_doc_batch)\n\u001b[0;32m--> 152\u001b[0m responses \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_backend(prompts)\n\u001b[1;32m    153\u001b[0m modified_docs \u001b[39m=\u001b[39m \u001b[39miter\u001b[39m(\u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_task\u001b[39m.\u001b[39mparse_responses(noncached_doc_batch, responses))\n\u001b[1;32m    154\u001b[0m final_docs \u001b[39m=\u001b[39m []\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/backends/rest/backend/openai.py:140\u001b[0m, in \u001b[0;36mOpenAIBackend.__call__\u001b[0;34m(self, prompts)\u001b[0m\n\u001b[1;32m    137\u001b[0m \u001b[39mif\u001b[39;00m url \u001b[39m==\u001b[39m Endpoints\u001b[39m.\u001b[39mCHAT:\n\u001b[1;32m    138\u001b[0m     \u001b[39m# The OpenAI API doesn't support batching for /chat/completions yet, so we have to send individual requests.\u001b[39;00m\n\u001b[1;32m    139\u001b[0m     \u001b[39mfor\u001b[39;00m prompt \u001b[39min\u001b[39;00m prompts:\n\u001b[0;32m--> 140\u001b[0m         responses \u001b[39m=\u001b[39m _request(\n\u001b[1;32m    141\u001b[0m             {\u001b[39m\"\u001b[39;49m\u001b[39mmessages\u001b[39;49m\u001b[39m\"\u001b[39;49m: [{\u001b[39m\"\u001b[39;49m\u001b[39mrole\u001b[39;49m\u001b[39m\"\u001b[39;49m: \u001b[39m\"\u001b[39;49m\u001b[39muser\u001b[39;49m\u001b[39m\"\u001b[39;49m, \u001b[39m\"\u001b[39;49m\u001b[39mcontent\u001b[39;49m\u001b[39m\"\u001b[39;49m: prompt}]}\n\u001b[1;32m    142\u001b[0m         )\n\u001b[1;32m    143\u001b[0m         \u001b[39mif\u001b[39;00m \u001b[39m\"\u001b[39m\u001b[39merror\u001b[39m\u001b[39m\"\u001b[39m \u001b[39min\u001b[39;00m responses:\n\u001b[1;32m    144\u001b[0m             \u001b[39mreturn\u001b[39;00m responses[\u001b[39m\"\u001b[39m\u001b[39merror\u001b[39m\u001b[39m\"\u001b[39m]\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/backends/rest/backend/openai.py:111\u001b[0m, in \u001b[0;36mOpenAIBackend.__call__.<locals>._request\u001b[0;34m(json_data)\u001b[0m\n\u001b[1;32m    110\u001b[0m \u001b[39mdef\u001b[39;00m \u001b[39m_request\u001b[39m(json_data: Dict[\u001b[39mstr\u001b[39m, Any]) \u001b[39m-\u001b[39m\u001b[39m>\u001b[39m Dict[\u001b[39mstr\u001b[39m, Any]:\n\u001b[0;32m--> 111\u001b[0m     r \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mretry(\n\u001b[1;32m    112\u001b[0m         call_method\u001b[39m=\u001b[39;49mrequests\u001b[39m.\u001b[39;49mpost,\n\u001b[1;32m    113\u001b[0m         url\u001b[39m=\u001b[39;49murl,\n\u001b[1;32m    114\u001b[0m         headers\u001b[39m=\u001b[39;49mheaders,\n\u001b[1;32m    115\u001b[0m         json\u001b[39m=\u001b[39;49m{\u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mjson_data, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49m\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_config},\n\u001b[1;32m    116\u001b[0m         timeout\u001b[39m=\u001b[39;49m\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_max_request_time,\n\u001b[1;32m    117\u001b[0m     )\n\u001b[1;32m    118\u001b[0m     \u001b[39mtry\u001b[39;00m:\n\u001b[1;32m    119\u001b[0m         r\u001b[39m.\u001b[39mraise_for_status()\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/backends/rest/backend/base.py:121\u001b[0m, in \u001b[0;36mBackend.retry\u001b[0;34m(self, call_method, url, **kwargs)\u001b[0m\n\u001b[1;32m    117\u001b[0m \u001b[39mwhile\u001b[39;00m i \u001b[39m<\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_max_tries \u001b[39mand\u001b[39;00m (\n\u001b[1;32m    118\u001b[0m     response \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m \u001b[39mor\u001b[39;00m _HTTPRetryErrorCodes\u001b[39m.\u001b[39mhas(response\u001b[39m.\u001b[39mstatus_code)\n\u001b[1;32m    119\u001b[0m ):\n\u001b[1;32m    120\u001b[0m     time\u001b[39m.\u001b[39msleep(interval)\n\u001b[0;32m--> 121\u001b[0m     response \u001b[39m=\u001b[39m _call_api(i \u001b[39m+\u001b[39;49m \u001b[39m1\u001b[39;49m)\n\u001b[1;32m    122\u001b[0m     i \u001b[39m+\u001b[39m\u001b[39m=\u001b[39m \u001b[39m1\u001b[39m\n\u001b[1;32m    123\u001b[0m     \u001b[39m# Increase timeout everytime you retry\u001b[39;00m\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/spacy_llm/backends/rest/backend/base.py:101\u001b[0m, in \u001b[0;36mBackend.retry.<locals>._call_api\u001b[0;34m(attempt)\u001b[0m\n\u001b[1;32m     94\u001b[0m \u001b[39m\u001b[39m\u001b[39m\"\"\"Calls API with given timeout.\u001b[39;00m\n\u001b[1;32m     95\u001b[0m \u001b[39mattempt (int): Reflects the how many-th try at reaching the API this is. If attempt < self._max_tries and\u001b[39;00m\n\u001b[1;32m     96\u001b[0m \u001b[39m    the call fails, None is returned. If attempt == self._max_tries and the call fails, a TimeoutError is\u001b[39;00m\n\u001b[1;32m     97\u001b[0m \u001b[39m    raised.\u001b[39;00m\n\u001b[1;32m     98\u001b[0m \u001b[39mRETURNS (Optional[requests.Response]): Response object.\u001b[39;00m\n\u001b[1;32m     99\u001b[0m \u001b[39m\"\"\"\u001b[39;00m\n\u001b[1;32m    100\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m--> 101\u001b[0m     \u001b[39mreturn\u001b[39;00m call_method(url, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m    102\u001b[0m \u001b[39mexcept\u001b[39;00m (ConnectTimeout, ReadTimeout, \u001b[39mTimeoutError\u001b[39;00m) \u001b[39mas\u001b[39;00m err:\n\u001b[1;32m    103\u001b[0m     \u001b[39mif\u001b[39;00m attempt \u001b[39m<\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_max_tries:\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/requests/api.py:115\u001b[0m, in \u001b[0;36mpost\u001b[0;34m(url, data, json, **kwargs)\u001b[0m\n\u001b[1;32m    103\u001b[0m \u001b[39mdef\u001b[39;00m \u001b[39mpost\u001b[39m(url, data\u001b[39m=\u001b[39m\u001b[39mNone\u001b[39;00m, json\u001b[39m=\u001b[39m\u001b[39mNone\u001b[39;00m, \u001b[39m*\u001b[39m\u001b[39m*\u001b[39mkwargs):\n\u001b[1;32m    104\u001b[0m \u001b[39m    \u001b[39m\u001b[39mr\u001b[39m\u001b[39m\"\"\"Sends a POST request.\u001b[39;00m\n\u001b[1;32m    105\u001b[0m \n\u001b[1;32m    106\u001b[0m \u001b[39m    :param url: URL for the new :class:`Request` object.\u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    112\u001b[0m \u001b[39m    :rtype: requests.Response\u001b[39;00m\n\u001b[1;32m    113\u001b[0m \u001b[39m    \"\"\"\u001b[39;00m\n\u001b[0;32m--> 115\u001b[0m     \u001b[39mreturn\u001b[39;00m request(\u001b[39m\"\u001b[39;49m\u001b[39mpost\u001b[39;49m\u001b[39m\"\u001b[39;49m, url, data\u001b[39m=\u001b[39;49mdata, json\u001b[39m=\u001b[39;49mjson, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/requests/api.py:59\u001b[0m, in \u001b[0;36mrequest\u001b[0;34m(method, url, **kwargs)\u001b[0m\n\u001b[1;32m     55\u001b[0m \u001b[39m# By using the 'with' statement we are sure the session is closed, thus we\u001b[39;00m\n\u001b[1;32m     56\u001b[0m \u001b[39m# avoid leaving sockets open which can trigger a ResourceWarning in some\u001b[39;00m\n\u001b[1;32m     57\u001b[0m \u001b[39m# cases, and look like a memory leak in others.\u001b[39;00m\n\u001b[1;32m     58\u001b[0m \u001b[39mwith\u001b[39;00m sessions\u001b[39m.\u001b[39mSession() \u001b[39mas\u001b[39;00m session:\n\u001b[0;32m---> 59\u001b[0m     \u001b[39mreturn\u001b[39;00m session\u001b[39m.\u001b[39;49mrequest(method\u001b[39m=\u001b[39;49mmethod, url\u001b[39m=\u001b[39;49murl, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/requests/sessions.py:589\u001b[0m, in \u001b[0;36mSession.request\u001b[0;34m(self, method, url, params, data, headers, cookies, files, auth, timeout, allow_redirects, proxies, hooks, stream, verify, cert, json)\u001b[0m\n\u001b[1;32m    584\u001b[0m send_kwargs \u001b[39m=\u001b[39m {\n\u001b[1;32m    585\u001b[0m     \u001b[39m\"\u001b[39m\u001b[39mtimeout\u001b[39m\u001b[39m\"\u001b[39m: timeout,\n\u001b[1;32m    586\u001b[0m     \u001b[39m\"\u001b[39m\u001b[39mallow_redirects\u001b[39m\u001b[39m\"\u001b[39m: allow_redirects,\n\u001b[1;32m    587\u001b[0m }\n\u001b[1;32m    588\u001b[0m send_kwargs\u001b[39m.\u001b[39mupdate(settings)\n\u001b[0;32m--> 589\u001b[0m resp \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49msend(prep, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49msend_kwargs)\n\u001b[1;32m    591\u001b[0m \u001b[39mreturn\u001b[39;00m resp\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/requests/sessions.py:703\u001b[0m, in \u001b[0;36mSession.send\u001b[0;34m(self, request, **kwargs)\u001b[0m\n\u001b[1;32m    700\u001b[0m start \u001b[39m=\u001b[39m preferred_clock()\n\u001b[1;32m    702\u001b[0m \u001b[39m# Send the request\u001b[39;00m\n\u001b[0;32m--> 703\u001b[0m r \u001b[39m=\u001b[39m adapter\u001b[39m.\u001b[39;49msend(request, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m    705\u001b[0m \u001b[39m# Total elapsed time of the request (approximately)\u001b[39;00m\n\u001b[1;32m    706\u001b[0m elapsed \u001b[39m=\u001b[39m preferred_clock() \u001b[39m-\u001b[39m start\n",
-      "File \u001b[0;32m~/.virtualenvs/dacy/lib/python3.10/site-packages/requests/adapters.py:519\u001b[0m, in \u001b[0;36mHTTPAdapter.send\u001b[0;34m(self, request, stream, timeout, verify, cert, proxies)\u001b[0m\n\u001b[1;32m    515\u001b[0m     \u001b[39mif\u001b[39;00m \u001b[39misinstance\u001b[39m(e\u001b[39m.\u001b[39mreason, _SSLError):\n\u001b[1;32m    516\u001b[0m         \u001b[39m# This branch is for urllib3 v1.22 and later.\u001b[39;00m\n\u001b[1;32m    517\u001b[0m         \u001b[39mraise\u001b[39;00m SSLError(e, request\u001b[39m=\u001b[39mrequest)\n\u001b[0;32m--> 519\u001b[0m     \u001b[39mraise\u001b[39;00m \u001b[39mConnectionError\u001b[39;00m(e, request\u001b[39m=\u001b[39mrequest)\n\u001b[1;32m    521\u001b[0m \u001b[39mexcept\u001b[39;00m ClosedPoolError \u001b[39mas\u001b[39;00m e:\n\u001b[1;32m    522\u001b[0m     \u001b[39mraise\u001b[39;00m \u001b[39mConnectionError\u001b[39;00m(e, request\u001b[39m=\u001b[39mrequest)\n",
-      "\u001b[0;31mConnectionError\u001b[0m: HTTPSConnectionPool(host='api.openai.com', port=443): Max retries exceeded with url: /v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x152a0ba30>: Failed to resolve 'api.openai.com' ([Errno 8] nodename nor servname provided, or not known)\"))"
+      "dansk (test): Loading prediction for da_core_news_sm-3.5.0\n"
      ]
     }
    ],
@@ -682,52 +621,13 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
    "metadata": {
     "tags": [
      "remove-cell"
     ]
    },
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n",
-      "huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...\n",
-      "To disable this warning, you can either:\n",
-      "\t- Avoid using `tokenizers` before the fork if possible\n",
-      "\t- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "with Pool(8) as p:\n",
     "    tables = p.starmap(\n",
@@ -738,7 +638,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 12,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -808,7 +708,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {
     "tags": [
      "remove-input"
@@ -820,23 +720,23 @@
       "text/html": [
        "\n",
        "<style>\n",
-       "  #altair-viz-a65206bbd8d8455388d4e821c2ffa6c0.vega-embed {\n",
+       "  #altair-viz-93ea216721f84b06bfa5848ac3e2ee19.vega-embed {\n",
        "    width: 100%;\n",
        "    display: flex;\n",
        "  }\n",
        "\n",
-       "  #altair-viz-a65206bbd8d8455388d4e821c2ffa6c0.vega-embed details,\n",
-       "  #altair-viz-a65206bbd8d8455388d4e821c2ffa6c0.vega-embed details summary {\n",
+       "  #altair-viz-93ea216721f84b06bfa5848ac3e2ee19.vega-embed details,\n",
+       "  #altair-viz-93ea216721f84b06bfa5848ac3e2ee19.vega-embed details summary {\n",
        "    position: relative;\n",
        "  }\n",
        "</style>\n",
-       "<div id=\"altair-viz-a65206bbd8d8455388d4e821c2ffa6c0\"></div>\n",
+       "<div id=\"altair-viz-93ea216721f84b06bfa5848ac3e2ee19\"></div>\n",
        "<script type=\"text/javascript\">\n",
        "  var VEGA_DEBUG = (typeof VEGA_DEBUG == \"undefined\") ? {} : VEGA_DEBUG;\n",
        "  (function(spec, embedOpt){\n",
        "    let outputDiv = document.currentScript.previousElementSibling;\n",
-       "    if (outputDiv.id !== \"altair-viz-a65206bbd8d8455388d4e821c2ffa6c0\") {\n",
-       "      outputDiv = document.getElementById(\"altair-viz-a65206bbd8d8455388d4e821c2ffa6c0\");\n",
+       "    if (outputDiv.id !== \"altair-viz-93ea216721f84b06bfa5848ac3e2ee19\") {\n",
+       "      outputDiv = document.getElementById(\"altair-viz-93ea216721f84b06bfa5848ac3e2ee19\");\n",
        "    }\n",
        "    const paths = {\n",
        "      \"vega\": \"https://cdn.jsdelivr.net/npm/vega@5?noext\",\n",
@@ -882,14 +782,14 @@
        "        .catch(showError)\n",
        "        .then(() => displayChart(vegaEmbed));\n",
        "    }\n",
-       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"point\", \"filled\": true, \"size\": 100}, \"encoding\": {\"color\": {\"field\": \"Label\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_1\", \"value\": 1}, \"value\": 0.0}, \"tooltip\": [{\"field\": \"Models\", \"type\": \"nominal\"}, {\"field\": \"Label\", \"type\": \"nominal\"}, {\"field\": \"F1 string\", \"title\": \"F1\", \"type\": \"nominal\"}], \"x\": {\"field\": \"F1\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"y\": {\"field\": \"Models\", \"type\": \"nominal\"}}, \"name\": \"view_1\"}, {\"mark\": {\"type\": \"errorbar\", \"ticks\": false}, \"encoding\": {\"color\": {\"field\": \"Label\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_1\", \"value\": 1}, \"value\": 0.0}, \"x\": {\"field\": \"CI Lower\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"x2\": {\"field\": \"CI Upper\"}, \"y\": {\"field\": \"Models\", \"type\": \"nominal\"}}}], \"data\": {\"name\": \"data-fb3a3f7660e577e82d7e98bc93f4bc12\"}, \"height\": 300, \"params\": [{\"name\": \"param_1\", \"select\": {\"type\": \"point\", \"fields\": [\"Label\"]}, \"bind\": \"legend\", \"value\": [{\"Label\": \"Average\"}], \"views\": [\"view_1\"]}], \"width\": 400, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.8.0.json\", \"datasets\": {\"data-fb3a3f7660e577e82d7e98bc93f4bc12\": [{\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Average\", \"F1 string\": \"80.1 (78.2, 81.9)\", \"F1\": 80.1, \"CI Lower\": 78.2, \"CI Upper\": 81.9}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Average\", \"F1 string\": \"79.7 (77.7, 81.5)\", \"F1\": 79.7, \"CI Lower\": 77.7, \"CI Upper\": 81.5}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Average\", \"F1 string\": \"78.4 (76.3, 80.4)\", \"F1\": 78.4, \"CI Lower\": 76.3, \"CI Upper\": 80.4}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Language\", \"F1 string\": \"74.5 (60.0, 83.3)\", \"F1\": 74.5, \"CI Lower\": 60.0, \"CI Upper\": 83.3}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Language\", \"F1 string\": \"51.9 (23.3, 100.0)\", \"F1\": 51.9, \"CI Lower\": 23.3, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Language\", \"F1 string\": \"45.9 (13.3, 93.3)\", \"F1\": 45.9, \"CI Lower\": 13.3, \"CI Upper\": 93.3}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Product\", \"F1 string\": \"62.4 (53.9, 72.0)\", \"F1\": 62.4, \"CI Lower\": 53.9, \"CI Upper\": 72.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Product\", \"F1 string\": \"62.6 (53.9, 71.6)\", \"F1\": 62.6, \"CI Lower\": 53.9, \"CI Upper\": 71.6}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Product\", \"F1 string\": \"59.5 (48.9, 67.9)\", \"F1\": 59.5, \"CI Lower\": 48.9, \"CI Upper\": 67.9}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Organization\", \"F1 string\": \"79.5 (74.9, 83.1)\", \"F1\": 79.5, \"CI Lower\": 74.9, \"CI Upper\": 83.1}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Organization\", \"F1 string\": \"80.5 (78.1, 84.2)\", \"F1\": 80.5, \"CI Lower\": 78.1, \"CI Upper\": 84.2}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Organization\", \"F1 string\": \"79.1 (75.7, 82.3)\", \"F1\": 79.1, \"CI Lower\": 75.7, \"CI Upper\": 82.3}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Cardinal\", \"F1 string\": \"87.0 (82.8, 90.3)\", \"F1\": 87.0, \"CI Lower\": 82.8, \"CI Upper\": 90.3}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Cardinal\", \"F1 string\": \"80.5 (77.0, 84.4)\", \"F1\": 80.5, \"CI Lower\": 77.0, \"CI Upper\": 84.4}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Cardinal\", \"F1 string\": \"89.2 (86.0, 91.7)\", \"F1\": 89.2, \"CI Lower\": 86.0, \"CI Upper\": 91.7}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Quantity\", \"F1 string\": \"78.6 (59.8, 93.8)\", \"F1\": 78.6, \"CI Lower\": 59.8, \"CI Upper\": 93.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Quantity\", \"F1 string\": \"76.9 (63.9, 89.9)\", \"F1\": 76.9, \"CI Lower\": 63.9, \"CI Upper\": 89.9}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Quantity\", \"F1 string\": \"71.3 (50.0, 91.1)\", \"F1\": 71.3, \"CI Lower\": 50.0, \"CI Upper\": 91.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Work of Art\", \"F1 string\": \"39.3 (25.5, 50.3)\", \"F1\": 39.3, \"CI Lower\": 25.5, \"CI Upper\": 50.3}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Work of Art\", \"F1 string\": \"58.4 (48.7, 69.1)\", \"F1\": 58.4, \"CI Lower\": 48.7, \"CI Upper\": 69.1}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Work of Art\", \"F1 string\": \"46.6 (36.2, 56.9)\", \"F1\": 46.6, \"CI Lower\": 36.2, \"CI Upper\": 56.9}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Location\", \"F1 string\": \"75.3 (66.9, 83.8)\", \"F1\": 75.3, \"CI Lower\": 66.9, \"CI Upper\": 83.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Location\", \"F1 string\": \"72.5 (62.1, 80.8)\", \"F1\": 72.5, \"CI Lower\": 62.1, \"CI Upper\": 80.8}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Location\", \"F1 string\": \"65.6 (55.4, 74.1)\", \"F1\": 65.6, \"CI Lower\": 55.4, \"CI Upper\": 74.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"NORP\", \"F1 string\": \"84.8 (76.9, 90.8)\", \"F1\": 84.8, \"CI Lower\": 76.9, \"CI Upper\": 90.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"NORP\", \"F1 string\": \"78.2 (68.6, 85.8)\", \"F1\": 78.2, \"CI Lower\": 68.6, \"CI Upper\": 85.8}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"NORP\", \"F1 string\": \"73.3 (62.9, 81.5)\", \"F1\": 73.3, \"CI Lower\": 62.9, \"CI Upper\": 81.5}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Date\", \"F1 string\": \"77.3 (71.6, 81.8)\", \"F1\": 77.3, \"CI Lower\": 71.6, \"CI Upper\": 81.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Date\", \"F1 string\": \"77.6 (72.8, 82.2)\", \"F1\": 77.6, \"CI Lower\": 72.8, \"CI Upper\": 82.2}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Date\", \"F1 string\": \"78.8 (73.9, 83.4)\", \"F1\": 78.8, \"CI Lower\": 73.9, \"CI Upper\": 83.4}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Percent\", \"F1 string\": \"100.0 (100.0, 100.0)\", \"F1\": 100.0, \"CI Lower\": 100.0, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Percent\", \"F1 string\": \"100.0 (100.0, 100.0)\", \"F1\": 100.0, \"CI Lower\": 100.0, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Percent\", \"F1 string\": \"100.0 (100.0, 100.0)\", \"F1\": 100.0, \"CI Lower\": 100.0, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Money\", \"F1 string\": \"99.3 (97.9, 100.0)\", \"F1\": 99.3, \"CI Lower\": 97.9, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Money\", \"F1 string\": \"98.6 (97.2, 100.0)\", \"F1\": 98.6, \"CI Lower\": 97.2, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Money\", \"F1 string\": \"95.2 (90.0, 98.2)\", \"F1\": 95.2, \"CI Lower\": 90.0, \"CI Upper\": 98.2}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Person\", \"F1 string\": \"85.9 (82.7, 88.8)\", \"F1\": 85.9, \"CI Lower\": 82.7, \"CI Upper\": 88.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Person\", \"F1 string\": \"84.8 (80.6, 88.2)\", \"F1\": 84.8, \"CI Lower\": 80.6, \"CI Upper\": 88.2}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Person\", \"F1 string\": \"86.8 (83.2, 90.1)\", \"F1\": 86.8, \"CI Lower\": 83.2, \"CI Upper\": 90.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Time\", \"F1 string\": \"90.9 (83.8, 96.7)\", \"F1\": 90.9, \"CI Lower\": 83.8, \"CI Upper\": 96.7}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Time\", \"F1 string\": \"85.1 (74.0, 93.7)\", \"F1\": 85.1, \"CI Lower\": 74.0, \"CI Upper\": 93.7}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Time\", \"F1 string\": \"83.4 (68.0, 95.6)\", \"F1\": 83.4, \"CI Lower\": 68.0, \"CI Upper\": 95.6}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"GPE\", \"F1 string\": \"90.6 (87.2, 93.1)\", \"F1\": 90.6, \"CI Lower\": 87.2, \"CI Upper\": 93.1}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"GPE\", \"F1 string\": \"88.0 (82.7, 92.1)\", \"F1\": 88.0, \"CI Lower\": 82.7, \"CI Upper\": 92.1}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"GPE\", \"F1 string\": \"79.6 (73.0, 84.6)\", \"F1\": 79.6, \"CI Lower\": 73.0, \"CI Upper\": 84.6}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Event\", \"F1 string\": \"43.5 (27.0, 56.0)\", \"F1\": 43.5, \"CI Lower\": 27.0, \"CI Upper\": 56.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Event\", \"F1 string\": \"64.2 (50.0, 79.4)\", \"F1\": 64.2, \"CI Lower\": 50.0, \"CI Upper\": 79.4}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Event\", \"F1 string\": \"46.1 (27.8, 62.4)\", \"F1\": 46.1, \"CI Lower\": 27.8, \"CI Upper\": 62.4}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Law\", \"F1 string\": \"54.2 (38.1, 72.5)\", \"F1\": 54.2, \"CI Lower\": 38.1, \"CI Upper\": 72.5}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Law\", \"F1 string\": \"59.3 (37.4, 77.3)\", \"F1\": 59.3, \"CI Lower\": 37.4, \"CI Upper\": 77.3}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Law\", \"F1 string\": \"57.6 (39.6, 75.1)\", \"F1\": 57.6, \"CI Lower\": 39.6, \"CI Upper\": 75.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Facility\", \"F1 string\": \"69.8 (54.3, 84.4)\", \"F1\": 69.8, \"CI Lower\": 54.3, \"CI Upper\": 84.4}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Facility\", \"F1 string\": \"72.3 (56.2, 84.6)\", \"F1\": 72.3, \"CI Lower\": 56.2, \"CI Upper\": 84.6}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Facility\", \"F1 string\": \"55.5 (36.2, 70.5)\", \"F1\": 55.5, \"CI Lower\": 36.2, \"CI Upper\": 70.5}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Ordinal\", \"F1 string\": \"37.8 (22.5, 51.2)\", \"F1\": 37.8, \"CI Lower\": 22.5, \"CI Upper\": 51.2}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Ordinal\", \"F1 string\": \"68.7 (49.1, 82.6)\", \"F1\": 68.7, \"CI Lower\": 49.1, \"CI Upper\": 82.6}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Ordinal\", \"F1 string\": \"68.5 (47.6, 83.1)\", \"F1\": 68.5, \"CI Lower\": 47.6, \"CI Upper\": 83.1}]}}, {\"mode\": \"vega-lite\"});\n",
+       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"point\", \"filled\": true, \"size\": 100}, \"encoding\": {\"color\": {\"field\": \"Label\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_1\", \"value\": 1}, \"value\": 0.0}, \"tooltip\": [{\"field\": \"Models\", \"type\": \"nominal\"}, {\"field\": \"Label\", \"type\": \"nominal\"}, {\"field\": \"F1 string\", \"title\": \"F1\", \"type\": \"nominal\"}], \"x\": {\"field\": \"F1\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"y\": {\"field\": \"Models\", \"type\": \"nominal\"}}, \"name\": \"view_1\"}, {\"mark\": {\"type\": \"errorbar\", \"ticks\": false}, \"encoding\": {\"color\": {\"field\": \"Label\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_1\", \"value\": 1}, \"value\": 0.0}, \"x\": {\"field\": \"CI Lower\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"x2\": {\"field\": \"CI Upper\"}, \"y\": {\"field\": \"Models\", \"type\": \"nominal\"}}}], \"data\": {\"name\": \"data-db2e689a8dbaa1f239c072df7e662711\"}, \"height\": 300, \"params\": [{\"name\": \"param_1\", \"select\": {\"type\": \"point\", \"fields\": [\"Label\"]}, \"bind\": \"legend\", \"value\": [{\"Label\": \"Average\"}], \"views\": [\"view_1\"]}], \"width\": 400, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.8.0.json\", \"datasets\": {\"data-db2e689a8dbaa1f239c072df7e662711\": [{\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Average\", \"F1 string\": \"80.1 (78.2, 81.9)\", \"F1\": 80.1, \"CI Lower\": 78.2, \"CI Upper\": 81.9}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Average\", \"F1 string\": \"79.7 (77.7, 81.5)\", \"F1\": 79.7, \"CI Lower\": 77.7, \"CI Upper\": 81.5}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Average\", \"F1 string\": \"78.4 (76.3, 80.4)\", \"F1\": 78.4, \"CI Lower\": 76.3, \"CI Upper\": 80.4}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Language\", \"F1 string\": \"74.5 (60.0, 83.3)\", \"F1\": 74.5, \"CI Lower\": 60.0, \"CI Upper\": 83.3}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Language\", \"F1 string\": \"51.9 (23.3, 100.0)\", \"F1\": 51.9, \"CI Lower\": 23.3, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Language\", \"F1 string\": \"45.9 (13.3, 93.3)\", \"F1\": 45.9, \"CI Lower\": 13.3, \"CI Upper\": 93.3}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Organization\", \"F1 string\": \"79.5 (74.9, 83.1)\", \"F1\": 79.5, \"CI Lower\": 74.9, \"CI Upper\": 83.1}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Organization\", \"F1 string\": \"80.5 (78.1, 84.2)\", \"F1\": 80.5, \"CI Lower\": 78.1, \"CI Upper\": 84.2}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Organization\", \"F1 string\": \"79.1 (75.7, 82.3)\", \"F1\": 79.1, \"CI Lower\": 75.7, \"CI Upper\": 82.3}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Percent\", \"F1 string\": \"100.0 (100.0, 100.0)\", \"F1\": 100.0, \"CI Lower\": 100.0, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Percent\", \"F1 string\": \"100.0 (100.0, 100.0)\", \"F1\": 100.0, \"CI Lower\": 100.0, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Percent\", \"F1 string\": \"100.0 (100.0, 100.0)\", \"F1\": 100.0, \"CI Lower\": 100.0, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Law\", \"F1 string\": \"54.2 (38.1, 72.5)\", \"F1\": 54.2, \"CI Lower\": 38.1, \"CI Upper\": 72.5}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Law\", \"F1 string\": \"59.3 (37.4, 77.3)\", \"F1\": 59.3, \"CI Lower\": 37.4, \"CI Upper\": 77.3}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Law\", \"F1 string\": \"57.6 (39.6, 75.1)\", \"F1\": 57.6, \"CI Lower\": 39.6, \"CI Upper\": 75.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"GPE\", \"F1 string\": \"90.6 (87.2, 93.1)\", \"F1\": 90.6, \"CI Lower\": 87.2, \"CI Upper\": 93.1}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"GPE\", \"F1 string\": \"88.0 (82.7, 92.1)\", \"F1\": 88.0, \"CI Lower\": 82.7, \"CI Upper\": 92.1}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"GPE\", \"F1 string\": \"79.6 (73.0, 84.6)\", \"F1\": 79.6, \"CI Lower\": 73.0, \"CI Upper\": 84.6}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Facility\", \"F1 string\": \"69.8 (54.3, 84.4)\", \"F1\": 69.8, \"CI Lower\": 54.3, \"CI Upper\": 84.4}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Facility\", \"F1 string\": \"72.3 (56.2, 84.6)\", \"F1\": 72.3, \"CI Lower\": 56.2, \"CI Upper\": 84.6}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Facility\", \"F1 string\": \"55.5 (36.2, 70.5)\", \"F1\": 55.5, \"CI Lower\": 36.2, \"CI Upper\": 70.5}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Product\", \"F1 string\": \"62.4 (53.9, 72.0)\", \"F1\": 62.4, \"CI Lower\": 53.9, \"CI Upper\": 72.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Product\", \"F1 string\": \"62.6 (53.9, 71.6)\", \"F1\": 62.6, \"CI Lower\": 53.9, \"CI Upper\": 71.6}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Product\", \"F1 string\": \"59.5 (48.9, 67.9)\", \"F1\": 59.5, \"CI Lower\": 48.9, \"CI Upper\": 67.9}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Ordinal\", \"F1 string\": \"37.8 (22.5, 51.2)\", \"F1\": 37.8, \"CI Lower\": 22.5, \"CI Upper\": 51.2}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Ordinal\", \"F1 string\": \"68.7 (49.1, 82.6)\", \"F1\": 68.7, \"CI Lower\": 49.1, \"CI Upper\": 82.6}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Ordinal\", \"F1 string\": \"68.5 (47.6, 83.1)\", \"F1\": 68.5, \"CI Lower\": 47.6, \"CI Upper\": 83.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Time\", \"F1 string\": \"90.9 (83.8, 96.7)\", \"F1\": 90.9, \"CI Lower\": 83.8, \"CI Upper\": 96.7}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Time\", \"F1 string\": \"85.1 (74.0, 93.7)\", \"F1\": 85.1, \"CI Lower\": 74.0, \"CI Upper\": 93.7}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Time\", \"F1 string\": \"83.4 (68.0, 95.6)\", \"F1\": 83.4, \"CI Lower\": 68.0, \"CI Upper\": 95.6}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Money\", \"F1 string\": \"99.3 (97.9, 100.0)\", \"F1\": 99.3, \"CI Lower\": 97.9, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Money\", \"F1 string\": \"98.6 (97.2, 100.0)\", \"F1\": 98.6, \"CI Lower\": 97.2, \"CI Upper\": 100.0}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Money\", \"F1 string\": \"95.2 (90.0, 98.2)\", \"F1\": 95.2, \"CI Lower\": 90.0, \"CI Upper\": 98.2}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Event\", \"F1 string\": \"43.5 (27.0, 56.0)\", \"F1\": 43.5, \"CI Lower\": 27.0, \"CI Upper\": 56.0}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Event\", \"F1 string\": \"64.2 (50.0, 79.4)\", \"F1\": 64.2, \"CI Lower\": 50.0, \"CI Upper\": 79.4}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Event\", \"F1 string\": \"46.1 (27.8, 62.4)\", \"F1\": 46.1, \"CI Lower\": 27.8, \"CI Upper\": 62.4}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Person\", \"F1 string\": \"85.9 (82.7, 88.8)\", \"F1\": 85.9, \"CI Lower\": 82.7, \"CI Upper\": 88.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Person\", \"F1 string\": \"84.8 (80.6, 88.2)\", \"F1\": 84.8, \"CI Lower\": 80.6, \"CI Upper\": 88.2}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Person\", \"F1 string\": \"86.8 (83.2, 90.1)\", \"F1\": 86.8, \"CI Lower\": 83.2, \"CI Upper\": 90.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Work of Art\", \"F1 string\": \"39.3 (25.5, 50.3)\", \"F1\": 39.3, \"CI Lower\": 25.5, \"CI Upper\": 50.3}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Work of Art\", \"F1 string\": \"58.4 (48.7, 69.1)\", \"F1\": 58.4, \"CI Lower\": 48.7, \"CI Upper\": 69.1}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Work of Art\", \"F1 string\": \"46.6 (36.2, 56.9)\", \"F1\": 46.6, \"CI Lower\": 36.2, \"CI Upper\": 56.9}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Location\", \"F1 string\": \"75.3 (66.9, 83.8)\", \"F1\": 75.3, \"CI Lower\": 66.9, \"CI Upper\": 83.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Location\", \"F1 string\": \"72.5 (62.1, 80.8)\", \"F1\": 72.5, \"CI Lower\": 62.1, \"CI Upper\": 80.8}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Location\", \"F1 string\": \"65.6 (55.4, 74.1)\", \"F1\": 65.6, \"CI Lower\": 55.4, \"CI Upper\": 74.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"NORP\", \"F1 string\": \"84.8 (76.9, 90.8)\", \"F1\": 84.8, \"CI Lower\": 76.9, \"CI Upper\": 90.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"NORP\", \"F1 string\": \"78.2 (68.6, 85.8)\", \"F1\": 78.2, \"CI Lower\": 68.6, \"CI Upper\": 85.8}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"NORP\", \"F1 string\": \"73.3 (62.9, 81.5)\", \"F1\": 73.3, \"CI Lower\": 62.9, \"CI Upper\": 81.5}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Cardinal\", \"F1 string\": \"87.0 (82.8, 90.3)\", \"F1\": 87.0, \"CI Lower\": 82.8, \"CI Upper\": 90.3}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Cardinal\", \"F1 string\": \"80.5 (77.0, 84.4)\", \"F1\": 80.5, \"CI Lower\": 77.0, \"CI Upper\": 84.4}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Cardinal\", \"F1 string\": \"89.2 (86.0, 91.7)\", \"F1\": 89.2, \"CI Lower\": 86.0, \"CI Upper\": 91.7}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Quantity\", \"F1 string\": \"78.6 (59.8, 93.8)\", \"F1\": 78.6, \"CI Lower\": 59.8, \"CI Upper\": 93.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Quantity\", \"F1 string\": \"76.9 (63.9, 89.9)\", \"F1\": 76.9, \"CI Lower\": 63.9, \"CI Upper\": 89.9}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Quantity\", \"F1 string\": \"71.3 (50.0, 91.1)\", \"F1\": 71.3, \"CI Lower\": 50.0, \"CI Upper\": 91.1}, {\"Models\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Label\": \"Date\", \"F1 string\": \"77.3 (71.6, 81.8)\", \"F1\": 77.3, \"CI Lower\": 71.6, \"CI Upper\": 81.8}, {\"Models\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Label\": \"Date\", \"F1 string\": \"77.6 (72.8, 82.2)\", \"F1\": 77.6, \"CI Lower\": 72.8, \"CI Upper\": 82.2}, {\"Models\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Label\": \"Date\", \"F1 string\": \"78.8 (73.9, 83.4)\", \"F1\": 78.8, \"CI Lower\": 73.9, \"CI Upper\": 83.4}]}}, {\"mode\": \"vega-lite\"});\n",
        "</script>"
       ],
       "text/plain": [
        "alt.LayerChart(...)"
       ]
      },
-     "execution_count": 10,
+     "execution_count": 13,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -901,7 +801,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -935,7 +835,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -963,7 +863,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 16,
    "metadata": {
     "tags": [
      "remove-input"
@@ -974,165 +874,165 @@
      "data": {
       "text/html": [
        "<style type=\"text/css\">\n",
-       "#T_05512 .level0 {\n",
+       "#T_edc40 .level0 {\n",
        "  text-align: center;\n",
        "}\n",
-       "#T_05512 .col_heading {\n",
+       "#T_edc40 .col_heading {\n",
        "  text-align: center;\n",
        "}\n",
-       "#T_05512_row0_col1, #T_05512_row1_col1, #T_05512_row2_col0, #T_05512_row3_col0, #T_05512_row4_col1, #T_05512_row5_col0, #T_05512_row6_col0, #T_05512_row7_col1, #T_05512_row8_col1, #T_05512_row9_col2, #T_05512_row10_col1, #T_05512_row11_col1, #T_05512_row12_col2, #T_05512_row13_col2, #T_05512_row14_col0, #T_05512_row16_col0, #T_05512_row17_col0, #T_05512_row18_col0 {\n",
+       "#T_edc40_row0_col1, #T_edc40_row1_col1, #T_edc40_row2_col0, #T_edc40_row3_col0, #T_edc40_row4_col1, #T_edc40_row5_col0, #T_edc40_row6_col0, #T_edc40_row7_col1, #T_edc40_row8_col1, #T_edc40_row9_col2, #T_edc40_row10_col1, #T_edc40_row11_col1, #T_edc40_row12_col2, #T_edc40_row13_col2, #T_edc40_row14_col0, #T_edc40_row16_col0, #T_edc40_row17_col0, #T_edc40_row18_col0 {\n",
        "  font-weight: bold;\n",
        "}\n",
-       "#T_05512_row0_col2, #T_05512_row1_col0, #T_05512_row2_col1, #T_05512_row3_col1, #T_05512_row4_col2, #T_05512_row5_col1, #T_05512_row6_col1, #T_05512_row7_col2, #T_05512_row8_col0, #T_05512_row9_col0, #T_05512_row10_col0, #T_05512_row11_col2, #T_05512_row12_col0, #T_05512_row13_col1, #T_05512_row14_col1, #T_05512_row16_col1, #T_05512_row17_col1, #T_05512_row18_col1 {\n",
+       "#T_edc40_row0_col2, #T_edc40_row1_col0, #T_edc40_row2_col1, #T_edc40_row3_col1, #T_edc40_row4_col2, #T_edc40_row5_col1, #T_edc40_row6_col1, #T_edc40_row7_col2, #T_edc40_row8_col0, #T_edc40_row9_col0, #T_edc40_row10_col0, #T_edc40_row11_col2, #T_edc40_row12_col0, #T_edc40_row13_col1, #T_edc40_row14_col1, #T_edc40_row16_col1, #T_edc40_row17_col1, #T_edc40_row18_col1 {\n",
        "  font-style: italic;\n",
        "}\n",
-       "#T_05512_row15_col0, #T_05512_row15_col1, #T_05512_row15_col2 {\n",
+       "#T_edc40_row15_col0, #T_edc40_row15_col1, #T_edc40_row15_col2 {\n",
        "  font-weight: bold;\n",
        "  font-style: normal;\n",
        "}\n",
        "</style>\n",
-       "<table id=\"T_05512\" style=\"font-size: 0.8em\">\n",
+       "<table id=\"T_edc40\" style=\"font-size: 0.8em\">\n",
        "  <caption>F1 score with 95% confidence interval calculated using bootstrapping with 100 samples.</caption>\n",
        "  <thead>\n",
        "    <tr>\n",
        "      <th class=\"blank\" >&nbsp;</th>\n",
        "      <th class=\"blank level0\" >&nbsp;</th>\n",
-       "      <th id=\"T_05512_level0_col0\" class=\"col_heading level0 col0\" colspan=\"3\">Fine-grained Models</th>\n",
+       "      <th id=\"T_edc40_level0_col0\" class=\"col_heading level0 col0\" colspan=\"3\">Fine-grained Models</th>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th class=\"blank\" >&nbsp;</th>\n",
        "      <th class=\"blank level1\" >&nbsp;</th>\n",
-       "      <th id=\"T_05512_level1_col0\" class=\"col_heading level1 col0\" >Large 0.1.0</th>\n",
-       "      <th id=\"T_05512_level1_col1\" class=\"col_heading level1 col1\" >Medium 0.1.0</th>\n",
-       "      <th id=\"T_05512_level1_col2\" class=\"col_heading level1 col2\" >Small 0.1.0</th>\n",
+       "      <th id=\"T_edc40_level1_col0\" class=\"col_heading level1 col0\" >Large 0.1.0</th>\n",
+       "      <th id=\"T_edc40_level1_col1\" class=\"col_heading level1 col1\" >Medium 0.1.0</th>\n",
+       "      <th id=\"T_edc40_level1_col2\" class=\"col_heading level1 col2\" >Small 0.1.0</th>\n",
        "    </tr>\n",
        "  </thead>\n",
        "  <tbody>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level0_row0\" class=\"row_heading level0 row0\" rowspan=\"12\">Entities</th>\n",
-       "      <th id=\"T_05512_level1_row0\" class=\"row_heading level1 row0\" >Event</th>\n",
-       "      <td id=\"T_05512_row0_col0\" class=\"data row0 col0\" >43.5 (27.0, 56.0)</td>\n",
-       "      <td id=\"T_05512_row0_col1\" class=\"data row0 col1\" >64.2 (50.0, 79.4)</td>\n",
-       "      <td id=\"T_05512_row0_col2\" class=\"data row0 col2\" >46.1 (27.8, 62.4)</td>\n",
+       "      <th id=\"T_edc40_level0_row0\" class=\"row_heading level0 row0\" rowspan=\"12\">Entities</th>\n",
+       "      <th id=\"T_edc40_level1_row0\" class=\"row_heading level1 row0\" >Event</th>\n",
+       "      <td id=\"T_edc40_row0_col0\" class=\"data row0 col0\" >43.5 (27.0, 56.0)</td>\n",
+       "      <td id=\"T_edc40_row0_col1\" class=\"data row0 col1\" >64.2 (50.0, 79.4)</td>\n",
+       "      <td id=\"T_edc40_row0_col2\" class=\"data row0 col2\" >46.1 (27.8, 62.4)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row1\" class=\"row_heading level1 row1\" >Facility</th>\n",
-       "      <td id=\"T_05512_row1_col0\" class=\"data row1 col0\" >69.8 (54.3, 84.4)</td>\n",
-       "      <td id=\"T_05512_row1_col1\" class=\"data row1 col1\" >72.3 (56.2, 84.6)</td>\n",
-       "      <td id=\"T_05512_row1_col2\" class=\"data row1 col2\" >55.5 (36.2, 70.5)</td>\n",
+       "      <th id=\"T_edc40_level1_row1\" class=\"row_heading level1 row1\" >Facility</th>\n",
+       "      <td id=\"T_edc40_row1_col0\" class=\"data row1 col0\" >69.8 (54.3, 84.4)</td>\n",
+       "      <td id=\"T_edc40_row1_col1\" class=\"data row1 col1\" >72.3 (56.2, 84.6)</td>\n",
+       "      <td id=\"T_edc40_row1_col2\" class=\"data row1 col2\" >55.5 (36.2, 70.5)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row2\" class=\"row_heading level1 row2\" >GPE</th>\n",
-       "      <td id=\"T_05512_row2_col0\" class=\"data row2 col0\" >90.6 (87.2, 93.1)</td>\n",
-       "      <td id=\"T_05512_row2_col1\" class=\"data row2 col1\" >88.0 (82.7, 92.1)</td>\n",
-       "      <td id=\"T_05512_row2_col2\" class=\"data row2 col2\" >79.6 (73.0, 84.6)</td>\n",
+       "      <th id=\"T_edc40_level1_row2\" class=\"row_heading level1 row2\" >GPE</th>\n",
+       "      <td id=\"T_edc40_row2_col0\" class=\"data row2 col0\" >90.6 (87.2, 93.1)</td>\n",
+       "      <td id=\"T_edc40_row2_col1\" class=\"data row2 col1\" >88.0 (82.7, 92.1)</td>\n",
+       "      <td id=\"T_edc40_row2_col2\" class=\"data row2 col2\" >79.6 (73.0, 84.6)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row3\" class=\"row_heading level1 row3\" >Language</th>\n",
-       "      <td id=\"T_05512_row3_col0\" class=\"data row3 col0\" >74.5 (60.0, 83.3)</td>\n",
-       "      <td id=\"T_05512_row3_col1\" class=\"data row3 col1\" >51.9 (23.3, 100.0)</td>\n",
-       "      <td id=\"T_05512_row3_col2\" class=\"data row3 col2\" >45.9 (13.3, 93.3)</td>\n",
+       "      <th id=\"T_edc40_level1_row3\" class=\"row_heading level1 row3\" >Language</th>\n",
+       "      <td id=\"T_edc40_row3_col0\" class=\"data row3 col0\" >74.5 (60.0, 83.3)</td>\n",
+       "      <td id=\"T_edc40_row3_col1\" class=\"data row3 col1\" >51.9 (23.3, 100.0)</td>\n",
+       "      <td id=\"T_edc40_row3_col2\" class=\"data row3 col2\" >45.9 (13.3, 93.3)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row4\" class=\"row_heading level1 row4\" >Law</th>\n",
-       "      <td id=\"T_05512_row4_col0\" class=\"data row4 col0\" >54.2 (38.1, 72.5)</td>\n",
-       "      <td id=\"T_05512_row4_col1\" class=\"data row4 col1\" >59.3 (37.4, 77.3)</td>\n",
-       "      <td id=\"T_05512_row4_col2\" class=\"data row4 col2\" >57.6 (39.6, 75.1)</td>\n",
+       "      <th id=\"T_edc40_level1_row4\" class=\"row_heading level1 row4\" >Law</th>\n",
+       "      <td id=\"T_edc40_row4_col0\" class=\"data row4 col0\" >54.2 (38.1, 72.5)</td>\n",
+       "      <td id=\"T_edc40_row4_col1\" class=\"data row4 col1\" >59.3 (37.4, 77.3)</td>\n",
+       "      <td id=\"T_edc40_row4_col2\" class=\"data row4 col2\" >57.6 (39.6, 75.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row5\" class=\"row_heading level1 row5\" >Location</th>\n",
-       "      <td id=\"T_05512_row5_col0\" class=\"data row5 col0\" >75.3 (66.9, 83.8)</td>\n",
-       "      <td id=\"T_05512_row5_col1\" class=\"data row5 col1\" >72.5 (62.1, 80.8)</td>\n",
-       "      <td id=\"T_05512_row5_col2\" class=\"data row5 col2\" >65.6 (55.4, 74.1)</td>\n",
+       "      <th id=\"T_edc40_level1_row5\" class=\"row_heading level1 row5\" >Location</th>\n",
+       "      <td id=\"T_edc40_row5_col0\" class=\"data row5 col0\" >75.3 (66.9, 83.8)</td>\n",
+       "      <td id=\"T_edc40_row5_col1\" class=\"data row5 col1\" >72.5 (62.1, 80.8)</td>\n",
+       "      <td id=\"T_edc40_row5_col2\" class=\"data row5 col2\" >65.6 (55.4, 74.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row6\" class=\"row_heading level1 row6\" >NORP</th>\n",
-       "      <td id=\"T_05512_row6_col0\" class=\"data row6 col0\" >84.8 (76.9, 90.8)</td>\n",
-       "      <td id=\"T_05512_row6_col1\" class=\"data row6 col1\" >78.2 (68.6, 85.8)</td>\n",
-       "      <td id=\"T_05512_row6_col2\" class=\"data row6 col2\" >73.3 (62.9, 81.5)</td>\n",
+       "      <th id=\"T_edc40_level1_row6\" class=\"row_heading level1 row6\" >NORP</th>\n",
+       "      <td id=\"T_edc40_row6_col0\" class=\"data row6 col0\" >84.8 (76.9, 90.8)</td>\n",
+       "      <td id=\"T_edc40_row6_col1\" class=\"data row6 col1\" >78.2 (68.6, 85.8)</td>\n",
+       "      <td id=\"T_edc40_row6_col2\" class=\"data row6 col2\" >73.3 (62.9, 81.5)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row7\" class=\"row_heading level1 row7\" >Ordinal</th>\n",
-       "      <td id=\"T_05512_row7_col0\" class=\"data row7 col0\" >37.8 (22.5, 51.2)</td>\n",
-       "      <td id=\"T_05512_row7_col1\" class=\"data row7 col1\" >68.7 (49.1, 82.6)</td>\n",
-       "      <td id=\"T_05512_row7_col2\" class=\"data row7 col2\" >68.5 (47.6, 83.1)</td>\n",
+       "      <th id=\"T_edc40_level1_row7\" class=\"row_heading level1 row7\" >Ordinal</th>\n",
+       "      <td id=\"T_edc40_row7_col0\" class=\"data row7 col0\" >37.8 (22.5, 51.2)</td>\n",
+       "      <td id=\"T_edc40_row7_col1\" class=\"data row7 col1\" >68.7 (49.1, 82.6)</td>\n",
+       "      <td id=\"T_edc40_row7_col2\" class=\"data row7 col2\" >68.5 (47.6, 83.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row8\" class=\"row_heading level1 row8\" >Organization</th>\n",
-       "      <td id=\"T_05512_row8_col0\" class=\"data row8 col0\" >79.5 (74.9, 83.1)</td>\n",
-       "      <td id=\"T_05512_row8_col1\" class=\"data row8 col1\" >80.5 (78.1, 84.2)</td>\n",
-       "      <td id=\"T_05512_row8_col2\" class=\"data row8 col2\" >79.1 (75.7, 82.3)</td>\n",
+       "      <th id=\"T_edc40_level1_row8\" class=\"row_heading level1 row8\" >Organization</th>\n",
+       "      <td id=\"T_edc40_row8_col0\" class=\"data row8 col0\" >79.5 (74.9, 83.1)</td>\n",
+       "      <td id=\"T_edc40_row8_col1\" class=\"data row8 col1\" >80.5 (78.1, 84.2)</td>\n",
+       "      <td id=\"T_edc40_row8_col2\" class=\"data row8 col2\" >79.1 (75.7, 82.3)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row9\" class=\"row_heading level1 row9\" >Person</th>\n",
-       "      <td id=\"T_05512_row9_col0\" class=\"data row9 col0\" >85.9 (82.7, 88.8)</td>\n",
-       "      <td id=\"T_05512_row9_col1\" class=\"data row9 col1\" >84.8 (80.6, 88.2)</td>\n",
-       "      <td id=\"T_05512_row9_col2\" class=\"data row9 col2\" >86.8 (83.2, 90.1)</td>\n",
+       "      <th id=\"T_edc40_level1_row9\" class=\"row_heading level1 row9\" >Person</th>\n",
+       "      <td id=\"T_edc40_row9_col0\" class=\"data row9 col0\" >85.9 (82.7, 88.8)</td>\n",
+       "      <td id=\"T_edc40_row9_col1\" class=\"data row9 col1\" >84.8 (80.6, 88.2)</td>\n",
+       "      <td id=\"T_edc40_row9_col2\" class=\"data row9 col2\" >86.8 (83.2, 90.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row10\" class=\"row_heading level1 row10\" >Product</th>\n",
-       "      <td id=\"T_05512_row10_col0\" class=\"data row10 col0\" >62.4 (53.9, 72.0)</td>\n",
-       "      <td id=\"T_05512_row10_col1\" class=\"data row10 col1\" >62.6 (53.9, 71.6)</td>\n",
-       "      <td id=\"T_05512_row10_col2\" class=\"data row10 col2\" >59.5 (48.9, 67.9)</td>\n",
+       "      <th id=\"T_edc40_level1_row10\" class=\"row_heading level1 row10\" >Product</th>\n",
+       "      <td id=\"T_edc40_row10_col0\" class=\"data row10 col0\" >62.4 (53.9, 72.0)</td>\n",
+       "      <td id=\"T_edc40_row10_col1\" class=\"data row10 col1\" >62.6 (53.9, 71.6)</td>\n",
+       "      <td id=\"T_edc40_row10_col2\" class=\"data row10 col2\" >59.5 (48.9, 67.9)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row11\" class=\"row_heading level1 row11\" >Work of Art</th>\n",
-       "      <td id=\"T_05512_row11_col0\" class=\"data row11 col0\" >39.3 (25.5, 50.3)</td>\n",
-       "      <td id=\"T_05512_row11_col1\" class=\"data row11 col1\" >58.4 (48.7, 69.1)</td>\n",
-       "      <td id=\"T_05512_row11_col2\" class=\"data row11 col2\" >46.6 (36.2, 56.9)</td>\n",
+       "      <th id=\"T_edc40_level1_row11\" class=\"row_heading level1 row11\" >Work of Art</th>\n",
+       "      <td id=\"T_edc40_row11_col0\" class=\"data row11 col0\" >39.3 (25.5, 50.3)</td>\n",
+       "      <td id=\"T_edc40_row11_col1\" class=\"data row11 col1\" >58.4 (48.7, 69.1)</td>\n",
+       "      <td id=\"T_edc40_row11_col2\" class=\"data row11 col2\" >46.6 (36.2, 56.9)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level0_row12\" class=\"row_heading level0 row12\" rowspan=\"6\">Non-Entities</th>\n",
-       "      <th id=\"T_05512_level1_row12\" class=\"row_heading level1 row12\" >Cardinal</th>\n",
-       "      <td id=\"T_05512_row12_col0\" class=\"data row12 col0\" >87.0 (82.8, 90.3)</td>\n",
-       "      <td id=\"T_05512_row12_col1\" class=\"data row12 col1\" >80.5 (77.0, 84.4)</td>\n",
-       "      <td id=\"T_05512_row12_col2\" class=\"data row12 col2\" >89.2 (86.0, 91.7)</td>\n",
+       "      <th id=\"T_edc40_level0_row12\" class=\"row_heading level0 row12\" rowspan=\"6\">Non-Entities</th>\n",
+       "      <th id=\"T_edc40_level1_row12\" class=\"row_heading level1 row12\" >Cardinal</th>\n",
+       "      <td id=\"T_edc40_row12_col0\" class=\"data row12 col0\" >87.0 (82.8, 90.3)</td>\n",
+       "      <td id=\"T_edc40_row12_col1\" class=\"data row12 col1\" >80.5 (77.0, 84.4)</td>\n",
+       "      <td id=\"T_edc40_row12_col2\" class=\"data row12 col2\" >89.2 (86.0, 91.7)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row13\" class=\"row_heading level1 row13\" >Date</th>\n",
-       "      <td id=\"T_05512_row13_col0\" class=\"data row13 col0\" >77.3 (71.6, 81.8)</td>\n",
-       "      <td id=\"T_05512_row13_col1\" class=\"data row13 col1\" >77.6 (72.8, 82.2)</td>\n",
-       "      <td id=\"T_05512_row13_col2\" class=\"data row13 col2\" >78.8 (73.9, 83.4)</td>\n",
+       "      <th id=\"T_edc40_level1_row13\" class=\"row_heading level1 row13\" >Date</th>\n",
+       "      <td id=\"T_edc40_row13_col0\" class=\"data row13 col0\" >77.3 (71.6, 81.8)</td>\n",
+       "      <td id=\"T_edc40_row13_col1\" class=\"data row13 col1\" >77.6 (72.8, 82.2)</td>\n",
+       "      <td id=\"T_edc40_row13_col2\" class=\"data row13 col2\" >78.8 (73.9, 83.4)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row14\" class=\"row_heading level1 row14\" >Money</th>\n",
-       "      <td id=\"T_05512_row14_col0\" class=\"data row14 col0\" >99.3 (97.9, 100.0)</td>\n",
-       "      <td id=\"T_05512_row14_col1\" class=\"data row14 col1\" >98.6 (97.2, 100.0)</td>\n",
-       "      <td id=\"T_05512_row14_col2\" class=\"data row14 col2\" >95.2 (90.0, 98.2)</td>\n",
+       "      <th id=\"T_edc40_level1_row14\" class=\"row_heading level1 row14\" >Money</th>\n",
+       "      <td id=\"T_edc40_row14_col0\" class=\"data row14 col0\" >99.3 (97.9, 100.0)</td>\n",
+       "      <td id=\"T_edc40_row14_col1\" class=\"data row14 col1\" >98.6 (97.2, 100.0)</td>\n",
+       "      <td id=\"T_edc40_row14_col2\" class=\"data row14 col2\" >95.2 (90.0, 98.2)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row15\" class=\"row_heading level1 row15\" >Percent</th>\n",
-       "      <td id=\"T_05512_row15_col0\" class=\"data row15 col0\" >100.0 (100.0, 100.0)</td>\n",
-       "      <td id=\"T_05512_row15_col1\" class=\"data row15 col1\" >100.0 (100.0, 100.0)</td>\n",
-       "      <td id=\"T_05512_row15_col2\" class=\"data row15 col2\" >100.0 (100.0, 100.0)</td>\n",
+       "      <th id=\"T_edc40_level1_row15\" class=\"row_heading level1 row15\" >Percent</th>\n",
+       "      <td id=\"T_edc40_row15_col0\" class=\"data row15 col0\" >100.0 (100.0, 100.0)</td>\n",
+       "      <td id=\"T_edc40_row15_col1\" class=\"data row15 col1\" >100.0 (100.0, 100.0)</td>\n",
+       "      <td id=\"T_edc40_row15_col2\" class=\"data row15 col2\" >100.0 (100.0, 100.0)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row16\" class=\"row_heading level1 row16\" >Quantity</th>\n",
-       "      <td id=\"T_05512_row16_col0\" class=\"data row16 col0\" >78.6 (59.8, 93.8)</td>\n",
-       "      <td id=\"T_05512_row16_col1\" class=\"data row16 col1\" >76.9 (63.9, 89.9)</td>\n",
-       "      <td id=\"T_05512_row16_col2\" class=\"data row16 col2\" >71.3 (50.0, 91.1)</td>\n",
+       "      <th id=\"T_edc40_level1_row16\" class=\"row_heading level1 row16\" >Quantity</th>\n",
+       "      <td id=\"T_edc40_row16_col0\" class=\"data row16 col0\" >78.6 (59.8, 93.8)</td>\n",
+       "      <td id=\"T_edc40_row16_col1\" class=\"data row16 col1\" >76.9 (63.9, 89.9)</td>\n",
+       "      <td id=\"T_edc40_row16_col2\" class=\"data row16 col2\" >71.3 (50.0, 91.1)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level1_row17\" class=\"row_heading level1 row17\" >Time</th>\n",
-       "      <td id=\"T_05512_row17_col0\" class=\"data row17 col0\" >90.9 (83.8, 96.7)</td>\n",
-       "      <td id=\"T_05512_row17_col1\" class=\"data row17 col1\" >85.1 (74.0, 93.7)</td>\n",
-       "      <td id=\"T_05512_row17_col2\" class=\"data row17 col2\" >83.4 (68.0, 95.6)</td>\n",
+       "      <th id=\"T_edc40_level1_row17\" class=\"row_heading level1 row17\" >Time</th>\n",
+       "      <td id=\"T_edc40_row17_col0\" class=\"data row17 col0\" >90.9 (83.8, 96.7)</td>\n",
+       "      <td id=\"T_edc40_row17_col1\" class=\"data row17 col1\" >85.1 (74.0, 93.7)</td>\n",
+       "      <td id=\"T_edc40_row17_col2\" class=\"data row17 col2\" >83.4 (68.0, 95.6)</td>\n",
        "    </tr>\n",
        "    <tr>\n",
-       "      <th id=\"T_05512_level0_row18\" class=\"row_heading level0 row18\" >Average</th>\n",
-       "      <th id=\"T_05512_level1_row18\" class=\"row_heading level1 row18\" >Average</th>\n",
-       "      <td id=\"T_05512_row18_col0\" class=\"data row18 col0\" >80.1 (78.2, 81.9)</td>\n",
-       "      <td id=\"T_05512_row18_col1\" class=\"data row18 col1\" >79.7 (77.7, 81.5)</td>\n",
-       "      <td id=\"T_05512_row18_col2\" class=\"data row18 col2\" >78.4 (76.3, 80.4)</td>\n",
+       "      <th id=\"T_edc40_level0_row18\" class=\"row_heading level0 row18\" >Average</th>\n",
+       "      <th id=\"T_edc40_level1_row18\" class=\"row_heading level1 row18\" >Average</th>\n",
+       "      <td id=\"T_edc40_row18_col0\" class=\"data row18 col0\" >80.1 (78.2, 81.9)</td>\n",
+       "      <td id=\"T_edc40_row18_col1\" class=\"data row18 col1\" >79.7 (77.7, 81.5)</td>\n",
+       "      <td id=\"T_edc40_row18_col2\" class=\"data row18 col2\" >78.4 (76.3, 80.4)</td>\n",
        "    </tr>\n",
        "  </tbody>\n",
        "</table>\n"
       ],
       "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x17847cd30>"
+       "<pandas.io.formats.style.Styler at 0x3ceec3f10>"
       ]
      },
-     "execution_count": 13,
+     "execution_count": 16,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1197,7 +1097,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 17,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -1210,7 +1110,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 18,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -1229,7 +1129,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 19,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -1244,7 +1144,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 17,
+   "execution_count": 20,
    "metadata": {
     "tags": [
      "remove-input"
@@ -1256,23 +1156,23 @@
       "text/html": [
        "\n",
        "<style>\n",
-       "  #altair-viz-ab74447a07bd43b493eb9af490258f99.vega-embed {\n",
+       "  #altair-viz-fe456292bec24900bf9b81c521c84de2.vega-embed {\n",
        "    width: 100%;\n",
        "    display: flex;\n",
        "  }\n",
        "\n",
-       "  #altair-viz-ab74447a07bd43b493eb9af490258f99.vega-embed details,\n",
-       "  #altair-viz-ab74447a07bd43b493eb9af490258f99.vega-embed details summary {\n",
+       "  #altair-viz-fe456292bec24900bf9b81c521c84de2.vega-embed details,\n",
+       "  #altair-viz-fe456292bec24900bf9b81c521c84de2.vega-embed details summary {\n",
        "    position: relative;\n",
        "  }\n",
        "</style>\n",
-       "<div id=\"altair-viz-ab74447a07bd43b493eb9af490258f99\"></div>\n",
+       "<div id=\"altair-viz-fe456292bec24900bf9b81c521c84de2\"></div>\n",
        "<script type=\"text/javascript\">\n",
        "  var VEGA_DEBUG = (typeof VEGA_DEBUG == \"undefined\") ? {} : VEGA_DEBUG;\n",
        "  (function(spec, embedOpt){\n",
        "    let outputDiv = document.currentScript.previousElementSibling;\n",
-       "    if (outputDiv.id !== \"altair-viz-ab74447a07bd43b493eb9af490258f99\") {\n",
-       "      outputDiv = document.getElementById(\"altair-viz-ab74447a07bd43b493eb9af490258f99\");\n",
+       "    if (outputDiv.id !== \"altair-viz-fe456292bec24900bf9b81c521c84de2\") {\n",
+       "      outputDiv = document.getElementById(\"altair-viz-fe456292bec24900bf9b81c521c84de2\");\n",
        "    }\n",
        "    const paths = {\n",
        "      \"vega\": \"https://cdn.jsdelivr.net/npm/vega@5?noext\",\n",
@@ -1318,14 +1218,14 @@
        "        .catch(showError)\n",
        "        .then(() => displayChart(vegaEmbed));\n",
        "    }\n",
-       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"point\", \"filled\": true}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_2\", \"value\": 1}, \"value\": 0.0}, \"size\": {\"condition\": {\"param\": \"param_3\", \"field\": \"Number of docs\", \"legend\": null}, \"value\": 100}, \"tooltip\": [{\"field\": \"Model\", \"type\": \"nominal\"}, {\"field\": \"Domain\", \"type\": \"nominal\"}, {\"field\": \"Average F1\", \"type\": \"nominal\"}], \"x\": {\"field\": \"Average\", \"scale\": {\"domain\": [0.0, 1.0]}, \"title\": \"F1\", \"type\": \"quantitative\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"saattrupdan/nbailab-base-ner-scandi\", \"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}, \"name\": \"view_2\"}, {\"mark\": {\"type\": \"errorbar\", \"ticks\": false}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_2\", \"value\": 1}, \"value\": 0.0}, \"x\": {\"field\": \"Average Lower CI\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"x2\": {\"field\": \"Average Upper CI\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"saattrupdan/nbailab-base-ner-scandi\", \"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}}], \"data\": {\"name\": \"data-f41e944fb77a7a56152b17a7560d7b9e\"}, \"height\": 300, \"params\": [{\"name\": \"param_2\", \"select\": {\"type\": \"point\", \"fields\": [\"Domain\"]}, \"bind\": \"legend\", \"value\": [{\"Domain\": \"All\"}], \"views\": [\"view_2\"]}, {\"name\": \"param_3\", \"bind\": {\"input\": \"checkbox\", \"name\": \"Scale point size by number of documents: \"}}], \"title\": \"DANSK test set performance\", \"width\": 400, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.8.0.json\", \"datasets\": {\"data-f41e944fb77a7a56152b17a7560d7b9e\": [{\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8101067602127482, \"Average Lower CI\": 0.7841651487553125, \"Average Upper CI\": 0.830900900900901, \"Average F1\": \"0.81 (0.78, 0.83)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.8663320350050492, \"Average Lower CI\": 0.8419256402801457, \"Average Upper CI\": 0.8887819496820972, \"Average F1\": \"0.87 (0.84, 0.89)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.7641179934708223, \"Average Lower CI\": 0.7337162907078971, \"Average Upper CI\": 0.7902515430981282, \"Average F1\": \"0.76 (0.73, 0.79)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7220179014224088, \"Average Lower CI\": 0.6878643801132788, \"Average Upper CI\": 0.762446517440944, \"Average F1\": \"0.72 (0.69, 0.76)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.823329124708956, \"Average Lower CI\": 0.7975750707209395, \"Average Upper CI\": 0.8467087702231627, \"Average F1\": \"0.82 (0.80, 0.85)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.5842981151577813, \"Average Lower CI\": 0.5411082722470623, \"Average Upper CI\": 0.6276502609352638, \"Average F1\": \"0.58 (0.54, 0.63)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.8012382615583585, \"Average Lower CI\": 0.7773314556164734, \"Average Upper CI\": 0.8290060904096623, \"Average F1\": \"0.80 (0.78, 0.83)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8069059577346168, \"Average Lower CI\": 0.7792190204698447, \"Average Upper CI\": 0.8320044217003898, \"Average F1\": \"0.81 (0.78, 0.83)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.8792798287165162, \"Average Lower CI\": 0.860279516303508, \"Average Upper CI\": 0.8961524325753569, \"Average F1\": \"0.88 (0.86, 0.90)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.6636923028744094, \"Average Lower CI\": 0.6349232630707509, \"Average Upper CI\": 0.6883207901715027, \"Average F1\": \"0.66 (0.63, 0.69)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7937488810814491, \"Average Lower CI\": 0.7653571428571427, \"Average Upper CI\": 0.8218744746115128, \"Average F1\": \"0.79 (0.77, 0.82)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.6966281148220598, \"Average Lower CI\": 0.6733559377459511, \"Average Upper CI\": 0.7196226874856663, \"Average F1\": \"0.70 (0.67, 0.72)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.6944594484094899, \"Average Lower CI\": 0.6478237984608682, \"Average Upper CI\": 0.7331416617609958, \"Average F1\": \"0.69 (0.65, 0.73)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.7954568921751537, \"Average Lower CI\": 0.7682324162204714, \"Average Upper CI\": 0.825265478923979, \"Average F1\": \"0.80 (0.77, 0.83)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.7781528937111613, \"Average Lower CI\": 0.7453085067542898, \"Average Upper CI\": 0.7999058473736373, \"Average F1\": \"0.78 (0.75, 0.80)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.9090202269126079, \"Average Lower CI\": 0.8905576809510362, \"Average Upper CI\": 0.9278187376371155, \"Average F1\": \"0.91 (0.89, 0.93)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.7369381979372508, \"Average Lower CI\": 0.7024462244622447, \"Average Upper CI\": 0.7668525088402879, \"Average F1\": \"0.74 (0.70, 0.77)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7414870979112445, \"Average Lower CI\": 0.711301648812756, \"Average Upper CI\": 0.774739456390258, \"Average F1\": \"0.74 (0.71, 0.77)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.7978561822955089, \"Average Lower CI\": 0.7712527545212747, \"Average Upper CI\": 0.8215780291306777, \"Average F1\": \"0.80 (0.77, 0.82)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.707274819499705, \"Average Lower CI\": 0.6689111635220126, \"Average Upper CI\": 0.7518443992428864, \"Average F1\": \"0.71 (0.67, 0.75)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.7842946502544421, \"Average Lower CI\": 0.7563924902895867, \"Average Upper CI\": 0.8127158179241442, \"Average F1\": \"0.78 (0.76, 0.81)\", \"Number of docs\": 1500}]}}, {\"mode\": \"vega-lite\"});\n",
+       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"point\", \"filled\": true}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_2\", \"value\": 1}, \"value\": 0.0}, \"size\": {\"condition\": {\"param\": \"param_3\", \"field\": \"Number of docs\", \"legend\": null}, \"value\": 100}, \"tooltip\": [{\"field\": \"Model\", \"type\": \"nominal\"}, {\"field\": \"Domain\", \"type\": \"nominal\"}, {\"field\": \"Average F1\", \"type\": \"nominal\"}], \"x\": {\"field\": \"Average\", \"scale\": {\"domain\": [0.0, 1.0]}, \"title\": \"F1\", \"type\": \"quantitative\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"saattrupdan/nbailab-base-ner-scandi\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}, \"name\": \"view_2\"}, {\"mark\": {\"type\": \"errorbar\", \"ticks\": false}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_2\", \"value\": 1}, \"value\": 0.0}, \"x\": {\"field\": \"Average Lower CI\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"x2\": {\"field\": \"Average Upper CI\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"saattrupdan/nbailab-base-ner-scandi\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}}], \"data\": {\"name\": \"data-f41e944fb77a7a56152b17a7560d7b9e\"}, \"height\": 300, \"params\": [{\"name\": \"param_2\", \"select\": {\"type\": \"point\", \"fields\": [\"Domain\"]}, \"bind\": \"legend\", \"value\": [{\"Domain\": \"All\"}], \"views\": [\"view_2\"]}, {\"name\": \"param_3\", \"bind\": {\"input\": \"checkbox\", \"name\": \"Scale point size by number of documents: \"}}], \"title\": \"DANSK test set performance\", \"width\": 400, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.8.0.json\", \"datasets\": {\"data-f41e944fb77a7a56152b17a7560d7b9e\": [{\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8101067602127482, \"Average Lower CI\": 0.7841651487553125, \"Average Upper CI\": 0.830900900900901, \"Average F1\": \"0.81 (0.78, 0.83)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.8663320350050492, \"Average Lower CI\": 0.8419256402801457, \"Average Upper CI\": 0.8887819496820972, \"Average F1\": \"0.87 (0.84, 0.89)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.7641179934708223, \"Average Lower CI\": 0.7337162907078971, \"Average Upper CI\": 0.7902515430981282, \"Average F1\": \"0.76 (0.73, 0.79)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7220179014224088, \"Average Lower CI\": 0.6878643801132788, \"Average Upper CI\": 0.762446517440944, \"Average F1\": \"0.72 (0.69, 0.76)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.823329124708956, \"Average Lower CI\": 0.7975750707209395, \"Average Upper CI\": 0.8467087702231627, \"Average F1\": \"0.82 (0.80, 0.85)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.5842981151577813, \"Average Lower CI\": 0.5411082722470623, \"Average Upper CI\": 0.6276502609352638, \"Average F1\": \"0.58 (0.54, 0.63)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.8012382615583585, \"Average Lower CI\": 0.7773314556164734, \"Average Upper CI\": 0.8290060904096623, \"Average F1\": \"0.80 (0.78, 0.83)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8069059577346168, \"Average Lower CI\": 0.7792190204698447, \"Average Upper CI\": 0.8320044217003898, \"Average F1\": \"0.81 (0.78, 0.83)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.8792798287165162, \"Average Lower CI\": 0.860279516303508, \"Average Upper CI\": 0.8961524325753569, \"Average F1\": \"0.88 (0.86, 0.90)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.6636923028744094, \"Average Lower CI\": 0.6349232630707509, \"Average Upper CI\": 0.6883207901715027, \"Average F1\": \"0.66 (0.63, 0.69)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7937488810814491, \"Average Lower CI\": 0.7653571428571427, \"Average Upper CI\": 0.8218744746115128, \"Average F1\": \"0.79 (0.77, 0.82)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.6966281148220598, \"Average Lower CI\": 0.6733559377459511, \"Average Upper CI\": 0.7196226874856663, \"Average F1\": \"0.70 (0.67, 0.72)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.6944594484094899, \"Average Lower CI\": 0.6478237984608682, \"Average Upper CI\": 0.7331416617609958, \"Average F1\": \"0.69 (0.65, 0.73)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.7954568921751537, \"Average Lower CI\": 0.7682324162204714, \"Average Upper CI\": 0.825265478923979, \"Average F1\": \"0.80 (0.77, 0.83)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.7781528937111613, \"Average Lower CI\": 0.7453085067542898, \"Average Upper CI\": 0.7999058473736373, \"Average F1\": \"0.78 (0.75, 0.80)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.9090202269126079, \"Average Lower CI\": 0.8905576809510362, \"Average Upper CI\": 0.9278187376371155, \"Average F1\": \"0.91 (0.89, 0.93)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.7369381979372508, \"Average Lower CI\": 0.7024462244622447, \"Average Upper CI\": 0.7668525088402879, \"Average F1\": \"0.74 (0.70, 0.77)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7414870979112445, \"Average Lower CI\": 0.711301648812756, \"Average Upper CI\": 0.774739456390258, \"Average F1\": \"0.74 (0.71, 0.77)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.7978561822955089, \"Average Lower CI\": 0.7712527545212747, \"Average Upper CI\": 0.8215780291306777, \"Average F1\": \"0.80 (0.77, 0.82)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.707274819499705, \"Average Lower CI\": 0.6689111635220126, \"Average Upper CI\": 0.7518443992428864, \"Average F1\": \"0.71 (0.67, 0.75)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.7842946502544421, \"Average Lower CI\": 0.7563924902895867, \"Average Upper CI\": 0.8127158179241442, \"Average F1\": \"0.78 (0.76, 0.81)\", \"Number of docs\": 1500}]}}, {\"mode\": \"vega-lite\"});\n",
        "</script>"
       ],
       "text/plain": [
        "alt.LayerChart(...)"
       ]
      },
-     "execution_count": 17,
+     "execution_count": 20,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1396,7 +1296,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 18,
+   "execution_count": 21,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -1409,7 +1309,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 26,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -1419,11 +1319,11 @@
    "source": [
     "tables = []\n",
     "for mdl_name in dansk:\n",
-    "    if \"fine_grained\" in mdl_name:\n",
-    "        continue\n",
+    "    # if \"fine_grained\" in mdl_name:\n",
+    "    #     continue\n",
     "    examples = dansk[mdl_name][\"test\"][\"examples\"]\n",
-    "    examples += dansk[mdl_name][\"dev\"][\"examples\"]\n",
-    "    examples += dansk[mdl_name][\"train\"][\"examples\"]\n",
+    "    # examples += dansk[mdl_name][\"dev\"][\"examples\"]\n",
+    "    # examples += dansk[mdl_name][\"train\"][\"examples\"]\n",
     "\n",
     "    \n",
     "    examples = convert_to_conll_2003(examples)\n",
@@ -1435,7 +1335,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 20,
+   "execution_count": 27,
    "metadata": {
     "tags": [
      "remove-cell"
@@ -1450,7 +1350,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 21,
+   "execution_count": 28,
    "metadata": {
     "tags": [
      "remove-input"
@@ -1462,23 +1362,23 @@
       "text/html": [
        "\n",
        "<style>\n",
-       "  #altair-viz-15ce44fa180d4c9db32ce47daf4b14e4.vega-embed {\n",
+       "  #altair-viz-af178b9951294daab69185da8a796b24.vega-embed {\n",
        "    width: 100%;\n",
        "    display: flex;\n",
        "  }\n",
        "\n",
-       "  #altair-viz-15ce44fa180d4c9db32ce47daf4b14e4.vega-embed details,\n",
-       "  #altair-viz-15ce44fa180d4c9db32ce47daf4b14e4.vega-embed details summary {\n",
+       "  #altair-viz-af178b9951294daab69185da8a796b24.vega-embed details,\n",
+       "  #altair-viz-af178b9951294daab69185da8a796b24.vega-embed details summary {\n",
        "    position: relative;\n",
        "  }\n",
        "</style>\n",
-       "<div id=\"altair-viz-15ce44fa180d4c9db32ce47daf4b14e4\"></div>\n",
+       "<div id=\"altair-viz-af178b9951294daab69185da8a796b24\"></div>\n",
        "<script type=\"text/javascript\">\n",
        "  var VEGA_DEBUG = (typeof VEGA_DEBUG == \"undefined\") ? {} : VEGA_DEBUG;\n",
        "  (function(spec, embedOpt){\n",
        "    let outputDiv = document.currentScript.previousElementSibling;\n",
-       "    if (outputDiv.id !== \"altair-viz-15ce44fa180d4c9db32ce47daf4b14e4\") {\n",
-       "      outputDiv = document.getElementById(\"altair-viz-15ce44fa180d4c9db32ce47daf4b14e4\");\n",
+       "    if (outputDiv.id !== \"altair-viz-af178b9951294daab69185da8a796b24\") {\n",
+       "      outputDiv = document.getElementById(\"altair-viz-af178b9951294daab69185da8a796b24\");\n",
        "    }\n",
        "    const paths = {\n",
        "      \"vega\": \"https://cdn.jsdelivr.net/npm/vega@5?noext\",\n",
@@ -1524,14 +1424,14 @@
        "        .catch(showError)\n",
        "        .then(() => displayChart(vegaEmbed));\n",
        "    }\n",
-       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"point\", \"filled\": true}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_4\", \"value\": 1}, \"value\": 0.0}, \"size\": {\"condition\": {\"param\": \"param_5\", \"field\": \"Number of docs\", \"legend\": null}, \"value\": 100}, \"tooltip\": [{\"field\": \"Model\", \"type\": \"nominal\"}, {\"field\": \"Domain\", \"type\": \"nominal\"}, {\"field\": \"Average F1\", \"type\": \"nominal\"}, {\"field\": \"Person F1\", \"type\": \"nominal\"}, {\"field\": \"Location F1\", \"type\": \"nominal\"}, {\"field\": \"Organization F1\", \"type\": \"nominal\"}], \"x\": {\"field\": \"Average\", \"scale\": {\"domain\": [0.0, 1.0]}, \"title\": \"F1\", \"type\": \"quantitative\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"saattrupdan/nbailab-base-ner-scandi\", \"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}, \"name\": \"view_3\"}, {\"mark\": {\"type\": \"errorbar\", \"ticks\": false}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_4\", \"value\": 1}, \"value\": 0.0}, \"x\": {\"field\": \"Average Lower CI\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"x2\": {\"field\": \"Average Upper CI\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"saattrupdan/nbailab-base-ner-scandi\", \"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}}], \"data\": {\"name\": \"data-290b8a00f13b86923ad85bd2d9a5337f\"}, \"height\": 300, \"params\": [{\"name\": \"param_4\", \"select\": {\"type\": \"point\", \"fields\": [\"Domain\"]}, \"bind\": \"legend\", \"value\": [{\"Domain\": \"All\"}], \"views\": [\"view_3\"]}, {\"name\": \"param_5\", \"bind\": {\"input\": \"checkbox\", \"name\": \"Scale point size by number of documents: \"}}], \"title\": \"Generalization to Unseen Domains\", \"width\": 400, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.8.0.json\", \"datasets\": {\"data-290b8a00f13b86923ad85bd2d9a5337f\": [{\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Web\", \"Average\": 0.6320979667934344, \"Average Lower CI\": 0.5772940747683015, \"Average Upper CI\": 0.6807455174059502, \"Average F1\": \"0.63 (0.58, 0.68)\", \"Person F1\": \"0.76 (0.70, 0.82)\", \"Organization F1\": \"0.44 (0.34, 0.53)\", \"Location F1\": \"0.71 (0.61, 0.80)\", \"Number of docs\": 8270}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Legal\", \"Average\": 0.6091491463766007, \"Average Lower CI\": 0.5561125604518662, \"Average Upper CI\": 0.6694873582948897, \"Average F1\": \"0.61 (0.56, 0.67)\", \"Person F1\": \"0.64 (0.54, 0.74)\", \"Organization F1\": \"0.57 (0.51, 0.64)\", \"Location F1\": \"0.70 (0.56, 0.83)\", \"Number of docs\": 2163}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Conversation\", \"Average\": 0.6868105414946557, \"Average Lower CI\": 0.6288968945167018, \"Average Upper CI\": 0.733696412560472, \"Average F1\": \"0.69 (0.63, 0.73)\", \"Person F1\": \"0.45 (0.34, 0.53)\", \"Organization F1\": \"0.68 (0.56, 0.80)\", \"Location F1\": \"0.91 (0.86, 0.95)\", \"Number of docs\": 1649}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7071938816537304, \"Average Lower CI\": 0.6478843311160384, \"Average Upper CI\": 0.7605586293923509, \"Average F1\": \"0.71 (0.65, 0.76)\", \"Person F1\": \"0.65 (0.54, 0.73)\", \"Organization F1\": \"0.62 (0.46, 0.74)\", \"Location F1\": \"0.77 (0.70, 0.84)\", \"Number of docs\": 1709}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"News\", \"Average\": 0.6930174636150015, \"Average Lower CI\": 0.6646859011292303, \"Average Upper CI\": 0.7221996681383499, \"Average F1\": \"0.69 (0.66, 0.72)\", \"Person F1\": \"0.78 (0.74, 0.82)\", \"Organization F1\": \"0.62 (0.57, 0.68)\", \"Location F1\": \"0.65 (0.60, 0.70)\", \"Number of docs\": 421}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Social Media\", \"Average\": 0.7146932414144532, \"Average Lower CI\": 0.6727417628443784, \"Average Upper CI\": 0.7635720331809718, \"Average F1\": \"0.71 (0.67, 0.76)\", \"Person F1\": \"0.82 (0.76, 0.87)\", \"Organization F1\": \"0.39 (0.29, 0.48)\", \"Location F1\": \"0.80 (0.73, 0.86)\", \"Number of docs\": 554}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"All\", \"Average\": 0.6399846068221187, \"Average Lower CI\": 0.5913243276585245, \"Average Upper CI\": 0.6863364795832064, \"Average F1\": \"0.64 (0.59, 0.69)\", \"Person F1\": \"0.70 (0.63, 0.76)\", \"Organization F1\": \"0.49 (0.40, 0.58)\", \"Location F1\": \"0.74 (0.62, 0.81)\", \"Number of docs\": 15062}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Web\", \"Average\": 0.6622299878444764, \"Average Lower CI\": 0.6067156841323254, \"Average Upper CI\": 0.7040365031143719, \"Average F1\": \"0.66 (0.61, 0.70)\", \"Person F1\": \"0.79 (0.72, 0.84)\", \"Organization F1\": \"0.46 (0.39, 0.53)\", \"Location F1\": \"0.77 (0.70, 0.83)\", \"Number of docs\": 8270}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Legal\", \"Average\": 0.6705098767100004, \"Average Lower CI\": 0.6259144053402851, \"Average Upper CI\": 0.7092298537220516, \"Average F1\": \"0.67 (0.63, 0.71)\", \"Person F1\": \"0.75 (0.67, 0.83)\", \"Organization F1\": \"0.62 (0.56, 0.68)\", \"Location F1\": \"0.74 (0.60, 0.84)\", \"Number of docs\": 2163}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Conversation\", \"Average\": 0.6542176020229208, \"Average Lower CI\": 0.6019818043008016, \"Average Upper CI\": 0.7140041741204531, \"Average F1\": \"0.65 (0.60, 0.71)\", \"Person F1\": \"0.48 (0.36, 0.57)\", \"Organization F1\": \"0.46 (0.31, 0.59)\", \"Location F1\": \"0.92 (0.88, 0.96)\", \"Number of docs\": 1649}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.6542573239405536, \"Average Lower CI\": 0.5965014245014245, \"Average Upper CI\": 0.7100683431310761, \"Average F1\": \"0.65 (0.60, 0.71)\", \"Person F1\": \"0.60 (0.50, 0.69)\", \"Organization F1\": \"0.43 (0.31, 0.52)\", \"Location F1\": \"0.82 (0.74, 0.87)\", \"Number of docs\": 1709}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"News\", \"Average\": 0.6919175862990398, \"Average Lower CI\": 0.6616499275837584, \"Average Upper CI\": 0.7227475950526797, \"Average F1\": \"0.69 (0.66, 0.72)\", \"Person F1\": \"0.76 (0.73, 0.81)\", \"Organization F1\": \"0.56 (0.51, 0.61)\", \"Location F1\": \"0.73 (0.69, 0.79)\", \"Number of docs\": 421}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Social Media\", \"Average\": 0.7549612024929343, \"Average Lower CI\": 0.7119168127463809, \"Average Upper CI\": 0.7917034827948499, \"Average F1\": \"0.75 (0.71, 0.79)\", \"Person F1\": \"0.83 (0.79, 0.88)\", \"Organization F1\": \"0.45 (0.38, 0.53)\", \"Location F1\": \"0.90 (0.85, 0.95)\", \"Number of docs\": 554}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"All\", \"Average\": 0.664953725293192, \"Average Lower CI\": 0.6217947060344624, \"Average Upper CI\": 0.7064397860593513, \"Average F1\": \"0.66 (0.62, 0.71)\", \"Person F1\": \"0.74 (0.67, 0.79)\", \"Organization F1\": \"0.50 (0.42, 0.56)\", \"Location F1\": \"0.79 (0.72, 0.85)\", \"Number of docs\": 15062}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Web\", \"Average\": 0.5429015929539475, \"Average Lower CI\": 0.48955164757226394, \"Average Upper CI\": 0.600878112968197, \"Average F1\": \"0.54 (0.49, 0.60)\", \"Person F1\": \"0.66 (0.58, 0.73)\", \"Organization F1\": \"0.37 (0.31, 0.46)\", \"Location F1\": \"0.63 (0.51, 0.71)\", \"Number of docs\": 8270}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Legal\", \"Average\": 0.5958256886871834, \"Average Lower CI\": 0.5559941357868662, \"Average Upper CI\": 0.6406445244706698, \"Average F1\": \"0.60 (0.56, 0.64)\", \"Person F1\": \"0.74 (0.64, 0.82)\", \"Organization F1\": \"0.48 (0.42, 0.55)\", \"Location F1\": \"0.79 (0.68, 0.89)\", \"Number of docs\": 2163}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Conversation\", \"Average\": 0.6168235305503006, \"Average Lower CI\": 0.5622598708645221, \"Average Upper CI\": 0.6705878502225713, \"Average F1\": \"0.62 (0.56, 0.67)\", \"Person F1\": \"0.39 (0.30, 0.47)\", \"Organization F1\": \"0.50 (0.37, 0.61)\", \"Location F1\": \"0.92 (0.88, 0.96)\", \"Number of docs\": 1649}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.6013171286772022, \"Average Lower CI\": 0.5419592074592074, \"Average Upper CI\": 0.6513982076552458, \"Average F1\": \"0.60 (0.54, 0.65)\", \"Person F1\": \"0.59 (0.49, 0.68)\", \"Organization F1\": \"0.32 (0.22, 0.43)\", \"Location F1\": \"0.75 (0.67, 0.81)\", \"Number of docs\": 1709}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"News\", \"Average\": 0.5916103793988399, \"Average Lower CI\": 0.5514664353215447, \"Average Upper CI\": 0.6284386551663439, \"Average F1\": \"0.59 (0.55, 0.63)\", \"Person F1\": \"0.66 (0.61, 0.71)\", \"Organization F1\": \"0.57 (0.51, 0.63)\", \"Location F1\": \"0.53 (0.48, 0.59)\", \"Number of docs\": 421}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Social Media\", \"Average\": 0.6229443114860667, \"Average Lower CI\": 0.5669289935014807, \"Average Upper CI\": 0.6692543941862644, \"Average F1\": \"0.62 (0.57, 0.67)\", \"Person F1\": \"0.65 (0.58, 0.72)\", \"Organization F1\": \"0.41 (0.33, 0.49)\", \"Location F1\": \"0.80 (0.74, 0.86)\", \"Number of docs\": 554}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"All\", \"Average\": 0.5569509457639416, \"Average Lower CI\": 0.49619818542368543, \"Average Upper CI\": 0.6100553940441581, \"Average F1\": \"0.56 (0.50, 0.61)\", \"Person F1\": \"0.62 (0.54, 0.70)\", \"Organization F1\": \"0.40 (0.31, 0.47)\", \"Location F1\": \"0.68 (0.57, 0.77)\", \"Number of docs\": 15062}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Web\", \"Average\": 0.5461978061161671, \"Average Lower CI\": 0.5069639110204845, \"Average Upper CI\": 0.5969669409344694, \"Average F1\": \"0.55 (0.51, 0.60)\", \"Person F1\": \"0.73 (0.66, 0.78)\", \"Organization F1\": \"0.33 (0.26, 0.41)\", \"Location F1\": \"0.64 (0.57, 0.71)\", \"Number of docs\": 8270}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Legal\", \"Average\": 0.536429517680482, \"Average Lower CI\": 0.4824591818015043, \"Average Upper CI\": 0.5958867300943556, \"Average F1\": \"0.54 (0.48, 0.60)\", \"Person F1\": \"0.52 (0.38, 0.64)\", \"Organization F1\": \"0.56 (0.49, 0.62)\", \"Location F1\": \"0.44 (0.26, 0.59)\", \"Number of docs\": 2163}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Conversation\", \"Average\": 0.6268520454467161, \"Average Lower CI\": 0.5757813428401664, \"Average Upper CI\": 0.6786188472541147, \"Average F1\": \"0.63 (0.58, 0.68)\", \"Person F1\": \"0.43 (0.30, 0.51)\", \"Organization F1\": \"0.48 (0.37, 0.58)\", \"Location F1\": \"0.89 (0.84, 0.93)\", \"Number of docs\": 1649}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.46992430120737955, \"Average Lower CI\": 0.41995114847401627, \"Average Upper CI\": 0.51962931735553, \"Average F1\": \"0.47 (0.42, 0.52)\", \"Person F1\": \"0.52 (0.41, 0.61)\", \"Organization F1\": \"0.23 (0.15, 0.30)\", \"Location F1\": \"0.56 (0.50, 0.63)\", \"Number of docs\": 1709}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"News\", \"Average\": 0.6758817829004726, \"Average Lower CI\": 0.6382040892047133, \"Average Upper CI\": 0.707565011820331, \"Average F1\": \"0.68 (0.64, 0.71)\", \"Person F1\": \"0.76 (0.72, 0.80)\", \"Organization F1\": \"0.54 (0.48, 0.60)\", \"Location F1\": \"0.69 (0.64, 0.73)\", \"Number of docs\": 421}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Social Media\", \"Average\": 0.6894082728405587, \"Average Lower CI\": 0.6451891646489103, \"Average Upper CI\": 0.725898249488777, \"Average F1\": \"0.69 (0.65, 0.73)\", \"Person F1\": \"0.83 (0.77, 0.87)\", \"Organization F1\": \"0.45 (0.35, 0.57)\", \"Location F1\": \"0.66 (0.56, 0.73)\", \"Number of docs\": 554}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"All\", \"Average\": 0.5444872004098057, \"Average Lower CI\": 0.4915802185619259, \"Average Upper CI\": 0.5935406545573487, \"Average F1\": \"0.54 (0.49, 0.59)\", \"Person F1\": \"0.64 (0.56, 0.72)\", \"Organization F1\": \"0.38 (0.30, 0.46)\", \"Location F1\": \"0.65 (0.56, 0.72)\", \"Number of docs\": 15062}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Web\", \"Average\": 0.6409070653617142, \"Average Lower CI\": 0.5889088534921868, \"Average Upper CI\": 0.693482868803189, \"Average F1\": \"0.64 (0.59, 0.69)\", \"Person F1\": \"0.76 (0.70, 0.82)\", \"Organization F1\": \"0.44 (0.37, 0.55)\", \"Location F1\": \"0.71 (0.64, 0.79)\", \"Number of docs\": 8270}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Legal\", \"Average\": 0.7598117588210556, \"Average Lower CI\": 0.7161917167009288, \"Average Upper CI\": 0.7983702763026245, \"Average F1\": \"0.76 (0.72, 0.80)\", \"Person F1\": \"0.76 (0.67, 0.83)\", \"Organization F1\": \"0.75 (0.71, 0.80)\", \"Location F1\": \"0.81 (0.67, 0.90)\", \"Number of docs\": 2163}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Conversation\", \"Average\": 0.6593392586208562, \"Average Lower CI\": 0.5947191641011913, \"Average Upper CI\": 0.7285752473593345, \"Average F1\": \"0.66 (0.59, 0.73)\", \"Person F1\": \"0.47 (0.36, 0.56)\", \"Organization F1\": \"0.49 (0.29, 0.62)\", \"Location F1\": \"0.92 (0.88, 0.96)\", \"Number of docs\": 1649}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7018148381144313, \"Average Lower CI\": 0.6321812888672114, \"Average Upper CI\": 0.7556884494815529, \"Average F1\": \"0.70 (0.63, 0.76)\", \"Person F1\": \"0.68 (0.59, 0.76)\", \"Organization F1\": \"0.41 (0.24, 0.55)\", \"Location F1\": \"0.81 (0.75, 0.86)\", \"Number of docs\": 1709}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"News\", \"Average\": 0.7094609467638066, \"Average Lower CI\": 0.6772939111022244, \"Average Upper CI\": 0.7341493750609626, \"Average F1\": \"0.71 (0.68, 0.73)\", \"Person F1\": \"0.77 (0.73, 0.81)\", \"Organization F1\": \"0.62 (0.56, 0.67)\", \"Location F1\": \"0.70 (0.65, 0.74)\", \"Number of docs\": 421}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Social Media\", \"Average\": 0.7396773181136647, \"Average Lower CI\": 0.6929453672293987, \"Average Upper CI\": 0.785763293310463, \"Average F1\": \"0.74 (0.69, 0.79)\", \"Person F1\": \"0.81 (0.75, 0.86)\", \"Organization F1\": \"0.47 (0.37, 0.57)\", \"Location F1\": \"0.83 (0.77, 0.90)\", \"Number of docs\": 554}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"All\", \"Average\": 0.6644254866827842, \"Average Lower CI\": 0.6035380314277451, \"Average Upper CI\": 0.7188656810176565, \"Average F1\": \"0.66 (0.60, 0.72)\", \"Person F1\": \"0.72 (0.65, 0.78)\", \"Organization F1\": \"0.52 (0.41, 0.61)\", \"Location F1\": \"0.76 (0.68, 0.83)\", \"Number of docs\": 15062}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.5717369198343648, \"Average Lower CI\": 0.5082934413798914, \"Average Upper CI\": 0.624909837855705, \"Average F1\": \"0.57 (0.51, 0.62)\", \"Person F1\": \"0.66 (0.60, 0.73)\", \"Organization F1\": \"0.37 (0.29, 0.47)\", \"Location F1\": \"0.69 (0.60, 0.77)\", \"Number of docs\": 8270}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.6762522405192257, \"Average Lower CI\": 0.6271914294898971, \"Average Upper CI\": 0.722508563135951, \"Average F1\": \"0.68 (0.63, 0.72)\", \"Person F1\": \"0.71 (0.62, 0.79)\", \"Organization F1\": \"0.63 (0.58, 0.69)\", \"Location F1\": \"0.80 (0.67, 0.91)\", \"Number of docs\": 2163}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.6234100285427392, \"Average Lower CI\": 0.567126906271783, \"Average Upper CI\": 0.6840985610092647, \"Average F1\": \"0.62 (0.57, 0.68)\", \"Person F1\": \"0.44 (0.33, 0.55)\", \"Organization F1\": \"0.40 (0.24, 0.52)\", \"Location F1\": \"0.89 (0.85, 0.93)\", \"Number of docs\": 1649}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.6148739675696991, \"Average Lower CI\": 0.5642660339813256, \"Average Upper CI\": 0.6703068610254237, \"Average F1\": \"0.61 (0.56, 0.67)\", \"Person F1\": \"0.58 (0.50, 0.67)\", \"Organization F1\": \"0.26 (0.12, 0.38)\", \"Location F1\": \"0.76 (0.69, 0.82)\", \"Number of docs\": 1709}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"News\", \"Average\": 0.691160431800026, \"Average Lower CI\": 0.6555163417138534, \"Average Upper CI\": 0.7208689637826962, \"Average F1\": \"0.69 (0.66, 0.72)\", \"Person F1\": \"0.71 (0.68, 0.76)\", \"Organization F1\": \"0.55 (0.46, 0.61)\", \"Location F1\": \"0.77 (0.71, 0.81)\", \"Number of docs\": 421}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.7107722551142583, \"Average Lower CI\": 0.671195919335157, \"Average Upper CI\": 0.7532407407407407, \"Average F1\": \"0.71 (0.67, 0.75)\", \"Person F1\": \"0.76 (0.71, 0.81)\", \"Organization F1\": \"0.45 (0.36, 0.54)\", \"Location F1\": \"0.83 (0.76, 0.89)\", \"Number of docs\": 554}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"All\", \"Average\": 0.5941779959127065, \"Average Lower CI\": 0.5375469336670838, \"Average Upper CI\": 0.6430959568288406, \"Average F1\": \"0.59 (0.54, 0.64)\", \"Person F1\": \"0.63 (0.54, 0.71)\", \"Organization F1\": \"0.43 (0.34, 0.52)\", \"Location F1\": \"0.73 (0.63, 0.80)\", \"Number of docs\": 15062}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.4859487847315235, \"Average Lower CI\": 0.43429190757967623, \"Average Upper CI\": 0.5372173263110323, \"Average F1\": \"0.49 (0.43, 0.54)\", \"Person F1\": \"0.65 (0.58, 0.73)\", \"Organization F1\": \"0.29 (0.21, 0.38)\", \"Location F1\": \"0.56 (0.45, 0.64)\", \"Number of docs\": 8270}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.5568956849585586, \"Average Lower CI\": 0.49839034509529123, \"Average Upper CI\": 0.608655303030303, \"Average F1\": \"0.56 (0.50, 0.61)\", \"Person F1\": \"0.71 (0.62, 0.83)\", \"Organization F1\": \"0.44 (0.38, 0.52)\", \"Location F1\": \"0.71 (0.59, 0.83)\", \"Number of docs\": 2163}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.6077738474778475, \"Average Lower CI\": 0.5579258733398409, \"Average Upper CI\": 0.6628561064019317, \"Average F1\": \"0.61 (0.56, 0.66)\", \"Person F1\": \"0.36 (0.26, 0.47)\", \"Organization F1\": \"0.52 (0.39, 0.65)\", \"Location F1\": \"0.89 (0.84, 0.94)\", \"Number of docs\": 1649}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.5171714580214156, \"Average Lower CI\": 0.442906976744186, \"Average Upper CI\": 0.5804834955564959, \"Average F1\": \"0.52 (0.44, 0.58)\", \"Person F1\": \"0.45 (0.36, 0.54)\", \"Organization F1\": \"0.25 (0.13, 0.34)\", \"Location F1\": \"0.70 (0.63, 0.76)\", \"Number of docs\": 1709}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"News\", \"Average\": 0.6154821004039736, \"Average Lower CI\": 0.5746965811965812, \"Average Upper CI\": 0.6540876498287672, \"Average F1\": \"0.62 (0.57, 0.65)\", \"Person F1\": \"0.69 (0.65, 0.74)\", \"Organization F1\": \"0.46 (0.40, 0.54)\", \"Location F1\": \"0.64 (0.59, 0.70)\", \"Number of docs\": 421}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.5774874698174104, \"Average Lower CI\": 0.5310012956286616, \"Average Upper CI\": 0.6240742887424237, \"Average F1\": \"0.58 (0.53, 0.62)\", \"Person F1\": \"0.65 (0.57, 0.71)\", \"Organization F1\": \"0.34 (0.24, 0.43)\", \"Location F1\": \"0.66 (0.58, 0.75)\", \"Number of docs\": 554}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"All\", \"Average\": 0.5069216754168929, \"Average Lower CI\": 0.44735545946565103, \"Average Upper CI\": 0.5651739638258565, \"Average F1\": \"0.51 (0.45, 0.57)\", \"Person F1\": \"0.60 (0.51, 0.68)\", \"Organization F1\": \"0.32 (0.24, 0.40)\", \"Location F1\": \"0.63 (0.53, 0.72)\", \"Number of docs\": 15062}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.4745033261598815, \"Average Lower CI\": 0.4263456721228215, \"Average Upper CI\": 0.5215018656716418, \"Average F1\": \"0.47 (0.43, 0.52)\", \"Person F1\": \"0.64 (0.56, 0.71)\", \"Organization F1\": \"0.26 (0.21, 0.34)\", \"Location F1\": \"0.58 (0.46, 0.68)\", \"Number of docs\": 8270}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.5748506490376031, \"Average Lower CI\": 0.5140775267241071, \"Average Upper CI\": 0.6232807901440448, \"Average F1\": \"0.57 (0.51, 0.62)\", \"Person F1\": \"0.65 (0.55, 0.74)\", \"Organization F1\": \"0.50 (0.43, 0.56)\", \"Location F1\": \"0.77 (0.61, 0.86)\", \"Number of docs\": 2163}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.6129605060379099, \"Average Lower CI\": 0.5610351926912437, \"Average Upper CI\": 0.6640061306614093, \"Average F1\": \"0.61 (0.56, 0.66)\", \"Person F1\": \"0.37 (0.27, 0.46)\", \"Organization F1\": \"0.53 (0.40, 0.66)\", \"Location F1\": \"0.87 (0.81, 0.92)\", \"Number of docs\": 1649}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.48662621172654597, \"Average Lower CI\": 0.41378571428571426, \"Average Upper CI\": 0.5387693288697593, \"Average F1\": \"0.49 (0.41, 0.54)\", \"Person F1\": \"0.44 (0.35, 0.53)\", \"Organization F1\": \"0.22 (0.12, 0.30)\", \"Location F1\": \"0.66 (0.58, 0.73)\", \"Number of docs\": 1709}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"News\", \"Average\": 0.5823902691260386, \"Average Lower CI\": 0.5451603700806806, \"Average Upper CI\": 0.6201576245460397, \"Average F1\": \"0.58 (0.55, 0.62)\", \"Person F1\": \"0.61 (0.56, 0.66)\", \"Organization F1\": \"0.40 (0.34, 0.47)\", \"Location F1\": \"0.68 (0.62, 0.73)\", \"Number of docs\": 421}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.5930123182295732, \"Average Lower CI\": 0.5490975059454845, \"Average Upper CI\": 0.6368166593854666, \"Average F1\": \"0.59 (0.55, 0.64)\", \"Person F1\": \"0.69 (0.63, 0.74)\", \"Organization F1\": \"0.30 (0.20, 0.39)\", \"Location F1\": \"0.70 (0.63, 0.78)\", \"Number of docs\": 554}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"All\", \"Average\": 0.498074458954352, \"Average Lower CI\": 0.43267572996741643, \"Average Upper CI\": 0.5507352130044973, \"Average F1\": \"0.50 (0.43, 0.55)\", \"Person F1\": \"0.59 (0.51, 0.67)\", \"Organization F1\": \"0.31 (0.24, 0.39)\", \"Location F1\": \"0.63 (0.51, 0.73)\", \"Number of docs\": 15062}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.2920643226833033, \"Average Lower CI\": 0.2502204729525964, \"Average Upper CI\": 0.3343973227045257, \"Average F1\": \"0.29 (0.25, 0.33)\", \"Person F1\": \"0.35 (0.28, 0.41)\", \"Organization F1\": \"0.15 (0.08, 0.19)\", \"Location F1\": \"0.39 (0.30, 0.49)\", \"Number of docs\": 8270}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.4928129111150733, \"Average Lower CI\": 0.42574027160596367, \"Average Upper CI\": 0.5437918445517297, \"Average F1\": \"0.49 (0.43, 0.54)\", \"Person F1\": \"0.53 (0.41, 0.65)\", \"Organization F1\": \"0.46 (0.39, 0.52)\", \"Location F1\": \"0.53 (0.39, 0.65)\", \"Number of docs\": 2163}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.4988902152023031, \"Average Lower CI\": 0.4402202471024494, \"Average Upper CI\": 0.552027665980754, \"Average F1\": \"0.50 (0.44, 0.55)\", \"Person F1\": \"0.24 (0.16, 0.33)\", \"Organization F1\": \"0.31 (0.17, 0.43)\", \"Location F1\": \"0.80 (0.74, 0.87)\", \"Number of docs\": 1649}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.33443918532217004, \"Average Lower CI\": 0.2861951798136416, \"Average Upper CI\": 0.3820397022332506, \"Average F1\": \"0.33 (0.29, 0.38)\", \"Person F1\": \"0.26 (0.19, 0.34)\", \"Organization F1\": \"0.14 (0.07, 0.23)\", \"Location F1\": \"0.48 (0.41, 0.56)\", \"Number of docs\": 1709}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"News\", \"Average\": 0.5051741121845459, \"Average Lower CI\": 0.45972088749306494, \"Average Upper CI\": 0.5399541337759082, \"Average F1\": \"0.51 (0.46, 0.54)\", \"Person F1\": \"0.51 (0.47, 0.56)\", \"Organization F1\": \"0.29 (0.23, 0.36)\", \"Location F1\": \"0.64 (0.58, 0.69)\", \"Number of docs\": 421}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.39286038498567044, \"Average Lower CI\": 0.3438957174909765, \"Average Upper CI\": 0.4500212449543233, \"Average F1\": \"0.39 (0.34, 0.45)\", \"Person F1\": \"0.45 (0.38, 0.53)\", \"Organization F1\": \"0.18 (0.09, 0.25)\", \"Location F1\": \"0.47 (0.36, 0.55)\", \"Number of docs\": 554}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"All\", \"Average\": 0.3418451669912897, \"Average Lower CI\": 0.2815761105612794, \"Average Upper CI\": 0.395188156070509, \"Average F1\": \"0.34 (0.28, 0.40)\", \"Person F1\": \"0.36 (0.27, 0.45)\", \"Organization F1\": \"0.22 (0.14, 0.27)\", \"Location F1\": \"0.46 (0.37, 0.55)\", \"Number of docs\": 15062}]}}, {\"mode\": \"vega-lite\"});\n",
+       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"point\", \"filled\": true}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_4\", \"value\": 1}, \"value\": 0.0}, \"size\": {\"condition\": {\"param\": \"param_5\", \"field\": \"Number of docs\", \"legend\": null}, \"value\": 100}, \"tooltip\": [{\"field\": \"Model\", \"type\": \"nominal\"}, {\"field\": \"Domain\", \"type\": \"nominal\"}, {\"field\": \"Average F1\", \"type\": \"nominal\"}, {\"field\": \"Person F1\", \"type\": \"nominal\"}, {\"field\": \"Location F1\", \"type\": \"nominal\"}, {\"field\": \"Organization F1\", \"type\": \"nominal\"}], \"x\": {\"field\": \"Average\", \"scale\": {\"domain\": [0.0, 1.0]}, \"title\": \"F1\", \"type\": \"quantitative\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"saattrupdan/nbailab-base-ner-scandi\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}, \"name\": \"view_3\"}, {\"mark\": {\"type\": \"errorbar\", \"ticks\": false}, \"encoding\": {\"color\": {\"field\": \"Domain\", \"type\": \"nominal\"}, \"opacity\": {\"condition\": {\"param\": \"param_4\", \"value\": 1}, \"value\": 0.0}, \"x\": {\"field\": \"Average Lower CI\", \"title\": \"F1\", \"type\": \"quantitative\"}, \"x2\": {\"field\": \"Average Upper CI\"}, \"y\": {\"field\": \"Model\", \"sort\": [\"da_dacy_large_trf-0.2.0\", \"da_dacy_medium_trf-0.2.0\", \"da_dacy_small_trf-0.2.0\", \"da_dacy_large_ner_fine_grained-0.1.0\", \"da_dacy_medium_ner_fine_grained-0.1.0\", \"da_dacy_small_ner_fine_grained-0.1.0\", \"saattrupdan/nbailab-base-ner-scandi\", \"alexandrainst/da-ner-base\", \"da_core_news_trf-3.5.0\", \"da_core_news_lg-3.5.0\", \"da_core_news_md-3.5.0\", \"da_core_news_sm-3.5.0\"], \"type\": \"nominal\"}}}], \"data\": {\"name\": \"data-d6e3e3cc205ffd0b72f085fec1aedba8\"}, \"height\": 300, \"params\": [{\"name\": \"param_4\", \"select\": {\"type\": \"point\", \"fields\": [\"Domain\"]}, \"bind\": \"legend\", \"value\": [{\"Domain\": \"All\"}], \"views\": [\"view_3\"]}, {\"name\": \"param_5\", \"bind\": {\"input\": \"checkbox\", \"name\": \"Scale point size by number of documents: \"}}], \"title\": \"Generalization to Unseen Domains\", \"width\": 400, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.8.0.json\", \"datasets\": {\"data-d6e3e3cc205ffd0b72f085fec1aedba8\": [{\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Web\", \"Average\": 0.667528985236362, \"Average Lower CI\": 0.6285297837859204, \"Average Upper CI\": 0.7115764966229456, \"Average F1\": \"0.67 (0.63, 0.71)\", \"Person F1\": \"0.76 (0.69, 0.82)\", \"Organization F1\": \"0.50 (0.44, 0.57)\", \"Location F1\": \"0.79 (0.74, 0.85)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Legal\", \"Average\": 0.6968613827360955, \"Average Lower CI\": 0.6479282839802326, \"Average Upper CI\": 0.7412643365519742, \"Average F1\": \"0.70 (0.65, 0.74)\", \"Person F1\": \"0.69 (0.62, 0.77)\", \"Organization F1\": \"0.70 (0.64, 0.76)\", \"Location F1\": \"0.66 (0.49, 0.83)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Conversation\", \"Average\": 0.6528786650509781, \"Average Lower CI\": 0.6040030164278661, \"Average Upper CI\": 0.6989262384874426, \"Average F1\": \"0.65 (0.60, 0.70)\", \"Person F1\": \"0.48 (0.38, 0.57)\", \"Organization F1\": \"0.32 (0.21, 0.45)\", \"Location F1\": \"0.94 (0.92, 0.97)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.5765523040063475, \"Average Lower CI\": 0.5331836914924933, \"Average Upper CI\": 0.6298384082527658, \"Average F1\": \"0.58 (0.53, 0.63)\", \"Person F1\": \"0.53 (0.45, 0.61)\", \"Organization F1\": \"0.35 (0.25, 0.44)\", \"Location F1\": \"0.75 (0.69, 0.79)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"News\", \"Average\": 0.8067395073942872, \"Average Lower CI\": 0.7685981818675921, \"Average Upper CI\": 0.8357818313352625, \"Average F1\": \"0.81 (0.77, 0.84)\", \"Person F1\": \"0.71 (0.66, 0.76)\", \"Organization F1\": \"0.67 (0.58, 0.72)\", \"Location F1\": \"0.95 (0.93, 0.97)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"Social Media\", \"Average\": 0.6659289149665456, \"Average Lower CI\": 0.6125936329588015, \"Average Upper CI\": 0.7080083849594789, \"Average F1\": \"0.67 (0.61, 0.71)\", \"Person F1\": \"0.75 (0.69, 0.81)\", \"Organization F1\": \"0.50 (0.43, 0.57)\", \"Location F1\": \"0.80 (0.69, 0.89)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_large_trf-0.2.0\", \"Domain\": \"All\", \"Average\": 0.6664886410109309, \"Average Lower CI\": 0.6254746646499224, \"Average Upper CI\": 0.7091693893271708, \"Average F1\": \"0.67 (0.63, 0.71)\", \"Person F1\": \"0.69 (0.62, 0.76)\", \"Organization F1\": \"0.54 (0.47, 0.60)\", \"Location F1\": \"0.81 (0.76, 0.86)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Web\", \"Average\": 0.560980315279223, \"Average Lower CI\": 0.5193585634026125, \"Average Upper CI\": 0.6079729504090832, \"Average F1\": \"0.56 (0.52, 0.61)\", \"Person F1\": \"0.68 (0.62, 0.75)\", \"Organization F1\": \"0.39 (0.33, 0.47)\", \"Location F1\": \"0.65 (0.59, 0.73)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Legal\", \"Average\": 0.6142971438502267, \"Average Lower CI\": 0.5566547785932218, \"Average Upper CI\": 0.6644733355448209, \"Average F1\": \"0.61 (0.56, 0.66)\", \"Person F1\": \"0.68 (0.59, 0.76)\", \"Organization F1\": \"0.55 (0.49, 0.60)\", \"Location F1\": \"0.79 (0.65, 0.88)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Conversation\", \"Average\": 0.5841716925183772, \"Average Lower CI\": 0.5273059944237919, \"Average Upper CI\": 0.6335597406606979, \"Average F1\": \"0.58 (0.53, 0.63)\", \"Person F1\": \"0.27 (0.19, 0.35)\", \"Organization F1\": \"0.33 (0.21, 0.48)\", \"Location F1\": \"0.97 (0.95, 0.99)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.6093583129257678, \"Average Lower CI\": 0.5549533604933324, \"Average Upper CI\": 0.6755938881058109, \"Average F1\": \"0.61 (0.55, 0.68)\", \"Person F1\": \"0.60 (0.50, 0.69)\", \"Organization F1\": \"0.32 (0.22, 0.41)\", \"Location F1\": \"0.77 (0.71, 0.82)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"News\", \"Average\": 0.5369590803281531, \"Average Lower CI\": 0.5053508771929824, \"Average Upper CI\": 0.5729970657943418, \"Average F1\": \"0.54 (0.51, 0.57)\", \"Person F1\": \"0.50 (0.42, 0.57)\", \"Organization F1\": \"0.40 (0.32, 0.48)\", \"Location F1\": \"0.63 (0.59, 0.67)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"Social Media\", \"Average\": 0.514405014305934, \"Average Lower CI\": 0.453710852521392, \"Average Upper CI\": 0.5639178617992177, \"Average F1\": \"0.51 (0.45, 0.56)\", \"Person F1\": \"0.46 (0.39, 0.54)\", \"Organization F1\": \"0.53 (0.46, 0.60)\", \"Location F1\": \"0.66 (0.48, 0.82)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_medium_trf-0.2.0\", \"Domain\": \"All\", \"Average\": 0.5604888568076893, \"Average Lower CI\": 0.5077672413793103, \"Average Upper CI\": 0.6092426309009623, \"Average F1\": \"0.56 (0.51, 0.61)\", \"Person F1\": \"0.60 (0.52, 0.67)\", \"Organization F1\": \"0.42 (0.34, 0.52)\", \"Location F1\": \"0.70 (0.63, 0.76)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Web\", \"Average\": 0.5861013092620353, \"Average Lower CI\": 0.5469861835863377, \"Average Upper CI\": 0.6220607908715325, \"Average F1\": \"0.59 (0.55, 0.62)\", \"Person F1\": \"0.76 (0.69, 0.82)\", \"Organization F1\": \"0.38 (0.30, 0.44)\", \"Location F1\": \"0.72 (0.65, 0.78)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Legal\", \"Average\": 0.6031883979717402, \"Average Lower CI\": 0.5434979369093571, \"Average Upper CI\": 0.6511363175744145, \"Average F1\": \"0.60 (0.54, 0.65)\", \"Person F1\": \"0.60 (0.48, 0.70)\", \"Organization F1\": \"0.61 (0.56, 0.65)\", \"Location F1\": \"0.57 (0.41, 0.69)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Conversation\", \"Average\": 0.5917388201389233, \"Average Lower CI\": 0.5411907114624507, \"Average Upper CI\": 0.6359840854149879, \"Average F1\": \"0.59 (0.54, 0.64)\", \"Person F1\": \"0.32 (0.23, 0.41)\", \"Organization F1\": \"0.27 (0.19, 0.36)\", \"Location F1\": \"0.97 (0.95, 0.99)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.4403569955595427, \"Average Lower CI\": 0.4010310606479816, \"Average Upper CI\": 0.4939674287025001, \"Average F1\": \"0.44 (0.40, 0.49)\", \"Person F1\": \"0.55 (0.47, 0.64)\", \"Organization F1\": \"0.21 (0.14, 0.28)\", \"Location F1\": \"0.50 (0.43, 0.58)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"News\", \"Average\": 0.8149559916249054, \"Average Lower CI\": 0.785616108996193, \"Average Upper CI\": 0.8356736335825664, \"Average F1\": \"0.81 (0.79, 0.84)\", \"Person F1\": \"0.94 (0.93, 0.96)\", \"Organization F1\": \"0.54 (0.49, 0.60)\", \"Location F1\": \"0.85 (0.81, 0.89)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"Social Media\", \"Average\": 0.4971664867414185, \"Average Lower CI\": 0.44813006632277086, \"Average Upper CI\": 0.5539955490931692, \"Average F1\": \"0.50 (0.45, 0.55)\", \"Person F1\": \"0.71 (0.66, 0.77)\", \"Organization F1\": \"0.44 (0.35, 0.53)\", \"Location F1\": \"0.00 (0.00, 0.00)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_small_trf-0.2.0\", \"Domain\": \"All\", \"Average\": 0.5723364354480662, \"Average Lower CI\": 0.5205699646051561, \"Average Upper CI\": 0.6184630650966705, \"Average F1\": \"0.57 (0.52, 0.62)\", \"Person F1\": \"0.66 (0.57, 0.74)\", \"Organization F1\": \"0.41 (0.35, 0.48)\", \"Location F1\": \"0.70 (0.65, 0.75)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8479359476866852, \"Average Lower CI\": 0.815980341313657, \"Average Upper CI\": 0.876074782111192, \"Average F1\": \"0.85 (0.82, 0.88)\", \"Person F1\": \"0.88 (0.85, 0.92)\", \"Organization F1\": \"0.77 (0.71, 0.83)\", \"Location F1\": \"0.93 (0.90, 0.96)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.9323961905417734, \"Average Lower CI\": 0.9095775312066574, \"Average Upper CI\": 0.9538810989194607, \"Average F1\": \"0.93 (0.91, 0.95)\", \"Person F1\": \"0.93 (0.90, 0.96)\", \"Organization F1\": \"0.94 (0.92, 0.96)\", \"Location F1\": \"0.80 (0.61, 0.95)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.8591304681896426, \"Average Lower CI\": 0.8296825361438397, \"Average Upper CI\": 0.8847152775751919, \"Average F1\": \"0.86 (0.83, 0.88)\", \"Person F1\": \"0.75 (0.69, 0.80)\", \"Organization F1\": \"0.81 (0.75, 0.87)\", \"Location F1\": \"1.00 (1.00, 1.00)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7875348540037215, \"Average Lower CI\": 0.7445908183632733, \"Average Upper CI\": 0.8366649937927573, \"Average F1\": \"0.79 (0.74, 0.84)\", \"Person F1\": \"0.78 (0.69, 0.86)\", \"Organization F1\": \"0.55 (0.44, 0.66)\", \"Location F1\": \"0.90 (0.85, 0.93)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.8500446954275824, \"Average Lower CI\": 0.8161730032419687, \"Average Upper CI\": 0.8810427070328756, \"Average F1\": \"0.85 (0.82, 0.88)\", \"Person F1\": \"0.87 (0.82, 0.92)\", \"Organization F1\": \"0.80 (0.74, 0.85)\", \"Location F1\": \"0.85 (0.81, 0.89)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.5909784946289866, \"Average Lower CI\": 0.5274659030969784, \"Average Upper CI\": 0.6600959892254662, \"Average F1\": \"0.59 (0.53, 0.66)\", \"Person F1\": \"0.66 (0.59, 0.75)\", \"Organization F1\": \"0.40 (0.31, 0.49)\", \"Location F1\": \"0.66 (0.57, 0.77)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_large_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.8518845269547171, \"Average Lower CI\": 0.814045689694639, \"Average Upper CI\": 0.8786310223266744, \"Average F1\": \"0.85 (0.81, 0.88)\", \"Person F1\": \"0.86 (0.80, 0.90)\", \"Organization F1\": \"0.79 (0.73, 0.85)\", \"Location F1\": \"0.93 (0.89, 0.96)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8552022198021011, \"Average Lower CI\": 0.8190691929361429, \"Average Upper CI\": 0.8796596467868855, \"Average F1\": \"0.86 (0.82, 0.88)\", \"Person F1\": \"0.90 (0.86, 0.95)\", \"Organization F1\": \"0.77 (0.72, 0.81)\", \"Location F1\": \"0.92 (0.86, 0.97)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.8940226089404762, \"Average Lower CI\": 0.8673171181131379, \"Average Upper CI\": 0.920923950234295, \"Average F1\": \"0.89 (0.87, 0.92)\", \"Person F1\": \"0.88 (0.81, 0.93)\", \"Organization F1\": \"0.92 (0.89, 0.94)\", \"Location F1\": \"0.73 (0.56, 0.86)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.8127690875409891, \"Average Lower CI\": 0.7722243765403375, \"Average Upper CI\": 0.8532208363903153, \"Average F1\": \"0.81 (0.77, 0.85)\", \"Person F1\": \"0.64 (0.56, 0.71)\", \"Organization F1\": \"0.95 (0.90, 0.98)\", \"Location F1\": \"0.94 (0.91, 0.98)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.8422759141178982, \"Average Lower CI\": 0.8056981273920175, \"Average Upper CI\": 0.8823107129709167, \"Average F1\": \"0.84 (0.81, 0.88)\", \"Person F1\": \"0.81 (0.73, 0.88)\", \"Organization F1\": \"0.66 (0.57, 0.76)\", \"Location F1\": \"0.93 (0.88, 0.96)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.7106600021241404, \"Average Lower CI\": 0.6810680688735207, \"Average Upper CI\": 0.7343385734988342, \"Average F1\": \"0.71 (0.68, 0.73)\", \"Person F1\": \"0.57 (0.51, 0.63)\", \"Organization F1\": \"0.57 (0.50, 0.63)\", \"Location F1\": \"0.83 (0.81, 0.86)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.7540892243218367, \"Average Lower CI\": 0.7042482243890695, \"Average Upper CI\": 0.7994123340707965, \"Average F1\": \"0.75 (0.70, 0.80)\", \"Person F1\": \"0.80 (0.74, 0.86)\", \"Organization F1\": \"0.61 (0.53, 0.70)\", \"Location F1\": \"1.00 (1.00, 1.00)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_medium_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.8497648811435619, \"Average Lower CI\": 0.8141689896266509, \"Average Upper CI\": 0.8784788241704733, \"Average F1\": \"0.85 (0.81, 0.88)\", \"Person F1\": \"0.85 (0.79, 0.90)\", \"Organization F1\": \"0.80 (0.76, 0.85)\", \"Location F1\": \"0.91 (0.86, 0.96)\", \"Number of docs\": 1500}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Web\", \"Average\": 0.8193685336482619, \"Average Lower CI\": 0.7841398986925701, \"Average Upper CI\": 0.8474517107325313, \"Average F1\": \"0.82 (0.78, 0.85)\", \"Person F1\": \"0.88 (0.82, 0.92)\", \"Organization F1\": \"0.76 (0.70, 0.80)\", \"Location F1\": \"0.85 (0.79, 0.92)\", \"Number of docs\": 783}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Legal\", \"Average\": 0.9427008846663705, \"Average Lower CI\": 0.9202775032938078, \"Average Upper CI\": 0.9608768656716418, \"Average F1\": \"0.94 (0.92, 0.96)\", \"Person F1\": \"0.93 (0.89, 0.95)\", \"Organization F1\": \"0.96 (0.94, 0.98)\", \"Location F1\": \"0.79 (0.64, 0.92)\", \"Number of docs\": 239}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Conversation\", \"Average\": 0.7649388627018243, \"Average Lower CI\": 0.7207038002469476, \"Average Upper CI\": 0.8055727594260237, \"Average F1\": \"0.76 (0.72, 0.81)\", \"Person F1\": \"0.59 (0.51, 0.68)\", \"Organization F1\": \"0.78 (0.63, 0.87)\", \"Location F1\": \"0.95 (0.92, 0.97)\", \"Number of docs\": 168}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.8216292630976697, \"Average Lower CI\": 0.7807349131540755, \"Average Upper CI\": 0.8766204170925924, \"Average F1\": \"0.82 (0.78, 0.88)\", \"Person F1\": \"0.86 (0.80, 0.91)\", \"Organization F1\": \"0.53 (0.39, 0.68)\", \"Location F1\": \"0.89 (0.84, 0.94)\", \"Number of docs\": 182}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"News\", \"Average\": 0.8671303590558316, \"Average Lower CI\": 0.8393492316927406, \"Average Upper CI\": 0.8886426079967054, \"Average F1\": \"0.87 (0.84, 0.89)\", \"Person F1\": \"1.00 (1.00, 1.00)\", \"Organization F1\": \"0.49 (0.42, 0.55)\", \"Location F1\": \"0.91 (0.88, 0.93)\", \"Number of docs\": 39}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"Social Media\", \"Average\": 0.8086330903888892, \"Average Lower CI\": 0.7568825910931174, \"Average Upper CI\": 0.8574352548036759, \"Average F1\": \"0.81 (0.76, 0.86)\", \"Person F1\": \"1.00 (1.00, 1.00)\", \"Organization F1\": \"0.80 (0.74, 0.85)\", \"Location F1\": \"0.32 (0.18, 0.47)\", \"Number of docs\": 64}, {\"Model\": \"da_dacy_small_ner_fine_grained-0.1.0\", \"Domain\": \"All\", \"Average\": 0.8330711878200586, \"Average Lower CI\": 0.7951427836377669, \"Average Upper CI\": 0.8642824695513596, \"Average F1\": \"0.83 (0.80, 0.86)\", \"Person F1\": \"0.87 (0.82, 0.92)\", \"Organization F1\": \"0.79 (0.74, 0.83)\", \"Location F1\": \"0.85 (0.78, 0.92)\", \"Number of docs\": 1500}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Web\", \"Average\": 0.6524810903923257, \"Average Lower CI\": 0.6132546942561155, \"Average Upper CI\": 0.6905463578038948, \"Average F1\": \"0.65 (0.61, 0.69)\", \"Person F1\": \"0.77 (0.70, 0.84)\", \"Organization F1\": \"0.50 (0.43, 0.56)\", \"Location F1\": \"0.73 (0.66, 0.78)\", \"Number of docs\": 783}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Legal\", \"Average\": 0.5976467528188156, \"Average Lower CI\": 0.5316067972907595, \"Average Upper CI\": 0.6539271918293053, \"Average F1\": \"0.60 (0.53, 0.65)\", \"Person F1\": \"0.54 (0.45, 0.65)\", \"Organization F1\": \"0.62 (0.54, 0.70)\", \"Location F1\": \"0.73 (0.56, 0.88)\", \"Number of docs\": 239}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Conversation\", \"Average\": 0.5505961721940514, \"Average Lower CI\": 0.4930601080237976, \"Average Upper CI\": 0.600929203539823, \"Average F1\": \"0.55 (0.49, 0.60)\", \"Person F1\": \"0.25 (0.17, 0.34)\", \"Organization F1\": \"0.30 (0.17, 0.46)\", \"Location F1\": \"0.89 (0.85, 0.92)\", \"Number of docs\": 168}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Wiki & Books\", \"Average\": 0.7177764961181036, \"Average Lower CI\": 0.6609971847892879, \"Average Upper CI\": 0.7679188004082333, \"Average F1\": \"0.72 (0.66, 0.77)\", \"Person F1\": \"0.68 (0.60, 0.76)\", \"Organization F1\": \"0.66 (0.53, 0.76)\", \"Location F1\": \"0.76 (0.69, 0.81)\", \"Number of docs\": 182}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"News\", \"Average\": 0.851357711465195, \"Average Lower CI\": 0.8335065109144074, \"Average Upper CI\": 0.8668864284886384, \"Average F1\": \"0.85 (0.83, 0.87)\", \"Person F1\": \"0.93 (0.91, 0.96)\", \"Organization F1\": \"0.67 (0.61, 0.72)\", \"Location F1\": \"0.87 (0.84, 0.89)\", \"Number of docs\": 39}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"Social Media\", \"Average\": 0.4788494920088626, \"Average Lower CI\": 0.4215434857821456, \"Average Upper CI\": 0.5433242253573487, \"Average F1\": \"0.48 (0.42, 0.54)\", \"Person F1\": \"0.66 (0.60, 0.73)\", \"Organization F1\": \"0.24 (0.15, 0.33)\", \"Location F1\": \"0.33 (0.20, 0.44)\", \"Number of docs\": 64}, {\"Model\": \"saattrupdan/nbailab-base-ner-scandi\", \"Domain\": \"All\", \"Average\": 0.6404158423152169, \"Average Lower CI\": 0.5971249208216451, \"Average Upper CI\": 0.683077088871327, \"Average F1\": \"0.64 (0.60, 0.68)\", \"Person F1\": \"0.66 (0.57, 0.72)\", \"Organization F1\": \"0.52 (0.45, 0.59)\", \"Location F1\": \"0.75 (0.69, 0.81)\", \"Number of docs\": 1500}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Web\", \"Average\": 0.6772797119549435, \"Average Lower CI\": 0.6294598513935309, \"Average Upper CI\": 0.7233569585810175, \"Average F1\": \"0.68 (0.63, 0.72)\", \"Person F1\": \"0.76 (0.70, 0.81)\", \"Organization F1\": \"0.52 (0.42, 0.61)\", \"Location F1\": \"0.77 (0.70, 0.83)\", \"Number of docs\": 783}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Legal\", \"Average\": 0.7073682855388124, \"Average Lower CI\": 0.6587500118253631, \"Average Upper CI\": 0.7551344964967714, \"Average F1\": \"0.71 (0.66, 0.76)\", \"Person F1\": \"0.71 (0.61, 0.79)\", \"Organization F1\": \"0.72 (0.67, 0.77)\", \"Location F1\": \"0.61 (0.43, 0.76)\", \"Number of docs\": 239}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Conversation\", \"Average\": 0.6887403634221382, \"Average Lower CI\": 0.635970040189989, \"Average Upper CI\": 0.7327359617682199, \"Average F1\": \"0.69 (0.64, 0.73)\", \"Person F1\": \"0.53 (0.44, 0.62)\", \"Organization F1\": \"0.34 (0.24, 0.43)\", \"Location F1\": \"0.97 (0.95, 0.99)\", \"Number of docs\": 168}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Wiki & Books\", \"Average\": 0.6335285074209022, \"Average Lower CI\": 0.5778187958095092, \"Average Upper CI\": 0.6857142857142856, \"Average F1\": \"0.63 (0.58, 0.69)\", \"Person F1\": \"0.68 (0.60, 0.77)\", \"Organization F1\": \"0.28 (0.17, 0.38)\", \"Location F1\": \"0.70 (0.63, 0.75)\", \"Number of docs\": 182}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"News\", \"Average\": 0.7551014173976767, \"Average Lower CI\": 0.7182013576081971, \"Average Upper CI\": 0.7860757315552063, \"Average F1\": \"0.76 (0.72, 0.79)\", \"Person F1\": \"0.71 (0.65, 0.78)\", \"Organization F1\": \"0.67 (0.61, 0.71)\", \"Location F1\": \"0.82 (0.78, 0.84)\", \"Number of docs\": 39}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"Social Media\", \"Average\": 0.7074503583760692, \"Average Lower CI\": 0.6511280005502441, \"Average Upper CI\": 0.7515687250996016, \"Average F1\": \"0.71 (0.65, 0.75)\", \"Person F1\": \"0.73 (0.67, 0.80)\", \"Organization F1\": \"0.66 (0.58, 0.74)\", \"Location F1\": \"0.66 (0.48, 0.82)\", \"Number of docs\": 64}, {\"Model\": \"alexandrainst/da-ner-base\", \"Domain\": \"All\", \"Average\": 0.6712384598623063, \"Average Lower CI\": 0.6261242441439502, \"Average Upper CI\": 0.7250227766849571, \"Average F1\": \"0.67 (0.63, 0.73)\", \"Person F1\": \"0.70 (0.61, 0.76)\", \"Organization F1\": \"0.55 (0.47, 0.63)\", \"Location F1\": \"0.77 (0.71, 0.83)\", \"Number of docs\": 1500}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.5876969094308764, \"Average Lower CI\": 0.5434579199558514, \"Average Upper CI\": 0.6422389070437741, \"Average F1\": \"0.59 (0.54, 0.64)\", \"Person F1\": \"0.67 (0.59, 0.73)\", \"Organization F1\": \"0.41 (0.31, 0.50)\", \"Location F1\": \"0.70 (0.63, 0.76)\", \"Number of docs\": 783}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.6430997167163972, \"Average Lower CI\": 0.6000158312452166, \"Average Upper CI\": 0.6841037360890302, \"Average F1\": \"0.64 (0.60, 0.68)\", \"Person F1\": \"0.66 (0.58, 0.75)\", \"Organization F1\": \"0.64 (0.60, 0.69)\", \"Location F1\": \"0.56 (0.39, 0.71)\", \"Number of docs\": 239}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.6953852175246458, \"Average Lower CI\": 0.6289815072302558, \"Average Upper CI\": 0.7450399759883073, \"Average F1\": \"0.70 (0.63, 0.75)\", \"Person F1\": \"0.56 (0.47, 0.64)\", \"Organization F1\": \"0.25 (0.15, 0.38)\", \"Location F1\": \"0.97 (0.95, 0.99)\", \"Number of docs\": 168}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.6109104275242887, \"Average Lower CI\": 0.5573528623099887, \"Average Upper CI\": 0.6695693380449564, \"Average F1\": \"0.61 (0.56, 0.67)\", \"Person F1\": \"0.61 (0.54, 0.69)\", \"Organization F1\": \"0.23 (0.13, 0.33)\", \"Location F1\": \"0.74 (0.67, 0.79)\", \"Number of docs\": 182}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"News\", \"Average\": 0.7366176070639676, \"Average Lower CI\": 0.6915650777625022, \"Average Upper CI\": 0.7704920977011495, \"Average F1\": \"0.74 (0.69, 0.77)\", \"Person F1\": \"0.71 (0.65, 0.77)\", \"Organization F1\": \"0.28 (0.20, 0.35)\", \"Location F1\": \"0.88 (0.84, 0.91)\", \"Number of docs\": 39}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.6051651691797325, \"Average Lower CI\": 0.5523764113518463, \"Average Upper CI\": 0.6585234798957399, \"Average F1\": \"0.61 (0.55, 0.66)\", \"Person F1\": \"0.70 (0.63, 0.78)\", \"Organization F1\": \"0.40 (0.32, 0.49)\", \"Location F1\": \"0.66 (0.48, 0.82)\", \"Number of docs\": 64}, {\"Model\": \"da_core_news_trf-3.5.0\", \"Domain\": \"All\", \"Average\": 0.6011565821198456, \"Average Lower CI\": 0.5541557024381119, \"Average Upper CI\": 0.6540204188481675, \"Average F1\": \"0.60 (0.55, 0.65)\", \"Person F1\": \"0.63 (0.55, 0.71)\", \"Organization F1\": \"0.44 (0.35, 0.52)\", \"Location F1\": \"0.74 (0.68, 0.79)\", \"Number of docs\": 1500}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.5470658597979223, \"Average Lower CI\": 0.5044154936607766, \"Average Upper CI\": 0.5882707104092878, \"Average F1\": \"0.55 (0.50, 0.59)\", \"Person F1\": \"0.69 (0.63, 0.74)\", \"Organization F1\": \"0.38 (0.29, 0.46)\", \"Location F1\": \"0.62 (0.54, 0.68)\", \"Number of docs\": 783}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.5784534648295648, \"Average Lower CI\": 0.5095322693383038, \"Average Upper CI\": 0.6340613429593958, \"Average F1\": \"0.58 (0.51, 0.63)\", \"Person F1\": \"0.60 (0.49, 0.69)\", \"Organization F1\": \"0.53 (0.46, 0.60)\", \"Location F1\": \"0.77 (0.64, 0.88)\", \"Number of docs\": 239}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.5995742936928079, \"Average Lower CI\": 0.5269780219780219, \"Average Upper CI\": 0.6469814996904475, \"Average F1\": \"0.60 (0.53, 0.65)\", \"Person F1\": \"0.31 (0.22, 0.41)\", \"Organization F1\": \"0.39 (0.26, 0.52)\", \"Location F1\": \"0.95 (0.93, 0.97)\", \"Number of docs\": 168}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.4283896843283366, \"Average Lower CI\": 0.37074527815617986, \"Average Upper CI\": 0.4901084860173577, \"Average F1\": \"0.43 (0.37, 0.49)\", \"Person F1\": \"0.28 (0.22, 0.37)\", \"Organization F1\": \"0.19 (0.11, 0.30)\", \"Location F1\": \"0.68 (0.62, 0.74)\", \"Number of docs\": 182}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"News\", \"Average\": 0.6628651420839026, \"Average Lower CI\": 0.6025909090909091, \"Average Upper CI\": 0.7117209528439474, \"Average F1\": \"0.66 (0.60, 0.71)\", \"Person F1\": \"0.53 (0.45, 0.58)\", \"Organization F1\": \"0.25 (0.16, 0.32)\", \"Location F1\": \"0.91 (0.88, 0.93)\", \"Number of docs\": 39}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.48286163699360757, \"Average Lower CI\": 0.4253190422123371, \"Average Upper CI\": 0.5409267431597528, \"Average F1\": \"0.48 (0.43, 0.54)\", \"Person F1\": \"0.80 (0.76, 0.84)\", \"Organization F1\": \"0.23 (0.15, 0.32)\", \"Location F1\": \"0.22 (0.12, 0.29)\", \"Number of docs\": 64}, {\"Model\": \"da_core_news_lg-3.5.0\", \"Domain\": \"All\", \"Average\": 0.5368726417033386, \"Average Lower CI\": 0.48491520546368416, \"Average Upper CI\": 0.5913509919493961, \"Average F1\": \"0.54 (0.48, 0.59)\", \"Person F1\": \"0.57 (0.47, 0.65)\", \"Organization F1\": \"0.39 (0.32, 0.46)\", \"Location F1\": \"0.67 (0.59, 0.76)\", \"Number of docs\": 1500}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.5136992348502423, \"Average Lower CI\": 0.4615804480651731, \"Average Upper CI\": 0.5552635415950478, \"Average F1\": \"0.51 (0.46, 0.56)\", \"Person F1\": \"0.64 (0.55, 0.71)\", \"Organization F1\": \"0.32 (0.24, 0.39)\", \"Location F1\": \"0.66 (0.58, 0.72)\", \"Number of docs\": 783}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.5378431117397959, \"Average Lower CI\": 0.47948233599514806, \"Average Upper CI\": 0.5903539633624378, \"Average F1\": \"0.54 (0.48, 0.59)\", \"Person F1\": \"0.66 (0.55, 0.75)\", \"Organization F1\": \"0.47 (0.40, 0.54)\", \"Location F1\": \"0.53 (0.38, 0.67)\", \"Number of docs\": 239}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.6032162945763784, \"Average Lower CI\": 0.5328329918032786, \"Average Upper CI\": 0.6558421362582355, \"Average F1\": \"0.60 (0.53, 0.66)\", \"Person F1\": \"0.36 (0.25, 0.46)\", \"Organization F1\": \"0.27 (0.14, 0.39)\", \"Location F1\": \"0.90 (0.86, 0.94)\", \"Number of docs\": 168}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.41435781484086653, \"Average Lower CI\": 0.3706879483500717, \"Average Upper CI\": 0.47429130403638836, \"Average F1\": \"0.41 (0.37, 0.47)\", \"Person F1\": \"0.39 (0.30, 0.51)\", \"Organization F1\": \"0.19 (0.12, 0.26)\", \"Location F1\": \"0.56 (0.48, 0.62)\", \"Number of docs\": 182}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"News\", \"Average\": 0.8064540034418824, \"Average Lower CI\": 0.7688224313603484, \"Average Upper CI\": 0.8384070872947277, \"Average F1\": \"0.81 (0.77, 0.84)\", \"Person F1\": \"0.86 (0.81, 0.89)\", \"Organization F1\": \"0.33 (0.23, 0.42)\", \"Location F1\": \"0.91 (0.87, 0.93)\", \"Number of docs\": 39}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.4651086913925664, \"Average Lower CI\": 0.41810312426591495, \"Average Upper CI\": 0.5236993464052287, \"Average F1\": \"0.47 (0.42, 0.52)\", \"Person F1\": \"0.62 (0.57, 0.68)\", \"Organization F1\": \"0.40 (0.32, 0.48)\", \"Location F1\": \"0.00 (0.00, 0.00)\", \"Number of docs\": 64}, {\"Model\": \"da_core_news_md-3.5.0\", \"Domain\": \"All\", \"Average\": 0.5165210406027024, \"Average Lower CI\": 0.4613247974915077, \"Average Upper CI\": 0.566645987527782, \"Average F1\": \"0.52 (0.46, 0.57)\", \"Person F1\": \"0.60 (0.51, 0.68)\", \"Organization F1\": \"0.34 (0.28, 0.41)\", \"Location F1\": \"0.67 (0.59, 0.74)\", \"Number of docs\": 1500}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Web\", \"Average\": 0.3010391861079031, \"Average Lower CI\": 0.26244658567239215, \"Average Upper CI\": 0.33846847078287406, \"Average F1\": \"0.30 (0.26, 0.34)\", \"Person F1\": \"0.36 (0.30, 0.42)\", \"Organization F1\": \"0.16 (0.10, 0.23)\", \"Location F1\": \"0.41 (0.33, 0.48)\", \"Number of docs\": 783}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Legal\", \"Average\": 0.45884372852577193, \"Average Lower CI\": 0.40300316018171045, \"Average Upper CI\": 0.5209330567629291, \"Average F1\": \"0.46 (0.40, 0.52)\", \"Person F1\": \"0.53 (0.42, 0.63)\", \"Organization F1\": \"0.43 (0.36, 0.49)\", \"Location F1\": \"0.35 (0.20, 0.51)\", \"Number of docs\": 239}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Conversation\", \"Average\": 0.5301938027694156, \"Average Lower CI\": 0.46568268969100224, \"Average Upper CI\": 0.5762441474834178, \"Average F1\": \"0.53 (0.47, 0.58)\", \"Person F1\": \"0.21 (0.14, 0.28)\", \"Organization F1\": \"0.14 (0.04, 0.25)\", \"Location F1\": \"0.90 (0.86, 0.94)\", \"Number of docs\": 168}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Wiki & Books\", \"Average\": 0.299486033053285, \"Average Lower CI\": 0.2557559774964838, \"Average Upper CI\": 0.3386012414960058, \"Average F1\": \"0.30 (0.26, 0.34)\", \"Person F1\": \"0.10 (0.05, 0.16)\", \"Organization F1\": \"0.22 (0.13, 0.31)\", \"Location F1\": \"0.46 (0.39, 0.52)\", \"Number of docs\": 182}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"News\", \"Average\": 0.7424269925549841, \"Average Lower CI\": 0.7118787878787879, \"Average Upper CI\": 0.7746618006767242, \"Average F1\": \"0.74 (0.71, 0.77)\", \"Person F1\": \"0.57 (0.51, 0.62)\", \"Organization F1\": \"0.66 (0.62, 0.70)\", \"Location F1\": \"0.90 (0.86, 0.92)\", \"Number of docs\": 39}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"Social Media\", \"Average\": 0.18544554542239552, \"Average Lower CI\": 0.1408037757437071, \"Average Upper CI\": 0.23491625287185944, \"Average F1\": \"0.19 (0.14, 0.23)\", \"Person F1\": \"0.42 (0.34, 0.49)\", \"Organization F1\": \"0.00 (0.00, 0.00)\", \"Location F1\": \"0.00 (0.00, 0.00)\", \"Number of docs\": 64}, {\"Model\": \"da_core_news_sm-3.5.0\", \"Domain\": \"All\", \"Average\": 0.3441244538142977, \"Average Lower CI\": 0.2946728008833272, \"Average Upper CI\": 0.3917402862168212, \"Average F1\": \"0.34 (0.29, 0.39)\", \"Person F1\": \"0.34 (0.26, 0.42)\", \"Organization F1\": \"0.22 (0.17, 0.30)\", \"Location F1\": \"0.48 (0.39, 0.56)\", \"Number of docs\": 1500}]}}, {\"mode\": \"vega-lite\"});\n",
        "</script>"
       ],
       "text/plain": [
        "alt.LayerChart(...)"
       ]
      },
-     "execution_count": 21,
+     "execution_count": 28,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1594,6 +1494,72 @@
     "chart"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": 29,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\\begin{tabular}{lllll}\n",
+      "\\toprule\n",
+      " & Average F1 & Person F1 & Organization F1 & Location F1 \\\\\n",
+      "Model &  &  &  &  \\\\\n",
+      "\\midrule\n",
+      "da\\_dacy\\_large\\_trf-0.2.0 & 0.67 (0.63, 0.71) & 0.69 (0.62, 0.76) & 0.54 (0.47, 0.60) & 0.81 (0.76, 0.86) \\\\\n",
+      "da\\_dacy\\_medium\\_trf-0.2.0 & 0.56 (0.51, 0.61) & 0.60 (0.52, 0.67) & 0.42 (0.34, 0.52) & 0.70 (0.63, 0.76) \\\\\n",
+      "da\\_dacy\\_small\\_trf-0.2.0 & 0.57 (0.52, 0.62) & 0.66 (0.57, 0.74) & 0.41 (0.35, 0.48) & 0.70 (0.65, 0.75) \\\\\n",
+      "da\\_dacy\\_large\\_ner\\_fine\\_grained-0.1.0 & 0.85 (0.81, 0.88) & 0.86 (0.80, 0.90) & 0.79 (0.73, 0.85) & 0.93 (0.89, 0.96) \\\\\n",
+      "da\\_dacy\\_medium\\_ner\\_fine\\_grained-0.1.0 & 0.85 (0.81, 0.88) & 0.85 (0.79, 0.90) & 0.80 (0.76, 0.85) & 0.91 (0.86, 0.96) \\\\\n",
+      "da\\_dacy\\_small\\_ner\\_fine\\_grained-0.1.0 & 0.83 (0.8, 0.86) & 0.87 (0.82, 0.92) & 0.79 (0.74, 0.83) & 0.85 (0.78, 0.92) \\\\\n",
+      "saattrupdan/nbailab-base-ner-scandi & 0.64 (0.6, 0.68) & 0.66 (0.57, 0.72) & 0.52 (0.45, 0.59) & 0.75 (0.69, 0.81) \\\\\n",
+      "alexandrainst/da-ner-base & 0.67 (0.63, 0.73) & 0.70 (0.61, 0.76) & 0.55 (0.47, 0.63) & 0.77 (0.71, 0.83) \\\\\n",
+      "da\\_core\\_news\\_trf-3.5.0 & 0.6 (0.55, 0.65) & 0.63 (0.55, 0.71) & 0.44 (0.35, 0.52) & 0.74 (0.68, 0.79) \\\\\n",
+      "da\\_core\\_news\\_lg-3.5.0 & 0.54 (0.48, 0.59) & 0.57 (0.47, 0.65) & 0.39 (0.32, 0.46) & 0.67 (0.59, 0.76) \\\\\n",
+      "da\\_core\\_news\\_md-3.5.0 & 0.52 (0.46, 0.57) & 0.60 (0.51, 0.68) & 0.34 (0.28, 0.41) & 0.67 (0.59, 0.74) \\\\\n",
+      "da\\_core\\_news\\_sm-3.5.0 & 0.34 (0.29, 0.39) & 0.34 (0.26, 0.42) & 0.22 (0.17, 0.30) & 0.48 (0.39, 0.56) \\\\\n",
+      "\\bottomrule\n",
+      "\\end{tabular}\n",
+      "\n"
+     ]
+    }
+   ],
+   "source": [
+    "# add ci to average\n",
+    "\n",
+    "df = tables\n",
+    "df = df[df[\"Domain\"] != \"dannet\"]   # type: ignore\n",
+    "df = df[df[\"Domain\"].notnull()]\n",
+    "\n",
+    "df[\"Average F1\"] = df[\"Average\"].round(2).astype(str) + \" (\" + df[\"Average Lower CI\"].round(2).astype(str) + \", \" + df[\"Average Upper CI\"].round(2).astype(str) + \")\"\n",
+    "\n",
+    "df.drop([\"Average Lower CI\", \"Average Upper CI\"], axis=1, inplace=True)\n",
+    "df.drop([\"Number of docs\", \"Average\"], axis=1, inplace=True)\n",
+    "\n",
+    "\n",
+    "# filter all but average\n",
+    "df = df[df[\"Domain\"] == \"All\"]\n",
+    "df.drop([\"Domain\"], axis=1, inplace=True)\n",
+    "df.set_index(\"Model\", inplace=True)\n",
+    "df\n",
+    "\n",
+    "# convert to latex using styler\n",
+    "style = df.style.format_index(escape=\"latex\", axis=1).format_index(\n",
+    "    escape=\"latex\", axis=0\n",
+    ")\n",
+    "\n",
+    "# print latex\n",
+    "latex = style.to_latex(\n",
+    "        hrules=True,\n",
+    "        convert_css=True,\n",
+    "    )\n",
+    "\n",
+    "print(latex)\n",
+    "\n"
+   ]
+  },
   {
    "attachments": {},
    "cell_type": "markdown",

From 6e0f04f73f7c4581f8a3922807e2558e6a873743 Mon Sep 17 00:00:00 2001
From: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
Date: Wed, 6 Dec 2023 20:50:42 +0100
Subject: [PATCH 2/6] Update cruft reference

---
 .cruft.json | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.cruft.json b/.cruft.json
index 0aba82e7..a732c277 100644
--- a/.cruft.json
+++ b/.cruft.json
@@ -1,5 +1,5 @@
 {
-  "template": "https://github.com/MartinBernstorff/swift-python-cookiecutter",
+  "template": "https://github.com/KennethEnevoldsen/swift-python-cookiecutter",
   "commit": "7fdb02999e8596c525377c208ca902645d134f97",
   "checkout": null,
   "context": {
@@ -16,8 +16,8 @@
       "_copy_without_render": [
         "*.github"
       ],
-      "_template": "https://github.com/MartinBernstorff/swift-python-cookiecutter"
+      "_template": "https://github.com/KennethEnevoldsen/swift-python-cookiecutter"
     }
   },
   "directory": null
-}
+}
\ No newline at end of file

From 6cbeb42270bf6c8d97af36352465decc2b0a718d Mon Sep 17 00:00:00 2001
From: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
Date: Wed, 6 Dec 2023 21:04:17 +0100
Subject: [PATCH 3/6] Updated cruft template

---
 .cookiecutter.json                         |   1 -
 .cruft.json                                |   5 +-
 .github/dependabot.yml                     |  16 -
 .github/workflows/check_for_rej.yml        |  27 --
 .github/workflows/cruft.yml                |  66 ----
 .github/workflows/dependabot_automerge.yml |  30 --
 .github/workflows/lint.yml                 |  28 ++
 .github/workflows/pre-commit.yml           |  79 ----
 .github/workflows/static_type_checks.yml   |  71 +---
 .github/workflows/tests.yml                |  44 +--
 .pre-commit-config.yaml                    |  31 --
 CONTRIBUTING.md                            |  27 +-
 README.md                                  |   4 +-
 makefile                                   |  39 ++
 pyproject.toml                             |  43 +--
 tasks.py                                   | 427 ---------------------
 training/main/requirements.txt             |   3 -
 17 files changed, 102 insertions(+), 839 deletions(-)
 delete mode 100644 .github/dependabot.yml
 delete mode 100644 .github/workflows/check_for_rej.yml
 delete mode 100644 .github/workflows/cruft.yml
 delete mode 100644 .github/workflows/dependabot_automerge.yml
 create mode 100644 .github/workflows/lint.yml
 delete mode 100644 .github/workflows/pre-commit.yml
 delete mode 100644 .pre-commit-config.yaml
 create mode 100644 makefile
 delete mode 100644 tasks.py

diff --git a/.cookiecutter.json b/.cookiecutter.json
index 2665f074..9d03ac9f 100644
--- a/.cookiecutter.json
+++ b/.cookiecutter.json
@@ -8,7 +8,6 @@
     "email": "kennethcenevoldsen@gmail.com",
     "friendly_name": "DaCy",
     "github_user": "centre-for-humanities-computing",
-    "license": "MIT",
     "package_name": "dacy",
     "project_name": "dacy",
     "version": "2.4.2"
diff --git a/.cruft.json b/.cruft.json
index a732c277..a14abc9a 100644
--- a/.cruft.json
+++ b/.cruft.json
@@ -1,6 +1,6 @@
 {
   "template": "https://github.com/KennethEnevoldsen/swift-python-cookiecutter",
-  "commit": "7fdb02999e8596c525377c208ca902645d134f97",
+  "commit": "e96eb05162a0e45a8ad5aa446c72229372e79cdb",
   "checkout": null,
   "context": {
     "cookiecutter": {
@@ -12,7 +12,6 @@
       "github_user": "centre-for-humanities-computing",
       "version": "2.4.2",
       "copyright_year": "2023",
-      "license": "MIT",
       "_copy_without_render": [
         "*.github"
       ],
@@ -20,4 +19,4 @@
     }
   },
   "directory": null
-}
\ No newline at end of file
+}
diff --git a/.github/dependabot.yml b/.github/dependabot.yml
deleted file mode 100644
index ee72a897..00000000
--- a/.github/dependabot.yml
+++ /dev/null
@@ -1,16 +0,0 @@
-# Configuration: https://dependabot.com/docs/config-file/
-# Docs: https://docs.github.com/en/github/administering-a-repository/keeping-your-dependencies-updated-automatically
-
-version: 2
-updates:
-  - package-ecosystem: "pip" # See documentation for possible values
-    directory: "/" # Location of package manifests
-    schedule:
-      interval: "weekly"
-      day: "monday"
-      time: "13:00"
-      timezone: "Europe/Copenhagen"
-    open-pull-requests-limit: 20
-    commit-message:
-      prefix: "deps:"
-      include: "scope"
diff --git a/.github/workflows/check_for_rej.yml b/.github/workflows/check_for_rej.yml
deleted file mode 100644
index ed200fcc..00000000
--- a/.github/workflows/check_for_rej.yml
+++ /dev/null
@@ -1,27 +0,0 @@
-# .rej files occur when cruft update could not merge two files.
-# They need to be handled, but are easy to miss if there's no CI 
-name: Check for .rej files
-
-on:
-  pull_request:
-    types: [opened, synchronize]
-
-jobs:
-  check-for-rej-files:
-    runs-on: ubuntu-latest
-
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@v2
-
-      - name: Check for .rej files
-        run: |
-          files=`find . -type f -name "*.rej"`
-          count=`echo $files | grep -o "\.rej" | wc -l`
-          if [[ $count != 0 ]]; then
-            echo "Found .rej files in the repository."
-            echo $files | 
-            exit 1
-          else
-            echo "No .rej files found in the repository."
-          fi
diff --git a/.github/workflows/cruft.yml b/.github/workflows/cruft.yml
deleted file mode 100644
index 714de363..00000000
--- a/.github/workflows/cruft.yml
+++ /dev/null
@@ -1,66 +0,0 @@
-name: Cruft Check
-
-on:
-  pull_request:
-    branches:
-      - main
-
-jobs:
-  cruft-check:
-    runs-on: ubuntu-latest
-    permissions:
-      pull-requests: write
-
-    steps:
-      # Avoid infinite loop where main
-      # Feature PR -> cruft check from main ->
-      # Cruft update PR -> cruft check from main ->
-      # Cruft update PR ...
-      - name: Check if pull request is from a fork
-        run: |
-          if [ "${{ github.event.pull_request.head.repo.fork }}" = "true" ]; then
-            echo "Pull request is from a fork and does not have permissions for PR creation. Exiting gracefully."
-            exit 0
-          elif [ "${{github.event.pull_request.title}}"  == "ci - update cruft" ]; then
-            echo "Pull request is already a cruft update. Exiting gracefully."
-            exit 0
-          else
-            echo "Pull request is not from a fork, continuing."
-          fi
-
-      - name: Checkout code
-        uses: actions/checkout@v3
-        with:
-          ref: main
-
-      - name: Setup Python
-        uses: actions/setup-python@v4
-        with:
-          python-version: "3.9"
-
-      - name: Install Cruft
-        run: pip install cruft
-
-      - name: Update cruft
-        id: cruft_check
-        run: |
-          cruft_output=$(cruft update --skip-apply-ask)
-          if echo "$cruft_output" | grep -q "Good work!"; then
-            echo "$cruft_output"
-            echo "cruft_updated=true" >> $GITHUB_OUTPUT
-          else
-            echo "$cruft_output"
-            echo "cruft_updated=false" >> $GITHUB_OUTPUT
-          fi
-
-      - name: Create Pull Request
-        uses: peter-evans/create-pull-request@v4
-        if: ${{ steps.cruft_check.outputs.cruft_updated == 'true' && github.event.pull_request.title != 'ci - update cruft' }}
-        continue-on-error: true
-        with:
-          title: "ci - update cruft"
-          branch: "update-cruft"
-          body: "🌲 Cruft updates"
-          token: ${{ secrets.PAT }}
-          commit-message: "ci: update cruft"
-          labels: "dependencies" # This makes the PR exempt from the stale bot
diff --git a/.github/workflows/dependabot_automerge.yml b/.github/workflows/dependabot_automerge.yml
deleted file mode 100644
index 22d2ecd7..00000000
--- a/.github/workflows/dependabot_automerge.yml
+++ /dev/null
@@ -1,30 +0,0 @@
-# GitHub action to automerge dependabot PRs. Only merges if tests passes the
-# branch protections in the repository settings.
-# You can set branch protections in the repository under Settings > Branches > Add rule
-name: automerge-bot-prs
-
-on: pull_request
-
-permissions:
-  contents: write
-  pull-requests: write
-
-jobs:
-  dependabot-automerge:
-    runs-on: ubuntu-latest
-    # if actor is dependabot or pre-commit-ci[bot] then run
-    if: ${{ github.actor == 'dependabot[bot]' }}
-
-    steps:
-      # Checkout action is required for token to persist
-      - name: Enable auto-merge for Dependabot PRs
-        run: gh pr merge --auto --merge "$PR_URL" # Use Github CLI to merge automatically the PR
-        env:
-          PR_URL: ${{github.event.pull_request.html_url}}
-          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-
-      - name: Auto approve dependabot PRs
-        if: ${{ github.actor == 'dependabot[bot]' }}
-        uses: hmarr/auto-approve-action@v3.1.0
-        with:
-          github-token: ${{ secrets.GITHUB_TOKEN }}
diff --git a/.github/workflows/lint.yml b/.github/workflows/lint.yml
new file mode 100644
index 00000000..d27e4d45
--- /dev/null
+++ b/.github/workflows/lint.yml
@@ -0,0 +1,28 @@
+# GitHub action to run linting
+
+name: run-pre-commit
+
+on:
+  pull_request:
+    branches: [main]
+  push:
+    branches: [main]
+
+jobs:
+  pre-commit:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+
+      - uses: actions/setup-python@v4
+        with:
+          python-version: "3.9"
+          cache: "pip"
+
+      - name: Install pre-commit
+        run: make install
+
+      - name: Lint
+        id: lint
+        run: |
+          make lint
diff --git a/.github/workflows/pre-commit.yml b/.github/workflows/pre-commit.yml
deleted file mode 100644
index 79671c4a..00000000
--- a/.github/workflows/pre-commit.yml
+++ /dev/null
@@ -1,79 +0,0 @@
-# GitHub action to check if pre-commit has been run. Runs from .pre-commit-config.yaml, where the pre-commit actions are.
-
-name: run-pre-commit
-
-on:
-  pull_request:
-    branches: [main]
-  push:
-    branches: [main]
-
-jobs:
-  pre-commit:
-    permissions:
-      pull-requests: write
-    concurrency:
-      group: "${{ github.workflow }} @ ${{ github.ref }}"
-      cancel-in-progress: true
-    if: ${{ github.actor != 'dependabot[bot]' }}
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-        with:
-          repository: ${{ github.event.pull_request.head.repo.full_name }}
-          ref: ${{ github.event.pull_request.head.ref }}
-          token: ${{ secrets.PAT }}
-
-      - uses: actions/setup-python@v4
-        with:
-          python-version: "3.9"
-
-      - name: Install pre-commit
-        run: pip install pre-commit
-
-      - name: Run pre-commit
-        id: pre_commit
-        continue-on-error: true
-        run: |
-          if pre-commit run --color always --all-files; then
-            echo "Pre-commit check passed"
-            echo "pre_commit_failed=0" >> $GITHUB_OUTPUT
-          else
-            echo "Pre-commit check failed"
-            echo "pre_commit_failed=1" >> $GITHUB_OUTPUT
-            exit 1
-          fi
-
-      # Have this step before commit in case the PR is from a fork. In this case, we want the
-      # add-pr-comment to fail, because it makes it means that the contributer is directed here,
-      # and are given the informative error message, instead of directed to a "could not commit error message".
-      - uses: mshick/add-pr-comment@v2
-        if: ${{ steps.pre_commit.outputs.pre_commit_failed == 1 && github.event_name == 'pull_request' }}
-        id: add_comment
-        with:
-          message: |
-            Looks like some formatting rules failed.
-
-            ✨ The action has attempted automatic fixes ✨
-
-            If any were succesful, they were committed to the branch.
-            We suggest using `git pull --rebase` to apply them locally. 
-
-            If some errors could not be fixed automatically, you can:
-
-            🏎️ Get results locally by running `pre-commit run --all-files`
-            🕵️ Examine the results in the `Run pre-commit` section of this workflow `pre-commit` 
-
-            We also recommend setting up the `ruff` and `black` extensions to auto-format on save in your chosen editor.
-
-      - name: Commit formatting
-        if: ${{ steps.pre_commit.outputs.pre_commit_failed == 1 && github.event_name == 'pull_request' }}
-        run: |
-          git config user.name github-actions
-          git config user.email github-actions@github.com
-          git commit -am "style: linting"
-          git push --no-verify
-
-      - name: Fail workflow
-        if: ${{ steps.pre_commit.outputs.pre_commit_failed == 1 && github.event_name == 'pull_request' }}
-        run: exit 1
diff --git a/.github/workflows/static_type_checks.yml b/.github/workflows/static_type_checks.yml
index a1baa9c2..04faedde 100644
--- a/.github/workflows/static_type_checks.yml
+++ b/.github/workflows/static_type_checks.yml
@@ -1,6 +1,3 @@
-# We do not include static_type_checks as a pre-commit hook because pre-commit hooks
-# are installed in their own virtual environment, so static_type_checks cannot
-# use stubs from imports
 name: static_type_checks
 
 on:
@@ -12,11 +9,6 @@ on:
 jobs:
   static_type_checks:
     runs-on: ubuntu-latest
-    permissions:
-      pull-requests: write
-    concurrency:
-      group: "${{ github.workflow }} @ ${{ github.ref }}"
-      cancel-in-progress: true
     strategy:
       matrix:
         os: [ubuntu-latest]
@@ -24,74 +16,19 @@ jobs:
     steps:
       - uses: actions/checkout@v3
 
-      - name: Cache tox
-        uses: actions/cache@v3.2.6
-        id: cache_tox
-        with:
-          path: |
-            .tox
-          key: ${{ runner.os }}-${{ matrix.python-version }}-static-type-checks
-
       - name: Set up Python
         uses: actions/setup-python@v4
         id: setup_python
         with:
           python-version: ${{ matrix.python-version}}
+          cache: pip
 
       - name: Install dependencies
         shell: bash
         run: |
-          pip install invoke tox pyright
+          make install
 
       - name: Run static type checker
-        id: pyright
-        continue-on-error: true
-        run: |
-          if inv static-type-checks; then
-            echo "pyright check passed"
-            echo "pyright_failed=0" >> $GITHUB_OUTPUT
-          else
-            echo "pyright check failed"
-            echo "pyright_failed=1" >> $GITHUB_OUTPUT
-          fi
-
-      - name: Find Comment
-        uses: peter-evans/find-comment@v2
-        id: find_comment
-        if: ${{github.event_name == 'pull_request'}}
-        continue-on-error: true
-        with:
-          issue-number: ${{ github.event.pull_request.number }}
-          comment-author: "github-actions[bot]"
-          body-includes: ✨ Looks like pyright failed ✨
-
-      - uses: mshick/add-pr-comment@v2
-        if: ${{ steps.pyright.outputs.pyright_failed == 1 && github.event_name == 'pull_request'}}
-        id: add_comment
-        with:
-          message: |
-            ✨ Looks like pyright failed ✨
-          
-            If you want to fix this, we recommend doing it locally by either:
-            
-              a) Enabling pyright in VSCode and going through the errors in the problems tab 
-            
-            `VSCode settings > Python > Analysis: Type checking mode > "basic"`
-            
-              b) Debugging via the command line
-            
-                1. Installing pyright, which is included in the dev dependencies: `pip install -e ".[dev]"`
-                2. Diagnosing the errors by running `pyright .`
-
-      - uses: mshick/add-pr-comment@v2
-        if: ${{ steps.pyright.outputs.pyright_failed == 0 && steps.find_comment.outputs.comment-id != '' && github.event_name == 'pull_request'}}
-        with:
-          message-id: ${{ steps.find_comment.outputs.comment-id }}
-          message: |
-            🌟 pyright succeeds! 🌟
-
-      - name: Show pyright output
-        id: fail_run
-        if: ${{steps.pyright.outputs.pyright_failed == 1}}
+        shell: bash
         run: |
-          inv static-type-checks # Rerunning pyright isn't optimal computationally, but typically takes no more than a couple of seconds, and this ensures that the errors are in the failing step
+          make static-type-checks
diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 8931ad8d..3a1814c5 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -1,6 +1,7 @@
-# This workflow will install Python dependencies, run pytests and run notebooks
-# then it will in python 3.9 (ubuntu-latest) create a badge with the coverage
-# and add it to the PR. This badge will be updated if the PR is updated.
+# This workflow will:
+# 1) install Python dependencies
+# 2) run make test
+
 
 name: Tests
 on:
@@ -30,15 +31,6 @@ jobs:
     steps:
       - uses: actions/checkout@v3
 
-
-      - name: Cache tox
-        uses: actions/cache@v3.2.6
-        id: cache_tox
-        with:
-          path: |
-            .tox
-          key: ${{ runner.os }}-${{ matrix.python-version }}-tests-1
-
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
@@ -48,31 +40,9 @@ jobs:
       - name: Install dependencies
         shell: bash
         run: |
-          pip install invoke tox
+          make install
 
-      - name: Run and write pytest
+      - name: Run tests
         shell: bash
         run: |
-          # Specifying two sets of "--pytest-args" is required for invoke to parse it as a list
-          export DACY_CACHE_DIR=/tmp/dacy_cache
-          inv test --pytest-args="--durations=0" --pytest-args="--junitxml=pytest.xml --cov-report=term-missing --cov=src/"
-
-
-      - name: Test report on failures
-        uses: EnricoMi/publish-unit-test-result-action@v2
-        id: test_report_with_annotations
-        if: ${{ matrix.os == 'ubuntu-latest' && matrix.python-version == '3.9' && github.actor != 'dependabot[bot]' && github.event_name == 'pull_request' && (success() || failure()) }} # Do not run for dependabot, run whether tests failed or succeeded
-        with:
-          comment_mode: "failures"
-          files: |
-            pytest.xml
-
-      - name: Pytest coverage comment
-        id: coverage-comment
-        uses: MishaKav/pytest-coverage-comment@main
-        if: ${{ matrix.os == 'ubuntu-latest' && matrix.python-version == '3.9' &&  github.actor != 'dependabot[bot]' && github.event_name == 'pull_request' && (success() || failure()) }}
-        with:
-          create-new-comment: false
-          report-only-changed-files: false
-          pytest-coverage-path: pytest-coverage.txt
-          junitxml-path: ./pytest.xml
+          make test
\ No newline at end of file
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
deleted file mode 100644
index b9887b16..00000000
--- a/.pre-commit-config.yaml
+++ /dev/null
@@ -1,31 +0,0 @@
-default_stages: [commit]
-
-repos:
-  - repo: https://github.com/psf/black
-    rev: 23.3.0
-    hooks:
-      - id: black
-
-  - repo: https://github.com/charliermarsh/ruff-pre-commit
-    rev: v0.0.265
-    hooks:
-      - id: ruff
-        args:
-          [
-            "--extend-select",
-            "F401",
-            "--extend-select",
-            "F841",
-            "--fix",
-            "--exit-non-zero-on-fix",
-          ]
-
-  - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v4.4.0
-    hooks:
-      - id: check-yaml
-
-  - repo: https://github.com/repo-helper/pyproject-parser
-    rev: v0.9.0b2
-    hooks:
-      - id: check-pyproject
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 8b65d3ab..7237cfe6 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -11,7 +11,7 @@ Here is a list of important resources for contributors:
 - [Issue Tracker]
 - [Code of Conduct]
 
-[mit license]: https://opensource.org/licenses/MIT
+[Apache-2.0 license]: https://opensource.org/license/apache-2-0/
 [source code]: https://github.com/centre-for-humanities-computing/dacy
 [documentation]: https://dacy.readthedocs.io/
 [issue tracker]: https://github.com/centre-for-humanities-computing/dacy/issues
@@ -37,24 +37,22 @@ Request features on the [Issue Tracker].
 
 ## How to set up your development environment
 
-Install the package with development requirements:
+To install all the development dependencies, you can use the [make] command:
 
 ```console
-$ pip install -e ."[dev,tests]"
+$ make install
 ```
 
+
 ## How to test the project
 
 Run the full test suite:
 
 ```console
-$ pytest
+$ make test
 ```
 
-Unit tests are located in the _tests_ directory,
-and are written using the [pytest] testing framework.
-
-[pytest]: https://pytest.readthedocs.io/
+Unit tests are located in the _tests_ directory.
 
 ## How to submit changes
 
@@ -62,23 +60,24 @@ Open a [pull request] to submit changes to this project.
 
 Your pull request needs to meet the following guidelines for acceptance:
 
-- The Nox test suite must pass without errors and warnings.
-- Include unit tests. This project maintains 100% code coverage.
+- The test suite should ideally pass without errors and warnings.
+- Ideally add tests for your changes.
 - If your changes add functionality, update the documentation accordingly.
 
 Feel free to submit early, though—we can always iterate on this.
 
-To run linting and code formatting checks before committing your change, you can install pre-commit as a Git hook by running the following command:
+To run linting and code formatting checks before committing your change, you can run the following [make] command:
 
 ```console
-$ nox --session=pre-commit -- install
+$ make lint
 ```
 
-It is recommended to open an issue before starting work on anything.
+It is recommended to open an issue before starting work on any major changes.
 This will allow a chance to talk it over with the owners and validate your approach.
 
 [pull request]: https://github.com/centre-for-humanities-computing/dacy/pulls
+[make]: https://makefiletutorial.com
 
 <!-- github-only -->
 
-[code of conduct]: CODE_OF_CONDUCT.md
+[code of conduct]: CODE_OF_CONDUCT.md
\ No newline at end of file
diff --git a/README.md b/README.md
index 85e5896e..8744f1ef 100644
--- a/README.md
+++ b/README.md
@@ -4,14 +4,14 @@
 [![PyPI](https://img.shields.io/pypi/v/dacy.svg)][pypi status]
 [![pip downloads](https://img.shields.io/pypi/dm/dacy.svg)](https://pypi.org/project/dacy/)
 [![Python Version](https://img.shields.io/pypi/pyversions/dacy)][pypi status]
-[![Black](https://img.shields.io/badge/code%20style-black-000000.svg)][black]
+[![Ruff](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/astral-sh/ruff/main/assets/badge/v2.json)]([ruff])
 [![documentation](https://github.com/centre-for-humanities-computing/dacy/actions/workflows/documentation.yml/badge.svg)][documentation]
 [![Tests](https://github.com/centre-for-humanities-computing/dacy/actions/workflows/tests.yml/badge.svg)][tests]
 
 [pypi status]: https://pypi.org/project/dacy/
 [documentation]: https://centre-for-humanities-computing.github.io/DaCy/
 [tests]: https://github.com/centre-for-humanities-computing/dacy/actions?workflow=Tests
-[black]: https://github.com/psf/black
+[ruff]: https://github.com/astral-sh/ruff
 
 
 <!-- start short-description -->
diff --git a/makefile b/makefile
new file mode 100644
index 00000000..e94def5b
--- /dev/null
+++ b/makefile
@@ -0,0 +1,39 @@
+install:
+	@echo "--- 🚀 Installing project ---"
+	pip install -e ".[dev, docs, tests]" 
+
+static-type-check:
+	@echo "--- 🔍 Running static type check ---"
+	pyright .
+
+lint:
+	@echo "--- 🧹 Running linters ---"
+	pyproject-parser check pyproject.toml 		# check pyproject.toml
+	ruff format .  								# running ruff formatting
+	ruff . --fix  								# running ruff linting
+
+test:
+	@echo "--- 🧪 Running tests ---"
+	pytest tests/
+
+pr:
+	@echo "--- 🚀 Running PR checks ---"
+	make lint
+	make static-type-check
+	make test
+	@echo "Ready to make a PR"
+
+build-docs:
+	@echo "--- 📚 Building docs ---"
+	@echo "Builds the docs and puts them in the 'site' folder"
+	mkdocs build
+
+view-docs:
+	@echo "--- 👀 Viewing docs ---"
+	mkdocs serve
+	
+update-from-template:
+	@echo "--- 🔄 Updating from template ---"
+	@echo "This will update the project from the template, make sure to resolve any .rej files"
+	cruft update
+	
diff --git a/pyproject.toml b/pyproject.toml
index 3370978d..818c224e 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -50,11 +50,9 @@ name = "Apache License 2.0"
 [project.optional-dependencies]
 dev = [
   "cruft>=2.0.0",
-  "pyright==1.1.305",
-  "pyright-polite>=0.0.1",
-  "pre-commit>=2.20.0",
+  "pyright==1.1.328",
   "ruff>=0.0.262",
-  "black[jupyter]>=23.3.0",
+  "pyproject-parser[cli, readme]>=0.9.1",
 ]
 tests = ["pytest>=7.1.2", "pytest-cov>=3.0.0", "pytest-instafail>=0.4.2"]
 docs = [
@@ -112,6 +110,7 @@ exclude = [".*venv*", ".tox"]
 pythonPlatform = "Darwin"
 
 [tool.ruff]
+extend-include = ["*.ipynb"]
 # Enable pycodestyle (`E`) and Pyflakes (`F`) codes by default.
 select = [
   "A",
@@ -150,6 +149,7 @@ ignore = [
   "F841",
   "RET504",
   "ANN202",
+  "COM812",
 ]
 ignore-init-module-imports = true
 # Allow autofix for all enabled rules (when `--fix`) is provided.
@@ -190,6 +190,8 @@ exclude = [
 dummy-variable-rgx = "^(_+|(_+[a-zA-Z0-9_]*[a-zA-Z0-9]+?))$"
 target-version = "py38"
 
+tool.ruff.lint.pydocstyle]
+convention = "google"
 [tool.ruff.flake8-annotations]
 mypy-init-return = true
 suppress-none-returning = true
@@ -206,35 +208,4 @@ version_toml = ["pyproject.toml:project.version"]
 build_command = "python -m pip install build; python -m build"
 
 [tool.setuptools]
-include-package-data = true
-
-
-[tool.tox]
-legacy_tox_ini = """
-[tox]
-envlist = py{39,310}
-
-[testenv]
-description: run unit tests
-extras = tests
-use_develop = true
-commands =
-  pytest {posargs:test}
-
-[testenv:type]
-allowlist_externals = pyright
-description: run type checks
-extras = tests, dev
-basepython = py39 # Setting these explicitly avoid recreating env if your shell is set to a different version
-use_develop = true
-commands =
-  pyright src/
-
-[testenv:docs]
-description: build docs
-extras = docs
-basepython = py39 # Setting these explicitly avoid recreating env if your shell is set to a different version
-use_develop = true
-commands =
-  sphinx-build -b html docs docs/_build/html
-"""
+include-package-data = true
\ No newline at end of file
diff --git a/tasks.py b/tasks.py
deleted file mode 100644
index 20b84722..00000000
--- a/tasks.py
+++ /dev/null
@@ -1,427 +0,0 @@
-"""
-This project uses Invoke (pyinvoke.org) for task management.
-Install it via:
-
-```
-pip install invoke
-```
-
-And then run:
-
-```
-inv --list
-```
-
-If you do not wish to use invoke you can simply delete this file.
-"""
-
-
-import platform
-import re
-import shutil
-from pathlib import Path
-from typing import List, Optional
-
-from invoke import Context, Result, task
-
-# Extract supported python versions from the pyproject.toml classifiers key
-SUPPORTED_PYTHON_VERSIONS = [
-    line.split("::")[-1].strip().replace('"', "").replace(",", "")
-    for line in Path("pyproject.toml").read_text().splitlines()
-    if "Programming Language :: Python ::" in line
-]
-
-NOT_WINDOWS = platform.system() != "Windows"
-
-
-def echo_header(msg: str):
-    print(f"\n--- {msg} ---")
-
-
-class MsgType:
-    # Emojis have to be encoded as bytes to not break the terminal on Windows
-    @property
-    def DOING(self) -> str:
-        return b"\xf0\x9f\xa4\x96".decode() if NOT_WINDOWS else "DOING:"
-
-    @property
-    def GOOD(self) -> str:
-        return b"\xe2\x9c\x85".decode() if NOT_WINDOWS else "DONE:"
-
-    @property
-    def FAIL(self) -> str:
-        return b"\xf0\x9f\x9a\xa8".decode() if NOT_WINDOWS else "FAILED:"
-
-    @property
-    def WARN(self) -> str:
-        return b"\xf0\x9f\x9a\xa7".decode() if NOT_WINDOWS else "WARNING:"
-
-    @property
-    def SYNC(self) -> str:
-        return b"\xf0\x9f\x9a\x82".decode() if NOT_WINDOWS else "SYNCING:"
-
-    @property
-    def PY(self) -> str:
-        return b"\xf0\x9f\x90\x8d".decode() if NOT_WINDOWS else ""
-
-    @property
-    def CLEAN(self) -> str:
-        return b"\xf0\x9f\xa7\xb9".decode() if NOT_WINDOWS else "CLEANING:"
-
-    @property
-    def TEST(self) -> str:
-        return b"\xf0\x9f\xa7\xaa".decode() if NOT_WINDOWS else "TESTING:"
-
-    @property
-    def COMMUNICATE(self) -> str:
-        return b"\xf0\x9f\x93\xa3".decode() if NOT_WINDOWS else "COMMUNICATING:"
-
-    @property
-    def EXAMINE(self) -> str:
-        return b"\xf0\x9f\x94\x8d".decode() if NOT_WINDOWS else "VIEWING:"
-
-
-msg_type = MsgType()
-
-
-def git_init(c: Context, branch: str = "main"):
-    """Initialize a git repository if it does not exist yet."""
-    # If no .git directory exits
-    if not Path(".git").exists():
-        echo_header(f"{msg_type.DOING} Initializing Git repository")
-        c.run(f"git init -b {branch}")
-        c.run("git add .")
-        c.run("git commit -m 'Init'")
-        print(f"{msg_type.GOOD} Git repository initialized")
-    else:
-        print(f"{msg_type.GOOD} Git repository already initialized")
-
-
-def setup_venv(
-    c: Context,
-    python_path: str,
-    venv_name: Optional[str] = None,
-) -> str:
-    """Create a virtual environment if it does not exist yet.
-
-    Args:
-        c: The invoke context.
-        python_path: The python executable to use.
-        venv_name: The name of the virtual environment. Defaults to ".venv".
-    """
-    if venv_name is None:
-        venv_name = ".venv"
-
-    if not Path(venv_name).exists():
-        echo_header(
-            f"{msg_type.DOING} Creating virtual environment using {msg_type.PY}:{python_path}",
-        )
-        c.run(f"{python_path} -m venv {venv_name}")
-        print(f"{msg_type.GOOD} Virtual environment created")
-    else:
-        print(f"{msg_type.GOOD} Virtual environment already exists")
-    return venv_name
-
-
-def _add_commit(c: Context, msg: Optional[str] = None):
-    print(f"{msg_type.DOING} Adding and committing changes")
-    c.run("git add .")
-
-    if msg is None:
-        msg = input("Commit message: ")
-
-    c.run(f'git commit -m "{msg}"', pty=NOT_WINDOWS, hide=True)
-    print(f"{msg_type.GOOD} Changes added and committed")
-
-
-def is_uncommitted_changes(c: Context) -> bool:
-    git_status_result: Result = c.run(
-        "git status --porcelain",
-        pty=NOT_WINDOWS,
-        hide=True,
-    )
-
-    uncommitted_changes = git_status_result.stdout != ""
-    return uncommitted_changes
-
-
-def add_and_commit(c: Context, msg: Optional[str] = None):
-    """Add and commit all changes."""
-    if is_uncommitted_changes(c):
-        uncommitted_changes_descr = c.run(
-            "git status --porcelain",
-            pty=NOT_WINDOWS,
-            hide=True,
-        ).stdout
-
-        echo_header(
-            f"{msg_type.WARN} Uncommitted changes detected",
-        )
-
-        for line in uncommitted_changes_descr.splitlines():
-            print(f"    {line.strip()}")
-        print("\n")
-        _add_commit(c, msg=msg)
-
-
-def branch_exists_on_remote(c: Context) -> bool:
-    branch_name = Path(".git/HEAD").read_text().split("/")[-1].strip()
-
-    branch_exists_result: Result = c.run(
-        f"git ls-remote --heads origin {branch_name}",
-        hide=True,
-    )
-
-    return branch_name in branch_exists_result.stdout
-
-
-def update_branch(c: Context):
-    echo_header(f"{msg_type.SYNC} Syncing branch with remote")
-
-    if not branch_exists_on_remote(c):
-        c.run("git push --set-upstream origin HEAD")
-    else:
-        print("Pulling")
-        c.run("git pull")
-        print("Pushing")
-        c.run("git push")
-
-
-def create_pr(c: Context):
-    c.run(
-        "gh pr create --web",
-        pty=NOT_WINDOWS,
-    )
-
-
-def update_pr(c: Context):
-    echo_header(f"{msg_type.COMMUNICATE} Syncing PR")
-    # Get current branch name
-    branch_name = Path(".git/HEAD").read_text().split("/")[-1].strip()
-    pr_result: Result = c.run(
-        "gh pr list --state OPEN",
-        pty=False,
-        hide=True,
-    )
-
-    if branch_name not in pr_result.stdout:
-        create_pr(c)
-    else:
-        open_web = input("Open in browser? [y/n] ")
-        if "y" in open_web.lower():
-            c.run("gh pr view --web", pty=NOT_WINDOWS)
-
-
-def exit_if_error_in_stdout(result: Result):
-    # Find N remaining using regex
-
-    if "error" in result.stdout:
-        errors_remaining = re.findall(r"\d+(?=( remaining))", result.stdout)[
-            0
-        ]  # testing
-        if errors_remaining != "0":
-            exit(0)
-
-
-def pre_commit(c: Context, auto_fix: bool):
-    """Run pre-commit checks."""
-
-    # Essential to have a clean working directory before pre-commit to avoid committing
-    # heterogenous files under a "style: linting" commit
-    if is_uncommitted_changes(c):
-        print(
-            f"{msg_type.WARN} Your git working directory is not clean. Stash or commit before running pre-commit.",
-        )
-        exit(1)
-
-    echo_header(f"{msg_type.CLEAN} Running pre-commit checks")
-    pre_commit_cmd = "pre-commit run --all-files"
-    result = c.run(pre_commit_cmd, pty=NOT_WINDOWS, warn=True)
-
-    exit_if_error_in_stdout(result)
-
-    if ("fixed" in result.stdout or "reformatted" in result.stdout) and auto_fix:
-        _add_commit(c, msg="style: Auto-fixes from pre-commit")
-
-        print(f"{msg_type.DOING} Fixed errors, re-running pre-commit checks")
-        second_result = c.run(pre_commit_cmd, pty=NOT_WINDOWS, warn=True)
-        exit_if_error_in_stdout(second_result)
-    else:
-        if result.return_code != 0:
-            print(f"{msg_type.FAIL} Pre-commit checks failed")
-            exit(1)
-
-
-@task
-def static_type_checks(c: Context):
-    echo_header(f"{msg_type.CLEAN} Running static type checks")
-    c.run("tox -e type", pty=NOT_WINDOWS)
-
-
-@task
-def install(
-    c: Context,
-    pip_args: str = "",
-    msg: bool = True,
-    venv_path: Optional[str] = None,
-):
-    """Install the project in editable mode using pip install"""
-    if msg:
-        echo_header(f"{msg_type.DOING} Installing project")
-
-    extras = ".[dev,tests,docs]" if NOT_WINDOWS else ".[dev,tests,docs]"
-    install_cmd = f"pip install -e {extras} {pip_args}"
-
-    if venv_path is not None and NOT_WINDOWS:
-        with c.prefix(f"source {venv_path}/bin/activate"):
-            c.run(install_cmd)
-            return
-
-    c.run(install_cmd)
-
-
-def get_python_path(preferred_version: str) -> Optional[str]:
-    """Get path to python executable."""
-    preferred_version_path = shutil.which(f"python{preferred_version}")
-
-    if preferred_version_path is not None:
-        return preferred_version_path
-
-    print(
-        f"{msg_type.WARN}: python{preferred_version} not found, continuing with default python version",
-    )
-    return shutil.which("python")
-
-
-@task
-def setup(c: Context, python_path: Optional[str] = None):
-    """Confirm that a git repo exists and setup a virtual environment.
-
-    Args:
-        c: Invoke context
-        python_path: Path to the python executable to use for the virtual environment. Uses the return value of `which python` if not provided.
-    """
-    git_init(c)
-
-    if python_path is None:
-        # get path to python executable
-        python_path = get_python_path(preferred_version="3.9")
-        if not python_path:
-            print(f"{msg_type.FAIL} Python executable not found")
-            exit(1)
-    venv_name = setup_venv(c, python_path=python_path)
-
-    install(c, pip_args="--upgrade", msg=False, venv_path=venv_name)
-
-    if venv_name is not None:
-        print(
-            f"{msg_type.DOING} Activate your virtual environment by running: \n\n\t\t source {venv_name}/bin/activate \n",
-        )
-
-
-@task
-def update(c: Context):
-    """Update dependencies."""
-    echo_header(f"{msg_type.DOING} Updating project")
-    install(c, pip_args="--upgrade", msg=False)
-
-
-@task(iterable="pytest_args")
-def test(
-    c: Context,
-    python_versions: List[str] = (SUPPORTED_PYTHON_VERSIONS[0],),  # type: ignore
-    pytest_args: List[str] = [],  # noqa
-):
-    """Run tests"""
-    # Invoke requires lists as type hints, but does not support lists as default arguments.
-    # Hence this super weird type hint and default argument for the python_versions arg.
-    echo_header(f"{msg_type.TEST} Running tests")
-
-    python_version_strings = [f"py{v.replace('.', '')}" for v in python_versions]
-    python_version_arg_string = ",".join(python_version_strings)
-
-    if not pytest_args:
-        pytest_args = [
-            "tests",
-            "-rfE",
-            "--failed-first",
-            "-p no:cov",
-            "--disable-warnings",
-            "-q",
-        ]
-
-    pytest_arg_str = " ".join(pytest_args)
-
-    test_result: Result = c.run(
-        f"tox -e {python_version_arg_string} -- {pytest_arg_str}",
-        warn=True,
-        pty=NOT_WINDOWS,
-    )
-
-    # If "failed" in the pytest results
-    failed_tests = [line for line in test_result.stdout if line.startswith("FAILED")]
-
-    if len(failed_tests) > 0:
-        print("\n\n\n")
-        echo_header("Failed tests")
-        print("\n\n\n")
-        echo_header("Failed tests")
-
-        for line in failed_tests:
-            # Remove from start of line until /test_
-            line_sans_prefix = line[line.find("test_") :]
-
-            # Keep only that after ::
-            line_sans_suffix = line_sans_prefix[line_sans_prefix.find("::") + 2 :]
-            print(f"FAILED {msg_type.FAIL} #{line_sans_suffix}     ")
-
-    if test_result.return_code != 0:
-        exit(test_result.return_code)
-
-
-def test_for_rej():
-    # Get all paths in current directory or subdirectories that end in .rej
-    rej_files = list(Path(".").rglob("*.rej"))
-
-    if len(rej_files) > 0:
-        print(f"\n{msg_type.FAIL} Found .rej files leftover from cruft update.\n")
-        for file in rej_files:
-            print(f"    /{file}")
-        print("\nResolve the conflicts and try again. \n")
-        exit(1)
-
-
-@task
-def lint(c: Context, auto_fix: bool = False):
-    """Lint the project."""
-    test_for_rej()
-    pre_commit(c=c, auto_fix=auto_fix)
-    static_type_checks(c)
-
-
-@task
-def pr(c: Context, auto_fix: bool = False):
-    """Run all checks and update the PR."""
-    add_and_commit(c)
-    lint(c, auto_fix=auto_fix)
-    test(c, python_versions=SUPPORTED_PYTHON_VERSIONS)
-    update_branch(c)
-    update_pr(c)
-
-
-@task
-def docs(c: Context, view: bool = False, view_only: bool = False):
-    """
-    Build and view docs. If neither build or view are specified, both are run.
-    """
-    if not view_only:
-        echo_header(f"{msg_type.DOING}: Building docs")
-        c.run("tox -e docs")
-
-    if view or view_only:
-        echo_header(f"{msg_type.EXAMINE}: Opening docs in browser")
-        # check the OS and open the docs in the browser
-        if platform.system() == "Windows":
-            c.run("start docs/_build/html/index.html")
-        else:
-            c.run("open docs/_build/html/index.html")
diff --git a/training/main/requirements.txt b/training/main/requirements.txt
index ae058fa2..a44d4e36 100644
--- a/training/main/requirements.txt
+++ b/training/main/requirements.txt
@@ -14,6 +14,3 @@ wandb >= 0.14.2
 # for dataset handling
 conllu>=4.5.2
 wikidata>=0.7.0
-
-# style
-black>=23.3.0
\ No newline at end of file

From ee7e318ee49f5a020d2225c4111e27802a655e06 Mon Sep 17 00:00:00 2001
From: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
Date: Wed, 6 Dec 2023 21:09:53 +0100
Subject: [PATCH 4/6] lint: ran ruff

---
 docs/performance_ner.ipynb            | 114 +++++++++++++++++---------
 docs/tutorials/basic.ipynb            |  24 +++---
 docs/tutorials/hate-speech.ipynb      |   9 +-
 docs/tutorials/robustness.ipynb       |   7 +-
 docs/tutorials/sentiment.ipynb        |  16 ++--
 docs/tutorials/textdescriptives.ipynb |   9 +-
 makefile                              |   1 -
 pyproject.toml                        |  10 +--
 8 files changed, 117 insertions(+), 73 deletions(-)

diff --git a/docs/performance_ner.ipynb b/docs/performance_ner.ipynb
index 2a13d263..5424eb85 100644
--- a/docs/performance_ner.ipynb
+++ b/docs/performance_ner.ipynb
@@ -186,7 +186,7 @@
     "dane = {}\n",
     "for mdl_name, model_getter in MODELS.items():\n",
     "    mdl_results = apply_models(mdl_name, model_getter, dataset=\"dane\", splits=[\"test\"])\n",
-    "    dane[mdl_name] = mdl_results[\"test\"]\n"
+    "    dane[mdl_name] = mdl_results[\"test\"]"
    ]
   },
   {
@@ -214,8 +214,7 @@
     "        for ent in ents:\n",
     "            ent.label_ = mapping[ent.label_]\n",
     "\n",
-    "        e.x.ents = ents\n",
-    "    "
+    "        e.x.ents = ents"
    ]
   },
   {
@@ -231,6 +230,7 @@
     "import pandas as pd\n",
     "from evaluation.utils import create_dataframe\n",
     "\n",
+    "\n",
     "def highlight_max(s: pd.Series) -> list:\n",
     "    \"\"\"Highlight the maximum in a Series with bold text.\"\"\"\n",
     "    # convert to str for comparison\n",
@@ -291,10 +291,15 @@
    "outputs": [],
    "source": [
     "from multiprocessing import Pool\n",
+    "\n",
     "with Pool(8) as p:\n",
     "    tables = p.starmap(\n",
     "        create_dataframe,\n",
-    "        [(dane[mdl][\"examples\"], mdl, 1, 500) for mdl in dane if \"fine_grained\" not in mdl],\n",
+    "        [\n",
+    "            (dane[mdl][\"examples\"], mdl, 1, 500)\n",
+    "            for mdl in dane\n",
+    "            if \"fine_grained\" not in mdl\n",
+    "        ],\n",
     "    )"
    ]
   },
@@ -545,13 +550,18 @@
    "source": [
     "from functools import partial\n",
     "from evaluation.models import openai_model_loader_fine_ner\n",
+    "\n",
     "MODELS_ = MODELS.copy()\n",
-    "MODELS_[\"openai/gpt-3.5-turbo (02/05/23)\"] = partial(openai_model_loader_fine_ner, model=\"gpt-3.5-turbo\")\n",
-    "MODELS_[\"openai/gpt-4 (02/05/23)\"] = partial(openai_model_loader_fine_ner, model=\"gpt-4\")\n",
+    "MODELS_[\"openai/gpt-3.5-turbo (02/05/23)\"] = partial(\n",
+    "    openai_model_loader_fine_ner, model=\"gpt-3.5-turbo\"\n",
+    ")\n",
+    "MODELS_[\"openai/gpt-4 (02/05/23)\"] = partial(\n",
+    "    openai_model_loader_fine_ner, model=\"gpt-4\"\n",
+    ")\n",
     "\n",
     "# don't test openai models on DANSK\n",
     "MODELS_.pop(\"openai/gpt-3.5-turbo (02/05/23)\")\n",
-    "MODELS_.pop(\"openai/gpt-4 (02/05/23)\")\n"
+    "MODELS_.pop(\"openai/gpt-4 (02/05/23)\")"
    ]
   },
   {
@@ -610,12 +620,10 @@
     "dansk = {}\n",
     "for mdl_name, model_getter in MODELS_.items():\n",
     "    if \"openai\" in mdl_name:\n",
-    "        splits=[\"test\"]\n",
+    "        splits = [\"test\"]\n",
     "    else:\n",
-    "        splits=[\"train\", \"dev\", \"test\"]\n",
-    "    mdl_results = apply_models(\n",
-    "        mdl_name, model_getter, dataset=\"dansk\", splits=splits\n",
-    "    )\n",
+    "        splits = [\"train\", \"dev\", \"test\"]\n",
+    "    mdl_results = apply_models(mdl_name, model_getter, dataset=\"dansk\", splits=splits)\n",
     "    dansk[mdl_name] = mdl_results"
    ]
   },
@@ -632,8 +640,12 @@
     "with Pool(8) as p:\n",
     "    tables = p.starmap(\n",
     "        create_dataframe,\n",
-    "        [(dansk[mdl][\"test\"][\"examples\"], mdl, 1, 100, 2000) for mdl in dansk if \"fine_grained\" in mdl],\n",
-    "    )\n"
+    "        [\n",
+    "            (dansk[mdl][\"test\"][\"examples\"], mdl, 1, 100, 2000)\n",
+    "            for mdl in dansk\n",
+    "            if \"fine_grained\" in mdl\n",
+    "        ],\n",
+    "    )"
    ]
   },
   {
@@ -1123,8 +1135,13 @@
     "    if \"fine_grained\" not in mdl_name:\n",
     "        continue\n",
     "\n",
-    "    table = evaluate_generalization(examples=dansk[mdl_name][\"test\"][\"examples\"], mdl_name=mdl_name, n_rep=100, n_samples=1000)\n",
-    "    tables.append(table)\n"
+    "    table = evaluate_generalization(\n",
+    "        examples=dansk[mdl_name][\"test\"][\"examples\"],\n",
+    "        mdl_name=mdl_name,\n",
+    "        n_rep=100,\n",
+    "        n_samples=1000,\n",
+    "    )\n",
+    "    tables.append(table)"
    ]
   },
   {
@@ -1325,9 +1342,14 @@
     "    # examples += dansk[mdl_name][\"dev\"][\"examples\"]\n",
     "    # examples += dansk[mdl_name][\"train\"][\"examples\"]\n",
     "\n",
-    "    \n",
     "    examples = convert_to_conll_2003(examples)\n",
-    "    table = evaluate_generalization(mdl_name, examples, n_rep=100, n_samples=1000, create_row_fn=create_row_conll2003)\n",
+    "    table = evaluate_generalization(\n",
+    "        mdl_name,\n",
+    "        examples,\n",
+    "        n_rep=100,\n",
+    "        n_samples=1000,\n",
+    "        create_row_fn=create_row_conll2003,\n",
+    "    )\n",
     "    tables.append(table)\n",
     "\n",
     "tables = pd.concat(tables, axis=0)"
@@ -1344,7 +1366,7 @@
    "outputs": [],
    "source": [
     "df = tables\n",
-    "df = df[df[\"Domain\"] != \"dannet\"]   # type: ignore\n",
+    "df = df[df[\"Domain\"] != \"dannet\"]  # type: ignore\n",
     "df = df[df[\"Domain\"].notnull()]"
    ]
   },
@@ -1486,7 +1508,8 @@
     "chart = base + error_bars\n",
     "\n",
     "chart = chart.add_params(selection, param_checkbox).properties(\n",
-    "    width=400, height=300,\n",
+    "    width=400,\n",
+    "    height=300,\n",
     "    title=\"Generalization to Unseen Domains\",\n",
     ")\n",
     "\n",
@@ -1530,10 +1553,17 @@
     "# add ci to average\n",
     "\n",
     "df = tables\n",
-    "df = df[df[\"Domain\"] != \"dannet\"]   # type: ignore\n",
+    "df = df[df[\"Domain\"] != \"dannet\"]  # type: ignore\n",
     "df = df[df[\"Domain\"].notnull()]\n",
     "\n",
-    "df[\"Average F1\"] = df[\"Average\"].round(2).astype(str) + \" (\" + df[\"Average Lower CI\"].round(2).astype(str) + \", \" + df[\"Average Upper CI\"].round(2).astype(str) + \")\"\n",
+    "df[\"Average F1\"] = (\n",
+    "    df[\"Average\"].round(2).astype(str)\n",
+    "    + \" (\"\n",
+    "    + df[\"Average Lower CI\"].round(2).astype(str)\n",
+    "    + \", \"\n",
+    "    + df[\"Average Upper CI\"].round(2).astype(str)\n",
+    "    + \")\"\n",
+    ")\n",
     "\n",
     "df.drop([\"Average Lower CI\", \"Average Upper CI\"], axis=1, inplace=True)\n",
     "df.drop([\"Number of docs\", \"Average\"], axis=1, inplace=True)\n",
@@ -1552,12 +1582,11 @@
     "\n",
     "# print latex\n",
     "latex = style.to_latex(\n",
-    "        hrules=True,\n",
-    "        convert_css=True,\n",
-    "    )\n",
+    "    hrules=True,\n",
+    "    convert_css=True,\n",
+    ")\n",
     "\n",
-    "print(latex)\n",
-    "\n"
+    "print(latex)"
    ]
   },
   {
@@ -1637,6 +1666,8 @@
    "outputs": [],
    "source": [
     "from collections import defaultdict\n",
+    "\n",
+    "\n",
     "def augmentation_specific_examples(examples):\n",
     "    aug_group = defaultdict(list)\n",
     "    for example in examples:\n",
@@ -1678,7 +1709,7 @@
     "\n",
     "    aug_group = augmentation_specific_examples(examples)\n",
     "    for aug_name, _examples in aug_group.items():\n",
-    "        _examples = convert_to_conll_2003(_examples) # also removes misc.\n",
+    "        _examples = convert_to_conll_2003(_examples)  # also removes misc.\n",
     "        table = create_dataframe(_examples, mdl, n_rep=100, n_samples=1000)\n",
     "        table[\"Augmentation\"] = aug_name\n",
     "        tables.append(table)"
@@ -1694,7 +1725,7 @@
    },
    "outputs": [],
    "source": [
-    "df = pd.concat(tables)\n"
+    "df = pd.concat(tables)"
    ]
   },
   {
@@ -1709,7 +1740,6 @@
    "source": [
     "# create the table\n",
     "def create_table(df, model_order: list[str], baseline=df_average):\n",
-    "\n",
     "    table_df = df[[\"Models\", \"Augmentation\", \"Average\"]]\n",
     "\n",
     "    table_df = table_df.pivot(index=\"Models\", columns=\"Augmentation\", values=\"Average\")\n",
@@ -1722,7 +1752,6 @@
     "    # order the columns\n",
     "    table_df = table_df[[\"Baseline\"] + list(table_df.columns[:-1])]\n",
     "\n",
-    "\n",
     "    # create augmentation superheader\n",
     "\n",
     "    aug_superheader = [(\"\", \"Baseline\")]\n",
@@ -1736,7 +1765,9 @@
     "    s = s.apply(underline_second_max, axis=0, subset=df.columns[1:])\n",
     "\n",
     "    # Add a caption\n",
-    "    s = s.set_caption(\"F1 score for each augmentation with 95% confidence interval calculated over 100 repetitions\")\n",
+    "    s = s.set_caption(\n",
+    "        \"F1 score for each augmentation with 95% confidence interval calculated over 100 repetitions\"\n",
+    "    )\n",
     "\n",
     "    # Center the header and left align the model names\n",
     "    s = s.set_properties(subset=df.columns[1:], **{\"text-align\": \"right\"})\n",
@@ -1753,8 +1784,7 @@
     "    s = s.hide(axis=\"index\")\n",
     "    # smaller font\n",
     "    s = s.set_table_attributes('style=\"font-size: 0.65em\"')\n",
-    "    return s\n",
-    "\n"
+    "    return s"
    ]
   },
   {
@@ -1996,7 +2026,7 @@
     "\n",
     "    aug_group = augmentation_specific_examples(examples)\n",
     "    for aug_name, _examples in aug_group.items():\n",
-    "        _examples = convert_to_conll_2003(_examples) # also removes misc.\n",
+    "        _examples = convert_to_conll_2003(_examples)  # also removes misc.\n",
     "        table = create_dataframe(_examples, mdl, n_rep=100, n_samples=1000)\n",
     "        table[\"Augmentation\"] = aug_name\n",
     "        tables.append(table)"
@@ -2226,7 +2256,9 @@
     "        examples = dane[mdl_name][\"examples\"]\n",
     "        n_words = sum(len(e.y) for e in examples)\n",
     "    wps = n_words / total_time\n",
-    "    rows.append({\"Model\": mdl_name, \"Words per second\": wps, \"Total time (sec)\": total_time})\n",
+    "    rows.append(\n",
+    "        {\"Model\": mdl_name, \"Words per second\": wps, \"Total time (sec)\": total_time}\n",
+    "    )\n",
     "\n",
     "speed = pd.DataFrame(rows)"
    ]
@@ -2347,21 +2379,25 @@
     "    is_min = s == s.min()\n",
     "    return [\"font-weight: bold\" if v else \"\" for v in is_min]\n",
     "\n",
+    "\n",
     "def highlight_max(s):\n",
     "    \"\"\"highlight the minimum in a series with bold\"\"\"\n",
     "    is_max = s == s.max()\n",
     "    return [\"font-weight: bold\" if v else \"\" for v in is_max]\n",
     "\n",
-    "style= style.apply(highlight_min, axis=0, subset=[\"Total time (sec)\"])\n",
+    "\n",
+    "style = style.apply(highlight_min, axis=0, subset=[\"Total time (sec)\"])\n",
     "style = style.apply(highlight_max, axis=0, subset=[\"Words per second\"])\n",
     "\n",
-    "style = style.set_properties(subset=[\"Words per second\", \"Total time (sec)\"], **{\"text-align\": \"right\"})\n",
+    "style = style.set_properties(\n",
+    "    subset=[\"Words per second\", \"Total time (sec)\"], **{\"text-align\": \"right\"}\n",
+    ")\n",
     "# set decimal places\n",
     "style = style.format({\"Words per second\": \"{:.1f}\", \"Total time (sec)\": \"{:.2f}\"})\n",
     "\n",
     "style = style.hide(axis=\"index\")\n",
     "style = style.set_properties(subset=[\"Model\"], **{\"text-align\": \"left\"})\n",
-    "style\n"
+    "style"
    ]
   },
   {
diff --git a/docs/tutorials/basic.ipynb b/docs/tutorials/basic.ipynb
index e3076941..01568b5f 100644
--- a/docs/tutorials/basic.ipynb
+++ b/docs/tutorials/basic.ipynb
@@ -46,6 +46,7 @@
    ],
    "source": [
     "import dacy\n",
+    "\n",
     "for model in dacy.models():\n",
     "    print(model)"
    ]
@@ -352,20 +353,18 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "\n",
     "displacy.render(doc, style=\"ent\")\n",
     "\n",
     "\n",
-    "client = Client() # start wikidata client\n",
+    "client = Client()  # start wikidata client\n",
     "for entity in doc.ents:\n",
     "    print(entity, \":\", entity.kb_id_)\n",
     "\n",
     "    # print the short description derived from wikidata\n",
-    "    wikidata_entry  = client.get(entity.kb_id_, load=True)\n",
+    "    wikidata_entry = client.get(entity.kb_id_, load=True)\n",
     "    print(wikidata_entry.description.get(\"en\"))\n",
     "    print(wikidata_entry.description.get(\"da\"))\n",
-    "    print(\" \")\n",
-    "        \n"
+    "    print(\" \")"
    ]
   },
   {
@@ -443,7 +442,7 @@
     "# add the ner component from the state-of-the-art fine-grained model\n",
     "nlp.add_pipe(\"dacy/ner-fine-grained\", config={\"size\": \"small\"})\n",
     "# or if you only want to do just NER\n",
-    "# nlp = dacy.load(\"da_dacy_small_ner_fine_grained-0.1.0\")\n"
+    "# nlp = dacy.load(\"da_dacy_small_ner_fine_grained-0.1.0\")"
    ]
   },
   {
@@ -485,7 +484,9 @@
     }
    ],
    "source": [
-    "doc = nlp(\"Denne model samt 3 andre blev trænet d. 7. marts af Center for Humantities Computing i Aarhus kommune\")\n",
+    "doc = nlp(\n",
+    "    \"Denne model samt 3 andre blev trænet d. 7. marts af Center for Humantities Computing i Aarhus kommune\"\n",
+    ")\n",
     "\n",
     "displacy.render(doc, style=\"ent\")"
    ]
@@ -535,8 +536,7 @@
    "source": [
     "print(\"Token POS-tag\")\n",
     "for token in doc:\n",
-    "    print(f\"{token}:\\t {token.pos_}\")\n",
-    "\n"
+    "    print(f\"{token}:\\t {token.pos_}\")"
    ]
   },
   {
@@ -713,7 +713,9 @@
     }
    ],
    "source": [
-    "doc = nlp(\"Sætnings segmentering er en vigtig del af sprogprocessering - Det kan bl.a. benyttes til at opdele lange tekster i mindre bidder uden at miste meningen i hvert sætning.\")\n",
+    "doc = nlp(\n",
+    "    \"Sætnings segmentering er en vigtig del af sprogprocessering - Det kan bl.a. benyttes til at opdele lange tekster i mindre bidder uden at miste meningen i hvert sætning.\"\n",
+    ")\n",
     "\n",
     "for sent in doc.sents:\n",
     "    print(sent)"
@@ -839,7 +841,7 @@
     "text = \"Den 4. november 2020 fik minkavler Henning Christensen og hele familien et chok. Efter et pressemøde, fik han at vide at alle mink i Danmark skulle aflives. Dermed fik han fjernet hans livsgrundlag\"\n",
     "doc = nlp(text)\n",
     "print(\"Coreference clusters:\")\n",
-    "print(doc.spans)\n"
+    "print(doc.spans)"
    ]
   },
   {
diff --git a/docs/tutorials/hate-speech.ipynb b/docs/tutorials/hate-speech.ipynb
index 22c1bf0f..01260862 100644
--- a/docs/tutorials/hate-speech.ipynb
+++ b/docs/tutorials/hate-speech.ipynb
@@ -82,7 +82,7 @@
     "import dacy\n",
     "import spacy\n",
     "\n",
-    "nlp = spacy.blank(\"da\") # create an empty pipeline\n",
+    "nlp = spacy.blank(\"da\")  # create an empty pipeline\n",
     "\n",
     "# add the hate speech models\n",
     "nlp.add_pipe(\"dacy/hatespeech_detection\")\n",
@@ -118,10 +118,7 @@
     }
    ],
    "source": [
-    "texts = [\n",
-    "    \"senile gamle idiot\", \n",
-    "    \"hej har du haft en god dag\"\n",
-    "]\n",
+    "texts = [\"senile gamle idiot\", \"hej har du haft en god dag\"]\n",
     "\n",
     "# apply the pipeline\n",
     "docs = nlp.pipe(texts)\n",
@@ -131,7 +128,7 @@
     "    print(doc._.is_offensive)\n",
     "    # print type of hate-speech if it is hate-speech\n",
     "    if doc._.is_offensive == \"offensive\":\n",
-    "        print(\"\\t\", doc._.hate_speech_type)\n"
+    "        print(\"\\t\", doc._.hate_speech_type)"
    ]
   }
  ],
diff --git a/docs/tutorials/robustness.ipynb b/docs/tutorials/robustness.ipynb
index 4832141d..30d48e3e 100644
--- a/docs/tutorials/robustness.ipynb
+++ b/docs/tutorials/robustness.ipynb
@@ -360,13 +360,16 @@
     }
    ],
    "source": [
-    "\n",
     "lower_aug = create_lower_casing_augmenter(level=1)\n",
     "female_name_dict = female_names()\n",
     "# Augmenter that replaces names with random Danish female names. Keep the format of the name as is (force_pattern_size=False)\n",
     "# but replace the name with one of the two defined patterns\n",
     "\n",
-    "patterns = [[\"firstname\"], [\"firstname\", \"lastname\"], [\"firstname\", \"firstname\", \"lastname\"]]\n",
+    "patterns = [\n",
+    "    [\"firstname\"],\n",
+    "    [\"firstname\", \"lastname\"],\n",
+    "    [\"firstname\", \"firstname\", \"lastname\"],\n",
+    "]\n",
     "female_aug = create_per_replace_augmenter_v1(female_name_dict, patterns, level=0.1)\n",
     "\n",
     "spacy_aug = score(\n",
diff --git a/docs/tutorials/sentiment.ipynb b/docs/tutorials/sentiment.ipynb
index cdeadef5..a680afe7 100644
--- a/docs/tutorials/sentiment.ipynb
+++ b/docs/tutorials/sentiment.ipynb
@@ -79,7 +79,7 @@
     "import dacy\n",
     "import spacy\n",
     "\n",
-    "nlp = spacy.blank(\"da\") # an empty spacy pipeline\n",
+    "nlp = spacy.blank(\"da\")  # an empty spacy pipeline\n",
     "# could also be a dacy pipeline, e.g. nlp = dacy.load(\"large\")\n",
     "nlp.add_pipe(\"dacy/subjectivity\")"
    ]
@@ -159,7 +159,7 @@
     }
    ],
    "source": [
-    "nlp = spacy.blank(\"da\") # an empty spacy pipeline\n",
+    "nlp = spacy.blank(\"da\")  # an empty spacy pipeline\n",
     "# could also be a dacy pipeline, e.g. nlp = dacy.load(\"large\")\n",
     "nlp.add_pipe(\"dacy/polarity\")"
    ]
@@ -256,10 +256,10 @@
     }
    ],
    "source": [
-    "nlp = spacy.blank(\"da\") # an empty spacy pipeline\n",
+    "nlp = spacy.blank(\"da\")  # an empty spacy pipeline\n",
     "# could also be a dacy pipeline, e.g. nlp = dacy.load(\"large\")\n",
-    "nlp.add_pipe(\"dacy/emotionally_laden\") # for emotianal/non-emotional\n",
-    "nlp.add_pipe(\"dacy/emotion\") # for type of emotion"
+    "nlp.add_pipe(\"dacy/emotionally_laden\")  # for emotianal/non-emotional\n",
+    "nlp.add_pipe(\"dacy/emotion\")  # for type of emotion"
    ]
   },
   {
@@ -298,7 +298,7 @@
     "    \"Ej den bil er såå flot\",\n",
     "    \"Fuck det er bare så FUCKING træls!\",\n",
     "    \"Har i set at Tesla har landet en raket på månen? Det er vildt!!\",\n",
-    "    \"der er et træ i haven\"\n",
+    "    \"der er et træ i haven\",\n",
     "]\n",
     "\n",
     "docs = nlp.pipe(texts)\n",
@@ -393,7 +393,9 @@
    ],
    "source": [
     "for token in doc:\n",
-    "    print(f\"{token._.polarity} | Valence: {token._.valence} | Negation: {token._.is_negation}\")"
+    "    print(\n",
+    "        f\"{token._.polarity} | Valence: {token._.valence} | Negation: {token._.is_negation}\"\n",
+    "    )"
    ]
   },
   {
diff --git a/docs/tutorials/textdescriptives.ipynb b/docs/tutorials/textdescriptives.ipynb
index 6090b3ea..0892c5c3 100644
--- a/docs/tutorials/textdescriptives.ipynb
+++ b/docs/tutorials/textdescriptives.ipynb
@@ -183,7 +183,8 @@
    ],
    "source": [
     "import dacy\n",
-    "nlp = dacy.load(\"small\") # load the latest version of the small model\n",
+    "\n",
+    "nlp = dacy.load(\"small\")  # load the latest version of the small model\n",
     "\n",
     "nlp.add_pipe(\"textdescriptives/readability\")\n",
     "nlp.add_pipe(\"textdescriptives/dependency_distance\")"
@@ -230,6 +231,7 @@
    ],
    "source": [
     "import textdescriptives as td\n",
+    "\n",
     "# extract the metrics as a dataframe\n",
     "metrics = td.extract_df(doc, include_text=False)"
    ]
@@ -523,6 +525,7 @@
    ],
    "source": [
     "import seaborn as sns\n",
+    "\n",
     "sns.boxplot(x=\"label\", y=\"lix\", data=df)"
    ]
   },
@@ -563,7 +566,9 @@
     "# encode the label as a boolean\n",
     "df[\"is_ham\"] = df[\"label\"] == \"ham\"\n",
     "# compute the correlation between all metrics and the label\n",
-    "metrics_correlations = metrics.corrwith(df[\"is_ham\"]).sort_values(key=abs, ascending=False)\n",
+    "metrics_correlations = metrics.corrwith(df[\"is_ham\"]).sort_values(\n",
+    "    key=abs, ascending=False\n",
+    ")\n",
     "metrics_correlations[:10]"
    ]
   },
diff --git a/makefile b/makefile
index e94def5b..c10f5b5e 100644
--- a/makefile
+++ b/makefile
@@ -8,7 +8,6 @@ static-type-check:
 
 lint:
 	@echo "--- 🧹 Running linters ---"
-	pyproject-parser check pyproject.toml 		# check pyproject.toml
 	ruff format .  								# running ruff formatting
 	ruff . --fix  								# running ruff linting
 
diff --git a/pyproject.toml b/pyproject.toml
index 818c224e..0627c5e2 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -50,9 +50,8 @@ name = "Apache License 2.0"
 [project.optional-dependencies]
 dev = [
   "cruft>=2.0.0",
-  "pyright==1.1.328",
-  "ruff>=0.0.262",
-  "pyproject-parser[cli, readme]>=0.9.1",
+  "pyright>=1.1.328",
+  "ruff>=0.0.270",
 ]
 tests = ["pytest>=7.1.2", "pytest-cov>=3.0.0", "pytest-instafail>=0.4.2"]
 docs = [
@@ -190,8 +189,9 @@ exclude = [
 dummy-variable-rgx = "^(_+|(_+[a-zA-Z0-9_]*[a-zA-Z0-9]+?))$"
 target-version = "py38"
 
-tool.ruff.lint.pydocstyle]
+[tool.ruff.lint.pydocstyle]
 convention = "google"
+
 [tool.ruff.flake8-annotations]
 mypy-init-return = true
 suppress-none-returning = true
@@ -208,4 +208,4 @@ version_toml = ["pyproject.toml:project.version"]
 build_command = "python -m pip install build; python -m build"
 
 [tool.setuptools]
-include-package-data = true
\ No newline at end of file
+include-package-data = true

From cac4d92fc50569f5658dfae2039584c1c5ddbbff Mon Sep 17 00:00:00 2001
From: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
Date: Wed, 6 Dec 2023 21:17:59 +0100
Subject: [PATCH 5/6] changed type checker to pyright

---
 makefile                               |  2 +-
 pyproject.toml                         |  2 +-
 src/dacy/datasets/dane.py              |  8 ++++----
 src/dacy/datasets/names.py             | 14 +++++++-------
 src/dacy/download.py                   | 12 ++++++------
 src/dacy/hate_speech/wrapped_models.py | 10 +++++-----
 src/dacy/load.py                       |  4 ++--
 src/dacy/ner/fine_grained.py           |  6 +++---
 src/dacy/score/input_length.py         |  6 +++---
 src/dacy/score/score.py                | 10 +++++-----
 src/dacy/sentiment/wrapped_models.py   | 10 +++++-----
 11 files changed, 42 insertions(+), 42 deletions(-)

diff --git a/makefile b/makefile
index c10f5b5e..d662f628 100644
--- a/makefile
+++ b/makefile
@@ -4,7 +4,7 @@ install:
 
 static-type-check:
 	@echo "--- 🔍 Running static type check ---"
-	pyright .
+	pyright src/
 
 lint:
 	@echo "--- 🧹 Running linters ---"
diff --git a/pyproject.toml b/pyproject.toml
index 0627c5e2..0c62e71b 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -50,7 +50,7 @@ name = "Apache License 2.0"
 [project.optional-dependencies]
 dev = [
   "cruft>=2.0.0",
-  "pyright>=1.1.328",
+  "pyright>=1.1.339",
   "ruff>=0.0.270",
 ]
 tests = ["pytest>=7.1.2", "pytest-cov>=3.0.0", "pytest-instafail>=0.4.2"]
diff --git a/src/dacy/datasets/dane.py b/src/dacy/datasets/dane.py
index d3dfb3c6..e1332aae 100644
--- a/src/dacy/datasets/dane.py
+++ b/src/dacy/datasets/dane.py
@@ -14,13 +14,13 @@
 
 
 def dane(  # noqa
-    save_path: Optional[PathLike] = None,
-    splits: List[str] = ["train", "dev", "test"],  # noqa
+    save_path: Optional[PathLike] = None,  # type: ignore
+    splits: List[str] = ["train", "dev", "test"],  # noqa  # type: ignore
     redownload: bool = False,
     n_sents: int = 1,
     open_unverified_connection: bool = False,
     **kwargs,  # noqa
-) -> Union[List[Corpus], Corpus]:
+) -> Union[List[Corpus], Corpus]:   # type: ignore
     """Reads the DaNE dataset as a spacy Corpus.
 
     Args:
@@ -110,5 +110,5 @@ def dane(  # noqa
     for split in splits:
         corpora.append(Corpus(save_path / paths[split]))  # type: ignore
     if len(corpora) == 1:
-        return corpora[0]
+        return corpora[0]       # type: ignore
     return corpora
diff --git a/src/dacy/datasets/names.py b/src/dacy/datasets/names.py
index 8c0f716a..06365ae4 100644
--- a/src/dacy/datasets/names.py
+++ b/src/dacy/datasets/names.py
@@ -8,10 +8,10 @@
 
 def load_names(
     min_count: int = 0,
-    ethnicity: Optional[str] = None,
-    gender: Optional[str] = None,
+    ethnicity: Optional[str] = None,  # type: ignore
+    gender: Optional[str] = None,  # type: ignore
     min_prop_gender: float = 0,
-) -> Dict[str, List[str]]:
+) -> Dict[str, List[str]]:  # type: ignore
     """Loads the names lookup table. Danish are from Danmarks statistik (2021).
     Muslim names are from Meldgaard (2005),
     https://nors.ku.dk/publikationer/webpublikationer/muslimske_fornavne/.
@@ -64,7 +64,7 @@ def load_names(
     }
 
 
-def muslim_names() -> Dict[str, List[str]]:
+def muslim_names() -> Dict[str, List[str]]:  # type: ignore
     """Returns a dictionary of Muslim names.
 
     Returns:
@@ -81,7 +81,7 @@ def muslim_names() -> Dict[str, List[str]]:
     return load_names(ethnicity="muslim")
 
 
-def danish_names() -> Dict[str, List[str]]:
+def danish_names() -> Dict[str, List[str]]: # type: ignore
     """Returns a dictionary of Danish names.
 
     Returns:
@@ -98,7 +98,7 @@ def danish_names() -> Dict[str, List[str]]:
     return load_names(ethnicity="danish")
 
 
-def female_names() -> Dict[str, List[str]]:
+def female_names() -> Dict[str, List[str]]:     # type: ignore
     """Returns a dictionary of Danish female names.
 
     Returns:
@@ -114,7 +114,7 @@ def female_names() -> Dict[str, List[str]]:
     return load_names(ethnicity="danish", gender="female", min_prop_gender=0.5)
 
 
-def male_names() -> Dict[str, List[str]]:
+def male_names() -> Dict[str, List[str]]:   # type: ignore
     """Returns a dictionary of Danish male names.
 
     Returns:
diff --git a/src/dacy/download.py b/src/dacy/download.py
index b602101a..45f98323 100644
--- a/src/dacy/download.py
+++ b/src/dacy/download.py
@@ -4,7 +4,7 @@
 from pathlib import Path
 
 from spacy.util import get_installed_models
-from tqdm import tqdm
+from tqdm import tqdm  # type: ignore
 
 DACY_DEFAULT_PATH = Path.home() / ".dacy"
 
@@ -40,10 +40,10 @@ def get_latest_version(model: str) -> str:
     versions = [mdl.split("-")[-1] for mdl in models_url if mdl.startswith(model)]
     versions = sorted(
         versions,
-        key=lambda s: [int(u) for u in s.split(".")],
+        key=lambda s: [int(u) for u in s.split(".")],  # type: ignore
         reverse=True,
     )
-    return versions[0]
+    return versions[0]  # type: ignore
 
 
 def models() -> list[str]:
@@ -69,7 +69,7 @@ def download_url(url: str, output_path: str) -> None:
         unit="B",
         unit_scale=True,
         miniters=1,
-        desc=url.split("/")[-1],
+        desc=url.split("/")[-1],  # type: ignore
     ) as t:
         urllib.request.urlretrieve(url, filename=output_path, reporthook=t.update_to)
 
@@ -104,7 +104,7 @@ def download_model(
     if model in {"small", "medium", "large"}:
         latest_version = get_latest_version(model)
         model = f"da_dacy_{model}_trf-{latest_version}"
-    mdl_version = model.split("-")[-1]
+    mdl_version = model.split("-")[-1]  # type: ignore
 
     if model not in models_url:
         raise ValueError(
@@ -112,7 +112,7 @@ def download_model(
             + " list of all models",
         )
 
-    mdl = model.split("-")[0]
+    mdl = model.split("-")[0]   # type: ignore
     if mdl in get_installed_models() and not force and version(mdl) == mdl_version:
         return mdl
     install(models_url[model])
diff --git a/src/dacy/hate_speech/wrapped_models.py b/src/dacy/hate_speech/wrapped_models.py
index b4818437..86383ea0 100644
--- a/src/dacy/hate_speech/wrapped_models.py
+++ b/src/dacy/hate_speech/wrapped_models.py
@@ -76,11 +76,11 @@ def make_offensive_transformer(
     nlp: Language,
     name: str,
     model: Model[List[Doc], FullTransformerBatch],
-    set_extra_annotations: Callable[[List[Doc], FullTransformerBatch], None],
+    set_extra_annotations: Callable[[List[Doc], FullTransformerBatch], None],  # type: ignore
     max_batch_items: int,
     doc_extension_trf_data: str,
     doc_extension_prediction: str,
-    labels: List[str],
+    labels: List[str],  # type: ignore
 ) -> SequenceClassificationTransformer:
     if not Doc.has_extension("is_offensive"):
         warn(
@@ -107,11 +107,11 @@ def make_offensive_transformer(
     # offensive
     if Doc.has_extension("is_offensive"):
 
-        def label_getter(doc) -> Optional[str]:  # noqa
+        def label_getter(doc) -> Optional[str]:  # noqa  # type: ignore
             if doc._.is_offensive == "offensive":
-                prob = getattr(doc._, f"{doc_extension_prediction}_prob")
+                prob = getattr(doc._, f"{doc_extension_prediction}_prob")  # type: ignore
                 if prob["prob"] is not None:
-                    return labels[int(prob["prob"].argmax())]
+                    return labels[int(prob["prob"].argmax())]  # type: ignore
             return doc._.is_offensive
 
         Doc.set_extension(doc_extension_prediction, getter=label_getter, force=True)
diff --git a/src/dacy/load.py b/src/dacy/load.py
index 3e25c99f..52cedb6e 100644
--- a/src/dacy/load.py
+++ b/src/dacy/load.py
@@ -12,7 +12,7 @@
 def load(
     model: str,
     force: bool = False,
-    **kwargs: Any,
+    **kwargs: Any,  # type: ignore
 ) -> Language:
     """Load a DaCy model as a SpaCy text processing pipeline. If the model is
     not downloaded it will also download the model.
@@ -38,7 +38,7 @@ def load(
     return spacy.load(path, **kwargs)
 
 
-def where_is_my_dacy(verbose: bool = True) -> Union[str, Path]:
+def where_is_my_dacy(verbose: bool = True) -> Union[str, Path]:  # type: ignore
     """Returns a path to where DaCy models are located. The default the model
     location can be configured with the environmental variable
     `DACY_CACHE_DIR`.
diff --git a/src/dacy/ner/fine_grained.py b/src/dacy/ner/fine_grained.py
index 049c62d7..8ff01252 100644
--- a/src/dacy/ner/fine_grained.py
+++ b/src/dacy/ner/fine_grained.py
@@ -18,10 +18,10 @@
 def create_finegrained_ner_component(
     nlp: Language,
     name: str,
-    size: Literal["small", "medium", "large"],
+    size: Literal["small", "medium", "large"],  # type: ignore
     transformer_name: str,
-    version: Optional[str],
-) -> Callable[[Doc], Doc]:
+    version: Optional[str],  # type: ignore
+) -> Callable[[Doc], Doc]:  # type: ignore
     """Create a fine grained NER component using the dacy models.
 
     Args:
diff --git a/src/dacy/score/input_length.py b/src/dacy/score/input_length.py
index 78eb68fe..32007a70 100644
--- a/src/dacy/score/input_length.py
+++ b/src/dacy/score/input_length.py
@@ -10,11 +10,11 @@
 
 
 def n_sents_score(
-    n_sents: Union[int, List[int]],
-    apply_fn: Callable,
+    n_sents: Union[int, List[int]],  # type: ignore
+    apply_fn: Callable,  # type: ignore
     dataset: str = "dane",
     split: str = "test",
-    score_fn: List[Union[str, Callable]] = ["token", "pos", "ents", "dep"],  # noqa
+    score_fn: List[Union[str, Callable]] = ["token", "pos", "ents", "dep"],  # noqa # type: ignore
     verbose: bool = True,
     **kwargs,  # noqa
 ) -> pd.DataFrame:
diff --git a/src/dacy/score/score.py b/src/dacy/score/score.py
index cb0913cc..634de5cb 100644
--- a/src/dacy/score/score.py
+++ b/src/dacy/score/score.py
@@ -3,7 +3,7 @@
 
 from copy import copy
 from functools import partial
-from time import time
+from time import time  # type: ignore
 from typing import Callable, Iterable
 
 import pandas as pd
@@ -17,7 +17,7 @@
 from ..utils import flatten_dict
 
 
-def no_misc_getter(doc: Doc, attr: str) -> Iterable[Span]:
+def no_misc_getter(doc: Doc, attr: str) -> Iterable[Span]:  # type: ignore
     """A utility getter for scoring entities without including MISC.
 
     Args:
@@ -27,7 +27,7 @@ def no_misc_getter(doc: Doc, attr: str) -> Iterable[Span]:
     Returns:
         Iterable[Span]
     """
-    spans = getattr(doc, attr)
+    spans = getattr(doc, attr)  # type: ignore
     for span in spans:
         if span.label_ == "MISC":
             continue
@@ -35,7 +35,7 @@ def no_misc_getter(doc: Doc, attr: str) -> Iterable[Span]:
 
 
 def dep_getter(token, attr):  # noqa
-    dep = getattr(token, attr)
+    dep = getattr(token, attr)  # type: ignore
     dep = token.vocab.strings.as_string(dep).lower()
     return dep
 
@@ -149,7 +149,7 @@ def __score(augmenter):  # noqa: ANN001
         corpus_ = copy(corpus)
         corpus_.augmenter = augmenter
         scores_ls = []
-        for _i in range(k):
+        for _i in range(k):  # type: ignore
             s = time()
             examples = apply_fn(corpus_(nlp))  # type: ignore
             speed = time() - s
diff --git a/src/dacy/sentiment/wrapped_models.py b/src/dacy/sentiment/wrapped_models.py
index a4cae25a..5e8ada9e 100644
--- a/src/dacy/sentiment/wrapped_models.py
+++ b/src/dacy/sentiment/wrapped_models.py
@@ -133,11 +133,11 @@ def make_emotion_transformer(
     nlp: Language,
     name: str,
     model: Model[List[Doc], FullTransformerBatch],
-    set_extra_annotations: Callable[[List[Doc], FullTransformerBatch], None],
+    set_extra_annotations: Callable[[List[Doc], FullTransformerBatch], None],  # type: ignore
     max_batch_items: int,
     doc_extension_trf_data: str,
     doc_extension_prediction: str,
-    labels: List[str],
+    labels: List[str],  # type: ignore
 ) -> SequenceClassificationTransformer:
     if not Doc.has_extension("dacy/emotionally_laden"):
         warn(
@@ -164,11 +164,11 @@ def make_emotion_transformer(
     # an emotion
     if Doc.has_extension("dacy/emotionally_laden"):
 
-        def label_getter(doc) -> Optional[str]:  # noqa: ANN001
+        def label_getter(doc) -> Optional[str]:  # noqa: ANN001  # type: ignore
             if doc._.emotionally_laden == "emotional":
-                prob = getattr(doc._, f"{doc_extension_prediction}_prob")
+                prob = getattr(doc._, f"{doc_extension_prediction}_prob")  # type: ignore
                 if prob["prob"] is not None:
-                    return labels[int(prob["prob"].argmax())]
+                    return labels[int(prob["prob"].argmax())]  # type: ignore
             return doc._.emotionally_laden
 
         Doc.set_extension(doc_extension_prediction, getter=label_getter, force=True)

From 72afda1c2eccfb1b3b17887cc3e2c5bc97e2c0fc Mon Sep 17 00:00:00 2001
From: Kenneth Enevoldsen <kennethcenevoldsen@gmail.com>
Date: Wed, 6 Dec 2023 21:25:10 +0100
Subject: [PATCH 6/6] ci: fix misspelled cmmand

---
 .github/workflows/static_type_checks.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/static_type_checks.yml b/.github/workflows/static_type_checks.yml
index 04faedde..9975945a 100644
--- a/.github/workflows/static_type_checks.yml
+++ b/.github/workflows/static_type_checks.yml
@@ -31,4 +31,4 @@ jobs:
       - name: Run static type checker
         shell: bash
         run: |
-          make static-type-checks
+          make static-type-check

	F1		F1
Models	Average	Location	Person	Organization	Misc.	Models	Average	Location	Person	Organization	Misc.
da_dacy_large_trf-0.2.0	85.4 (81.2, 88.9)	89.5 (84.0, 94.7)	92.6 (89.0, 95.4)	79.0 (72.5, 84.6)	79.0 (70.8, 86.0)	da_dacy_large_trf-0.2.0	85.4 (81.2, 88.9)	89.5 (84.0, 94.7)	92.6 (89.0, 95.4)	79.0 (72.5, 84.6)	79.0 (70.8, 86.0)
da_dacy_medium_trf-0.2.0	84.9 (81.0, 88.5)	86.8 (81.2, 92.3)	92.7 (89.2, 95.6)	78.7 (71.8, 85.0)	78.7 (70.6, 86.1)	da_dacy_medium_trf-0.2.0	84.9 (81.0, 88.5)	86.8 (81.2, 92.3)	92.7 (89.2, 95.6)	78.7 (71.8, 85.0)	78.7 (70.6, 86.1)
da_dacy_small_trf-0.2.0	82.7 (79.3, 85.9)	84.2 (78.3, 89.8)	92.2 (88.5, 95.1)	75.9 (69.3, 81.7)	75.7 (68.8, 81.8)	da_dacy_small_trf-0.2.0	82.7 (79.3, 85.9)	84.2 (78.3, 89.8)	92.2 (88.5, 95.1)	75.9 (69.3, 81.7)	75.7 (68.8, 81.8)
saattrupdan/nbailab-base-ner-scandi	86.3 (82.4, 89.7)	88.6 (83.0, 93.3)	95.1 (92.4, 97.8)	80.3 (73.6, 85.8)	78.6 (69.4, 86.0)	saattrupdan/nbailab-base-ner-scandi	86.3 (82.4, 89.7)	88.6 (83.0, 93.3)	95.1 (92.4, 97.8)	80.3 (73.6, 85.8)	78.6 (69.4, 86.0)
alexandrainst/da-ner-base	70.7 (66.2, 75.2)	84.8 (77.8, 91.0)	90.3 (86.3, 93.9)	64.7 (57.0, 71.3)		alexandrainst/da-ner-base	70.7 (66.2, 75.2)	84.8 (77.8, 91.0)	90.3 (86.3, 93.9)	64.7 (57.0, 71.3)
da_core_news_trf-3.5.0	79.0 (75.1, 82.3)	82.1 (75.5, 88.5)	91.6 (88.2, 94.5)	68.0 (61.0, 75.2)	69.0 (61.1, 77.3)	da_core_news_trf-3.5.0	79.0 (75.1, 82.3)	82.1 (75.5, 88.5)	91.6 (88.2, 94.5)	68.0 (61.0, 75.2)	69.0 (61.1, 77.3)
da_core_news_lg-3.5.0	74.6 (70.8, 78.1)	81.6 (75.3, 88.2)	85.5 (81.1, 89.9)	62.7 (54.8, 70.3)	64.4 (55.9, 72.8)	da_core_news_lg-3.5.0	74.6 (70.8, 78.1)	81.6 (75.3, 88.2)	85.5 (81.1, 89.9)	62.7 (54.8, 70.3)	64.4 (55.9, 72.8)
da_core_news_md-3.5.0	71.2 (66.9, 75.2)	76.8 (69.9, 83.6)	82.6 (77.8, 87.0)	58.2 (49.6, 66.7)	61.8 (52.6, 70.6)	da_core_news_md-3.5.0	71.2 (66.9, 75.2)	76.8 (69.9, 83.6)	82.6 (77.8, 87.0)	58.2 (49.6, 66.7)	61.8 (52.6, 70.6)
da_core_news_sm-3.5.0	64.4 (59.7, 68.5)	61.6 (52.2, 69.9)	80.1 (74.9, 85.1)	49.0 (39.0, 57.5)	58.4 (49.8, 67.1)	da_core_news_sm-3.5.0	64.4 (59.7, 68.5)	61.6 (52.2, 69.9)	80.1 (74.9, 85.1)	49.0 (39.0, 57.5)	58.4 (49.8, 67.1)
openai/gpt-3.5-turbo (02/05/23)	57.5 (52.3, 62.2)	50.7 (41.9, 59.2)	81.9 (76.8, 86.5)	55.7 (47.1, 63.7)		openai/gpt-3.5-turbo (02/05/23)	57.5 (52.3, 62.2)	50.7 (41.9, 59.2)	81.9 (76.8, 86.5)	55.7 (47.1, 63.7)
openai/gpt-4 (02/05/23)	70.1 (66.0, 74.3)	78.9 (71.5, 85.7)	85.3 (80.4, 89.5)	72.0 (65.4, 78.5)		openai/gpt-4 (02/05/23)	70.1 (66.0, 74.3)	78.9 (71.5, 85.7)	85.3 (80.4, 89.5)	72.0 (65.4, 78.5)
		Fine-grained Models	Fine-grained Models
		Large 0.1.0	Medium 0.1.0	Small 0.1.0	Large 0.1.0	Medium 0.1.0	Small 0.1.0
Entities	Event	43.5 (27.0, 56.0)	64.2 (50.0, 79.4)	46.1 (27.8, 62.4)	Entities	Event	43.5 (27.0, 56.0)	64.2 (50.0, 79.4)	46.1 (27.8, 62.4)
Facility	69.8 (54.3, 84.4)	72.3 (56.2, 84.6)	55.5 (36.2, 70.5)	Facility	69.8 (54.3, 84.4)	72.3 (56.2, 84.6)	55.5 (36.2, 70.5)
GPE	90.6 (87.2, 93.1)	88.0 (82.7, 92.1)	79.6 (73.0, 84.6)	GPE	90.6 (87.2, 93.1)	88.0 (82.7, 92.1)	79.6 (73.0, 84.6)
Language	74.5 (60.0, 83.3)	51.9 (23.3, 100.0)	45.9 (13.3, 93.3)	Language	74.5 (60.0, 83.3)	51.9 (23.3, 100.0)	45.9 (13.3, 93.3)
Law	54.2 (38.1, 72.5)	59.3 (37.4, 77.3)	57.6 (39.6, 75.1)	Law	54.2 (38.1, 72.5)	59.3 (37.4, 77.3)	57.6 (39.6, 75.1)
Location	75.3 (66.9, 83.8)	72.5 (62.1, 80.8)	65.6 (55.4, 74.1)	Location	75.3 (66.9, 83.8)	72.5 (62.1, 80.8)	65.6 (55.4, 74.1)
NORP	84.8 (76.9, 90.8)	78.2 (68.6, 85.8)	73.3 (62.9, 81.5)	NORP	84.8 (76.9, 90.8)	78.2 (68.6, 85.8)	73.3 (62.9, 81.5)
Ordinal	37.8 (22.5, 51.2)	68.7 (49.1, 82.6)	68.5 (47.6, 83.1)	Ordinal	37.8 (22.5, 51.2)	68.7 (49.1, 82.6)	68.5 (47.6, 83.1)
Organization	79.5 (74.9, 83.1)	80.5 (78.1, 84.2)	79.1 (75.7, 82.3)	Organization	79.5 (74.9, 83.1)	80.5 (78.1, 84.2)	79.1 (75.7, 82.3)
Person	85.9 (82.7, 88.8)	84.8 (80.6, 88.2)	86.8 (83.2, 90.1)	Person	85.9 (82.7, 88.8)	84.8 (80.6, 88.2)	86.8 (83.2, 90.1)
Product	62.4 (53.9, 72.0)	62.6 (53.9, 71.6)	59.5 (48.9, 67.9)	Product	62.4 (53.9, 72.0)	62.6 (53.9, 71.6)	59.5 (48.9, 67.9)
Work of Art	39.3 (25.5, 50.3)	58.4 (48.7, 69.1)	46.6 (36.2, 56.9)	Work of Art	39.3 (25.5, 50.3)	58.4 (48.7, 69.1)	46.6 (36.2, 56.9)
Non-Entities	Cardinal	87.0 (82.8, 90.3)	80.5 (77.0, 84.4)	89.2 (86.0, 91.7)	Non-Entities	Cardinal	87.0 (82.8, 90.3)	80.5 (77.0, 84.4)	89.2 (86.0, 91.7)
Date	77.3 (71.6, 81.8)	77.6 (72.8, 82.2)	78.8 (73.9, 83.4)	Date	77.3 (71.6, 81.8)	77.6 (72.8, 82.2)	78.8 (73.9, 83.4)
Money	99.3 (97.9, 100.0)	98.6 (97.2, 100.0)	95.2 (90.0, 98.2)	Money	99.3 (97.9, 100.0)	98.6 (97.2, 100.0)	95.2 (90.0, 98.2)
Percent	100.0 (100.0, 100.0)	100.0 (100.0, 100.0)	100.0 (100.0, 100.0)	Percent	100.0 (100.0, 100.0)	100.0 (100.0, 100.0)	100.0 (100.0, 100.0)
Quantity	78.6 (59.8, 93.8)	76.9 (63.9, 89.9)	71.3 (50.0, 91.1)	Quantity	78.6 (59.8, 93.8)	76.9 (63.9, 89.9)	71.3 (50.0, 91.1)
Time	90.9 (83.8, 96.7)	85.1 (74.0, 93.7)	83.4 (68.0, 95.6)	Time	90.9 (83.8, 96.7)	85.1 (74.0, 93.7)	83.4 (68.0, 95.6)
Average	Average	80.1 (78.2, 81.9)	79.7 (77.7, 81.5)	78.4 (76.3, 80.4)	Average	Average	80.1 (78.2, 81.9)	79.7 (77.7, 81.5)	78.4 (76.3, 80.4)