From aba4367b49750089e4e4122415a77cac43bd97bc Mon Sep 17 00:00:00 2001
From: Dirk Roorda <text.annotation@icloud.com>
Date: Thu, 9 Dec 2021 16:09:13 +0100
Subject: [PATCH] better metadata

---
 programs/phono.ipynb     | 610 ++++++++++++++++++++-------------------
 programs/phono.py        | 319 ++++++++++----------
 tf/2021/otext@phono.tf   |   6 +-
 tf/2021/phono.tf         |   7 +-
 tf/2021/phono_trailer.tf |   7 +-
 yaml/generic.yaml        |   3 +
 yaml/phono.yaml          |   5 +
 7 files changed, 486 insertions(+), 471 deletions(-)
 create mode 100644 yaml/generic.yaml
 create mode 100644 yaml/phono.yaml

diff --git a/programs/phono.ipynb b/programs/phono.ipynb
index bb23fe6..cc27d32 100644
--- a/programs/phono.ipynb
+++ b/programs/phono.ipynb
@@ -316,9 +316,11 @@
     "import os\n",
     "import collections\n",
     "import re\n",
+    "import yaml\n",
     "import utils\n",
     "from tf.fabric import Fabric\n",
-    "from tf.writing.transcription import Transcription"
+    "from tf.writing.transcription import Transcription\n",
+    "from tf.core.helpers import formatMeta"
    ]
   },
   {
@@ -334,7 +336,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -348,7 +350,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -383,7 +385,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -394,7 +396,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -403,7 +405,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -413,7 +415,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 7,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -436,7 +438,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 8,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -463,7 +465,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -473,10 +475,10 @@
       "..............................................................................................\n",
       ".       0.00s Load the existing TF dataset                                                   .\n",
       "..............................................................................................\n",
-      "This is Text-Fabric 8.5.13\n",
+      "This is Text-Fabric 9.1.7\n",
       "Api reference : https://annotation.github.io/text-fabric/tf/cheatsheet.html\n",
       "\n",
-      "88 features found and 0 ignored\n"
+      "114 features found and 0 ignored\n"
      ]
     }
    ],
@@ -487,14 +489,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 10,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -505,7 +500,7 @@
      "text": [
       "  0.00s loading features ...\n",
       "   |     0.00s Dataset without structure sections in otext:no structure functions in the T-API\n",
-      "  4.38s All features loaded/computed - for details use loadLog()\n"
+      "    10s All features loaded/computed - for details use TF.isLoaded()\n"
      ]
     },
     {
@@ -525,7 +520,7 @@
        " ('Text', 'text', ('T Text',))]"
       ]
      },
-     "execution_count": 6,
+     "execution_count": 10,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -572,7 +567,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -593,7 +588,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 12,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -616,7 +611,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -637,7 +632,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -672,7 +667,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 15,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -682,7 +677,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 16,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -705,7 +700,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 17,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -741,7 +736,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 18,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -750,7 +745,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 19,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -796,7 +791,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 20,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -841,7 +836,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 21,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -913,7 +908,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 22,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -948,7 +943,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 23,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -958,7 +953,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 24,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -983,7 +978,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 25,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -994,7 +989,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 26,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1007,7 +1002,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 27,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1020,7 +1015,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 28,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1124,7 +1119,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 29,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1135,7 +1130,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 30,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1147,7 +1142,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 31,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1160,7 +1155,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 32,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1171,7 +1166,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 33,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1193,7 +1188,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 34,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1241,7 +1236,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 35,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1250,7 +1245,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 36,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1260,7 +1255,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 37,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1271,7 +1266,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 38,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1301,7 +1296,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 39,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1319,7 +1314,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 40,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1329,7 +1324,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 41,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1340,7 +1335,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 42,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1353,7 +1348,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 43,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1363,7 +1358,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 44,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1373,7 +1368,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 45,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1395,7 +1390,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 46,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1405,7 +1400,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 47,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1414,7 +1409,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
+   "execution_count": 48,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1435,7 +1430,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 49,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1444,7 +1439,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 50,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1545,7 +1540,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 51,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1557,7 +1552,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 52,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1567,7 +1562,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 53,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1579,7 +1574,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 54,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1590,7 +1585,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 55,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1600,7 +1595,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 56,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1619,7 +1614,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 57,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1628,7 +1623,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 58,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1638,7 +1633,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 59,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1654,7 +1649,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 60,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1665,7 +1660,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 61,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1688,7 +1683,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 62,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1697,7 +1692,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 63,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1729,7 +1724,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 64,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1817,7 +1812,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 65,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1850,7 +1845,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 66,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1861,7 +1856,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 67,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1871,7 +1866,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 68,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1881,7 +1876,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 69,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1891,7 +1886,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 70,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1907,7 +1902,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 71,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1917,7 +1912,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 72,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1927,7 +1922,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 17,
+   "execution_count": 73,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -1948,7 +1943,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 18,
+   "execution_count": 74,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1958,7 +1953,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 75,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1970,7 +1965,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 76,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1980,7 +1975,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 77,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -1991,7 +1986,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 78,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2002,7 +1997,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 79,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2012,7 +2007,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 80,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2022,7 +2017,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 81,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2069,7 +2064,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 82,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2087,7 +2082,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 83,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2127,7 +2122,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 84,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2136,7 +2131,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 20,
+   "execution_count": 85,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2173,7 +2168,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 86,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2182,7 +2177,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 87,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2209,7 +2204,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 88,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2222,7 +2217,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 21,
+   "execution_count": 89,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2251,7 +2246,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 22,
+   "execution_count": 90,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2263,13 +2258,6 @@
     "]"
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
   {
    "cell_type": "markdown",
    "metadata": {
@@ -2286,7 +2274,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 23,
+   "execution_count": 91,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2428,14 +2416,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 24,
+   "execution_count": 92,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2535,14 +2516,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 25,
+   "execution_count": 93,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2625,7 +2599,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 26,
+   "execution_count": 94,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2722,7 +2696,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 95,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2737,7 +2711,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 96,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2752,7 +2726,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 27,
+   "execution_count": 97,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2781,7 +2755,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 98,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2791,7 +2765,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 99,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2803,7 +2777,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 100,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2813,7 +2787,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 101,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2833,7 +2807,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 102,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -2856,7 +2830,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 28,
+   "execution_count": 103,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2909,9 +2883,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 104,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "|         11s \tLooking for non-verb qamets\n"
+     ]
+    }
+   ],
    "source": [
     "# find lexemes which have an occurrence with a qamets (except verbs)\n",
     "utils.caption(0, \"\\tLooking for non-verb qamets\")\n",
@@ -2921,7 +2903,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 29,
+   "execution_count": 105,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2930,8 +2912,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "|         48s \tLooking for non-verb qamets\n",
-      "|         50s \t4058 lexemes and 13452 unique occurrences\n"
+      "|         13s \t4056 lexemes and 13451 unique occurrences\n"
      ]
     }
    ],
@@ -2968,7 +2949,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 30,
+   "execution_count": 106,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -2977,8 +2958,8 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "|         55s \tFiltering lexemes with varied occurrences\n",
-      "|         56s \t161 interesting lexemes with 1704 unique occurrences\n"
+      "|         13s \tFiltering lexemes with varied occurrences\n",
+      "|         13s \t161 interesting lexemes with 1704 unique occurrences\n"
      ]
     }
    ],
@@ -3029,7 +3010,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 107,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -3047,7 +3028,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 108,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -3094,7 +3075,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 109,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -3110,7 +3091,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 31,
+   "execution_count": 110,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3143,7 +3124,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 32,
+   "execution_count": 111,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3152,14 +3133,14 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "|      1m 07s \tGuessing between gadol and qatan\n",
+      "|         13s \tGuessing between gadol and qatan\n",
       "\tJM/: Override for syllable 1: ā becomes o\n",
       "\tBJT/: Override for syllable 1: o becomes ā\n",
       "\tJWMM: Override for syllable 2:  becomes ā\n",
       "\tJHWNTN/: Override for syllable 2:  becomes ā\n",
       "\tJRB<M/: No override needed for syllable 1 which is ā\n",
-      "|      1m 07s \t107 lexemes with modified occurrences (224)\n",
-      "|      1m 07s \t0 patterns with conflicts\n"
+      "|         13s \t107 lexemes with modified occurrences (224)\n",
+      "|         13s \t0 patterns with conflicts\n"
      ]
     }
    ],
@@ -3220,7 +3201,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 112,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -3230,16 +3211,26 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 113,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "..............................................................................................\n",
+      ".         13s Generating data in two ways ...                                                .\n",
+      "..............................................................................................\n"
+     ]
+    }
+   ],
    "source": [
     "utils.caption(4, \"Generating data in two ways ... \")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 114,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -3249,9 +3240,39 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 115,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "|         14s \t 1000 verses 13316 62 0 21\n",
+      "|         16s \t 2000 verses 27407 123 2 79\n",
+      "|         17s \t 3000 verses 40963 174 5 125\n",
+      "|         18s \t 4000 verses 54143 242 8 143\n",
+      "|         19s \t 5000 verses 67151 308 13 171\n",
+      "|         20s \t 6000 verses 82448 394 15 196\n",
+      "|         22s \t 7000 verses 97551 457 17 254\n",
+      "|         23s \t 8000 verses 113748 529 18 287\n",
+      "|         24s \t 9000 verses 129602 573 20 327\n",
+      "|         26s \t10000 verses 146217 624 20 438\n",
+      "|         27s \t11000 verses 159809 749 20 487\n",
+      "|         28s \t12000 verses 174192 891 24 524\n",
+      "|         30s \t13000 verses 190555 1018 28 576\n",
+      "|         31s \t14000 verses 205104 1168 32 622\n",
+      "|         32s \t15000 verses 218610 1290 33 728\n",
+      "|         33s \t16000 verses 227944 1336 39 777\n",
+      "|         34s \t17000 verses 235635 1379 48 827\n",
+      "|         35s \t18000 verses 243258 1396 51 866\n",
+      "|         35s \t19000 verses 250709 1429 59 906\n",
+      "|         36s \t20000 verses 260118 1470 60 960\n",
+      "|         38s \t21000 verses 275083 1533 63 979\n",
+      "|         39s \t22000 verses 286442 1590 65 1007\n",
+      "|         40s \t23000 verses 301302 1645 66 1075\n"
+     ]
+    }
+   ],
    "source": [
     "stats = collections.Counter()\n",
     "nv = 0\n",
@@ -3281,7 +3302,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 33,
+   "execution_count": 116,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3290,62 +3311,36 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "..............................................................................................\n",
-      ".      1m 15s Generating data in two ways ...                                                .\n",
-      "..............................................................................................\n",
-      "|      1m 16s \t 1000 verses 13315 62 0 21\n",
-      "|      1m 17s \t 2000 verses 27406 123 2 79\n",
-      "|      1m 19s \t 3000 verses 40962 174 5 125\n",
-      "|      1m 20s \t 4000 verses 54142 242 8 143\n",
-      "|      1m 21s \t 5000 verses 67150 308 13 171\n",
-      "|      1m 22s \t 6000 verses 82446 394 15 196\n",
-      "|      1m 24s \t 7000 verses 97549 457 17 254\n",
-      "|      1m 25s \t 8000 verses 113746 529 18 287\n",
-      "|      1m 26s \t 9000 verses 129600 573 20 327\n",
-      "|      1m 28s \t10000 verses 146215 624 20 438\n",
-      "|      1m 29s \t11000 verses 159807 749 20 487\n",
-      "|      1m 30s \t12000 verses 174191 891 24 524\n",
-      "|      1m 31s \t13000 verses 190554 1018 28 576\n",
-      "|      1m 33s \t14000 verses 205103 1168 32 622\n",
-      "|      1m 34s \t15000 verses 218609 1290 33 728\n",
-      "|      1m 35s \t16000 verses 227943 1336 39 777\n",
-      "|      1m 35s \t17000 verses 235633 1379 48 827\n",
-      "|      1m 36s \t18000 verses 243256 1396 51 866\n",
-      "|      1m 36s \t19000 verses 250708 1429 59 906\n",
-      "|      1m 37s \t20000 verses 260117 1470 60 960\n",
-      "|      1m 38s \t21000 verses 275084 1533 63 979\n",
-      "|      1m 39s \t22000 verses 286443 1590 65 1007\n",
-      "|      1m 41s \t23000 verses 301301 1645 66 1075\n",
-      "|      1m 41s \t23213 verses done 304799 1650 66 1081\n",
-      "|      1m 41s \t  270185 accents\n",
-      "|      1m 41s \t    9004 cleanup\n",
-      "|      1m 41s \t   45234 dagesh_forte\n",
-      "|      1m 41s \t   21509 dagesh_forte_lene\n",
-      "|      1m 41s \t   59611 dagesh_lene\n",
-      "|      1m 41s \t   16321 default_accent\n",
-      "|      1m 41s \t     969 fixit\n",
-      "|      1m 41s \t    2658 furtive_patah\n",
-      "|      1m 41s \t   28195 last_ml\n",
-      "|      1m 41s \t    2201 mappiq_heh\n",
-      "|      1m 41s \t   93897 mobile_schwa1\n",
-      "|      1m 41s \t    2255 mobile_schwa2\n",
-      "|      1m 41s \t     179 mobile_schwa3\n",
-      "|      1m 41s \t    7702 mobile_schwa4\n",
-      "|      1m 41s \t   25496 punct\n",
-      "|      1m 41s \t   25504 punctuation\n",
-      "|      1m 41s \t      66 qamets_prs_suppress_qatan\n",
-      "|      1m 41s \t    5257 qamets_qatan1\n",
-      "|      1m 41s \t     243 qamets_qatan2\n",
-      "|      1m 41s \t    1791 qamets_qatan3\n",
-      "|      1m 41s \t      28 qamets_qatan4a\n",
-      "|      1m 41s \t     256 qamets_qatan4b\n",
-      "|      1m 41s \t     209 qamets_qatan5\n",
-      "|      1m 41s \t    1081 qamets_qatan_corrections\n",
-      "|      1m 41s \t    1650 qamets_verb_suppress_qatan\n",
-      "|      1m 41s \t      12 rafe\n",
-      "|      1m 41s \t   21098 silent_aleph\n",
-      "|      1m 41s \t  304799 total\n",
-      "|      1m 41s \t  304795 trim\n"
+      "|         40s \t23213 verses done 304800 1650 66 1081\n",
+      "|         40s \t  270191 accents\n",
+      "|         40s \t    9006 cleanup\n",
+      "|         40s \t   45235 dagesh_forte\n",
+      "|         40s \t   21511 dagesh_forte_lene\n",
+      "|         40s \t   59612 dagesh_lene\n",
+      "|         40s \t   16322 default_accent\n",
+      "|         40s \t     968 fixit\n",
+      "|         40s \t    2658 furtive_patah\n",
+      "|         40s \t   28195 last_ml\n",
+      "|         40s \t    2201 mappiq_heh\n",
+      "|         40s \t   93898 mobile_schwa1\n",
+      "|         40s \t    2255 mobile_schwa2\n",
+      "|         40s \t     179 mobile_schwa3\n",
+      "|         40s \t    7702 mobile_schwa4\n",
+      "|         40s \t   25498 punct\n",
+      "|         40s \t   25498 punctuation\n",
+      "|         40s \t      66 qamets_prs_suppress_qatan\n",
+      "|         40s \t    5257 qamets_qatan1\n",
+      "|         40s \t     243 qamets_qatan2\n",
+      "|         40s \t    1791 qamets_qatan3\n",
+      "|         40s \t      28 qamets_qatan4a\n",
+      "|         40s \t     256 qamets_qatan4b\n",
+      "|         40s \t     209 qamets_qatan5\n",
+      "|         40s \t    1081 qamets_qatan_corrections\n",
+      "|         40s \t    1650 qamets_verb_suppress_qatan\n",
+      "|         40s \t      12 rafe\n",
+      "|         40s \t   21098 silent_aleph\n",
+      "|         40s \t  304800 total\n",
+      "|         40s \t  304796 trim\n"
      ]
     }
    ],
@@ -3379,9 +3374,19 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 117,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "|         40s 304800 items in phono\n",
+      "    40s Reading word\n",
+      "|         41s \t23213 lines\n"
+     ]
+    }
+   ],
    "source": [
     "utils.caption(0, \"{} items in phono\".format(len(phono_file)))\n",
     "word_test = []\n",
@@ -3397,7 +3402,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 35,
+   "execution_count": 118,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3406,10 +3411,7 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "|      2m 22s 304799 items in phono\n",
-      " 2m 16s Reading word\n",
-      "|      2m 22s \t23213 lines\n",
-      "|      2m 22s \tOK: phono text and word info are CONSISTENT\n"
+      "|         41s \tOK: phono text and word info are CONSISTENT\n"
      ]
     }
    ],
@@ -3439,7 +3441,25 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 36,
+   "execution_count": 122,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "genericMetaPath = f\"{thisRepo}/yaml/generic.yaml\"\n",
+    "phonoMetaPath = f\"{thisRepo}/yaml/phono.yaml\"\n",
+    "\n",
+    "with open(genericMetaPath) as fh:\n",
+    "    genericMeta = yaml.load(fh, Loader=yaml.FullLoader)\n",
+    "    genericMeta[\"version\"] = VERSION\n",
+    "with open(phonoMetaPath) as fh:\n",
+    "    phonoMeta = formatMeta(yaml.load(fh, Loader=yaml.FullLoader))\n",
+    "    \n",
+    "metaData = {\"\": genericMeta, **phonoMeta}"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 124,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3449,7 +3469,7 @@
      "output_type": "stream",
      "text": [
       "..............................................................................................\n",
-      ".      2m 29s Writing TF phono features                                                      .\n",
+      ".      3m 09s Writing TF phono features                                                      .\n",
       "..............................................................................................\n"
      ]
     },
@@ -3459,7 +3479,7 @@
        "True"
       ]
      },
-     "execution_count": 36,
+     "execution_count": 124,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -3471,22 +3491,14 @@
     "    phono_trailer=dict(((ln[0], ln[2]) for ln in word_file if ln[0] is not None)),\n",
     ")\n",
     "edgeFeatures = {}\n",
-    "provenance = dict(\n",
-    "    source=\"Phono Notebook applied to BHSA Data\",\n",
-    "    coreData=\"BHSA\",\n",
-    "    coreVersion=VERSION,\n",
-    "    author=\"BHSA Data: Constantijn Sikkel; Phono Notebook: Dirk Roorda\",\n",
-    ")\n",
-    "metaData = {\n",
-    "    \"\": provenance,\n",
-    "    \"otext@phono\": {\n",
-    "        \"about\": \"Provides phonetic transcriptions to Hebrew Words\",\n",
-    "        \"see\": \"https://github.com/ETCBC/phono\",\n",
-    "        \"fmt:text-phono-full\": \"{phono}{phono_trailer}\",\n",
-    "    },\n",
-    "    \"phono\": dict(valueType=\"str\"),\n",
-    "    \"phono_trailer\": dict(valueType=\"str\"),\n",
+    "metaData[\"otext@phono\"] = {\n",
+    "    \"about\": \"Provides phonetic transcriptions to Hebrew Words\",\n",
+    "    \"see\": \"https://github.com/ETCBC/phono\",\n",
+    "    \"fmt:text-phono-full\": \"{phono}{phono_trailer}\",\n",
     "}\n",
+    "metaData[\"phono\"][\"valueType\"] = \"str\"\n",
+    "metaData[\"phono_trailer\"][\"valueType\"] = \"str\"\n",
+    "\n",
     "TF = Fabric(locations=thisTempTf, silent=True)\n",
     "TF.save(nodeFeatures=nodeFeatures, edgeFeatures=edgeFeatures, metaData=metaData)"
    ]
@@ -3504,7 +3516,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 37,
+   "execution_count": 125,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3514,14 +3526,14 @@
      "output_type": "stream",
      "text": [
       "..............................................................................................\n",
-      ".      2m 34s Check differences with previous version                                        .\n",
+      ".      6m 08s Check differences with previous version                                        .\n",
       "..............................................................................................\n",
-      "|      2m 34s \t2 features to add\n",
-      "|      2m 34s \t\tphono\n",
-      "|      2m 34s \t\tphono_trailer\n",
-      "|      2m 34s \tno features to delete\n",
-      "|      2m 34s \t0 features in common\n",
-      "|      2m 34s Done\n"
+      "|      6m 08s \tno features to add\n",
+      "|      6m 08s \tno features to delete\n",
+      "|      6m 08s \t2 features in common\n",
+      "|      6m 08s phono                     ... no changes\n",
+      "|      6m 08s phono_trailer             ... no changes\n",
+      "|      6m 08s Done\n"
      ]
     }
    ],
@@ -3542,7 +3554,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 38,
+   "execution_count": 126,
    "metadata": {
     "lines_to_next_cell": 2
    },
@@ -3552,7 +3564,7 @@
      "output_type": "stream",
      "text": [
       "..............................................................................................\n",
-      ".      2m 38s Deliver data set to /Users/dirk/github/etcbc/phono/tf/2021                     .\n",
+      ".      6m 11s Deliver data set to /Users/werk/github/etcbc/phono/tf/2021                     .\n",
       "..............................................................................................\n"
      ]
     }
@@ -3572,34 +3584,41 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 127,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "..............................................................................................\n",
+      ".      6m 14s Load and compile the new TF features                                           .\n",
+      "..............................................................................................\n"
+     ]
+    }
+   ],
    "source": [
     "utils.caption(4, \"Load and compile the new TF features\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 39,
+   "execution_count": 128,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "..............................................................................................\n",
-      ".      2m 41s Load and compile the new TF features                                           .\n",
-      "..............................................................................................\n",
-      "This is Text-Fabric 8.5.13\n",
+      "This is Text-Fabric 9.1.7\n",
       "Api reference : https://annotation.github.io/text-fabric/tf/cheatsheet.html\n",
       "\n",
-      "91 features found and 0 ignored\n",
+      "117 features found and 0 ignored\n",
       "  0.00s loading features ...\n",
       "   |     0.00s Dataset without structure sections in otext:no structure functions in the T-API\n",
-      "   |     0.65s T phono_trailer        from ~/github/etcbc/phono/tf/2021\n",
-      "   |     1.22s T phono                from ~/github/etcbc/phono/tf/2021\n",
-      "  5.79s All features loaded/computed - for details use loadLog()\n"
+      "   |     1.01s T phono                from ~/github/etcbc/phono/tf/2021\n",
+      "   |     0.60s T phono_trailer        from ~/github/etcbc/phono/tf/2021\n",
+      "    15s All features loaded/computed - for details use TF.isLoaded()\n"
      ]
     },
     {
@@ -3619,7 +3638,7 @@
        " ('Text', 'text', ('T Text',))]"
       ]
      },
-     "execution_count": 39,
+     "execution_count": 128,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -3632,48 +3651,34 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 129,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "..............................................................................................\n",
+      ".      6m 33s Basic tests                                                                    .\n",
+      "..............................................................................................\n"
+     ]
+    }
+   ],
    "source": [
     "utils.caption(4, \"Basic tests\")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 130,
    "metadata": {},
-   "outputs": [],
-   "source": [
-    "utils.caption(4, \"First verses in phonetic transcription\")\n",
-    "for v in F.otype.s(\"verse\")[0:10]:\n",
-    "    utils.caption(0, \"{} {}:{}\".format(*T.sectionFromNode(v)), continuation=True)\n",
-    "    utils.caption(0, T.text(L.d(v, \"word\"), fmt=\"text-phono-full\"), continuation=True)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 40,
-   "metadata": {
-    "lines_to_next_cell": 2
-   },
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
       "..............................................................................................\n",
-      ".      2m 56s Basic tests                                                                    .\n",
-      "..............................................................................................\n",
-      "..............................................................................................\n",
-      ".      2m 56s First verses in phonetc transcription                                          .\n",
+      ".      6m 36s First verses in phonetic transcription                                         .\n",
       "..............................................................................................\n",
       "Genesis 1:1\n",
       "bᵊrēšˌîṯ bārˈā ʔᵉlōhˈîm ʔˌēṯ haššāmˌayim wᵊʔˌēṯ hāʔˈāreṣ . \n",
@@ -3694,9 +3699,30 @@
       "Genesis 1:9\n",
       "wayyˈōmer ʔᵉlōhˈîm yiqqāwˌû hammˈayim mittˈaḥaṯ haššāmˈayim ʔel-māqˈôm ʔeḥˈāḏ wᵊṯērāʔˌeh hayyabbāšˈā wˈayᵊhî-ḵˈēn . \n",
       "Genesis 1:10\n",
-      "wayyiqrˌā ʔᵉlōhˈîm layyabbāšˌā ʔˈereṣ ûlᵊmiqwˌē hammˌayim qārˈā yammˈîm wayyˌar ʔᵉlōhˌîm kî-ṭˈôv . \n",
+      "wayyiqrˌā ʔᵉlōhˈîm layyabbāšˌā ʔˈereṣ ûlᵊmiqwˌē hammˌayim qārˈā yammˈîm wayyˌar ʔᵉlōhˌîm kî-ṭˈôv . \n"
+     ]
+    }
+   ],
+   "source": [
+    "utils.caption(4, \"First verses in phonetic transcription\")\n",
+    "for v in F.otype.s(\"verse\")[0:10]:\n",
+    "    utils.caption(0, \"{} {}:{}\".format(*T.sectionFromNode(v)), continuation=True)\n",
+    "    utils.caption(0, T.text(L.d(v, \"word\"), fmt=\"text-phono-full\"), continuation=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 131,
+   "metadata": {
+    "lines_to_next_cell": 2
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
       "..............................................................................................\n",
-      ".      2m 56s First verse in all formats                                                     .\n",
+      ".      6m 41s First verse in all formats                                                     .\n",
       "..............................................................................................\n",
       "lex-orig-full\n",
       "\tבְּ רֵאשִׁית בָּרָא אֱלֹה אֵת הַ שָּׁמַי וְ אֵת הָ אָרֶץ \n",
@@ -4892,7 +4918,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.5"
+   "version": "3.10.0"
   },
   "widgets": {
    "application/vnd.jupyter.widget-state+json": {
diff --git a/programs/phono.py b/programs/phono.py
index 7491cab..30285e1 100644
--- a/programs/phono.py
+++ b/programs/phono.py
@@ -290,16 +290,18 @@
 import os
 import collections
 import re
+import yaml
 import utils
 from tf.fabric import Fabric
 from tf.writing.transcription import Transcription
+from tf.core.helpers import formatMeta
 
 
 # # Pipeline
 # See [operation](https://github.com/ETCBC/pipeline/blob/master/README.md#operation)
 # for how to run this script in the pipeline.
 
-# In[ ]:
+# In[2]:
 
 
 if "SCRIPT" not in locals():
@@ -310,7 +312,7 @@
     VERSION = "2021"
 
 
-# In[2]:
+# In[3]:
 
 
 def stop(good=False):
@@ -328,7 +330,7 @@ def stop(good=False):
 # The conversion is executed in an environment of directories, so that sources, temp files and
 # results are in convenient places and do not have to be shifted around.
 
-# In[ ]:
+# In[4]:
 
 
 repoBase = os.path.expanduser("~/github/etcbc")
@@ -336,20 +338,20 @@ def stop(good=False):
 thisRepo = "{}/{}".format(repoBase, NAME)
 
 
-# In[ ]:
+# In[5]:
 
 
 coreTf = "{}/tf/{}".format(coreRepo, VERSION)
 
 
-# In[ ]:
+# In[6]:
 
 
 thisTemp = "{}/_temp/{}".format(thisRepo, VERSION)
 thisTempTf = "{}/tf".format(thisTemp)
 
 
-# In[3]:
+# In[7]:
 
 
 thisTf = "{}/tf/{}".format(thisRepo, VERSION)
@@ -360,7 +362,7 @@ def stop(good=False):
 # Check whether this conversion is needed in the first place.
 # Only when run as a script.
 
-# In[4]:
+# In[8]:
 
 
 if SCRIPT:
@@ -375,20 +377,14 @@ def stop(good=False):
 
 # # Load the TF data
 
-# In[5]:
+# In[9]:
 
 
 utils.caption(4, "Load the existing TF dataset")
 TF = Fabric(locations=coreTf, modules=[""])
 
 
-# In[ ]:
-
-
-
-
-
-# In[6]:
+# In[10]:
 
 
 api = TF.load(
@@ -413,7 +409,7 @@ def stop(good=False):
 
 # ## Patterns
 
-# In[ ]:
+# In[11]:
 
 
 # punctuation
@@ -431,7 +427,7 @@ def stop(good=False):
 )
 
 
-# In[ ]:
+# In[12]:
 
 
 split_punctuation = re.compile(
@@ -451,7 +447,7 @@ def stop(good=False):
 )
 
 
-# In[ ]:
+# In[13]:
 
 
 start_punct = re.compile(
@@ -469,7 +465,7 @@ def stop(good=False):
 )
 
 
-# In[ ]:
+# In[14]:
 
 
 noorigspace = re.compile(
@@ -496,14 +492,14 @@ def stop(good=False):
 # So: set_pet to be used before phono(), in get_orig, but only if get_orig is
 # used for phono().
 
-# In[ ]:
+# In[15]:
 
 
 set_pet_pattern = re.compile(r"((?:0[05])?)(_[SNP])+\Z")
 tetra_lex = "JHWH/"
 
 
-# In[7]:
+# In[16]:
 
 
 def set_pet_pattern_repl(match):
@@ -514,7 +510,7 @@ def set_pet_pattern_repl(match):
 
 # ## Actions
 
-# In[ ]:
+# In[17]:
 
 
 def get_orig(w, punct=True, set_pet=False, tetra=True, give_ketiv=False):
@@ -542,13 +538,13 @@ def get_orig(w, punct=True, set_pet=False, tetra=True, give_ketiv=False):
 # it turns out that too much is happening with accents, so I will "normalize" the accents for the
 # sake of looking up
 
-# In[ ]:
+# In[18]:
 
 
 digit = re.compile("[0-9]+")
 
 
-# In[ ]:
+# In[19]:
 
 
 def find_w(passage, orig, debug=False):
@@ -591,7 +587,7 @@ def find_w(passage, orig, debug=False):
     return results
 
 
-# In[8]:
+# In[20]:
 
 
 # partition a list of nodes into chunks
@@ -624,7 +620,7 @@ def partition_w(wnodes):
 # 
 # This is especially important for, but not only for, the BGDKPT letters.
 
-# In[ ]:
+# In[21]:
 
 
 specials = (
@@ -693,7 +689,7 @@ def partition_w(wnodes):
 )
 
 
-# In[9]:
+# In[22]:
 
 
 specials2 = (
@@ -716,14 +712,14 @@ def partition_w(wnodes):
 # 
 # The ``sound_dict`` is the resulting (ordered) mapping of all source characters to "phonetic" characters.
 
-# In[ ]:
+# In[23]:
 
 
 dagesh_lenes = {"b.", "g.", "d.", "k.", "p.", "t."}
 dagesh_lene_dict = dict()
 
 
-# In[ ]:
+# In[24]:
 
 
 irrelevant_accents = (
@@ -745,7 +741,7 @@ def partition_w(wnodes):
 )
 
 
-# In[ ]:
+# In[25]:
 
 
 known_accents = {
@@ -753,7 +749,7 @@ def partition_w(wnodes):
 }
 
 
-# In[ ]:
+# In[26]:
 
 
 primary_accents = {
@@ -763,7 +759,7 @@ def partition_w(wnodes):
 sound_dict2 = collections.OrderedDict()
 
 
-# In[ ]:
+# In[27]:
 
 
 for (sym, let, glyph) in specials:
@@ -773,7 +769,7 @@ def partition_w(wnodes):
         sound_dict[sym] = glyph
 
 
-# In[10]:
+# In[28]:
 
 
 for (sym, let, glyph) in specials2:
@@ -860,7 +856,7 @@ def partition_w(wnodes):
 # vowel1 is for before, vowel2 is for after, both are usable in look-behind conditions
 # vowel matches purely vowels of variable length, and is not usable in look-behind conditions
 
-# In[ ]:
+# In[29]:
 
 
 vowel1 = r"(?:(?::[ea@])|(?:w\.)|(?:[i;]j)|(?:ow)|(?:.[%@\^;aeiIou`]))"
@@ -868,7 +864,7 @@ def partition_w(wnodes):
 vowel = r"(?:(?::[ea@])|(?:w\.)|(?:[i;]j)|(?:ow)|(?:[%@\^;aeiIou`]))"
 
 
-# In[ ]:
+# In[30]:
 
 
 # lvowel are long vowels only (including compositions)
@@ -877,7 +873,7 @@ def partition_w(wnodes):
 svowel = r"(?:(?::[ea@])|(?:[%@\^;aeiIou`]))"
 
 
-# In[ ]:
+# In[31]:
 
 
 gadol = sound_dict["@"]
@@ -887,7 +883,7 @@ def partition_w(wnodes):
 e_like = {":", ":e", ";", ";j", "e", "i", "ij"}
 
 
-# In[ ]:
+# In[32]:
 
 
 # complex i/w vowel: the composite vowels with waw and yod, after translation
@@ -895,7 +891,7 @@ def partition_w(wnodes):
 complex_w_vowel = "".join(sound_dict[s] for s in {"ow"})
 
 
-# In[ ]:
+# In[33]:
 
 
 # consonants
@@ -909,7 +905,7 @@ def partition_w(wnodes):
 
 # accents
 
-# In[11]:
+# In[34]:
 
 
 acc = "[ˈˌ]"  # primary and secundary accent
@@ -935,20 +931,20 @@ def partition_w(wnodes):
 
 # rafe
 
-# In[ ]:
+# In[35]:
 
 
 rafe = re.compile(r"({b})\.,".format(b=bgdkpt))
 
 
-# In[ ]:
+# In[36]:
 
 
 def rafe_repl(match):
     return match.group(1)
 
 
-# In[ ]:
+# In[37]:
 
 
 # furtive patah
@@ -956,7 +952,7 @@ def rafe_repl(match):
 furtive_patah = re.compile(r"([x<]|(?:h\.))(?:[/!]?)a(?=\Z|[ &-])")
 
 
-# In[12]:
+# In[38]:
 
 
 def furtive_patah_repl(match):
@@ -969,7 +965,7 @@ def furtive_patah_repl(match):
 
 # explicit accents
 
-# In[ ]:
+# In[39]:
 
 
 # lets assume that any cantillation mark or accent indicates that the vowel is stressed
@@ -984,14 +980,14 @@ def furtive_patah_repl(match):
 condense_accents = re.compile("({v})([!/]+)".format(v=vowel))
 
 
-# In[ ]:
+# In[40]:
 
 
 def sep_accent_repl(match):
     return "~" + match.group(1)
 
 
-# In[ ]:
+# In[41]:
 
 
 def condense_accents_repl(match):
@@ -999,7 +995,7 @@ def condense_accents_repl(match):
     return accent + match.group(1)
 
 
-# In[ ]:
+# In[42]:
 
 
 # implicit accents
@@ -1009,21 +1005,21 @@ def condense_accents_repl(match):
 strip_accents = re.compile(r"[0-9*]")
 
 
-# In[ ]:
+# In[43]:
 
 
 # wrong last accents
 last_accent = re.compile(r"[/!]+(?=[ ]|\Z)")
 
 
-# In[ ]:
+# In[44]:
 
 
 def default_accent_repl(match):
     return "/" + match.group(1)
 
 
-# In[ ]:
+# In[45]:
 
 
 def punctuation_accent_repl(match):
@@ -1037,20 +1033,20 @@ def punctuation_accent_repl(match):
 # specials2 specify how punctuation (sof pasuq, paseq, interword setumah-petuhah are
 # translated).
 
-# In[ ]:
+# In[46]:
 
 
 phono_sep = re.compile("(.*?)([ {}]*)".format("".join(x[2] for x in specials2)))
 multiple_space = re.compile("  +")
 
 
-# In[ ]:
+# In[47]:
 
 
 verse_end_phono = re.compile(r"(\. *)\Z")
 
 
-# In[13]:
+# In[48]:
 
 
 def verse_end_phono_repl(match):
@@ -1059,13 +1055,13 @@ def verse_end_phono_repl(match):
 
 # ### Actions
 
-# In[ ]:
+# In[49]:
 
 
 stats = collections.Counter()
 
 
-# In[14]:
+# In[50]:
 
 
 def doaccents(orig, debug=False, count=False):
@@ -1149,7 +1145,7 @@ def doaccents(orig, debug=False, count=False):
 # qamets qatan
 # NB: all patterns stipulate that the qamets (@) in question is unaccented
 
-# In[15]:
+# In[51]:
 
 
 # near end of word:
@@ -1158,14 +1154,14 @@ def doaccents(orig, debug=False, count=False):
 )
 
 
-# In[ ]:
+# In[52]:
 
 
 # before dagesh forte:
 qamets_qatan2 = re.compile(r"(?<={c})(\.?)@(?={c}\.)".format(c=cons))
 
 
-# In[ ]:
+# In[53]:
 
 
 # if the following consonant is BGDKFT and does not have dagesh, the @ is in an open syllable:
@@ -1174,7 +1170,7 @@ def doaccents(orig, debug=False, count=False):
 )
 
 
-# In[ ]:
+# In[54]:
 
 
 # assimilation of qamets with following composite schwa of type (chatef qamets),
@@ -1182,14 +1178,14 @@ def doaccents(orig, debug=False, count=False):
 qamets_qatan4a = re.compile(r"(?<={p})(\.?[!/]?)@(?=-{c}:@)".format(p=prep, c=cons))
 
 
-# In[ ]:
+# In[55]:
 
 
 #     or word-internal
 qamets_qatan4b = re.compile(r"(?<={c})(\.?[!/]?)@(?={c}:@)".format(c=cons))
 
 
-# In[ ]:
+# In[56]:
 
 
 # before an other qamets qatan, provided the syllable is unaccented
@@ -1200,20 +1196,20 @@ def doaccents(orig, debug=False, count=False):
 # This pattern will be applied only on words that do have a non-empty pronominal suffix
 # The pattern will spot the qamets qatan in front of the last consonant, if there is such a qatan
 
-# In[ ]:
+# In[57]:
 
 
 qamets_qatan_prs = re.compile(r"\^(?=[0-9]*{c}\.?[/!]?(?:[ &-]|\Z))".format(c=cons))
 
 
-# In[ ]:
+# In[58]:
 
 
 def qamets_qatan_repl(match):
     return match.group(1) + "^"
 
 
-# In[ ]:
+# In[59]:
 
 
 # there are exceptions to the heuristic of interpreting qamets by voting between occurrences
@@ -1226,7 +1222,7 @@ def qamets_qatan_repl(match):
 """
 
 
-# In[ ]:
+# In[60]:
 
 
 xxx = """
@@ -1234,7 +1230,7 @@ def qamets_qatan_repl(match):
 """
 
 
-# In[ ]:
+# In[61]:
 
 
 # there are unaccented conjugated verb forms that must not be subjected to qamets-qatan transformation
@@ -1254,13 +1250,13 @@ def qamets_qatan_repl(match):
 }
 
 
-# In[ ]:
+# In[62]:
 
 
 qamets_qatan_verb_x |= qqv_experimental
 
 
-# In[ ]:
+# In[63]:
 
 
 def qamets_qatan_verb_x_repl(match):
@@ -1273,7 +1269,7 @@ def qamets_qatan_verb_x_repl(match):
 # Here is the function that carries out rule based qamets qatan detection, without going into
 # verb paradigms and exceptions. It is the first go at it.
 
-# In[16]:
+# In[64]:
 
 
 def doplainqamets(word, accentless=False, debug=False, count=False):
@@ -1349,7 +1345,7 @@ def doplainqamets(word, accentless=False, debug=False, count=False):
 # As to rule 4, there are cases where the schwa in question is also followed by a final consonant with schwa.
 # In those cases it seems that the schwa in question is silent.
 
-# In[ ]:
+# In[65]:
 
 
 # mobile schwa
@@ -1379,7 +1375,7 @@ def doplainqamets(word, accentless=False, debug=False, count=False):
 )
 
 
-# In[ ]:
+# In[66]:
 
 
 mobile_schwa2 = re.compile(
@@ -1387,28 +1383,28 @@ def doplainqamets(word, accentless=False, debug=False, count=False):
 )  # before BGDKPT letter without dagesh
 
 
-# In[ ]:
+# In[67]:
 
 
 # second last consonant with schwa when last consonsoant also has schwa
 mobile_schwa3 = re.compile(r"[%:](?={c}\.?{a}?[%:](?:[ &]|\Z))".format(a=acc, c=cons))
 
 
-# In[ ]:
+# In[68]:
 
 
 # all schwas and the end of the word are quiescens, only if the words are not glued together
 mobile_schwa4 = re.compile(r"[%:](?=[ &]|\Z)")
 
 
-# In[ ]:
+# In[69]:
 
 
 def mobile_schwa1_repl(match):
     return match.group(1) + "%"
 
 
-# In[ ]:
+# In[70]:
 
 
 # dagesh
@@ -1421,21 +1417,21 @@ def mobile_schwa1_repl(match):
 dages_lene = re.compile(r"({b})\.".format(b=bgdkpt))
 
 
-# In[ ]:
+# In[71]:
 
 
 def dages_forte_lene_repl(match):
     return match.group(1) + (dagesh_lene_dict[match.group(2)] * 2)
 
 
-# In[ ]:
+# In[72]:
 
 
 def dages_lene_repl(match):
     return dagesh_lene_dict[match.group(1)]
 
 
-# In[17]:
+# In[73]:
 
 
 def dages_forte_repl(match):
@@ -1444,14 +1440,14 @@ def dages_forte_repl(match):
 
 # ## Mater lectionis and final fixes
 
-# In[18]:
+# In[74]:
 
 
 # silent aleph
 silent_aleph = re.compile("(?<=[^ &-])>(?!(?:[/!]|{v}))".format(v=vowel))
 
 
-# In[ ]:
+# In[75]:
 
 
 # final mater lectionis
@@ -1460,14 +1456,14 @@ def dages_forte_repl(match):
 last_ml_jw = re.compile(r"jw(?=[ &-]|\Z)")
 
 
-# In[ ]:
+# In[76]:
 
 
 # mappiq heh
 mappiq_heh = re.compile(r"h\.")
 
 
-# In[ ]:
+# In[77]:
 
 
 fixit_i = re.compile(r"([{v}])\.".format(v=complex_i_vowel))
@@ -1475,7 +1471,7 @@ def dages_forte_repl(match):
 fixit = re.compile(r"(.)\.")
 
 
-# In[ ]:
+# In[78]:
 
 
 split_sep = re.compile(
@@ -1483,21 +1479,21 @@ def dages_forte_repl(match):
 )  # to split the result in the phono part and the interword part
 
 
-# In[ ]:
+# In[79]:
 
 
 def fixit_repl(match):
     return match.group(1) * 2
 
 
-# In[ ]:
+# In[80]:
 
 
 def fixit_i_repl(match):
     return match.group(1) + "j"
 
 
-# In[ ]:
+# In[81]:
 
 
 def fixit_w_repl(match):
@@ -1525,7 +1521,7 @@ def fixit_w_repl(match):
 # 
 # The ``phono()`` function that carries out the complete transliteration, looks by default in ``qamets_corrections``, but this can be overridden. These corrections will not be carried out for the special verb cases.
 
-# In[ ]:
+# In[82]:
 
 
 qamets_corrections = {}  # list of translits that must be corrected
@@ -1533,7 +1529,7 @@ def fixit_w_repl(match):
 
 # apply correction instructions to a word
 
-# In[19]:
+# In[83]:
 
 
 def apply_corr(wordq, corr):
@@ -1561,13 +1557,13 @@ def apply_corr(wordq, corr):
 # 
 # We need concise, normalized values for the lexical features.
 
-# In[ ]:
+# In[84]:
 
 
 undefs = {"NA", "unknown", "n/a", "absent"}
 
 
-# In[20]:
+# In[85]:
 
 
 png = dict(
@@ -1592,13 +1588,13 @@ def apply_corr(wordq, corr):
 # 
 # We need a label for lexical information such as part of speech, person, number, gender.
 
-# In[ ]:
+# In[86]:
 
 
 declensed = {"subs", "nmpr", "adjv", "prps", "prde", "prin"}
 
 
-# In[ ]:
+# In[87]:
 
 
 def get_lex_info(w):
@@ -1622,7 +1618,7 @@ def get_lex_info(w):
     return lex_info
 
 
-# In[ ]:
+# In[88]:
 
 
 def get_decl(lex_info):
@@ -1632,7 +1628,7 @@ def get_decl(lex_info):
     return lex_info if len(parts) == 1 else parts[0]
 
 
-# In[21]:
+# In[89]:
 
 
 def get_prs(lex_info):
@@ -1649,7 +1645,7 @@ def get_prs(lex_info):
 # 
 # ## Phono parts
 
-# In[22]:
+# In[90]:
 
 
 interesting_stats = [
@@ -1660,12 +1656,6 @@ def get_prs(lex_info):
 ]
 
 
-# In[ ]:
-
-
-
-
-
 # if suppress_in_verb, phono will suppress qatan interpretation in certain verb paradigmatic forms
 # if suppress_in_prs, phono will suppress qatan interpreation in pronominal suffixes
 # if correct is 1, phono will apply individual corrections
@@ -1673,7 +1663,7 @@ def get_prs(lex_info):
 # if correct is -1, phono will stop just before applying the qamets qatan corrections and return
 # the intermediate result
 
-# In[23]:
+# In[91]:
 
 
 def phono_qamets(
@@ -1812,13 +1802,7 @@ def phono_qamets(
     return (result, False)
 
 
-# In[ ]:
-
-
-
-
-
-# In[24]:
+# In[92]:
 
 
 def phono_patterns(result, debug, count, dout):
@@ -1915,13 +1899,7 @@ def phono_patterns(result, debug, count, dout):
     return result
 
 
-# In[ ]:
-
-
-
-
-
-# In[25]:
+# In[93]:
 
 
 def phono_symbols(ws, result, debug, count, dout):
@@ -1992,7 +1970,7 @@ def phono_symbols(ws, result, debug, count, dout):
 # ## Phono whole
 # Here the rule fabrics are woven together, exceptions invoked.
 
-# In[26]:
+# In[94]:
 
 
 def phono(
@@ -2072,7 +2050,7 @@ def phono(
 # to the number of consonants found in the paradigmatic material.
 # This is rather crude, but it will do.
 
-# In[ ]:
+# In[95]:
 
 
 # we need the number of letters in a defined value of a morpho feature
@@ -2084,7 +2062,7 @@ def len_suffix(v):
     return len(v.replace("=", "").replace("W", "").replace("J", ""))
 
 
-# In[ ]:
+# In[96]:
 
 
 # we need a function that return 1 for plural/dual subs/adj and for fem adj
@@ -2096,7 +2074,7 @@ def len_ending(sp, n, g):
     return 0
 
 
-# In[27]:
+# In[97]:
 
 
 # return the number of consonants in the suffixes
@@ -2113,14 +2091,14 @@ def len_morpho(w):
 # 
 # Next, we reduce the vowel skeleton to a skeleton pattern. We are not interested in all vowels, only in whether the vowel is a qamets (gadol or qatan), A-like, O-like, or other (which we dub E-like).
 
-# In[ ]:
+# In[98]:
 
 
 # the qamets gadol/qatan skeleton
 qamets_qatan_skel = re.compile("([^@^])")
 
 
-# In[ ]:
+# In[99]:
 
 
 # the vowel skeleton where the qamets gadol/qatan are preserved as @ and ^
@@ -2129,14 +2107,14 @@ def len_morpho(w):
 silent_alef_start = re.compile(r"([ &-]|\A)>([!/]?(?:[^!/.:;@^aeiou]|\Z))")
 
 
-# In[ ]:
+# In[100]:
 
 
 def silent_alef_start_repl(match):
     return match.group(1) + "E" + match.group(2)
 
 
-# In[ ]:
+# In[101]:
 
 
 qamets_qatan_fullskel = re.compile(
@@ -2153,7 +2131,7 @@ def silent_alef_start_repl(match):
 )
 
 
-# In[ ]:
+# In[102]:
 
 
 def qamets_qatan_fullskel_repl(match):
@@ -2173,7 +2151,7 @@ def qamets_qatan_fullskel_repl(match):
     return ""
 
 
-# In[28]:
+# In[103]:
 
 
 def get_full_skel(w, debug=False):
@@ -2209,7 +2187,7 @@ def get_full_skel(w, debug=False):
 # 
 # ### All candidates
 
-# In[ ]:
+# In[104]:
 
 
 # find lexemes which have an occurrence with a qamets (except verbs)
@@ -2218,7 +2196,7 @@ def get_full_skel(w, debug=False):
 qq_lex = collections.defaultdict(lambda: [])
 
 
-# In[29]:
+# In[105]:
 
 
 for w in F.otype.s("word"):
@@ -2244,7 +2222,7 @@ def get_full_skel(w, debug=False):
 
 # ### Filtering interesting candidates
 
-# In[30]:
+# In[106]:
 
 
 utils.caption(0, "\tFiltering lexemes with varied occurrences")
@@ -2284,7 +2262,7 @@ def get_full_skel(w, debug=False):
 
 # ### Guess the qamets
 
-# In[ ]:
+# In[107]:
 
 
 qamets_qatan_xc = dict(
@@ -2299,7 +2277,7 @@ def get_full_skel(w, debug=False):
         qamets_qatan_xcompiled[lex][pos] = ins
 
 
-# In[ ]:
+# In[108]:
 
 
 def compile_occs(lex, occs):
@@ -2343,7 +2321,7 @@ def compile_occs(lex, occs):
     return occs_compiled
 
 
-# In[ ]:
+# In[109]:
 
 
 def guess_qq(occ, occs_compiled, debug=False):
@@ -2356,7 +2334,7 @@ def guess_qq(occ, occs_compiled, debug=False):
     return guess
 
 
-# In[31]:
+# In[110]:
 
 
 def get_corr(fullskel, guess, debug=False):
@@ -2377,7 +2355,7 @@ def get_corr(fullskel, guess, debug=False):
 
 # ### Carrying out the guess work
 
-# In[32]:
+# In[111]:
 
 
 utils.caption(0, "\tGuessing between gadol and qatan")
@@ -2427,27 +2405,27 @@ def get_corr(fullskel, guess, debug=False):
 
 # # Generate phonological data
 
-# In[ ]:
+# In[112]:
 
 
 def stats_prog():
     return " ".join(str(stats.get(stat, 0)) for stat in interesting_stats)
 
 
-# In[ ]:
+# In[113]:
 
 
 utils.caption(4, "Generating data in two ways ... ")
 
 
-# In[ ]:
+# In[114]:
 
 
 phono_file = []
 word_file = []
 
 
-# In[ ]:
+# In[115]:
 
 
 stats = collections.Counter()
@@ -2476,7 +2454,7 @@ def stats_prog():
         word_file.append((None, "", "+"))
 
 
-# In[33]:
+# In[116]:
 
 
 utils.caption(0, "\t{:>5} verses done {}".format(nv, stats_prog()))
@@ -2499,7 +2477,7 @@ def stats_prog():
 # 
 # They should be consistent.
 
-# In[ ]:
+# In[117]:
 
 
 utils.caption(0, "{} items in phono".format(len(phono_file)))
@@ -2514,7 +2492,7 @@ def stats_prog():
 utils.caption(0, "\t{} lines".format(i))
 
 
-# In[35]:
+# In[118]:
 
 
 phono_text = "".join(phono_file)
@@ -2533,7 +2511,22 @@ def stats_prog():
 # We also generate a config feature `otext@phono`, which will be picked up by Text-Fabric automatically.
 # In it we define the phonetic *format*, so that Text-Fabric has can output text in phonetic representation.
 
-# In[36]:
+# In[122]:
+
+
+genericMetaPath = f"{thisRepo}/yaml/generic.yaml"
+phonoMetaPath = f"{thisRepo}/yaml/phono.yaml"
+
+with open(genericMetaPath) as fh:
+    genericMeta = yaml.load(fh, Loader=yaml.FullLoader)
+    genericMeta["version"] = VERSION
+with open(phonoMetaPath) as fh:
+    phonoMeta = formatMeta(yaml.load(fh, Loader=yaml.FullLoader))
+    
+metaData = {"": genericMeta, **phonoMeta}
+
+
+# In[124]:
 
 
 utils.caption(4, "Writing TF phono features")
@@ -2542,22 +2535,14 @@ def stats_prog():
     phono_trailer=dict(((ln[0], ln[2]) for ln in word_file if ln[0] is not None)),
 )
 edgeFeatures = {}
-provenance = dict(
-    source="Phono Notebook applied to BHSA Data",
-    coreData="BHSA",
-    coreVersion=VERSION,
-    author="BHSA Data: Constantijn Sikkel; Phono Notebook: Dirk Roorda",
-)
-metaData = {
-    "": provenance,
-    "otext@phono": {
-        "about": "Provides phonetic transcriptions to Hebrew Words",
-        "see": "https://github.com/ETCBC/phono",
-        "fmt:text-phono-full": "{phono}{phono_trailer}",
-    },
-    "phono": dict(valueType="str"),
-    "phono_trailer": dict(valueType="str"),
+metaData["otext@phono"] = {
+    "about": "Provides phonetic transcriptions to Hebrew Words",
+    "see": "https://github.com/ETCBC/phono",
+    "fmt:text-phono-full": "{phono}{phono_trailer}",
 }
+metaData["phono"]["valueType"] = "str"
+metaData["phono_trailer"]["valueType"] = "str"
+
 TF = Fabric(locations=thisTempTf, silent=True)
 TF.save(nodeFeatures=nodeFeatures, edgeFeatures=edgeFeatures, metaData=metaData)
 
@@ -2566,7 +2551,7 @@ def stats_prog():
 # 
 # Check differences with previous versions.
 
-# In[37]:
+# In[125]:
 
 
 utils.checkDiffs(thisTempTf, thisTf, only=set(nodeFeatures))
@@ -2576,7 +2561,7 @@ def stats_prog():
 # 
 # Copy the new TF features from the temporary location where they have been created to their final destination.
 
-# In[38]:
+# In[126]:
 
 
 utils.deliverDataset(thisTempTf, thisTf)
@@ -2584,13 +2569,13 @@ def stats_prog():
 
 # # Compile TF
 
-# In[ ]:
+# In[127]:
 
 
 utils.caption(4, "Load and compile the new TF features")
 
 
-# In[39]:
+# In[128]:
 
 
 TF = Fabric(locations=[coreTf, thisTf], modules=[""])
@@ -2598,19 +2583,13 @@ def stats_prog():
 api.makeAvailableIn(globals())
 
 
-# In[ ]:
-
-
-
-
-
-# In[ ]:
+# In[129]:
 
 
 utils.caption(4, "Basic tests")
 
 
-# In[ ]:
+# In[130]:
 
 
 utils.caption(4, "First verses in phonetic transcription")
@@ -2619,7 +2598,7 @@ def stats_prog():
     utils.caption(0, T.text(L.d(v, "word"), fmt="text-phono-full"), continuation=True)
 
 
-# In[40]:
+# In[131]:
 
 
 utils.caption(4, "First verse in all formats")
diff --git a/tf/2021/otext@phono.tf b/tf/2021/otext@phono.tf
index 55670dd..f46f484 100644
--- a/tf/2021/otext@phono.tf
+++ b/tf/2021/otext@phono.tf
@@ -2,10 +2,10 @@
 @about=Provides phonetic transcriptions to Hebrew Words
 @author=BHSA Data: Constantijn Sikkel; Phono Notebook: Dirk Roorda
 @coreData=BHSA
-@coreVersion=2021
 @fmt:text-phono-full={phono}{phono_trailer}
+@provenance=computed by the phono notebook, see https://github.com/ETCBC/phono
 @see=https://github.com/ETCBC/phono
-@source=Phono Notebook applied to BHSA Data
+@version=2021
 @writtenBy=Text-Fabric
-@dateWritten=2021-11-30T15:33:30Z
+@dateWritten=2021-12-09T14:25:56Z
 
diff --git a/tf/2021/phono.tf b/tf/2021/phono.tf
index 1bc3559..9a4d907 100644
--- a/tf/2021/phono.tf
+++ b/tf/2021/phono.tf
@@ -1,11 +1,12 @@
 @node
 @author=BHSA Data: Constantijn Sikkel; Phono Notebook: Dirk Roorda
 @coreData=BHSA
-@coreVersion=2021
-@source=Phono Notebook applied to BHSA Data
+@description=🆗 phonological transcription (bᵊ rēšˌîṯ bārˈā ʔᵉlōhˈîm)
+@provenance=computed by the phono notebook, see https://github.com/ETCBC/phono
 @valueType=str
+@version=2021
 @writtenBy=Text-Fabric
-@dateWritten=2021-11-30T15:33:29Z
+@dateWritten=2021-12-09T14:25:55Z
 
 bᵊ
 rēšˌîṯ
diff --git a/tf/2021/phono_trailer.tf b/tf/2021/phono_trailer.tf
index a39cd6d..a42b4a3 100644
--- a/tf/2021/phono_trailer.tf
+++ b/tf/2021/phono_trailer.tf
@@ -1,11 +1,12 @@
 @node
 @author=BHSA Data: Constantijn Sikkel; Phono Notebook: Dirk Roorda
 @coreData=BHSA
-@coreVersion=2021
-@source=Phono Notebook applied to BHSA Data
+@description=🆗 interword material in phonological transcription
+@provenance=computed by the phono notebook, see https://github.com/ETCBC/phono
 @valueType=str
+@version=2021
 @writtenBy=Text-Fabric
-@dateWritten=2021-11-30T15:33:29Z
+@dateWritten=2021-12-09T14:25:55Z
 
 
  
diff --git a/yaml/generic.yaml b/yaml/generic.yaml
new file mode 100644
index 0000000..ae01558
--- /dev/null
+++ b/yaml/generic.yaml
@@ -0,0 +1,3 @@
+provenance: computed by the phono notebook, see https://github.com/ETCBC/phono
+coreData: BHSA
+author: "BHSA Data: Constantijn Sikkel; Phono Notebook: Dirk Roorda"
diff --git a/yaml/phono.yaml b/yaml/phono.yaml
new file mode 100644
index 0000000..12c9fd4
--- /dev/null
+++ b/yaml/phono.yaml
@@ -0,0 +1,5 @@
+phono:
+  desc: 🆗 phonological transcription
+  eg: bᵊ rēšˌîṯ bārˈā ʔᵉlōhˈîm
+phono_trailer:
+  desc: 🆗 interword material in phonological transcription