From 7ab27486ebd55973c34d972e1132e2b746448993 Mon Sep 17 00:00:00 2001 From: tonyjurg Date: Wed, 10 Jul 2024 14:56:41 +0200 Subject: [PATCH] update to v0.5.2 --- CreateFeatureDoc.ipynb | 344 ++- results/after.md | 16 +- results/appositioncontainer.md | 20 +- results/articular.md | 32 +- results/before.md | 16 +- results/book.md | 76 +- results/bookshort.md | 68 +- results/case.md | 16 +- results/chapter.md | 16 +- results/clauseType.md | 16 +- results/cls.md | 28 +- results/cltype.md | 16 +- results/criticalsign.md | 16 +- results/crule.md | 16 +- results/degree.md | 16 +- results/discontinuous.md | 16 +- results/domain.md | 16 +- results/featuresbydatatype.md | 32 +- results/featuresbyname.md | 68 + results/featuresbynodetype.md | 100 +- results/featuresbytype.md | 24 +- results/frame.md | 8 +- results/framespec.md | 16 +- results/function.md | 28 +- results/gender.md | 16 +- results/gloss.md | 58 +- results/id.md | 16 +- results/junction.md | 31 +- results/lang.md | 8 +- results/lemma.md | 16 +- results/lemmatranslit.md | 16 +- results/ln.md | 16 +- results/mood.md | 16 +- results/morph.md | 16 +- results/nodeId.md | 20 +- results/normalized.md | 16 +- results/note.md | 16 +- results/num.md | 92 +- results/number.md | 16 +- results/oslots.md | 4 +- results/otype.md | 4 +- results/parent.md | 36 +- results/person.md | 34 +- results/punctuation.md | 16 +- results/ref.md | 16 +- results/referent.md | 16 +- results/rela.md | 16 +- results/role.md | 57 +- results/rule.md | 56 +- results/sibling.md | 96 - results/sp.md | 16 +- results/strong.md | 16 +- results/subjref.md | 8 +- results/subjrefspec.md | 16 +- results/tense.md | 16 +- results/text.md | 16 +- results/trans.md | 16 +- results/translit.md | 16 +- results/typ.md | 26 +- results/{type.md => typems.md} | 45 +- results/unaccent.md | 16 +- results/unicode.md | 16 +- results/variant.md | 16 +- results/verse.md | 12 +- results/voice.md | 16 +- tools/determineDeltaBetweenVersions.ipynb | 2286 +++++++++++++++++++ tools/versionMapping.ipynb | 2432 +++++++++++++++++++++ 67 files changed, 5934 insertions(+), 791 deletions(-) create mode 100644 results/featuresbyname.md delete mode 100644 results/sibling.md rename results/{type.md => typems.md} (62%) create mode 100644 tools/determineDeltaBetweenVersions.ipynb create mode 100644 tools/versionMapping.ipynb diff --git a/CreateFeatureDoc.ipynb b/CreateFeatureDoc.ipynb index e698c9b..342f4cf 100644 --- a/CreateFeatureDoc.ipynb +++ b/CreateFeatureDoc.ipynb @@ -22,8 +22,8 @@ "metadata": {}, "outputs": [], "source": [ - "scriptVersion=\"0.5.1\"\n", - "scriptDate=\"June 16, 2024\"" + "scriptVersion=\"0.5.2\"\n", + "scriptDate=\"July 10, 2024\"" ] }, { @@ -126,7 +126,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 3, "id": "177f91d0-0baf-45eb-8450-dcce0e6b4b86", "metadata": { "slideshow": { @@ -142,7 +142,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 5, "id": "20a63ffb-0b5d-4586-bce3-bcb39a84273d", "metadata": { "slideshow": { @@ -160,7 +160,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 7, "id": "1f2d822d-b47a-4766-8226-8157799740c0", "metadata": { "scrolled": true, @@ -197,7 +197,7 @@ { "data": { "text/html": [ - "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7" + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.9" ], "text/plain": [ "" @@ -211,7 +211,7 @@ "text/html": [ "\n", " TF: TF API 12.4.4, saulocantanhede/tfgreek2/app v3, Search Reference
\n", - " Data: saulocantanhede - tfgreek2 0.5.7, Character table, Feature docs
\n", + " Data: saulocantanhede - tfgreek2 0.5.9, Character table, Feature docs
\n", "
Node types\n", "\n", " \n", @@ -244,9 +244,9 @@ "\n", "\n", " \n", - " \n", - " \n", - " \n", + " \n", + " \n", + " \n", "\n", "\n", "\n", @@ -258,9 +258,9 @@ "\n", "\n", " \n", - " \n", - " \n", - " \n", + " \n", + " \n", + " \n", "\n", "\n", "\n", @@ -298,7 +298,7 @@ "\n", "
\n", "
\n", - "after\n", + "after\n", "
\n", "
str
\n", "\n", @@ -308,7 +308,7 @@ "\n", "
\n", " \n", "
int
\n", "\n", @@ -318,7 +318,7 @@ "\n", "
\n", "
\n", - "articular\n", + "articular\n", "
\n", "
int
\n", "\n", @@ -328,7 +328,7 @@ "\n", "
\n", "
\n", - "before\n", + "before\n", "
\n", "
str
\n", "\n", @@ -338,7 +338,7 @@ "\n", "
\n", "
\n", - "book\n", + "book\n", "
\n", "
str
\n", "\n", @@ -348,7 +348,7 @@ "\n", "
\n", "
\n", - "bookshort\n", + "bookshort\n", "
\n", "
str
\n", "\n", @@ -358,7 +358,7 @@ "\n", "
\n", "
\n", - "case\n", + "case\n", "
\n", "
str
\n", "\n", @@ -368,7 +368,7 @@ "\n", "
\n", "
\n", - "chapter\n", + "chapter\n", "
\n", "
int
\n", "\n", @@ -378,7 +378,7 @@ "\n", "
\n", "
\n", - "clausetype\n", + "clausetype\n", "
\n", "
str
\n", "\n", @@ -388,7 +388,7 @@ "\n", "
\n", "
\n", - "cls\n", + "cls\n", "
\n", "
str
\n", "\n", @@ -398,7 +398,7 @@ "\n", "
\n", "
\n", - "cltype\n", + "cltype\n", "
\n", "
str
\n", "\n", @@ -408,7 +408,7 @@ "\n", "
\n", "
\n", - "criticalsign\n", + "criticalsign\n", "
\n", "
str
\n", "\n", @@ -418,7 +418,7 @@ "\n", "
\n", "
\n", - "crule\n", + "crule\n", "
\n", "
str
\n", "\n", @@ -428,7 +428,7 @@ "\n", "
\n", "
\n", - "degree\n", + "degree\n", "
\n", "
str
\n", "\n", @@ -438,7 +438,7 @@ "\n", "
\n", "
\n", - "discontinuous\n", + "discontinuous\n", "
\n", "
int
\n", "\n", @@ -448,7 +448,7 @@ "\n", "
\n", "
\n", - "domain\n", + "domain\n", "
\n", "
str
\n", "\n", @@ -458,7 +458,7 @@ "\n", "
\n", "
\n", - "framespec\n", + "framespec\n", "
\n", "
str
\n", "\n", @@ -468,7 +468,7 @@ "\n", "
\n", "
\n", - "function\n", + "function\n", "
\n", "
str
\n", "\n", @@ -478,7 +478,7 @@ "\n", "
\n", "
\n", - "gender\n", + "gender\n", "
\n", "
str
\n", "\n", @@ -488,17 +488,17 @@ "\n", "
\n", "
\n", - "gloss\n", + "gloss\n", "
\n", "
str
\n", "\n", - " short translation\n", + " English gloss (BGVB)\n", "\n", "
\n", "\n", "
\n", "
\n", - "id\n", + "id\n", "
\n", "
str
\n", "\n", @@ -508,7 +508,7 @@ "\n", "
\n", "
\n", - "junction\n", + "junction\n", "
\n", "
str
\n", "\n", @@ -518,7 +518,7 @@ "\n", "
\n", "
\n", - "lang\n", + "lang\n", "
\n", "
str
\n", "\n", @@ -528,7 +528,7 @@ "\n", "
\n", "
\n", - "lemma\n", + "lemma\n", "
\n", "
str
\n", "\n", @@ -538,7 +538,7 @@ "\n", "
\n", "
\n", - "lemmatranslit\n", + "lemmatranslit\n", "
\n", "
str
\n", "\n", @@ -548,7 +548,7 @@ "\n", "
\n", "
\n", - "ln\n", + "ln\n", "
\n", "
str
\n", "\n", @@ -558,7 +558,7 @@ "\n", "
\n", "
\n", - "mood\n", + "mood\n", "
\n", "
str
\n", "\n", @@ -568,7 +568,7 @@ "\n", "
\n", "
\n", - "morph\n", + "morph\n", "
\n", "
str
\n", "\n", @@ -578,17 +578,17 @@ "\n", "
\n", "
\n", - "nodeid\n", + "nodeid\n", "
\n", - "
int
\n", + "
str
\n", "\n", - " node id (as in the XML source data\n", + " node id (as in the XML source data)\n", "\n", "
\n", "\n", "
\n", "
\n", - "normalized\n", + "normalized\n", "
\n", "
str
\n", "\n", @@ -598,7 +598,7 @@ "\n", "
\n", "
\n", - "note\n", + "note\n", "
\n", "
str
\n", "\n", @@ -608,7 +608,7 @@ "\n", "
\n", "
\n", - "num\n", + "num\n", "
\n", "
int
\n", "\n", @@ -618,7 +618,7 @@ "\n", "
\n", "
\n", - "number\n", + "number\n", "
\n", "
str
\n", "\n", @@ -628,7 +628,7 @@ "\n", "
\n", "
\n", - "otype\n", + "otype\n", "
\n", "
str
\n", "\n", @@ -638,7 +638,7 @@ "\n", "
\n", "
\n", - "person\n", + "person\n", "
\n", "
str
\n", "\n", @@ -648,7 +648,7 @@ "\n", "
\n", "
\n", - "punctuation\n", + "punctuation\n", "
\n", "
str
\n", "\n", @@ -658,7 +658,7 @@ "\n", "
\n", "
\n", - "ref\n", + "ref\n", "
\n", "
str
\n", "\n", @@ -668,7 +668,7 @@ "\n", "
\n", "
\n", - "referent\n", + "referent\n", "
\n", "
str
\n", "\n", @@ -678,7 +678,7 @@ "\n", "
\n", "
\n", - "rela\n", + "rela\n", "
\n", "
str
\n", "\n", @@ -688,7 +688,7 @@ "\n", "
\n", "
\n", - "role\n", + "role\n", "
\n", "
str
\n", "\n", @@ -698,7 +698,7 @@ "\n", "
\n", "
\n", - "rule\n", + "rule\n", "
\n", "
str
\n", "\n", @@ -708,7 +708,7 @@ "\n", "
\n", "
\n", - "sp\n", + "sp\n", "
\n", "
str
\n", "\n", @@ -718,7 +718,7 @@ "\n", "
\n", "
\n", - "strong\n", + "strong\n", "
\n", "
int
\n", "\n", @@ -728,7 +728,7 @@ "\n", "
\n", "
\n", - "subjrefspec\n", + "subjrefspec\n", "
\n", "
str
\n", "\n", @@ -738,7 +738,7 @@ "\n", "
\n", "
\n", - "tense\n", + "tense\n", "
\n", "
str
\n", "\n", @@ -748,7 +748,7 @@ "\n", "
\n", "
\n", - "text\n", + "text\n", "
\n", "
str
\n", "\n", @@ -758,7 +758,7 @@ "\n", "
\n", "
\n", - "trans\n", + "trans\n", "
\n", "
str
\n", "\n", @@ -768,7 +768,7 @@ "\n", "
\n", "
\n", - "translit\n", + "translit\n", "
\n", "
str
\n", "\n", @@ -778,17 +778,17 @@ "\n", "
\n", "
\n", - "typ\n", + "typ\n", "
\n", "
str
\n", "\n", - " this is XML attribute typ\n", + " syntactical type (on sentence, group, clause or phrase)\n", "\n", "
\n", "\n", "
\n", "
\n", - "type\n", + "typems\n", "
\n", "
str
\n", "\n", @@ -798,7 +798,7 @@ "\n", "
\n", "
\n", - "unaccent\n", + "unaccent\n", "
\n", "
str
\n", "\n", @@ -808,7 +808,7 @@ "\n", "
\n", "
\n", - "unicode\n", + "unicode\n", "
\n", "
str
\n", "\n", @@ -818,7 +818,7 @@ "\n", "
\n", "
\n", - "variant\n", + "variant\n", "
\n", "
str
\n", "\n", @@ -828,7 +828,7 @@ "\n", "
\n", "
\n", - "verse\n", + "verse\n", "
\n", "
int
\n", "\n", @@ -838,7 +838,7 @@ "\n", "
\n", "
\n", - "voice\n", + "voice\n", "
\n", "
str
\n", "\n", @@ -848,7 +848,7 @@ "\n", "
\n", "
\n", - "frame\n", + "frame\n", "
\n", "
str
\n", "\n", @@ -858,7 +858,7 @@ "\n", "
\n", "
\n", - "oslots\n", + "oslots\n", "
\n", "
none
\n", "\n", @@ -868,7 +868,7 @@ "\n", "
\n", "
\n", - "parent\n", + "parent\n", "
\n", "
none
\n", "\n", @@ -878,17 +878,7 @@ "\n", "
\n", "
\n", - "sibling\n", - "
\n", - "
int
\n", - "\n", - " this is XML attribute sibling\n", - "\n", - "
\n", - "\n", - "
\n", - "
\n", - "subjref\n", + "subjref\n", "
\n", "
none
\n", "\n", @@ -899,7 +889,7 @@ "
\n", "\n", "\n", - " Settings:
specified
  1. apiVersion: 3
  2. appName: saulocantanhede/tfgreek2
  3. appPath:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/app
  4. commit: 352af50c8ce86edd8a0e2d58519453a8f53ee084
  5. css: ''
  6. dataDisplay:
    • excludedFeatures: []
    • noneValues:
      • none
      • unknown
      • no value
      • NA
    • sectionSep1:
    • sectionSep2: :
    • textFormat: text-orig-full
  7. docs:
    • docBase: https://github.com/saulocantanhede/tfgreek2/tree/main/docs
    • docPage: about
    • docRoot: https://github.com/saulocantanhede/tfgreek2
    • featureBase:https://github.com/saulocantanhede/tfgreek2/tree/main/docs/features/<feature>.md
    • featurePage: README
  8. interfaceDefaults: {fmt: text-orig-full}
  9. isCompatible: True
  10. local: local
  11. localDir:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/_temp
  12. provenanceSpec:
    • branch: main
    • corpus: Nestle 1904 Greek New Testament
    • doi: 10.5281/zenodo.notyet
    • moduleSpecs: []
    • org: saulocantanhede
    • relative: /tf
    • repo: tfgreek2
    • repro: tfgreek2
    • version: 0.5.7
    • webBase: https://learner.bible/text/show_text/nestle1904/
    • webHint: Show this on the website
    • webLang: en
    • webUrl:https://learner.bible/text/show_text/nestle1904/<1>/<2>/<3>
    • webUrlLex: {webBase}/word?version={version}&id=<lid>
  13. release: 0.5.7
  14. typeDisplay:
    • clause:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {cls} {role} {junction}
      • style: ''
    • group:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • phrase:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • sentence:
      • label: {typ} {function} {rela} \\\\ {role} {rule}
      • style: ''
    • subphrase:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • verse:
      • condense: True
      • label: {book} {chapter}:{verse}
      • style: ''
    • wg:
      • condense: True
      • label: {type} {role} {rule} {junction}
      • style: ''
    • word:
      • features:
        • lemma
        • sp
      • featuresBare: [gloss]
  15. writing: grc
\n" + " Settings:
specified
  1. apiVersion: 3
  2. appName: saulocantanhede/tfgreek2
  3. appPath:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/app
  4. commit: 352af50c8ce86edd8a0e2d58519453a8f53ee084
  5. css: ''
  6. dataDisplay:
    • excludedFeatures: []
    • noneValues:
      • none
      • unknown
      • no value
      • NA
    • sectionSep1:
    • sectionSep2: :
    • textFormat: text-orig-full
  7. docs:
    • docBase: https://github.com/saulocantanhede/tfgreek2/tree/main/docs
    • docPage: about
    • docRoot: https://github.com/saulocantanhede/tfgreek2
    • featureBase:https://github.com/saulocantanhede/tfgreek2/tree/main/docs/features/<feature>.md
    • featurePage: README
  8. interfaceDefaults: {fmt: text-orig-full}
  9. isCompatible: True
  10. local: local
  11. localDir:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/_temp
  12. provenanceSpec:
    • branch: main
    • corpus: Nestle 1904 Greek New Testament
    • doi: 10.5281/zenodo.notyet
    • moduleSpecs: []
    • org: saulocantanhede
    • relative: /tf
    • repo: tfgreek2
    • repro: tfgreek2
    • version: 0.5.9
    • webBase: https://learner.bible/text/show_text/nestle1904/
    • webHint: Show this on the website
    • webLang: en
    • webUrl:https://learner.bible/text/show_text/nestle1904/<1>/<2>/<3>
    • webUrlLex: {webBase}/word?version={version}&id=<lid>
  13. release: 0.5.7
  14. typeDisplay:
    • clause:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {cls} {role} {junction}
      • style: ''
    • group:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • phrase:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • sentence:
      • label: {typ} {function} {rela} \\\\ {role} {rule}
      • style: ''
    • subphrase:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • verse:
      • condense: True
      • label: {book} {chapter}:{verse}
      • style: ''
    • wg:
      • condense: True
      • label: {type} {role} {rule} {junction}
      • style: ''
    • word:
      • features:
        • lemma
        • sp
      • featuresBare: [gloss]
  15. writing: grc
\n" ], "text/plain": [ "" @@ -908,6 +898,20 @@ "metadata": {}, "output_type": "display_data" }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "App config error(s) in group:\n", + "\tlabel: feature type not loaded\n", + "App config error(s) in phrase:\n", + "\tlabel: feature type not loaded\n", + "App config error(s) in subphrase:\n", + "\tlabel: feature type not loaded\n", + "App config error(s) in wg:\n", + "\tlabel: feature type not loaded\n" + ] + }, { "data": { "text/html": [ @@ -1574,7 +1578,7 @@ ], "source": [ "# load the app and data\n", - "A = use (\"saulocantanhede/tfgreek2\", version=\"0.5.7\", hoist=globals())" + "A = use (\"saulocantanhede/tfgreek2\", version=\"0.5.9\", hoist=globals())" ] }, { @@ -1596,9 +1600,17 @@ "##### [Back to TOC](#TOC)" ] }, + { + "cell_type": "markdown", + "id": "1cfcb88c-ccfd-4326-8faf-e6324e742295", + "metadata": {}, + "source": [ + "Note: the first two lines were changed to reflect this tf version" + ] + }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 9, "id": "00f1d619-7481-4a79-b044-15addc2ad979", "metadata": { "tags": [] @@ -1606,11 +1618,11 @@ "outputs": [], "source": [ "# If the following variable is set, it will be used as title for all pages. It is intended to the describe the dataset in one line\n", - "customPageTitleMD=\"N1904 Greek New Testament [saulocantanhede/tfgreek2 - 0.5.7](https://github.com/saulocantanhede/tfgreek2)\"\n", - "customPageTitleHTML=\"N1904 Greek New Testament saulocantanhede/tfgreek2 - 0.5.7\"\n", + "customPageTitleMD=\"N1904 Greek New Testament [saulocantanhede/tfgreek2 - 0.5.9](https://github.com/saulocantanhede/tfgreek2)\"\n", + "customPageTitleHTML=\"N1904 Greek New Testament saulocantanhede/tfgreek2 - 0.5.9\"\n", "\n", "# Specify the location to store the resulting files, relative to the location of this notebook (without a trailing slash).\n", - "resultLocation = \"results\"\n", + "resultLocation = \"\" # store in the same dir\n", "\n", "# Type of output format ('html' for HTML, 'md' for Mark Down, or 'both' for both HTML and Mark Down)\n", "typeOutput='md'\n", @@ -1625,8 +1637,6 @@ "verbose=False\n", "\n", "\n", - "\n", - "\n", "# Create the footers for MD and HTML, include today's date\n", "from datetime import datetime\n", "today = datetime.today()\n", @@ -1654,7 +1664,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 11, "id": "e2fd353b-f615-4954-917e-65e61ff8a3d8", "metadata": { "tags": [] @@ -1666,8 +1676,8 @@ "text": [ "Gathering generic details\n", "Analyzing Node Features: .......................................................\n", - "Analyzing Edge Features: .....\n", - "Finished in 16.41 seconds.\n" + "Analyzing Edge Features: ....\n", + "Finished in 15.53 seconds.\n" ] } ], @@ -1734,12 +1744,27 @@ " if not (featureType == 'Node' and feature == 'otype') and not (featureType == 'Edge' and feature == 'oslots'):\n", " for nodeType in F.otype.all:\n", " frequencyLists = featureMethod(feature).freqList(nodeType)\n", + " \n", + " # Calculate the total frequency\n", + " if not isinstance(frequencyLists, int):\n", + " frequencyTotal = sum(freq for _, freq in frequencyLists)\n", + " else:\n", + " frequencyTotal = frequencyLists\n", + " \n", + " # Calculate the number of entries\n", + " if not isinstance(frequencyLists, int):\n", + " numberOfEntries = len(frequencyLists)\n", + " else:\n", + " numberOfEntries = 1 if frequencyLists != 0 else 0\n", + " # Check the length of the frequency table\n", + " truncated = True if numberOfEntries > tableLimit else False\n", + " \n", " if not isinstance(frequencyLists, int):\n", " if len(frequencyLists)!=0:\n", - " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': frequencyLists[:tableLimit]}\n", + " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': frequencyLists[:tableLimit], 'total': frequencyTotal, 'truncated': truncated}\n", " elif isinstance(frequencyLists, int):\n", " if frequencyLists != 0:\n", - " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': [(\"Link\", frequencyLists)]}\n", + " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': [(\"Link\", frequencyLists)], 'total': frequencyTotal, 'truncated': truncated}\n", "\n", " # Add processed feature data to the main dictionary\n", " featureDict[feature] = {'name': feature, 'descr': featureDescription, 'type': featureType, 'datatype': dataType, 'freqlist': featureFrequencyDict}\n", @@ -1805,6 +1830,19 @@ " processFeature(edgeFeature, 'Edge', Es)\n", " if verbose: print(f'\\nFeature {edgeFeature} = {featureDict[edgeFeature]}\\n') # Print feature data if verbose\n", "\n", + "########################################################\n", + "# Sorting feature dictionary #\n", + "########################################################\n", + "\n", + "# Sort the feature dictionary alphabetically by keys\n", + "sortedFeatureDict = {k: featureDict[k] for k in sorted(featureDict)}\n", + "\n", + "# Print the sorted feature dictionary if verbose\n", + "if verbose:\n", + " print(\"\\nSorted Feature Dictionary:\")\n", + " for key, value in sortedFeatureDict.items():\n", + " print(f\"Feature {key} = {value}\")\n", + " \n", "print(f'\\nFinished in {time.time() - overallTime:.2f} seconds.')" ] }, @@ -1831,7 +1869,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 12, "id": "c4b5e148-c336-4d95-a238-5fe79fa9525c", "metadata": { "tags": [] @@ -1841,7 +1879,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Finished in 0.06 seconds (written 60 md files to directory C:\\Users\\tonyj\\OneDrive\\Documents\\GitHub\\Doc4TF\\results)\n" + "Finished in 0.06 seconds (written 59 md files to directory C:\\Users\\tonyj\\OneDrive\\Documents\\GitHub\\tfgreek2\\docs\\doc4TF\\version_0_5_9\\)\n" ] } ], @@ -1856,7 +1894,7 @@ "pathFull = os.getcwd() + '\\\\'\n", "\n", "# Iterating over each feature in the feature dictionary\n", - "for featureName, featureData in featureDict.items():\n", + "for featureName, featureData in sortedFeatureDict.items():\n", " # Extracting various properties of each feature\n", " featureDescription = featureData.get('descr')\n", " featureType = featureData.get('type')\n", @@ -1884,6 +1922,17 @@ " tableListHTML += f'
'\n", " tableListMD += f'{handleSpace}|{item[1]}\\n'\n", " tableListHTML += f'
sentence1970313.82198801117.20100
clause308147.17160425068.36258
{handleSpace}{item[1]}
\\n'\n", + " \n", + " # Add total of featuredata for this node type\n", + " total=frequencyData.get(node).get('total')\n", + " truncated=frequencyData.get(node).get('truncated')\n", + " # Correct handling of the truncated condition in both HTML and Markdown\n", + " if truncated:\n", + " truncatedNote = ' Note: table truncated.'\n", + " else:\n", + " truncatedNote = ''\n", + " tableListHTML += f'

Total frequency of feature: {total}.{truncatedNote}

'\n", + " tableListMD += f'\\nTotal frequency of feature: {total}.{truncatedNote}\\n '\n", "\n", " # Creating info blocks for HTML and Markdown\n", " infoBlockHTML = f'
Data typeFeature typeAvailable for nodes
{featureDataType}{featureType}{nodeListHTML}
'\n", @@ -1935,7 +1984,7 @@ }, { "cell_type": "code", - "execution_count": 8, + "execution_count": 13, "id": "bb568470-a2ed-446b-86c9-e298fb4bc6b3", "metadata": { "tags": [] @@ -1945,7 +1994,7 @@ "name": "stdout", "output_type": "stream", "text": [ - "Finished in 0.01 seconds (written 3 md files to directory C:\\Users\\tonyj\\OneDrive\\Documents\\GitHub\\Doc4TF\\results)\n" + "Finished in 0.01 seconds (written 4 md files to directory C:\\Users\\tonyj\\OneDrive\\Documents\\GitHub\\tfgreek2\\docs\\doc4TF\\version_0_5_9\\)\n" ] } ], @@ -2012,7 +2061,7 @@ "typeFeatureList = []\n", "dataTypeFeatureList = []\n", "\n", - "for featureName, featureData in featureDict.items():\n", + "for featureName, featureData in sortedFeatureDict.items():\n", " typeFeatureList.append((featureName,featureData.get('type')))\n", " dataTypeFeatureList.append((featureName,featureData.get('datatype')))\n", " for node in featureData.get('freqlist'):\n", @@ -2022,15 +2071,15 @@ "# Create the page with overview per node type (e.g. word) #\n", "###########################################################\n", " \n", - "pageMD=f'{pageTitleMD}\\n# Overview features per nodetype\\n'\n", - "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features per nodetype

'\n", + "pageMD=f'{pageTitleMD}\\n# Overview features by node type\\nOverview by [name](featuresbyname.md), [data type](featuresbydatatype.md), or [feature type](featuresbytype.md).\\n'\n", + "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features by node type

Overview by name, data type, or feature type.

'\n", "\n", "# Sort the list alphabetically based on the second item of each tuple (featureName)\n", "nodeFeatureList = sorted(nodeFeatureList, key=lambda x: x[1])\n", "# Iterate over node types\n", "for NodeType in F.otype.all:\n", - " NodeItemTextMD=f'## {NodeType}\\n\\nFeature|Featuretype|Datatype|Description|Examples\\n---|---|---|---|---\\n' \n", - " NodeItemTextHTML=f'

{NodeType}

\\n\\n' \n", + " NodeItemTextMD=f'## {NodeType}\\n\\nFeature|Feature type|Data type|Description|Examples\\n---|---|---|---|---\\n' \n", + " NodeItemTextHTML=f'

{NodeType}

\\n
FeatureFeaturetypeDatatypeDescriptionExamples
\\n' \n", " for node, feature in nodeFeatureList:\n", " if node == NodeType: \n", " featureData=featureDict[feature]\n", @@ -2059,8 +2108,8 @@ "# Create the page with overview per data type (string or integer) #\n", "####################################################################\n", "\n", - "pageMD=f'{pageTitleMD}\\n# Overview features per datatype\\n'\n", - "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features per datatype'\n", + "pageMD=f'{pageTitleMD}\\n# Overview features by data type\\nOverview by [name](featuresbyname.md), [node type](featuresbynodetype.md), or [feature type](featuresbytype.md).\\n'\n", + "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features by data type\\n

Overview by name, node type, feature type

'\n", "\n", "# Sort the list alphabetically based on the second item of each tuple (featureName)\n", "dataTypeFeatureList = sorted(dataTypeFeatureList, key=lambda x: x[1])\n", @@ -2068,13 +2117,13 @@ "DataItemTextMD=DataItemTextHTML=''\n", "for DataType in ('Integer','String'):\n", " DataItemTextMD=f'## {DataType}\\n\\nFeature|Featuretype|Available on nodes|Description|Examples\\n---|---|---|---|---\\n' \n", - " DataItemTextHTML=f'

{DataType}

\\n
FeatureFeature typeData typeDescriptionExamples
\\n' \n", + " DataItemTextHTML=f'

{DataType}

\\n
FeatureFeaturetypeAvailable on nodesDescriptionExamples
\\n' \n", " for feature, featureDataType in dataTypeFeatureList: \n", " if featureDataType == DataType: \n", " featureDescription=featureDict[feature].get('descr') \n", " featureType=featureDict[feature].get('type') \n", " nodeListMD=nodeListHTML=''\n", - " for thisNode in featureDict[feature]['freqlist']:\n", + " for thisNode in sortedFeatureDict[feature]['freqlist']:\n", " nodeListMD+=f'[`{thisNode}`](featuresbynodetype.md#{thisNode}) '\n", " nodeListHTML+=f'{thisNode} '\n", " DataItemTextMD+=f\"[`{feature}`]({feature}.md#readme)|[`{featureType}`](featuresbytype.md#{featureType.lower()})|{nodeListMD}|{featureDescription}|{exampleData(feature)}\\n\"\n", @@ -2100,20 +2149,20 @@ "# Create the page with overview per feature type (edge or node) #\n", "##################################################################\n", "\n", - "pageMD=f'{pageTitleMD}\\n# Overview features per type\\n'\n", - "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features per type'\n", + "pageMD=f'{pageTitleMD}\\n# Overview features by feature type\\nOverview by [name](featuresbyname.md), [node type](featuresbynodetype.md), or [data type](featuresbydatatype.md).\\n'\n", + "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features by feature type\\n

Overview by name, node type, or data type

'\n", "\n", "# Sort the list alphabetically based on the second item of each tuple (nodetype)\n", "typeFeatureList = sorted(typeFeatureList, key=lambda x: x[1])\n", "for featureType in ('Node','Edge'):\n", " ItemTextMD=f'## {featureType}\\n\\nFeature|Datatype|Available on nodes|Description|Examples\\n---|---|---|---|---\\n' \n", - " ItemTextHTML=f'

{featureType}

\\n
FeatureFeature typeAvailable on nodesDescriptionExamples
\\n' \n", + " ItemTextHTML=f'

{featureType}

\\n
FeatureDatatypeAvailable on nodesDescriptionExamples
\\n' \n", " for thisFeature, thisFeatureType in typeFeatureList: \n", " if featureType == thisFeatureType:\n", " featureDescription=featureDict[thisFeature].get('descr')\n", " featureDataType=featureDict[thisFeature].get('datatype')\n", " nodeListMD=nodeListHTML=''\n", - " for thisNode in featureDict[thisFeature]['freqlist']:\n", + " for thisNode in sortedFeatureDict[thisFeature]['freqlist']:\n", " nodeListMD+=f'[`{thisNode}`](featuresbynodetype.md#{thisNode}) '\n", " nodeListHTML+=f'{thisNode} '\n", " ItemTextMD+=f\"[`{thisFeature}`]({thisFeature}.md#readme)|[`{featureDataType}`](featuresbydatatype.md#{featureDataType.lower()})|{nodeListMD}|{featureDescription}|{exampleData(thisFeature)}\\n\"\n", @@ -2133,6 +2182,54 @@ "if typeOutput in ('html','both'):\n", " fileNameHTML = os.path.join(resultLocation, \"featuresbytype.htm\")\n", " writeToFile(fileNameHTML, pageHTML, 'html', verbose)\n", + "\n", + "\n", + "####################################################################\n", + "# Create the page with an alphabetical overview of features #\n", + "####################################################################\n", + "\n", + "pageMD=f'{pageTitleMD}\\n# Overview features by name (alphabetical)\\nOverview by [node type](featuresbynodetype.md), [feature type](featuresbytype.md), or [data type](featuresbydatatype.md).\\n'\n", + "pageHTML=f'{htmlStyle}

{pageTitleHTML}

\\n

Overview features by name (alphabetical)\\n

Overview by node type, feature type, or data type

'\n", + "\n", + "# Initialize Markdown and HTML strings\n", + "DataItemTextMD = '\\nFeature|Feature type|Data type|Available on nodes|Description|Examples\\n---|---|---|---|---|---\\n' \n", + "DataItemTextHTML = '

FeatureData typeAvailable on nodesDescriptionExamples
\\n'\n", + "\n", + "\n", + "# Loop through the sorted dictionary\n", + "for featureKey in sortedFeatureDict:\n", + " featureDetails = sortedFeatureDict[featureKey]\n", + " feature = featureDetails.get('name')\n", + " featureDescription = featureDetails.get('descr')\n", + " featureType = featureDetails.get('type')\n", + " featureDataType = featureDetails.get('datatype')\n", + " \n", + " nodeListMD = nodeListHTML = ''\n", + " for thisNode in featureDetails['freqlist']:\n", + " nodeListMD += f'[`{thisNode}`](featuresbynodetype.md#{thisNode}) '\n", + " nodeListHTML += f'{thisNode} '\n", + " \n", + " DataItemTextMD += f\"[`{feature}`]({feature}.md#readme)|[`{featureType}`](featuresbytype.md#{featureType.lower()})|[`{featureDataType}`](featuresbydatatype.md#{featureDataType.lower()})|{nodeListMD}|{featureDescription}|{exampleData(feature)}\\n\"\n", + " DataItemTextHTML += f\"\\n\"\n", + "\n", + "# Close the HTML table\n", + "DataItemTextHTML += \"
FeatureFeature typeData typeAvailable on nodesDescriptionExamples
{feature}{featureType}{featureDataType}{nodeListHTML}{featureDescription}{exampleData(feature)}
\\n\"\n", + "\n", + "pageMD+=DataItemTextMD\n", + "pageHTML+=DataItemTextHTML\n", + "\n", + "pageHTML+=f'{footerHTML}'\n", + "pageMD+=f'{footerMD}'\n", + " \n", + " \n", + "# Write to file by calling common function\n", + "if typeOutput in ('md','both'):\n", + " fileNameMD = os.path.join(resultLocation, \"featuresbyname.md\")\n", + " writeToFile(fileNameMD, pageMD, 'md', verbose)\n", + "\n", + "if typeOutput in ('html','both'):\n", + " fileNameHTML = os.path.join(resultLocation, \"featuresbyname.htm\")\n", + " writeToFile(fileNameHTML, pageHTML, 'html', verbose)\n", " \n", "\n", "# Reporting the number of files created\n", @@ -2156,10 +2253,15 @@ "id": "23b5ae25-4032-4b1a-8a77-c8eb35f1afbc", "metadata": {}, "source": [ - "Minor changes with version [0.5](https://github.com/tonyjurg/Doc4TF/blob/main/previous_versions/CreateFeatureDoc(0_5).ipynb)):\n", - "\n", - " - Additional notes on install requirements added May 26, 2024.\n", - " - Fixed bug [#18: incorrectly use of HTML page title for MD title](https://github.com/tonyjurg/Doc4TF/issues/18)\n", + "Changes with version [0.5.1](https://github.com/tonyjurg/Doc4TF/blob/main/previous_versions/CreateFeatureDoc(0_5_1).ipynb):\n", + " - Fixed alphabetic sorting; bug [#19](https://github.com/tonyjurg/Doc4TF/issues/19) (No alphabetic sorting of edge and node features)\n", + " - Added an alphabetic index page; enhancement [#15](https://github.com/tonyjurg/Doc4TF/issues/15) (Alphabetic index page)\n", + " - Add total number of feature values and indication when a table is truncated; partial enhancement [#7](https://github.com/tonyjurg/Doc4TF/issues/7) \n", + " \n", + "Minor changes with version [0.5](https://github.com/tonyjurg/Doc4TF/blob/main/previous_versions/CreateFeatureDoc(0_5).ipynb):\n", + "\n", + " * Additional notes on install requirements added May 26, 2024.\n", + " * Fixed bug [#18: incorrectly use of HTML page title for MD title](https://github.com/tonyjurg/Doc4TF/issues/18)\n", " \n", "Changes to previous major version ([0.4](https://github.com/tonyjurg/Doc4TF/blob/main/previous_versions/CreateFeatureDoc(0_4).ipynb)):\n", "\n", diff --git a/results/after.md b/results/after.md index 9b9018d..6b0b30b 100644 --- a/results/after.md +++ b/results/after.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: after Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ space|37661 —|3 ,)|2 ·—|2 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- space|119261 @@ -32,7 +34,9 @@ space|119261 ).|6 .]]|4 ·—|4 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- space|119261 @@ -45,6 +49,8 @@ space|119261 ).|6 .]]|4 ·—|4 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/appositioncontainer.md b/results/appositioncontainer.md index 2c37871..8bc390c 100644 --- a/results/appositioncontainer.md +++ b/results/appositioncontainer.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: appositioncontainer Data type|Feature type|Available for nodes ---|---|--- @@ -10,18 +10,26 @@ Data type|Feature type|Available for nodes Value|Occurences ---|--- 1|62 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 62. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- 1|1908 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 1908. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- 1|715 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 715. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 1|1846 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 1846. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/articular.md b/results/articular.md index 758f43d..cf92806 100644 --- a/results/articular.md +++ b/results/articular.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: articular Data type|Feature type|Available for nodes ---|---|--- @@ -9,27 +9,39 @@ Data type|Feature type|Available for nodes ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- -1|2558 -### Frequency for nodetype [group](featuresbynodetype.md#group) +1|229 + +Total frequency of feature: 229. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- 1|181 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 181. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -1|1057 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +1|3386 + +Total frequency of feature: 3386. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- 1|28772 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 28772. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- 1|13079 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 13079. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 1|24976 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 24976. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/before.md b/results/before.md index 5738300..f32ee4c 100644 --- a/results/before.md +++ b/results/before.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: before Data type|Feature type|Available for nodes ---|---|--- @@ -12,20 +12,26 @@ Value|Occurences —|8 (|6 [[|2 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 16. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- —|16 (|10 [[|7 [|1 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 34. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- —|16 (|10 [[|7 [|1 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 34. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/book.md b/results/book.md index 4230a15..217b050 100644 --- a/results/book.md +++ b/results/book.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: book Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ II_Corinthians|1 II_John|1 II_Peter|1 II_Thessalonians|1 -### Frequency for nodetype [chapter](featuresbynodetype.md#chapter) + +Total frequency of feature: 27. Note: table truncated. + ### Frequency for nodetype [chapter](featuresbynodetype.md#chapter) Value|Occurences ---|--- Acts|28 @@ -32,7 +34,9 @@ Mark|16 Romans|16 Hebrews|13 II_Corinthians|13 -### Frequency for nodetype [verse](featuresbynodetype.md#verse) + +Total frequency of feature: 260. Note: table truncated. + ### Frequency for nodetype [verse](featuresbynodetype.md#verse) Value|Occurences ---|--- Luke|1149 @@ -45,20 +49,24 @@ Romans|432 Revelation|405 Hebrews|303 II_Corinthians|256 -### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) + +Total frequency of feature: 7944. Note: table truncated. + ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- -Luke|2833 -Matthew|2636 -John|2626 -Acts|2245 -Mark|1750 -I_Corinthians|1242 -Revelation|1183 -Romans|1036 -II_Corinthians|721 -Hebrews|612 -### Frequency for nodetype [group](featuresbynodetype.md#group) +Luke|1150 +Matthew|1118 +John|1027 +Acts|878 +Mark|723 +I_Corinthians|519 +Revelation|462 +Romans|460 +II_Corinthians|249 +Hebrews|241 + +Total frequency of feature: 7939. Note: table truncated. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- Acts|1288 @@ -71,20 +79,24 @@ I_Corinthians|431 Romans|362 Hebrews|325 II_Corinthians|222 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 8945. Note: table truncated. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -Luke|4880 -Matthew|4364 -Acts|4237 -John|3699 -Mark|2860 -Revelation|1803 -I_Corinthians|1487 -Romans|1401 -Hebrews|1040 -II_Corinthians|909 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +Luke|6563 +Matthew|5882 +Acts|5604 +John|5298 +Mark|3887 +Revelation|2524 +I_Corinthians|2210 +Romans|1977 +Hebrews|1411 +II_Corinthians|1381 + +Total frequency of feature: 42506. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- Luke|8945 @@ -97,7 +109,9 @@ I_Corinthians|3160 Romans|2799 Hebrews|1977 II_Corinthians|1852 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 59390. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- Luke|19456 @@ -110,6 +124,8 @@ Romans|7100 I_Corinthians|6820 Hebrews|4955 II_Corinthians|4469 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/bookshort.md b/results/bookshort.md index 69f5e57..08bf26f 100644 --- a/results/bookshort.md +++ b/results/bookshort.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: bookshort Data type|Feature type|Available for nodes ---|---|--- @@ -19,20 +19,24 @@ Value|Occurences 2PE|1 2TH|1 2TI|1 -### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) + +Total frequency of feature: 27. Note: table truncated. + ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- -LUK|2833 -MAT|2636 -JHN|2626 -ACT|2245 -MRK|1750 -1CO|1242 -REV|1183 -ROM|1036 -2CO|721 -HEB|612 -### Frequency for nodetype [group](featuresbynodetype.md#group) +LUK|1150 +MAT|1118 +JHN|1027 +ACT|878 +MRK|723 +1CO|519 +REV|462 +ROM|460 +2CO|249 +HEB|241 + +Total frequency of feature: 7939. Note: table truncated. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- ACT|1288 @@ -45,20 +49,24 @@ MRK|753 ROM|362 HEB|325 2CO|222 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 8945. Note: table truncated. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -LUK|4880 -MAT|4364 -ACT|4237 -JHN|3699 -MRK|2860 -REV|1803 -1CO|1487 -ROM|1401 -HEB|1040 -2CO|909 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +LUK|6563 +MAT|5882 +ACT|5604 +JHN|5298 +MRK|3887 +REV|2524 +1CO|2210 +ROM|1977 +HEB|1411 +2CO|1381 + +Total frequency of feature: 42506. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- LUK|8945 @@ -71,7 +79,9 @@ REV|3895 ROM|2799 HEB|1977 2CO|1852 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 59390. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- LUK|19456 @@ -84,6 +94,8 @@ ROM|7100 1CO|6820 HEB|4955 2CO|4469 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/case.md b/results/case.md index 0b085a1..02ffd5e 100644 --- a/results/case.md +++ b/results/case.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: case Data type|Feature type|Available for nodes ---|---|--- @@ -14,7 +14,9 @@ accusative|6170 dative|3265 genitive|1408 vocative|1 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 20453. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- nominative|24197 @@ -22,7 +24,9 @@ accusative|23031 genitive|19515 dative|12126 vocative|649 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 79518. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- nominative|24197 @@ -30,6 +34,8 @@ accusative|23031 genitive|19515 dative|12126 vocative|649 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 79518. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/chapter.md b/results/chapter.md index c1e2ba6..a0fe61c 100644 --- a/results/chapter.md +++ b/results/chapter.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: chapter Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences 8|10 9|10 10|10 -### Frequency for nodetype [verse](featuresbynodetype.md#verse) + +Total frequency of feature: 260. Note: table truncated. + ### Frequency for nodetype [verse](featuresbynodetype.md#verse) Value|Occurences ---|--- 1|691 @@ -32,7 +34,9 @@ Value|Occurences 9|356 7|354 10|348 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 7944. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 1|11685 @@ -45,6 +49,8 @@ Value|Occurences 7|6321 11|6242 12|6213 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/clauseType.md b/results/clauseType.md index 357270f..cdf1ba7 100644 --- a/results/clauseType.md +++ b/results/clauseType.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: clausetype Data type|Feature type|Available for nodes ---|---|--- @@ -10,14 +10,20 @@ clause type Value|Occurences ---|--- nominalized|59 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 59. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- nominalized|5237 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 5237. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- nominalized|5296 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 5296. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/cls.md b/results/cls.md index 6aeada3..9f66c74 100644 --- a/results/cls.md +++ b/results/cls.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: cls Data type|Feature type|Available for nodes ---|---|--- @@ -10,11 +10,15 @@ this is XML attribute cls Value|Occurences ---|--- cl|1476 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 1476. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- cl|28676 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 28676. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- np|30911 @@ -26,7 +30,9 @@ advp|166 adv|7 nump|7 conj|1 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 72788. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- verb|27355 @@ -39,7 +45,9 @@ adj|2304 det|257 advp|154 ptcl|87 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 66851. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- np|30911 @@ -52,7 +60,9 @@ pp|11169 prep|10914 adj|8452 adv|6154 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 180415. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- noun|28455 @@ -65,6 +75,8 @@ adj|8452 adv|6147 ptcl|773 num|476 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/cltype.md b/results/cltype.md index 267b117..4ca63be 100644 --- a/results/cltype.md +++ b/results/cltype.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: cltype Data type|Feature type|Available for nodes ---|---|--- @@ -12,18 +12,24 @@ Value|Occurences Verbless|77 VerbElided|47 Minor|1 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 125. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- VerbElided|1003 Verbless|884 Minor|831 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 2718. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- VerbElided|1050 Verbless|961 Minor|832 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 2843. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/criticalsign.md b/results/criticalsign.md index 62b5bc9..c4fdf1a 100644 --- a/results/criticalsign.md +++ b/results/criticalsign.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: criticalsign Data type|Feature type|Available for nodes ---|---|--- @@ -14,7 +14,9 @@ Value|Occurences (|6 ]]|3 [[|2 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 30. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- —|25 @@ -24,7 +26,9 @@ Value|Occurences ]]|7 [|1 ]|1 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 63. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- —|25 @@ -34,6 +38,8 @@ Value|Occurences ]]|7 [|1 ]|1 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 63. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/crule.md b/results/crule.md index ab9e491..88381c4 100644 --- a/results/crule.md +++ b/results/crule.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: crule Data type|Feature type|Available for nodes ---|---|--- @@ -11,16 +11,22 @@ Value|Occurences ---|--- ClCl|619 ClCl2|219 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 838. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- ClCl|3689 ClCl2|1031 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 4720. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- ClCl|4308 ClCl2|1250 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 5558. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/degree.md b/results/degree.md index fb5ecfc..03a4d7a 100644 --- a/results/degree.md +++ b/results/degree.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: degree Data type|Feature type|Available for nodes ---|---|--- @@ -11,16 +11,22 @@ Value|Occurences ---|--- comparative|119 superlative|32 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 151. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- comparative|313 superlative|200 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 513. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- comparative|313 superlative|200 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 513. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/discontinuous.md b/results/discontinuous.md index 001c720..c4614d5 100644 --- a/results/discontinuous.md +++ b/results/discontinuous.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: discontinuous Data type|Feature type|Available for nodes ---|---|--- @@ -10,14 +10,20 @@ Data type|Feature type|Available for nodes Value|Occurences ---|--- 1|645 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 645. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 1|6034 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 6034. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 1|6034 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 6034. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/domain.md b/results/domain.md index 956f06b..3fb842c 100644 --- a/results/domain.md +++ b/results/domain.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: domain Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences 092006|822 067002|790 024001|686 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 43153. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 092004|26129 @@ -32,7 +34,9 @@ Value|Occurences 069002|1857 092001|1845 089023|1780 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 126879. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 092004|26129 @@ -45,6 +49,8 @@ Value|Occurences 069002|1857 092001|1845 089023|1780 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 126879. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/featuresbydatatype.md b/results/featuresbydatatype.md index 2f7f409..38bfda5 100644 --- a/results/featuresbydatatype.md +++ b/results/featuresbydatatype.md @@ -1,5 +1,6 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) -# Overview features per datatype +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) +# Overview features by data type +Overview by [name](featuresbyname.md), [node type](featuresbynodetype.md), or [feature type](featuresbytype.md). ## Integer Feature|Featuretype|Available on nodes|Description|Examples @@ -8,11 +9,9 @@ Feature|Featuretype|Available on nodes|Description|Examples [`articular`](articular.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |1 if the sentence, group, clause, phrase or wg has an article|`1` [`chapter`](chapter.md#readme)|[`Node`](featuresbytype.md#node)|[`chapter`](featuresbynodetype.md#chapter) [`verse`](featuresbynodetype.md#verse) [`word`](featuresbynodetype.md#word) |chapter number, from ref attribute in xml|`1` `2` `3` `4` [`discontinuous`](discontinuous.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |1 if the word is out of sequence in the xml|`1` -[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |node id (as in the XML source data|`400040070010120` `400040100010070` `400050030010120` `400050040010060` [`num`](num.md#readme)|[`Node`](featuresbytype.md#node)|[`book`](featuresbynodetype.md#book) [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`strong`](strong.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |strong number|`846` `3004` `1510` `4771` [`verse`](verse.md#readme)|[`Node`](featuresbytype.md#node)|[`verse`](featuresbynodetype.md#verse) [`word`](featuresbynodetype.md#word) |verse number, from ref attribute in xml|`1` `2` `3` `4` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#edge)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute sibling|`1` `2` `3` `4` ## String Feature|Featuretype|Available on nodes|Description|Examples @@ -29,45 +28,46 @@ Feature|Featuretype|Available on nodes|Description|Examples [`crule`](crule.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |clause rule (from xml attribute Rule)|`ClCl` `ClCl2` [`degree`](degree.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical degree|`comparative` `superlative` [`domain`](domain.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |domain|`092004` `033006` `013001` `069002` +[`frame`](frame.md#readme)|[`Edge`](featuresbytype.md#edge)|[`word`](featuresbynodetype.md#word) |frame|`A0` `A1` `A2` `AA2` [`framespec`](framespec.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute framespec|`A0:n00000000000` `A1:n00000000000` `A0:n47010001004` `A0:n46003022002` [`function`](function.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`gender`](gender.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical gender|`masculine` `neuter` `feminine` -[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |short translation|`not` `you` `is` `Him` +[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#node)|[`word`](featuresbynodetype.md#word) |English gloss (BGVB)|`the` `and, also, likewise` `he, she, it, himself, herself, itself; even, very; same` `you` [`id`](id.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |xml id|`n40001002001` `n40001002002` `n40001002005` `n40001002007` -[`junction`](junction.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |type of junction|`coordinate` `subordinate` +[`junction`](junction.md#readme)|[`Node`](featuresbytype.md#node)|[`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |type of junction|`coordinate` `subordinate` [`lang`](lang.md#readme)|[`Node`](featuresbytype.md#node)|[`book`](featuresbynodetype.md#book) |language the text is in|`el` [`lemma`](lemma.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |lexical lemma|`αὐτός` `λέγω` `εἰμί` `σύ` [`lemmatranslit`](lemmatranslit.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |transliteration of the word lemma|`autos` `lego` `eimi` `su` [`ln`](ln.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |ln|`92.11` `33.69` `69.3` `92.1` [`mood`](mood.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal mood|`indicative` `participle` `infinitive` `subjunctive` [`morph`](morph.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological code|`V-PAI-3S` `ADV` `PRT-N` `V-2AAI-3S` +[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |node id (as in the XML source data)|`400040070010120` `400040100010070` `400050030010120` `400050040010060` [`normalized`](normalized.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |lemma normalized|`αὐτόν` `μή` `αὐτῷ` `οὐκ` [`note`](note.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |annotation of linguistic nature|`discontinuous discourse` [`number`](number.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical number|`singular` `plural` +[`oslots`](oslots.md#readme)|[`Edge`](featuresbytype.md#edge)||No feature description|No values [`otype`](otype.md#readme)|[`Node`](featuresbytype.md#node)||No feature description|No values -[`person`](person.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical person|`third` `second` `first` +[`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#edge)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |parent relationship between words|`Link` +[`person`](person.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical person|`p3` `p2` `p1` [`punctuation`](punctuation.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute punctuation|` ` `,` `.` `·` [`ref`](ref.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |biblical reference with word counting|`1CO 10:1!1` `1CO 10:1!15` `1CO 10:1!17` `1CO 10:1!2` [`referent`](referent.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |number of referent|`n40005001015` `n43014023002` `n43013023006 n43013037003 n43014005003 n43014008003 n43014022003` `n43017001003` [`rela`](rela.md#readme)|[`Node`](featuresbytype.md#node)|[`wg`](featuresbynodetype.md#wg) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute rela|`Appo` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#node)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` [`sp`](sp.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |part-of-speach|`verb` `pron` `advb` `subs` +[`subjref`](subjref.md#readme)|[`Edge`](featuresbytype.md#edge)|[`word`](featuresbynodetype.md#word) |number of subject referent|`Link` [`subjrefspec`](subjrefspec.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute subjrefspec|`n46003022002` `n66001009002` `n45001001001` `n47010001004` [`tense`](tense.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal tense|`aorist` `present` `future` `imperfect` [`text`](text.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |the text of a word|`αὐτῷ` `μὴ` `οὐκ` `εἶπεν` [`trans`](trans.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |translation of the word surface text according to the Berean Interlinear Bible|`not` `you` `is` `Him` [`translit`](translit.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |transliteration of the word surface text|`me` `estin` `auton` `auto` -[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#node)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#node)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#node)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` [`unaccent`](unaccent.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |word in unicode characters without accents and diacritical markers|`εστιν` `αυτον` `μη` `αυτω` [`unicode`](unicode.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |word in unicode characters plus material after it|`μὴ` `οὐκ` `αὐτῷ` `εἶπεν` [`variant`](variant.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute variant|`2` `1` [`voice`](voice.md#readme)|[`Node`](featuresbytype.md#node)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal voice|`active` `passive` `middle` `middlepassive` -[`frame`](frame.md#readme)|[`Edge`](featuresbytype.md#edge)|[`word`](featuresbynodetype.md#word) |frame|`A0` `A1` `A2` `AA2` -[`oslots`](oslots.md#readme)|[`Edge`](featuresbytype.md#edge)||No feature description|No values -[`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#edge)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |parent relationship between words|`Link` -[`subjref`](subjref.md#readme)|[`Edge`](featuresbytype.md#edge)|[`word`](featuresbynodetype.md#word) |number of subject referent|`Link` -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/featuresbyname.md b/results/featuresbyname.md new file mode 100644 index 0000000..0c9128a --- /dev/null +++ b/results/featuresbyname.md @@ -0,0 +1,68 @@ +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) +# Overview features by name (alphabetical) +Overview by [node type](featuresbynodetype.md), [feature type](featuresbytype.md), or [data type](featuresbydatatype.md). + +Feature|Feature type|Data type|Available on nodes|Description|Examples +---|---|---|---|---|--- +[`after`](after.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |material after the end of the word|` ` `,` `.` `·` +[`appositioncontainer`](appositioncontainer.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |1 if it is an apposition container|`1` +[`articular`](articular.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |1 if the sentence, group, clause, phrase or wg has an article|`1` +[`before`](before.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute before|`—` `(` `[[` +[`book`](book.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`book`](featuresbynodetype.md#book) [`chapter`](featuresbynodetype.md#chapter) [`verse`](featuresbynodetype.md#verse) [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`word`](featuresbynodetype.md#word) |book name (full name)|`Acts` `Colossians` `Ephesians` `Galatians` +[`bookshort`](bookshort.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`book`](featuresbynodetype.md#book) [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`word`](featuresbynodetype.md#word) |book name (abbreviated) from ref attribute in xml|`1CO` `1JN` `1PE` `1TH` +[`case`](case.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical case|`nominative` `accusative` `dative` `genitive` +[`chapter`](chapter.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`chapter`](featuresbynodetype.md#chapter) [`verse`](featuresbynodetype.md#verse) [`word`](featuresbynodetype.md#word) |chapter number, from ref attribute in xml|`1` `2` `3` `4` +[`clausetype`](clausetype.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |clause type|`nominalized` +[`cls`](cls.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute cls|`cl` +[`cltype`](cltype.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |clause type|`Verbless` `VerbElided` `Minor` +[`criticalsign`](criticalsign.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute criticalsign|`—` `)` `(` `]]` +[`crule`](crule.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |clause rule (from xml attribute Rule)|`ClCl` `ClCl2` +[`degree`](degree.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical degree|`comparative` `superlative` +[`discontinuous`](discontinuous.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |1 if the word is out of sequence in the xml|`1` +[`domain`](domain.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |domain|`092004` `033006` `013001` `069002` +[`frame`](frame.md#readme)|[`Edge`](featuresbytype.md#edge)|[`String`](featuresbydatatype.md#string)|[`word`](featuresbynodetype.md#word) |frame|`A0` `A1` `A2` `AA2` +[`framespec`](framespec.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute framespec|`A0:n00000000000` `A1:n00000000000` `A0:n47010001004` `A0:n46003022002` +[`function`](function.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` +[`gender`](gender.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical gender|`masculine` `neuter` `feminine` +[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`word`](featuresbynodetype.md#word) |English gloss (BGVB)|`the` `and, also, likewise` `he, she, it, himself, herself, itself; even, very; same` `you` +[`id`](id.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |xml id|`n40001002001` `n40001002002` `n40001002005` `n40001002007` +[`junction`](junction.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |type of junction|`coordinate` `subordinate` +[`lang`](lang.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`book`](featuresbynodetype.md#book) |language the text is in|`el` +[`lemma`](lemma.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |lexical lemma|`αὐτός` `λέγω` `εἰμί` `σύ` +[`lemmatranslit`](lemmatranslit.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |transliteration of the word lemma|`autos` `lego` `eimi` `su` +[`ln`](ln.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |ln|`92.11` `33.69` `69.3` `92.1` +[`mood`](mood.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal mood|`indicative` `participle` `infinitive` `subjunctive` +[`morph`](morph.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological code|`V-PAI-3S` `ADV` `PRT-N` `V-2AAI-3S` +[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |node id (as in the XML source data)|`400040070010120` `400040100010070` `400050030010120` `400050040010060` +[`normalized`](normalized.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |lemma normalized|`αὐτόν` `μή` `αὐτῷ` `οὐκ` +[`note`](note.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |annotation of linguistic nature|`discontinuous discourse` +[`num`](num.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`book`](featuresbynodetype.md#book) [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` +[`number`](number.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical number|`singular` `plural` +[`oslots`](oslots.md#readme)|[`Edge`](featuresbytype.md#edge)|[`String`](featuresbydatatype.md#string)||No feature description|No values +[`otype`](otype.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)||No feature description|No values +[`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#edge)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |parent relationship between words|`Link` +[`person`](person.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical person|`p3` `p2` `p1` +[`punctuation`](punctuation.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute punctuation|` ` `,` `.` `·` +[`ref`](ref.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |biblical reference with word counting|`1CO 10:1!1` `1CO 10:1!15` `1CO 10:1!17` `1CO 10:1!2` +[`referent`](referent.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |number of referent|`n40005001015` `n43014023002` `n43013023006 n43013037003 n43014005003 n43014008003 n43014022003` `n43017001003` +[`rela`](rela.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`wg`](featuresbynodetype.md#wg) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute rela|`Appo` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` +[`sp`](sp.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |part-of-speach|`verb` `pron` `advb` `subs` +[`strong`](strong.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |strong number|`846` `3004` `1510` `4771` +[`subjref`](subjref.md#readme)|[`Edge`](featuresbytype.md#edge)|[`String`](featuresbydatatype.md#string)|[`word`](featuresbynodetype.md#word) |number of subject referent|`Link` +[`subjrefspec`](subjrefspec.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute subjrefspec|`n46003022002` `n66001009002` `n45001001001` `n47010001004` +[`tense`](tense.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal tense|`aorist` `present` `future` `imperfect` +[`text`](text.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |the text of a word|`αὐτῷ` `μὴ` `οὐκ` `εἶπεν` +[`trans`](trans.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |translation of the word surface text according to the Berean Interlinear Bible|`not` `you` `is` `Him` +[`translit`](translit.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |transliteration of the word surface text|`me` `estin` `auton` `auto` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` +[`unaccent`](unaccent.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |word in unicode characters without accents and diacritical markers|`εστιν` `αυτον` `μη` `αυτω` +[`unicode`](unicode.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |word in unicode characters plus material after it|`μὴ` `οὐκ` `αὐτῷ` `εἶπεν` +[`variant`](variant.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute variant|`2` `1` +[`verse`](verse.md#readme)|[`Node`](featuresbytype.md#node)|[`Integer`](featuresbydatatype.md#integer)|[`verse`](featuresbynodetype.md#verse) [`word`](featuresbynodetype.md#word) |verse number, from ref attribute in xml|`1` `2` `3` `4` +[`voice`](voice.md#readme)|[`Node`](featuresbytype.md#node)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal voice|`active` `passive` `middle` `middlepassive` + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/featuresbynodetype.md b/results/featuresbynodetype.md index d420e59..fb0e316 100644 --- a/results/featuresbynodetype.md +++ b/results/featuresbynodetype.md @@ -1,8 +1,9 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) -# Overview features per nodetype +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) +# Overview features by node type +Overview by [name](featuresbyname.md), [data type](featuresbydatatype.md), or [feature type](featuresbytype.md). ## book -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`book`](book.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (full name)|`Acts` `Colossians` `Ephesians` `Galatians` [`bookshort`](bookshort.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (abbreviated) from ref attribute in xml|`1CO` `1JN` `1PE` `1TH` @@ -10,20 +11,20 @@ Feature|Featuretype|Datatype|Description|Examples [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` ## chapter -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`book`](book.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (full name)|`Acts` `Colossians` `Ephesians` `Galatians` [`chapter`](chapter.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|chapter number, from ref attribute in xml|`1` `2` `3` `4` ## verse -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`book`](book.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (full name)|`Acts` `Colossians` `Ephesians` `Galatians` [`chapter`](chapter.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|chapter number, from ref attribute in xml|`1` `2` `3` `4` [`verse`](verse.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|verse number, from ref attribute in xml|`1` `2` `3` `4` ## sentence -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`articular`](articular.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if the sentence, group, clause, phrase or wg has an article|`1` [`book`](book.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (full name)|`Acts` `Colossians` `Ephesians` `Galatians` @@ -33,31 +34,27 @@ Feature|Featuretype|Datatype|Description|Examples [`cltype`](cltype.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|clause type|`Verbless` `VerbElided` `Minor` [`crule`](crule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|clause rule (from xml attribute Rule)|`ClCl` `ClCl2` [`function`](function.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` -[`junction`](junction.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|type of junction|`coordinate` `subordinate` -[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|node id (as in the XML source data|`400040070010120` `400040100010070` `400050030010120` `400050040010060` +[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|node id (as in the XML source data)|`400040070010120` `400040100010070` `400050030010120` `400050040010060` [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` ## group -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`articular`](articular.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if the sentence, group, clause, phrase or wg has an article|`1` [`book`](book.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (full name)|`Acts` `Colossians` `Ephesians` `Galatians` [`bookshort`](bookshort.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|book name (abbreviated) from ref attribute in xml|`1CO` `1JN` `1PE` `1TH` [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` -[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` ## clause -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`appositioncontainer`](appositioncontainer.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if it is an apposition container|`1` [`articular`](articular.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if the sentence, group, clause, phrase or wg has an article|`1` @@ -69,17 +66,16 @@ Feature|Featuretype|Datatype|Description|Examples [`crule`](crule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|clause rule (from xml attribute Rule)|`ClCl` `ClCl2` [`function`](function.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`junction`](junction.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|type of junction|`coordinate` `subordinate` -[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|node id (as in the XML source data|`400040070010120` `400040100010070` `400050030010120` `400050040010060` +[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|node id (as in the XML source data)|`400040070010120` `400040100010070` `400050030010120` `400050040010060` [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` -[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` ## wg -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`appositioncontainer`](appositioncontainer.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if it is an apposition container|`1` [`articular`](articular.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if the sentence, group, clause, phrase or wg has an article|`1` @@ -91,18 +87,17 @@ Feature|Featuretype|Datatype|Description|Examples [`crule`](crule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|clause rule (from xml attribute Rule)|`ClCl` `ClCl2` [`function`](function.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`junction`](junction.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|type of junction|`coordinate` `subordinate` -[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|node id (as in the XML source data|`400040070010120` `400040100010070` `400050030010120` `400050040010060` +[`nodeid`](nodeid.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|node id (as in the XML source data)|`400040070010120` `400040100010070` `400050030010120` `400050040010060` [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` [`rela`](rela.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute rela|`Appo` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` -[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` ## phrase -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`after`](after.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|material after the end of the word|` ` `,` `.` `·` [`appositioncontainer`](appositioncontainer.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if it is an apposition container|`1` @@ -117,7 +112,6 @@ Feature|Featuretype|Datatype|Description|Examples [`framespec`](framespec.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute framespec|`A0:n00000000000` `A1:n00000000000` `A0:n47010001004` `A0:n46003022002` [`function`](function.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`gender`](gender.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical gender|`masculine` `neuter` `feminine` -[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|short translation|`not` `you` `is` `Him` [`id`](id.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|xml id|`n40001002001` `n40001002002` `n40001002005` `n40001002007` [`junction`](junction.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|type of junction|`coordinate` `subordinate` [`lemma`](lemma.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|lexical lemma|`αὐτός` `λέγω` `εἰμί` `σύ` @@ -130,13 +124,12 @@ Feature|Featuretype|Datatype|Description|Examples [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`number`](number.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical number|`singular` `plural` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` -[`person`](person.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical person|`third` `second` `first` +[`person`](person.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical person|`p3` `p2` `p1` [`punctuation`](punctuation.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute punctuation|` ` `,` `.` `·` [`ref`](ref.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|biblical reference with word counting|`1CO 10:1!1` `1CO 10:1!15` `1CO 10:1!17` `1CO 10:1!2` [`referent`](referent.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|number of referent|`n40005001015` `n43014023002` `n43013023006 n43013037003 n43014005003 n43014008003 n43014022003` `n43017001003` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` [`sp`](sp.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|part-of-speach|`verb` `pron` `advb` `subs` [`strong`](strong.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|strong number|`846` `3004` `1510` `4771` [`subjrefspec`](subjrefspec.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute subjrefspec|`n46003022002` `n66001009002` `n45001001001` `n47010001004` @@ -144,15 +137,15 @@ Feature|Featuretype|Datatype|Description|Examples [`text`](text.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|the text of a word|`αὐτῷ` `μὴ` `οὐκ` `εἶπεν` [`trans`](trans.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|translation of the word surface text according to the Berean Interlinear Bible|`not` `you` `is` `Him` [`translit`](translit.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|transliteration of the word surface text|`me` `estin` `auton` `auto` -[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` [`unaccent`](unaccent.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|word in unicode characters without accents and diacritical markers|`εστιν` `αυτον` `μη` `αυτω` [`unicode`](unicode.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|word in unicode characters plus material after it|`μὴ` `οὐκ` `αὐτῷ` `εἶπεν` [`variant`](variant.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute variant|`2` `1` [`voice`](voice.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|verbal voice|`active` `passive` `middle` `middlepassive` ## subphrase -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`after`](after.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|material after the end of the word|` ` `,` `.` `·` [`appositioncontainer`](appositioncontainer.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|1 if it is an apposition container|`1` @@ -167,7 +160,6 @@ Feature|Featuretype|Datatype|Description|Examples [`framespec`](framespec.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute framespec|`A0:n00000000000` `A1:n00000000000` `A0:n47010001004` `A0:n46003022002` [`function`](function.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`gender`](gender.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical gender|`masculine` `neuter` `feminine` -[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|short translation|`not` `you` `is` `Him` [`id`](id.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|xml id|`n40001002001` `n40001002002` `n40001002005` `n40001002007` [`junction`](junction.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|type of junction|`coordinate` `subordinate` [`lemma`](lemma.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|lexical lemma|`αὐτός` `λέγω` `εἰμί` `σύ` @@ -180,14 +172,13 @@ Feature|Featuretype|Datatype|Description|Examples [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`number`](number.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical number|`singular` `plural` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` -[`person`](person.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical person|`third` `second` `first` +[`person`](person.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical person|`p3` `p2` `p1` [`punctuation`](punctuation.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute punctuation|` ` `,` `.` `·` [`ref`](ref.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|biblical reference with word counting|`1CO 10:1!1` `1CO 10:1!15` `1CO 10:1!17` `1CO 10:1!2` [`referent`](referent.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|number of referent|`n40005001015` `n43014023002` `n43013023006 n43013037003 n43014005003 n43014008003 n43014022003` `n43017001003` [`rela`](rela.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute rela|`Appo` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` [`sp`](sp.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|part-of-speach|`verb` `pron` `advb` `subs` [`strong`](strong.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|strong number|`846` `3004` `1510` `4771` [`subjrefspec`](subjrefspec.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute subjrefspec|`n46003022002` `n66001009002` `n45001001001` `n47010001004` @@ -195,15 +186,15 @@ Feature|Featuretype|Datatype|Description|Examples [`text`](text.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|the text of a word|`αὐτῷ` `μὴ` `οὐκ` `εἶπεν` [`trans`](trans.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|translation of the word surface text according to the Berean Interlinear Bible|`not` `you` `is` `Him` [`translit`](translit.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|transliteration of the word surface text|`me` `estin` `auton` `auto` -[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`typ`](typ.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` [`unaccent`](unaccent.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|word in unicode characters without accents and diacritical markers|`εστιν` `αυτον` `μη` `αυτω` [`unicode`](unicode.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|word in unicode characters plus material after it|`μὴ` `οὐκ` `αὐτῷ` `εἶπεν` [`variant`](variant.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute variant|`2` `1` [`voice`](voice.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|verbal voice|`active` `passive` `middle` `middlepassive` ## word -Feature|Featuretype|Datatype|Description|Examples +Feature|Feature type|Data type|Description|Examples ---|---|---|---|--- [`after`](after.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|material after the end of the word|` ` `,` `.` `·` [`before`](before.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute before|`—` `(` `[[` @@ -220,7 +211,7 @@ Feature|Featuretype|Datatype|Description|Examples [`framespec`](framespec.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute framespec|`A0:n00000000000` `A1:n00000000000` `A0:n47010001004` `A0:n46003022002` [`function`](function.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`gender`](gender.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical gender|`masculine` `neuter` `feminine` -[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|short translation|`not` `you` `is` `Him` +[`gloss`](gloss.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|English gloss (BGVB)|`the` `and, also, likewise` `he, she, it, himself, herself, itself; even, very; same` `you` [`id`](id.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|xml id|`n40001002001` `n40001002002` `n40001002005` `n40001002007` [`lemma`](lemma.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|lexical lemma|`αὐτός` `λέγω` `εἰμί` `σύ` [`lemmatranslit`](lemmatranslit.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|transliteration of the word lemma|`autos` `lego` `eimi` `su` @@ -232,13 +223,12 @@ Feature|Featuretype|Datatype|Description|Examples [`num`](num.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`number`](number.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical number|`singular` `plural` [`parent`](parent.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|parent relationship between words|`Link` -[`person`](person.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical person|`third` `second` `first` +[`person`](person.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|grammatical person|`p3` `p2` `p1` [`punctuation`](punctuation.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute punctuation|` ` `,` `.` `·` [`ref`](ref.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|biblical reference with word counting|`1CO 10:1!1` `1CO 10:1!15` `1CO 10:1!17` `1CO 10:1!2` [`referent`](referent.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|number of referent|`n40005001015` `n43014023002` `n43013023006 n43013037003 n43014005003 n43014008003 n43014022003` `n43017001003` [`rela`](rela.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute rela|`Appo` -[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`adv` `o` `s` `apposition` -[`sibling`](sibling.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`Integer`](featuresbydatatype.md#Integer)|this is XML attribute sibling|`1` `2` `3` `4` +[`role`](role.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|role|`o` `s` `p` `adv` [`sp`](sp.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|part-of-speach|`verb` `pron` `advb` `subs` [`strong`](strong.md#readme)|[`Node`](featuresbytype.md#Node)|[`Integer`](featuresbydatatype.md#Integer)|strong number|`846` `3004` `1510` `4771` [`subjref`](subjref.md#readme)|[`Edge`](featuresbytype.md#Edge)|[`String`](featuresbydatatype.md#String)|number of subject referent|`Link` @@ -247,7 +237,7 @@ Feature|Featuretype|Datatype|Description|Examples [`text`](text.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|the text of a word|`αὐτῷ` `μὴ` `οὐκ` `εἶπεν` [`trans`](trans.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|translation of the word surface text according to the Berean Interlinear Bible|`not` `you` `is` `Him` [`translit`](translit.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|transliteration of the word surface text|`me` `estin` `auton` `auto` -[`type`](type.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`typems`](typems.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` [`unaccent`](unaccent.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|word in unicode characters without accents and diacritical markers|`εστιν` `αυτον` `μη` `αυτω` [`unicode`](unicode.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|word in unicode characters plus material after it|`μὴ` `οὐκ` `αὐτῷ` `εἶπεν` [`variant`](variant.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|this is XML attribute variant|`2` `1` @@ -255,4 +245,4 @@ Feature|Featuretype|Datatype|Description|Examples [`voice`](voice.md#readme)|[`Node`](featuresbytype.md#Node)|[`String`](featuresbydatatype.md#String)|verbal voice|`active` `passive` `middle` `middlepassive` -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/featuresbytype.md b/results/featuresbytype.md index 6ecd11f..44a6a1c 100644 --- a/results/featuresbytype.md +++ b/results/featuresbytype.md @@ -1,5 +1,6 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) -# Overview features per type +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) +# Overview features by feature type +Overview by [name](featuresbyname.md), [node type](featuresbynodetype.md), or [data type](featuresbydatatype.md). ## Node Feature|Datatype|Available on nodes|Description|Examples @@ -23,28 +24,28 @@ Feature|Datatype|Available on nodes|Description|Examples [`framespec`](framespec.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute framespec|`A0:n00000000000` `A1:n00000000000` `A0:n47010001004` `A0:n46003022002` [`function`](function.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute function|`Pred-Obj` `Subj-PreC-PreC` `Cmpl-Pred` `Cmpl-Pred-Obj` [`gender`](gender.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical gender|`masculine` `neuter` `feminine` -[`gloss`](gloss.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |short translation|`not` `you` `is` `Him` +[`gloss`](gloss.md#readme)|[`String`](featuresbydatatype.md#string)|[`word`](featuresbynodetype.md#word) |English gloss (BGVB)|`the` `and, also, likewise` `he, she, it, himself, herself, itself; even, very; same` `you` [`id`](id.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |xml id|`n40001002001` `n40001002002` `n40001002005` `n40001002007` -[`junction`](junction.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |type of junction|`coordinate` `subordinate` +[`junction`](junction.md#readme)|[`String`](featuresbydatatype.md#string)|[`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |type of junction|`coordinate` `subordinate` [`lang`](lang.md#readme)|[`String`](featuresbydatatype.md#string)|[`book`](featuresbynodetype.md#book) |language the text is in|`el` [`lemma`](lemma.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |lexical lemma|`αὐτός` `λέγω` `εἰμί` `σύ` [`lemmatranslit`](lemmatranslit.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |transliteration of the word lemma|`autos` `lego` `eimi` `su` [`ln`](ln.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |ln|`92.11` `33.69` `69.3` `92.1` [`mood`](mood.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |verbal mood|`indicative` `participle` `infinitive` `subjunctive` [`morph`](morph.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological code|`V-PAI-3S` `ADV` `PRT-N` `V-2AAI-3S` -[`nodeid`](nodeid.md#readme)|[`Integer`](featuresbydatatype.md#integer)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |node id (as in the XML source data|`400040070010120` `400040100010070` `400050030010120` `400050040010060` +[`nodeid`](nodeid.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) |node id (as in the XML source data)|`400040070010120` `400040100010070` `400050030010120` `400050040010060` [`normalized`](normalized.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |lemma normalized|`αὐτόν` `μή` `αὐτῷ` `οὐκ` [`note`](note.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |annotation of linguistic nature|`discontinuous discourse` [`num`](num.md#readme)|[`Integer`](featuresbydatatype.md#integer)|[`book`](featuresbynodetype.md#book) [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.|`1` `2` `3` `4` [`number`](number.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical number|`singular` `plural` [`otype`](otype.md#readme)|[`String`](featuresbydatatype.md#string)||No feature description|No values -[`person`](person.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical person|`third` `second` `first` +[`person`](person.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |grammatical person|`p3` `p2` `p1` [`punctuation`](punctuation.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute punctuation|` ` `,` `.` `·` [`ref`](ref.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |biblical reference with word counting|`1CO 10:1!1` `1CO 10:1!15` `1CO 10:1!17` `1CO 10:1!2` [`referent`](referent.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |number of referent|`n40005001015` `n43014023002` `n43013023006 n43013037003 n43014005003 n43014008003 n43014022003` `n43017001003` [`rela`](rela.md#readme)|[`String`](featuresbydatatype.md#string)|[`wg`](featuresbynodetype.md#wg) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute rela|`Appo` -[`role`](role.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |role|`adv` `o` `s` `apposition` -[`rule`](rule.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical rule|`Conj-CL` `CLaCL` `sub-CL` `DetCL` +[`role`](role.md#readme)|[`String`](featuresbydatatype.md#string)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |role|`o` `s` `p` `adv` +[`rule`](rule.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical rule|`Conj-CL` `CLaCL` `ClCl` `ClCl2` [`sp`](sp.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |part-of-speach|`verb` `pron` `advb` `subs` [`strong`](strong.md#readme)|[`Integer`](featuresbydatatype.md#integer)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |strong number|`846` `3004` `1510` `4771` [`subjrefspec`](subjrefspec.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute subjrefspec|`n46003022002` `n66001009002` `n45001001001` `n47010001004` @@ -52,8 +53,8 @@ Feature|Datatype|Available on nodes|Description|Examples [`text`](text.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |the text of a word|`αὐτῷ` `μὴ` `οὐκ` `εἶπεν` [`trans`](trans.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |translation of the word surface text according to the Berean Interlinear Bible|`not` `you` `is` `Him` [`translit`](translit.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |transliteration of the word surface text|`me` `estin` `auton` `auto` -[`typ`](typ.md#readme)|[`String`](featuresbydatatype.md#string)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |this is XML attribute typ|`conjuncted` `apposition` -[`type`](type.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` `apposition-group` +[`typ`](typ.md#readme)|[`String`](featuresbydatatype.md#string)|[`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) |syntactical type (on sentence, group, clause or phrase)|`conjuncted` `apposition` +[`typems`](typems.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)|`wrapper-clause-scope` `group` [`unaccent`](unaccent.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |word in unicode characters without accents and diacritical markers|`εστιν` `αυτον` `μη` `αυτω` [`unicode`](unicode.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |word in unicode characters plus material after it|`μὴ` `οὐκ` `αὐτῷ` `εἶπεν` [`variant`](variant.md#readme)|[`String`](featuresbydatatype.md#string)|[`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute variant|`2` `1` @@ -66,8 +67,7 @@ Feature|Datatype|Available on nodes|Description|Examples [`frame`](frame.md#readme)|[`String`](featuresbydatatype.md#string)|[`word`](featuresbynodetype.md#word) |frame|`A0` `A1` `A2` `AA2` [`oslots`](oslots.md#readme)|[`String`](featuresbydatatype.md#string)||No feature description|No values [`parent`](parent.md#readme)|[`String`](featuresbydatatype.md#string)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |parent relationship between words|`Link` -[`sibling`](sibling.md#readme)|[`Integer`](featuresbydatatype.md#integer)|[`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) |this is XML attribute sibling|`1` `2` `3` `4` [`subjref`](subjref.md#readme)|[`String`](featuresbydatatype.md#string)|[`word`](featuresbynodetype.md#word) |number of subject referent|`Link` -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/frame.md b/results/frame.md index 1a94791..a9c528b 100644 --- a/results/frame.md +++ b/results/frame.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: frame Data type|Feature type|Available for nodes ---|---|--- @@ -13,6 +13,8 @@ A0|25654 A1|15570 A2|2577 AA2|92 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 43893. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/framespec.md b/results/framespec.md index 422abae..623ec76 100644 --- a/results/framespec.md +++ b/results/framespec.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: framespec Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ A0:n40005001015|30 A0:n45001001001|28 A0:n50001001001|25 A0:n42020034005|24 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 24783. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- A0:n00000000000|896 @@ -32,7 +34,9 @@ A0:n40005001015|31 A0:n45001001001|29 A0:n50001001001|27 A0:n42020034005|25 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 25493. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- A0:n00000000000|896 @@ -45,6 +49,8 @@ A0:n40005001015|31 A0:n45001001001|29 A0:n50001001001|27 A0:n42020034005|25 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 25493. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/function.md b/results/function.md index a41ca9b..b324813 100644 --- a/results/function.md +++ b/results/function.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: function Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Subj-Cmpl|23 Pred-Obj-Cmpl|22 Subj-Pred-Obj|20 Pred-Obj-Subj|19 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 778. Note: table truncated. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- Pred-Obj|2675 @@ -32,7 +34,9 @@ Pred-Subj|603 Pred-Obj-Cmpl|596 Subj-PreC-PreC|595 PreC-PreC|554 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 21568. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- Cmpl|11056 @@ -45,7 +49,9 @@ Cmpl-Pred|1185 Obj-Pred|1077 Cmpl-Pred-Obj|684 Subj-Pred|639 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 45276. Note: table truncated. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- Pred|24767 @@ -54,7 +60,9 @@ Subj|10198 Objc|9337 PreC|6097 Adv|5596 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 69007. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- Pred|24767 @@ -63,7 +71,9 @@ Subj|10198 Objc|9337 PreC|6097 Adv|5596 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 69007. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- Pred|24767 @@ -72,6 +82,8 @@ Objc|4813 PreC|4487 Subj|4458 Cmpl|1956 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 46077. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/gender.md b/results/gender.md index c2adf36..05d0ba9 100644 --- a/results/gender.md +++ b/results/gender.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: gender Data type|Feature type|Available for nodes ---|---|--- @@ -12,18 +12,24 @@ Value|Occurences masculine|12430 neuter|3066 feminine|2162 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 17658. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- masculine|41486 feminine|18736 neuter|13753 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 73975. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- masculine|41486 feminine|18736 neuter|13753 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 73975. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/gloss.md b/results/gloss.md index 1dfe227..d0cb90f 100644 --- a/results/gloss.md +++ b/results/gloss.md @@ -1,50 +1,26 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: gloss Data type|Feature type|Available for nodes ---|---|--- -[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) +[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`word`](featuresbynodetype.md#word) ## Description -short translation +English gloss (BGVB) ## Feature Values -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) -Value|Occurences ----|--- -not|1619 -you|667 -is|578 -Him|535 -to you|453 -him|406 -them|394 -saying|391 -to them|373 -said|312 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) -Value|Occurences ----|--- -the|9857 -and|6212 --|5496 -in|2320 -And|2218 -not|2042 -of the|1551 -for|1501 -that|1498 -you|1226 ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- -the|9857 -and|6212 --|5496 -in|2320 -And|2218 -not|2042 -of the|1551 -for|1501 -that|1498 -you|1226 - +the|19783 +and, also, likewise|8978 +he, she, it, himself, herself, itself; even, very; same|5550 +you|2892 +but, and|2787 +(with dat.) in|2743 +I|2567 +am, exist|2457 +say, tell|2255 +no, not|1622 + +Total frequency of feature: 137779. Note: table truncated. + -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/id.md b/results/id.md index 67023fd..66062f0 100644 --- a/results/id.md +++ b/results/id.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: id Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ n40001003001|1 n40001003003|1 n40001003012|1 n40001003014|1 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- n40001001001|1 @@ -32,7 +34,9 @@ n40001001007|1 n40001001008|1 n40001002001|1 n40001002002|1 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- n40001001001|1 @@ -45,6 +49,8 @@ n40001001007|1 n40001001008|1 n40001002001|1 n40001002002|1 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/junction.md b/results/junction.md index 7386226..c2c6a96 100644 --- a/results/junction.md +++ b/results/junction.md @@ -1,35 +1,38 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: junction Data type|Feature type|Available for nodes ---|---|--- -[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) +[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) ## Description type of junction ## Feature Values -### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) -Value|Occurences ----|--- -coordinate|1117 -subordinate|989 ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -coordinate|8186 -subordinate|7449 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +coordinate|9303 +subordinate|8438 + +Total frequency of feature: 17741. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- coordinate|9367 subordinate|8554 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 17921. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- subordinate|57 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 57. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- subordinate|116 coordinate|64 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 180. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/lang.md b/results/lang.md index 452c565..a8f0822 100644 --- a/results/lang.md +++ b/results/lang.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: lang Data type|Feature type|Available for nodes ---|---|--- @@ -10,6 +10,8 @@ language the text is in Value|Occurences ---|--- el|27 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 27. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/lemma.md b/results/lemma.md index b6556f5..36ed9c5 100644 --- a/results/lemma.md +++ b/results/lemma.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: lemma Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences μή|779 ἔχω|707 γίνομαι|663 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- ὁ|19783 @@ -32,7 +34,9 @@ Value|Occurences εἰμί|2457 λέγω|2255 εἰς|1766 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- ὁ|19783 @@ -45,6 +49,8 @@ Value|Occurences εἰμί|2457 λέγω|2255 εἰς|1766 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/lemmatranslit.md b/results/lemmatranslit.md index 48d53ce..b6a212d 100644 --- a/results/lemmatranslit.md +++ b/results/lemmatranslit.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: lemmatranslit Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ os|1115 me|779 tis|722 ekho|707 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- o|19800 @@ -32,7 +34,9 @@ ego|2567 eimi|2457 lego|2255 eis|2102 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- o|19800 @@ -45,6 +49,8 @@ ego|2567 eimi|2457 lego|2255 eis|2102 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/ln.md b/results/ln.md index 31e3cb0..cb0e63a 100644 --- a/results/ln.md +++ b/results/ln.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: ln Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences 13.4|535 92.29|522 15.81|471 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 43153. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 92.24|19738 @@ -32,7 +34,9 @@ Value|Occurences 92.7|1494 12.1|1247 92.29|1090 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 126879. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 92.24|19738 @@ -45,6 +49,8 @@ Value|Occurences 92.7|1494 12.1|1247 92.29|1090 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 126879. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/mood.md b/results/mood.md index e48c85a..565e007 100644 --- a/results/mood.md +++ b/results/mood.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: mood Data type|Feature type|Available for nodes ---|---|--- @@ -15,7 +15,9 @@ infinitive|2228 subjunctive|1832 imperative|1663 optative|67 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 27355. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- indicative|15617 @@ -24,7 +26,9 @@ infinitive|2285 imperative|1877 subjunctive|1856 optative|69 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 28357. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- indicative|15617 @@ -33,6 +37,8 @@ infinitive|2285 imperative|1877 subjunctive|1856 optative|69 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 28357. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/morph.md b/results/morph.md index ebf9ef9..b4a5a3a 100644 --- a/results/morph.md +++ b/results/morph.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: morph Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ V-PAI-1S|765 P-ASM|746 V-PAN|730 P-DSM|700 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- CONJ|16316 @@ -32,7 +34,9 @@ N-ASF|2870 PRT-N|2701 N-ASM|2456 V-PAI-3S|2271 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- CONJ|16316 @@ -45,6 +49,8 @@ N-ASF|2870 PRT-N|2701 N-ASM|2456 V-PAI-3S|2271 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/nodeId.md b/results/nodeId.md index 28e34a7..665fec2 100644 --- a/results/nodeId.md +++ b/results/nodeId.md @@ -1,10 +1,10 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: nodeid Data type|Feature type|Available for nodes ---|---|--- -[`Integer`](featuresbydatatype.md#integer)|[`Node`](featuresbytype.md#node)| [`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) +[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`sentence`](featuresbynodetype.md#sentence) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) ## Description -node id (as in the XML source data +node id (as in the XML source data) ## Feature Values ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences @@ -19,7 +19,9 @@ Value|Occurences 400050080010100|1 400050100010120|1 400050120010110|1 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 838. Note: table truncated. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- 400010200010490|1 @@ -32,7 +34,9 @@ Value|Occurences 400020020010200|1 400020050010370|1 400020050090290|1 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 4720. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- 400010200010490|1 @@ -45,6 +49,8 @@ Value|Occurences 400020020010200|1 400020050010370|1 400020050090290|1 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 5558. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/normalized.md b/results/normalized.md index 6c23a5b..d1e2565 100644 --- a/results/normalized.md +++ b/results/normalized.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: normalized Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences ὑμῖν|475 οὐ|378 λέγει|331 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- καί|8576 @@ -32,7 +34,9 @@ Value|Occurences τόν|1562 τήν|1523 αὐτοῦ|1411 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- καί|8576 @@ -45,6 +49,8 @@ Value|Occurences τόν|1562 τήν|1523 αὐτοῦ|1411 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/note.md b/results/note.md index 03cc38d..23d5a79 100644 --- a/results/note.md +++ b/results/note.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: note Data type|Feature type|Available for nodes ---|---|--- @@ -10,14 +10,20 @@ annotation of linguistic nature Value|Occurences ---|--- discontinuous discourse|1 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 1. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- discontinuous discourse|1 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 1. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- discontinuous discourse|1 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 1. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/num.md b/results/num.md index 43a4c21..52e2952 100644 --- a/results/num.md +++ b/results/num.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: num Data type|Feature type|Available for nodes ---|---|--- @@ -19,20 +19,9 @@ Value|Occurences 8|1 9|1 10|1 -### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) -Value|Occurences ----|--- -1|52 -3|38 -2|34 -4|31 -6|31 -15|31 -18|30 -5|29 -9|29 -11|29 -### Frequency for nodetype [group](featuresbynodetype.md#group) + +Total frequency of feature: 27. Note: table truncated. + ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- 1|27 @@ -45,33 +34,54 @@ Value|Occurences 8|27 9|27 10|27 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 8011. Note: table truncated. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- -36|29 -13|28 -16|28 -37|28 -40|28 -42|28 +1|27 +2|27 +3|27 +4|27 5|27 +6|27 7|27 8|27 +9|27 10|27 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 8945. Note: table truncated. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -1|116 -4|99 -17|97 -7|96 -13|96 -15|96 -30|96 -8|94 -5|93 -20|93 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) +24|27 +33|27 +19|26 +27|26 +41|26 +68|26 +73|26 +7|25 +10|25 +11|25 + +Total frequency of feature: 42506. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) +Value|Occurences +---|--- +1|88 +4|72 +30|71 +17|70 +15|69 +7|68 +13|68 +8|67 +27|67 +50|67 + +Total frequency of feature: 106868. Note: table truncated. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- 1|23 @@ -84,7 +94,9 @@ Value|Occurences 235|20 77|19 89|19 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 69007. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 159|41 @@ -97,7 +109,9 @@ Value|Occurences 79|38 129|38 155|38 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 185185. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 1|7943 @@ -110,6 +124,8 @@ Value|Occurences 8|7643 9|7441 10|7166 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/number.md b/results/number.md index 56bbf72..b166d41 100644 --- a/results/number.md +++ b/results/number.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: number Data type|Feature type|Available for nodes ---|---|--- @@ -11,16 +11,22 @@ Value|Occurences ---|--- singular|26293 plural|12967 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 39260. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- singular|69846 plural|29091 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 98937. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- singular|69846 plural|29091 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 98937. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/oslots.md b/results/oslots.md index 97952a4..8bffc42 100644 --- a/results/oslots.md +++ b/results/oslots.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: oslots Data type|Feature type|Available for nodes ---|---|--- @@ -8,4 +8,4 @@ No feature description ## Feature Values -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/otype.md b/results/otype.md index 9162aaa..9f22233 100644 --- a/results/otype.md +++ b/results/otype.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: otype Data type|Feature type|Available for nodes ---|---|--- @@ -8,4 +8,4 @@ No feature description ## Feature Values -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/parent.md b/results/parent.md index 6107517..1d99e59 100644 --- a/results/parent.md +++ b/results/parent.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: parent Data type|Feature type|Available for nodes ---|---|--- @@ -9,31 +9,45 @@ parent relationship between words ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- -Link|19703 -### Frequency for nodetype [group](featuresbynodetype.md#group) +Link|8011 + +Total frequency of feature: 8011. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- Link|8945 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 8945. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -Link|30814 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +Link|42506 + +Total frequency of feature: 42506. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- Link|106867 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 106867. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- Link|69007 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 69007. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- Link|69007 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 69007. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- Link|551116 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 551116. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/person.md b/results/person.md index a773195..d4a8072 100644 --- a/results/person.md +++ b/results/person.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: person Data type|Feature type|Available for nodes ---|---|--- @@ -9,21 +9,27 @@ grammatical person ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- -third|12474 -second|3447 -first|2886 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) +p3|12474 +p2|3447 +p1|2886 + +Total frequency of feature: 18807. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- -third|12747 -second|3729 -first|2943 -### Frequency for nodetype [word](featuresbynodetype.md#word) +p3|12747 +p2|3729 +p1|2943 + +Total frequency of feature: 19419. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- -third|12747 -second|3729 -first|2943 - +p3|12747 +p2|3729 +p1|2943 + +Total frequency of feature: 19419. + -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/punctuation.md b/results/punctuation.md index 312eacc..85d56e8 100644 --- a/results/punctuation.md +++ b/results/punctuation.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: punctuation Data type|Feature type|Available for nodes ---|---|--- @@ -14,7 +14,9 @@ space|37660 .|2731 ·|1189 ;|589 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46072. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- space|119264 @@ -22,7 +24,9 @@ space|119264 .|5717 ·|2359 ;|971 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137773. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- space|119264 @@ -30,6 +34,8 @@ space|119264 .|5717 ·|2359 ;|971 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137773. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/ref.md b/results/ref.md index d1c4a51..1dfbe84 100644 --- a/results/ref.md +++ b/results/ref.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: ref Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences 1CO 10:10!2|1 1CO 10:10!6|1 1CO 10:10!8|1 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 1CO 10:1!1|1 @@ -32,7 +34,9 @@ Value|Occurences 1CO 10:1!16|1 1CO 10:1!17|1 1CO 10:1!18|1 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 1CO 10:1!1|1 @@ -45,6 +49,8 @@ Value|Occurences 1CO 10:1!16|1 1CO 10:1!17|1 1CO 10:1!18|1 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/referent.md b/results/referent.md index e11f657..5e53179 100644 --- a/results/referent.md +++ b/results/referent.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: referent Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ n41006030007|29 n47008001004|29 n44021040005|27 n42020034005|26 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 7827. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- n40005001015|112 @@ -32,7 +34,9 @@ n51001002007|57 n43013023006 n43013037003 n43014005003 n43014008003 n43014022003|54 n41003007003|48 n42020034005|47 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 14471. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- n40005001015|112 @@ -45,6 +49,8 @@ n51001002007|57 n43013023006 n43013037003 n43014005003 n43014008003 n43014022003|54 n41003007003|48 n42020034005|47 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 14471. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/rela.md b/results/rela.md index 4042a22..a193c1c 100644 --- a/results/rela.md +++ b/results/rela.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: rela Data type|Feature type|Available for nodes ---|---|--- @@ -10,14 +10,20 @@ this is XML attribute rela Value|Occurences ---|--- Appo|969 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 969. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- Appo|979 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 979. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- Appo|10 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 10. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/role.md b/results/role.md index 6adda54..49f1ea1 100644 --- a/results/role.md +++ b/results/role.md @@ -1,22 +1,11 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: role Data type|Feature type|Available for nodes ---|---|--- -[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) +[`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) ## Description role ## Feature Values -### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) -Value|Occurences ----|--- -adv|2069 -o|1691 -s|496 -apposition|478 -o2|104 -p|74 -io|62 -v|9 ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- @@ -27,20 +16,24 @@ adv|34 io|16 apposition|10 o2|2 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 335. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -adv|3442 -o|2573 -apposition|972 -s|359 +adv|5511 +o|4264 +apposition|1450 +s|855 aux|184 -v|167 -p|60 -o2|24 +v|176 +p|134 +o2|128 +io|66 topic|23 -io|4 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 12795. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- adv|15981 @@ -53,7 +46,9 @@ v|405 aux|351 o2|218 topic|23 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 37426. Note: table truncated. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- v|24767 @@ -64,7 +59,9 @@ p|3504 vc|2593 io|2576 o2|229 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 69007. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- v|24996 @@ -77,7 +74,9 @@ io|2576 apposition|979 aux|872 o2|229 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 71088. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- v|24767 @@ -90,6 +89,8 @@ p|1904 aux|705 o2|141 apposition|10 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 46792. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/rule.md b/results/rule.md index 989122c..8a037db 100644 --- a/results/rule.md +++ b/results/rule.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: rule Data type|Feature type|Available for nodes ---|---|--- @@ -9,35 +9,41 @@ syntactical rule ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- -Conj-CL|5574 -CLaCL|3505 -sub-CL|3015 -DetCL|1950 -ClCl|1552 -that-VP|886 -ClCl2|882 -PtclCL|468 -AdvpCL|56 +Conj-CL|5424 +CLaCL|395 +ClCl|223 +ClCl2|102 +PtclCL|84 V-O|51 -### Frequency for nodetype [group](featuresbynodetype.md#group) +sub-CL|47 +ADV-V|37 +ADV-V-O|33 +S-P|29 + +Total frequency of feature: 7173. Note: table truncated. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- NP-CL|856 CL-NP|14 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 870. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- +CLaCL|3434 +sub-CL|2982 V2CL|2842 V-O|2674 +DetCL|2011 V-ADV|1675 +ClCl|1356 ADV-V|1100 O-V|1064 -Np2CL|780 -ADV-V-O|628 -S-V|626 -V-S|603 -V-O-ADV|531 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +that-VP|888 + +Total frequency of feature: 37786. Note: table truncated. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- DetNP|15696 @@ -50,7 +56,9 @@ V2CL|2843 V-O|2725 DetCL|2011 Np-Appos|1908 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 93234. Note: table truncated. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- PrepNp|9512 @@ -63,7 +71,9 @@ AdvpNp|520 DetAdj|470 AdjpNp|455 All-NP|412 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 22930. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- DetNP|15696 @@ -76,6 +86,8 @@ NpaNp|1351 DetAdj|1282 All-NP|846 NpPp|676 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 47405. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/sibling.md b/results/sibling.md deleted file mode 100644 index 41431f7..0000000 --- a/results/sibling.md +++ /dev/null @@ -1,96 +0,0 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) -# Feature: sibling -Data type|Feature type|Available for nodes ----|---|--- -[`Integer`](featuresbydatatype.md#integer)|[`Edge`](featuresbytype.md#edge)| [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) -## Description -this is XML attribute sibling -## Feature Values -### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) -Value|Occurences ----|--- -1|10681 -2|8806 -3|8298 -4|8010 -5|7901 -6|7857 -7|7823 -8|7795 -9|7768 -10|7741 -### Frequency for nodetype [group](featuresbynodetype.md#group) -Value|Occurences ----|--- -1|1420 -2|401 -3|187 -4|102 -5|60 -6|36 -7|25 -8|18 -9|13 -10|8 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) -Value|Occurences ----|--- -1|9572 -2|3400 -3|1457 -4|556 -5|160 -6|59 -7|27 -8|18 -9|10 -10|7 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) -Value|Occurences ----|--- -1|38317 -2|18925 -3|12374 -4|9361 -5|8297 -6|8010 -7|7902 -8|7848 -9|7806 -10|7768 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) -Value|Occurences ----|--- -1|12438 -2|5882 -3|2294 -4|630 -5|138 -6|28 -7|5 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) -Value|Occurences ----|--- -1|12438 -2|5882 -3|2294 -4|630 -5|138 -6|28 -7|5 -### Frequency for nodetype [word](featuresbynodetype.md#word) -Value|Occurences ----|--- -1|139060 -2|27543 -3|9270 -4|2117 -5|476 -6|142 -7|56 -8|27 -9|17 -10|13 - - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/sp.md b/results/sp.md index 53313cf..71d5424 100644 --- a/results/sp.md +++ b/results/sp.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: sp Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ intj|90 conj|85 num|25 prep|4 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- subs|28455 @@ -32,7 +34,9 @@ adjv|8452 advb|6147 intj|788 num|476 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- subs|28455 @@ -45,6 +49,8 @@ adjv|8452 advb|6147 intj|788 num|476 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/strong.md b/results/strong.md index a40044c..0b9a766 100644 --- a/results/strong.md +++ b/results/strong.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: strong Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences 3361|779 2192|707 1096|663 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 3588|19783 @@ -32,7 +34,9 @@ Value|Occurences 1510|2457 3004|2255 1519|1766 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 3588|19783 @@ -45,6 +49,8 @@ Value|Occurences 1510|2457 3004|2255 1519|1766 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/subjref.md b/results/subjref.md index 38a4079..8ce396a 100644 --- a/results/subjref.md +++ b/results/subjref.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: subjref Data type|Feature type|Available for nodes ---|---|--- @@ -10,6 +10,8 @@ number of subject referent Value|Occurences ---|--- Link|37748 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 37748. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/subjrefspec.md b/results/subjrefspec.md index 0d9ce4f..92ab106 100644 --- a/results/subjrefspec.md +++ b/results/subjrefspec.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: subjrefspec Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ n40005001015|76 n49003001013|69 n51001002007|64 n48001001001|62 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 16008. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- n46003022002|172 @@ -32,7 +34,9 @@ n40005001015|78 n49003001013|73 n51001002007|71 n48001001001|66 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 16575. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- n46003022002|172 @@ -45,6 +49,8 @@ n40005001015|78 n49003001013|73 n51001002007|71 n48001001001|66 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 16575. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/tense.md b/results/tense.md index ef39f74..1d7c67c 100644 --- a/results/tense.md +++ b/results/tense.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: tense Data type|Feature type|Available for nodes ---|---|--- @@ -15,7 +15,9 @@ future|1592 imperfect|1547 perfect|1450 pluperfect|88 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 27355. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- aorist|11803 @@ -24,7 +26,9 @@ imperfect|1689 future|1626 perfect|1572 pluperfect|88 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 28357. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- aorist|11803 @@ -33,6 +37,8 @@ imperfect|1689 future|1626 perfect|1572 pluperfect|88 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 28357. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/text.md b/results/text.md index 76b171c..c4e146d 100644 --- a/results/text.md +++ b/results/text.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: text Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences ὑμῖν|475 οὐ|378 λέγει|331 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- καὶ|8545 @@ -32,7 +34,9 @@ Value|Occurences τὸν|1556 τὴν|1518 αὐτοῦ|1411 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- καὶ|8545 @@ -45,6 +49,8 @@ Value|Occurences τὸν|1556 τὴν|1518 αὐτοῦ|1411 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/trans.md b/results/trans.md index 50a4d53..1475895 100644 --- a/results/trans.md +++ b/results/trans.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: trans Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ them|394 saying|391 to them|373 said|312 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- the|9857 @@ -32,7 +34,9 @@ of the|1551 for|1501 that|1498 you|1226 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- the|9857 @@ -45,6 +49,8 @@ of the|1551 for|1501 that|1498 you|1226 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/translit.md b/results/translit.md index 3960c6b..0745534 100644 --- a/results/translit.md +++ b/results/translit.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: translit Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ autois|491 umin|475 ou|467 o|446 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- kai|8576 @@ -32,7 +34,9 @@ tou|2497 eis|1851 ten|1523 auton|1514 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- kai|8576 @@ -45,6 +49,8 @@ tou|2497 eis|1851 ten|1523 auton|1514 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/typ.md b/results/typ.md index a967247..e045e5e 100644 --- a/results/typ.md +++ b/results/typ.md @@ -1,21 +1,25 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: typ Data type|Feature type|Available for nodes ---|---|--- [`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) ## Description -this is XML attribute typ +syntactical type (on sentence, group, clause or phrase) ## Feature Values ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- conjuncted|8075 apposition|870 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 8945. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- Voct|167 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) + +Total frequency of feature: 167. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- NP|30911 @@ -26,7 +30,9 @@ VP|207 AdjP|168 Voct|167 AdvP|166 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 51733. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- NP|10935 @@ -34,7 +40,9 @@ PP|9609 AdvP|154 AdjP|60 VP|10 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 20768. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- NP|30911 @@ -42,6 +50,8 @@ PP|11169 VP|207 AdjP|168 AdvP|166 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 42621. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/type.md b/results/typems.md similarity index 62% rename from results/type.md rename to results/typems.md index fc70956..a67c31a 100644 --- a/results/type.md +++ b/results/typems.md @@ -1,5 +1,5 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) -# Feature: type +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) +# Feature: typems Data type|Feature type|Available for nodes ---|---|--- [`String`](featuresbydatatype.md#string)|[`Node`](featuresbytype.md#node)| [`sentence`](featuresbynodetype.md#sentence) [`group`](featuresbynodetype.md#group) [`clause`](featuresbynodetype.md#clause) [`wg`](featuresbynodetype.md#wg) [`phrase`](featuresbynodetype.md#phrase) [`subphrase`](featuresbynodetype.md#subphrase) [`word`](featuresbynodetype.md#word) @@ -9,21 +9,26 @@ morphological type (on word), syntactical type (on sentence, group, clause, phra ### Frequency for nodetype [sentence](featuresbynodetype.md#sentence) Value|Occurences ---|--- -wrapper-clause-scope|11975 -group|2525 -apposition-group|1 -### Frequency for nodetype [group](featuresbynodetype.md#group) +wrapper-clause-scope|5571 +group|375 + +Total frequency of feature: 5946. + ### Frequency for nodetype [group](featuresbynodetype.md#group) Value|Occurences ---|--- conjuncted-wg|8075 apposition-group|870 -### Frequency for nodetype [clause](featuresbynodetype.md#clause) + +Total frequency of feature: 8945. + ### Frequency for nodetype [clause](featuresbynodetype.md#clause) Value|Occurences ---|--- -wrapper-clause-scope|191 -group|107 -apposition-group|20 -### Frequency for nodetype [wg](featuresbynodetype.md#wg) +wrapper-clause-scope|6595 +group|2257 +apposition-group|21 + +Total frequency of feature: 8873. + ### Frequency for nodetype [wg](featuresbynodetype.md#wg) Value|Occurences ---|--- modifier-scope|29645 @@ -33,7 +38,9 @@ conjuncted-wg|8075 group|4957 modifier-clause-scope|1712 apposition-group|891 -### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) + +Total frequency of feature: 68710. + ### Frequency for nodetype [phrase](featuresbynodetype.md#phrase) Value|Occurences ---|--- modifier-scope|10484 @@ -46,7 +53,9 @@ modifier-clause-scope|755 demonstrative|744 proper|683 interrogative|480 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 33293. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- modifier-scope|29645 @@ -59,7 +68,9 @@ demonstrative|1722 modifier-clause-scope|1712 relative|1674 interrogative|633 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 89404. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- common|23644 @@ -71,6 +82,8 @@ interrogative|633 indefinite|552 possessive|70 adverbial|3 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 44458. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/unaccent.md b/results/unaccent.md index 062e7e7..a2bd0e3 100644 --- a/results/unaccent.md +++ b/results/unaccent.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: unaccent Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences υμιν|475 ου|467 ο|372 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- και|8576 @@ -32,7 +34,9 @@ Value|Occurences τον|1562 την|1523 αυτου|1411 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- και|8576 @@ -45,6 +49,8 @@ Value|Occurences τον|1562 την|1523 αυτου|1411 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/unicode.md b/results/unicode.md index 8b742b6..b0d47fb 100644 --- a/results/unicode.md +++ b/results/unicode.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: unicode Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences οὐ|378 λέγει|318 ὑμῖν|283 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 46077. Note: table truncated. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- καὶ|8541 @@ -32,7 +34,9 @@ Value|Occurences τὸν|1556 τὴν|1518 τῆς|1300 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 137779. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- καὶ|8541 @@ -45,6 +49,8 @@ Value|Occurences τὸν|1556 τὴν|1518 τῆς|1300 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/variant.md b/results/variant.md index 72a4632..7f4e40d 100644 --- a/results/variant.md +++ b/results/variant.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: variant Data type|Feature type|Available for nodes ---|---|--- @@ -11,16 +11,22 @@ Value|Occurences ---|--- 2|17 1|10 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 27. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- 2|151 1|18 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 169. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 2|151 1|18 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 169. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/verse.md b/results/verse.md index 15a5700..3b751fb 100644 --- a/results/verse.md +++ b/results/verse.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: verse Data type|Feature type|Available for nodes ---|---|--- @@ -19,7 +19,9 @@ Value|Occurences 7|259 9|259 10|259 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 7944. Note: table truncated. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- 10|4669 @@ -32,6 +34,8 @@ Value|Occurences 11|4478 8|4467 2|4463 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 137779. Note: table truncated. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/results/voice.md b/results/voice.md index 7ca7871..f013fb8 100644 --- a/results/voice.md +++ b/results/voice.md @@ -1,4 +1,4 @@ -Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.7) +Doc4TF pages for [Nestle 1904 Greek New Testament](https://github.com/saulocantanhede/tfgreek2/tree/main/tf) (version 0.5.9) # Feature: voice Data type|Feature type|Available for nodes ---|---|--- @@ -13,20 +13,26 @@ active|20154 passive|3345 middle|2187 middlepassive|1669 -### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) + +Total frequency of feature: 27355. + ### Frequency for nodetype [subphrase](featuresbynodetype.md#subphrase) Value|Occurences ---|--- active|20742 passive|3493 middle|2408 middlepassive|1714 -### Frequency for nodetype [word](featuresbynodetype.md#word) + +Total frequency of feature: 28357. + ### Frequency for nodetype [word](featuresbynodetype.md#word) Value|Occurences ---|--- active|20742 passive|3493 middle|2408 middlepassive|1714 - -Created on Jun. 16, 2024 using [Doc4TF version 0.5.1 (June 16, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file +Total frequency of feature: 28357. + + +Created on Jul. 10, 2024 using [Doc4TF version 0.5.2 (July 10, 2024)](https://github.com/tonyjurg/Doc4TF/blob/main/CreateFeatureDoc.ipynb) \ No newline at end of file diff --git a/tools/determineDeltaBetweenVersions.ipynb b/tools/determineDeltaBetweenVersions.ipynb new file mode 100644 index 0000000..9b2e82d --- /dev/null +++ b/tools/determineDeltaBetweenVersions.ipynb @@ -0,0 +1,2286 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "c1556425-a96e-41c8-9ee1-6ef9e296474f", + "metadata": {}, + "source": [ + "# [Doc4TF/tools/determineDeltaBetweenVersions](https://github.com/tonyjurg/Doc4TF/tools/determineDeltaBetweenVersions.ipynb)\n", + "#### *Tool to determine what feature and featurevalues were changed between two Text-Fabric datasets*\n", + "\n", + "Version: 0.1 (May. 12, 2024); implementation feature [17](https://github.com/tonyjurg/Doc4TF/issues/17)." + ] + }, + { + "cell_type": "markdown", + "id": "73d4bb00-9972-42fb-b699-f48285c0ad9d", + "metadata": {}, + "source": [ + "## Table of content \n", + "* 1 - Introduction\n", + "* 2 - Setting up the environment\n", + "* 3 - Load Text-Fabric data\n", + "* 4 - Creation of the dataset\n", + " * 4.1 - Setting up some global variables\n", + " * 4.2 - Store all relevant data into a dictionary\n", + "* 5 - Create the documentation pages\n", + " * 5.1 - Create the set of feature pages\n", + " * 5.2 - Create the index pages\n", + "* 6 - Licence" + ] + }, + { + "cell_type": "markdown", + "id": "fd0740e7-b222-4a88-92e9-199dd8c7ae69", + "metadata": {}, + "source": [ + "# 1 - Introduction \n", + "##### [Back to TOC](#TOC)\n", + "\n", + "The main steps in producing the comparison are:\n", + "* Load the two Text-Fabric database.\n", + "* Construct two python dictionaries stroring all the relevant data from both versions.\n", + "* Compare the thwo dictionaries.\n", + "* Print results. " + ] + }, + { + "cell_type": "markdown", + "id": "46c7ab99-57e7-460c-b0ab-4513c6d90c78", + "metadata": {}, + "source": [ + "# 2. Setting up the environment\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "2e28d9a6-ad38-475f-87ac-285b8326f837", + "metadata": {}, + "source": [ + "Your environment should (for obvious reasons) include the Python package `Text-Fabric`. If not installed yet, it can be installed using `pip`. Further it is required to be able to invoke the Text-Fabric data set (either from an online resource, or from a localy stored copy). There are no further requirements as the scripts basicly operate 'stand alone'. " + ] + }, + { + "cell_type": "markdown", + "id": "6dccab04-1f63-4021-9609-749cfac0ec47", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# 3 - Load Text-Fabric data \n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "216097a9-5328-4f3b-9e50-4c06faa90455", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "At this step, the Text-Fabric dataset is loaded, which embedded data will be used to create a documentation set. \n", + "\n", + "Which dataset will be loaded is specified in the parameters as detailed below:\n", + "```\n", + "Ax = use (\"{GitHub user name}/{repository name}\", version=\"{version}\")\n", + "```\n", + "In this notebook, we will load two different versions of the same dataset. Each will be loaded into a different object, respectively A1 and A2. One of the consequences of working with two Text-Fabric datasets in one Python environment is that we need to address them individually when using advanced API functions. That also means the invocation needs to exclude the hoist=globals() option.\n", + "\n", + "For various options regarding other possible storage locations, and other load options, see the documentation for function [`use`](https://annotation.github.io/text-fabric/tf/app.html#tf.app.use)." + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "id": "f1de2b3a-3d2e-457a-a710-423bdb0efe8c", + "metadata": { + "slideshow": { + "slide_type": "slide" + }, + "tags": [] + }, + "outputs": [], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "1a33b29e-d68f-4fae-9f2a-974bdb43e384", + "metadata": { + "slideshow": { + "slide_type": "slide" + }, + "tags": [] + }, + "outputs": [], + "source": [ + "# Loading the Text-Fabric code\n", + "# Note: it is assumed Text-Fabric is installed in your environment\n", + "from tf.fabric import Fabric\n", + "from tf.app import use" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "id": "210cab72-9658-4fdd-ac5d-9acbd8a8ca9c", + "metadata": { + "scrolled": true, + "slideshow": { + "slide_type": "slide" + }, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/markdown": [ + "**Locating corpus resources ...**" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The requested app is not available offline\n", + "\t~/text-fabric-data/github/saulocantanhede/tfgreek2/app not found\n" + ] + }, + { + "data": { + "text/html": [ + "Status: latest release online 0.5.7 versus None locally" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "downloading app, main data and requested additions ..." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "app: ~/text-fabric-data/github/saulocantanhede/tfgreek2/app" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + " | 0.56s T otype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 6.64s T oslots from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T before from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.16s T lemma from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.00s T punctuation from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.46s T verse from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.11s T lemmatranslit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.03s T after from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.15s T translit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.22s T text from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.47s T chapter from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.21s T unaccent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.99s T book from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | | 0.16s C __levels__ from otype, oslots, otext\n", + " | | 3.69s C __order__ from otype, oslots, __levels__\n", + " | | 0.15s C __rank__ from otype, __order__\n", + " | | 12s C __levUp__ from otype, oslots, __rank__\n", + " | | 6.63s C __levDown__ from otype, __levUp__, __rank__\n", + " | | 0.34s C __characters__ from otext\n", + " | | 2.24s C __boundary__ from otype, oslots, __rank__\n", + " | | 0.04s C __sections__ from otype, oslots, otext, __levUp__, __levels__, book, chapter, verse\n", + " | 0.02s T appositioncontainer from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.21s T articular from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.96s T bookshort from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.66s T case from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T clausetype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.59s T cls from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.03s T cltype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T criticalsign from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T crule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.01s T degree from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T discontinuous from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.99s T domain from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.37s T frame from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.27s T framespec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.72s T function from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.61s T gender from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.19s T gloss from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.36s T id from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.17s T junction from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T lang from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.13s T ln from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.27s T mood from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.14s T morph from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T nodeid from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.26s T normalized from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T note from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.70s T num from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.05s T number from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 2.91s T parent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.21s T person from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.40s T ref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.15s T referent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.01s T rela from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.66s T role from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.78s T rule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 29s T sibling from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.06s T sp from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.97s T strong from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.11s T subjref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.18s T subjrefspec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n" + ] + }, + { + "ename": "KeyboardInterrupt", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "Cell \u001b[1;32mIn[68], line 2\u001b[0m\n\u001b[0;32m 1\u001b[0m \u001b[38;5;66;03m# Load the app and data from the first version in the set for comparison\u001b[39;00m\n\u001b[1;32m----> 2\u001b[0m A1 \u001b[38;5;241m=\u001b[39m use (\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124msaulocantanhede/tfgreek2\u001b[39m\u001b[38;5;124m\"\u001b[39m, version\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m0.5.7\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\app.py:56\u001b[0m, in \u001b[0;36muse\u001b[1;34m(appName, backend, *args, **kwargs)\u001b[0m\n\u001b[0;32m 23\u001b[0m \u001b[38;5;250m\u001b[39m\u001b[38;5;124;03m\"\"\"Make use of a corpus.\u001b[39;00m\n\u001b[0;32m 24\u001b[0m \n\u001b[0;32m 25\u001b[0m \u001b[38;5;124;03mFor a detailed description, see `tf.about.usefunc`.\u001b[39;00m\n\u001b[1;32m (...)\u001b[0m\n\u001b[0;32m 51\u001b[0m \u001b[38;5;124;03mtf.advanced.app.App\u001b[39;00m\n\u001b[0;32m 52\u001b[0m \u001b[38;5;124;03m\"\"\"\u001b[39;00m\n\u001b[0;32m 54\u001b[0m (appName, checkoutApp, dataLoc, backend) \u001b[38;5;241m=\u001b[39m useApp(appName, backend)\n\u001b[1;32m---> 56\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m findApp(appName, checkoutApp, dataLoc, backend, \u001b[38;5;28;01mFalse\u001b[39;00m, \u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\advanced\\app.py:630\u001b[0m, in \u001b[0;36mfindApp\u001b[1;34m(appName, checkoutApp, dataLoc, backend, _browse, silent, version, legacy, *args, **kwargs)\u001b[0m\n\u001b[0;32m 628\u001b[0m kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mmod\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m mod\n\u001b[0;32m 629\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m--> 630\u001b[0m app \u001b[38;5;241m=\u001b[39m appClass(\n\u001b[0;32m 631\u001b[0m cfg,\n\u001b[0;32m 632\u001b[0m appName,\n\u001b[0;32m 633\u001b[0m appPath,\n\u001b[0;32m 634\u001b[0m commit,\n\u001b[0;32m 635\u001b[0m release,\n\u001b[0;32m 636\u001b[0m local,\n\u001b[0;32m 637\u001b[0m backend,\n\u001b[0;32m 638\u001b[0m _browse,\n\u001b[0;32m 639\u001b[0m \u001b[38;5;241m*\u001b[39margs,\n\u001b[0;32m 640\u001b[0m version\u001b[38;5;241m=\u001b[39mversion,\n\u001b[0;32m 641\u001b[0m versionOverride\u001b[38;5;241m=\u001b[39m\u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m versionGiven,\n\u001b[0;32m 642\u001b[0m silent\u001b[38;5;241m=\u001b[39msilent,\n\u001b[0;32m 643\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs,\n\u001b[0;32m 644\u001b[0m )\n\u001b[0;32m 645\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mException\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m e:\n\u001b[0;32m 646\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m appClass \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m App:\n", + "File \u001b[1;32mC:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/app/app.py:60\u001b[0m, in \u001b[0;36mTfApp.__init__\u001b[1;34m(app, *args, **kwargs)\u001b[0m\n\u001b[0;32m 59\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21m__init__\u001b[39m(app, \u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs):\n\u001b[1;32m---> 60\u001b[0m \u001b[38;5;28msuper\u001b[39m()\u001b[38;5;241m.\u001b[39m\u001b[38;5;21m__init__\u001b[39m(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[0;32m 61\u001b[0m app\u001b[38;5;241m.\u001b[39mviewtype(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124msyntax\u001b[39m\u001b[38;5;124m'\u001b[39m) \u001b[38;5;66;03m#default option as syntax view\u001b[39;00m\n\u001b[0;32m 62\u001b[0m app\u001b[38;5;241m.\u001b[39mdm(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mSee [here](https://github.com/saulocantanhede/tfgreek2/blob/main/docs/viewtypes.md#start) for more information on viewtypes\u001b[39m\u001b[38;5;124m'\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\advanced\\app.py:190\u001b[0m, in \u001b[0;36mApp.__init__\u001b[1;34m(self, cfg, appName, appPath, commit, release, local, backend, _browse, hoist, version, versionOverride, checkout, mod, locations, modules, volume, collection, api, setFile, silent, loadData, _withGc, **configOverrides)\u001b[0m\n\u001b[0;32m 184\u001b[0m loadableFeatures \u001b[38;5;241m=\u001b[39m allFeatures[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mnodes\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m+\u001b[39m allFeatures[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124medges\u001b[39m\u001b[38;5;124m\"\u001b[39m]\n\u001b[0;32m 185\u001b[0m useFeatures \u001b[38;5;241m=\u001b[39m [\n\u001b[0;32m 186\u001b[0m f\n\u001b[0;32m 187\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m f \u001b[38;5;129;01min\u001b[39;00m loadableFeatures\n\u001b[0;32m 188\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m f \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;129;01min\u001b[39;00m excludedFeatures \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m f\u001b[38;5;241m.\u001b[39mstartswith(OMAP)\n\u001b[0;32m 189\u001b[0m ]\n\u001b[1;32m--> 190\u001b[0m result \u001b[38;5;241m=\u001b[39m TF\u001b[38;5;241m.\u001b[39mload(useFeatures, add\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m, silent\u001b[38;5;241m=\u001b[39msilent)\n\u001b[0;32m 191\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m result \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mFalse\u001b[39;00m:\n\u001b[0;32m 192\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mapi \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\fabric.py:414\u001b[0m, in \u001b[0;36mFabricCore.load\u001b[1;34m(self, features, add, silent)\u001b[0m\n\u001b[0;32m 412\u001b[0m reset()\n\u001b[0;32m 413\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m fName \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfeaturesRequested:\n\u001b[1;32m--> 414\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_loadFeature(fName)\n\u001b[0;32m 415\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgood:\n\u001b[0;32m 416\u001b[0m indent(level\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m0\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\fabric.py:801\u001b[0m, in \u001b[0;36mFabricCore._loadFeature\u001b[1;34m(self, fName, optional)\u001b[0m\n\u001b[0;32m 799\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgood \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n\u001b[0;32m 800\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m--> 801\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfeatures[fName]\u001b[38;5;241m.\u001b[39mload(silent\u001b[38;5;241m=\u001b[39msilent, _withGc\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_withGc):\n\u001b[0;32m 802\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgood \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\data.py:145\u001b[0m, in \u001b[0;36mData.load\u001b[1;34m(self, metaOnly, silent, _withGc)\u001b[0m\n\u001b[0;32m 143\u001b[0m actionRep \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mM\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m 144\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m--> 145\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_writeDataBin()\n\u001b[0;32m 146\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 147\u001b[0m actionRep \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mB\u001b[39m\u001b[38;5;124m\"\u001b[39m\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\data.py:690\u001b[0m, in \u001b[0;36mData._writeDataBin\u001b[1;34m(self)\u001b[0m\n\u001b[0;32m 687\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[0;32m 688\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m gzip\u001b[38;5;241m.\u001b[39mopen(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbinPath, mode\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mwb\u001b[39m\u001b[38;5;124m\"\u001b[39m, compresslevel\u001b[38;5;241m=\u001b[39mGZIP_LEVEL) \u001b[38;5;28;01mas\u001b[39;00m f:\n\u001b[0;32m 689\u001b[0m \u001b[38;5;66;03m# pickle.dump(self.data, f, protocol=PICKLE_PROTOCOL)\u001b[39;00m\n\u001b[1;32m--> 690\u001b[0m f\u001b[38;5;241m.\u001b[39mwrite(optimize(pickle\u001b[38;5;241m.\u001b[39mdumps(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdata, protocol\u001b[38;5;241m=\u001b[39mPICKLE_PROTOCOL)))\n\u001b[0;32m 691\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mException\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m e:\n\u001b[0;32m 692\u001b[0m error(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mCannot write to file \u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbinPath\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m because: \u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mstr\u001b[39m(e)\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m'\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\gzip.py:289\u001b[0m, in \u001b[0;36mGzipFile.write\u001b[1;34m(self, data)\u001b[0m\n\u001b[0;32m 286\u001b[0m length \u001b[38;5;241m=\u001b[39m data\u001b[38;5;241m.\u001b[39mnbytes\n\u001b[0;32m 288\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m length \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[1;32m--> 289\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfileobj\u001b[38;5;241m.\u001b[39mwrite(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcompress\u001b[38;5;241m.\u001b[39mcompress(data))\n\u001b[0;32m 290\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39msize \u001b[38;5;241m+\u001b[39m\u001b[38;5;241m=\u001b[39m length\n\u001b[0;32m 291\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcrc \u001b[38;5;241m=\u001b[39m zlib\u001b[38;5;241m.\u001b[39mcrc32(data, \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcrc)\n", + "\u001b[1;31mKeyboardInterrupt\u001b[0m: " + ] + } + ], + "source": [ + "# Load the app and data from the first version in the set for comparison\n", + "A1 = use (\"saulocantanhede/tfgreek2\", version=\"0.5.7\")" + ] + }, + { + "cell_type": "code", + "execution_count": 70, + "id": "0fd30d97-cd49-48d7-9781-448a0f6cca40", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/markdown": [ + "**Locating corpus resources ...**" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The requested app is not available offline\n", + "\t~/text-fabric-data/github/saulocantanhede/tfgreek2/app not found\n" + ] + }, + { + "data": { + "text/html": [ + "Status: latest release online 0.5.7 versus None locally" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "downloading app, main data and requested additions ..." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "app: ~/text-fabric-data/github/saulocantanhede/tfgreek2/app" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The requested data is not available offline\n", + "\t~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6 not found\n", + "rate limit is 5000 requests per hour, with 4999 left for this hour\n", + "\tconnecting to online GitHub repo saulocantanhede/tfgreek2 ... connected\n", + "\ttf/0.5.6/after.tf...downloaded\n", + "\ttf/0.5.6/appositioncontainer.tf...downloaded\n", + "\ttf/0.5.6/articular.tf...downloaded\n", + "\ttf/0.5.6/before.tf...downloaded\n", + "\ttf/0.5.6/book.tf...downloaded\n", + "\ttf/0.5.6/bookshort.tf...downloaded\n", + "\ttf/0.5.6/case.tf...downloaded\n", + "\ttf/0.5.6/chapter.tf...downloaded\n", + "\ttf/0.5.6/clausetype.tf...downloaded\n", + "\ttf/0.5.6/cls.tf...downloaded\n", + "\ttf/0.5.6/cltype.tf...downloaded\n", + "\ttf/0.5.6/criticalsign.tf...downloaded\n", + "\ttf/0.5.6/crule.tf...downloaded\n", + "\ttf/0.5.6/degree.tf...downloaded\n", + "\ttf/0.5.6/discontinuous.tf...downloaded\n", + "\ttf/0.5.6/domain.tf...downloaded\n", + "\ttf/0.5.6/frame.tf...downloaded\n", + "\ttf/0.5.6/framespec.tf...downloaded\n", + "\ttf/0.5.6/function.tf...downloaded\n", + "\ttf/0.5.6/gender.tf...downloaded\n", + "\ttf/0.5.6/gloss.tf...downloaded\n", + "\ttf/0.5.6/id.tf...downloaded\n", + "\ttf/0.5.6/junction.tf...downloaded\n", + "\ttf/0.5.6/lang.tf...downloaded\n", + "\ttf/0.5.6/lemma.tf...downloaded\n", + "\ttf/0.5.6/lextranslit.tf...downloaded\n", + "\ttf/0.5.6/ln.tf...downloaded\n", + "\ttf/0.5.6/mood.tf...downloaded\n", + "\ttf/0.5.6/morph.tf...downloaded\n", + "\ttf/0.5.6/nodeid.tf...downloaded\n", + "\ttf/0.5.6/normalized.tf...downloaded\n", + "\ttf/0.5.6/note.tf...downloaded\n", + "\ttf/0.5.6/num.tf...downloaded\n", + "\ttf/0.5.6/number.tf...downloaded\n", + "\ttf/0.5.6/oslots.tf...downloaded\n", + "\ttf/0.5.6/otext.tf...downloaded\n", + "\ttf/0.5.6/otype.tf...downloaded\n", + "\ttf/0.5.6/parent.tf...downloaded\n", + "\ttf/0.5.6/person.tf...downloaded\n", + "\ttf/0.5.6/punctuation.tf...downloaded\n", + "\ttf/0.5.6/ref.tf...downloaded\n", + "\ttf/0.5.6/referent.tf...downloaded\n", + "\ttf/0.5.6/rela.tf...downloaded\n", + "\ttf/0.5.6/role.tf...downloaded\n", + "\ttf/0.5.6/rule.tf...downloaded\n", + "\ttf/0.5.6/sibling.zip...downloaded\n", + "\ttf/0.5.6/strong.tf...downloaded\n", + "\ttf/0.5.6/subjref.tf...downloaded\n", + "\ttf/0.5.6/subjrefspec.tf...downloaded\n", + "\ttf/0.5.6/tense.tf...downloaded\n", + "\ttf/0.5.6/text.tf...downloaded\n", + "\ttf/0.5.6/trans.tf...downloaded\n", + "\ttf/0.5.6/translit.tf...downloaded\n", + "\ttf/0.5.6/typ.tf...downloaded\n", + "\ttf/0.5.6/type.tf...downloaded\n", + "\ttf/0.5.6/unaccent.tf...downloaded\n", + "\ttf/0.5.6/unicode.tf...downloaded\n", + "\ttf/0.5.6/variant.tf...downloaded\n", + "\ttf/0.5.6/verse.tf...downloaded\n", + "\ttf/0.5.6/voice.tf...downloaded\n", + "\tOK\n" + ] + }, + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + " | 0.58s T otype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 6.26s T oslots from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T before from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.18s T lemma from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.03s T punctuation from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.47s T verse from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.04s T after from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.18s T translit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.26s T text from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.54s T chapter from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.19s T lextranslit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.28s T unaccent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.03s T book from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | | 0.17s C __levels__ from otype, oslots, otext\n", + " | | 4.28s C __order__ from otype, oslots, __levels__\n", + " | | 0.14s C __rank__ from otype, __order__\n", + " | | 12s C __levUp__ from otype, oslots, __rank__\n", + " | | 6.64s C __levDown__ from otype, __levUp__, __rank__\n", + " | | 0.34s C __characters__ from otext\n", + " | | 1.83s C __boundary__ from otype, oslots, __rank__\n", + " | | 0.04s C __sections__ from otype, oslots, otext, __levUp__, __levels__, book, chapter, verse\n", + " | 0.02s T appositioncontainer from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.21s T articular from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.98s T bookshort from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.68s T case from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.05s T clausetype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.63s T cls from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.03s T cltype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T criticalsign from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.06s T crule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.01s T degree from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.05s T discontinuous from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.12s T domain from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.37s T frame from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.29s T framespec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.75s T function from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.60s T gender from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.56s T gloss from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.33s T id from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.15s T junction from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T lang from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.10s T ln from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.25s T mood from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.08s T morph from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.05s T nodeid from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.22s T normalized from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T note from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.65s T num from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.81s T number from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 3.17s T parent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.18s T person from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.33s T ref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.15s T referent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.01s T rela from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.68s T role from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.82s T rule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.96s T strong from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.10s T subjref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.18s T subjrefspec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.25s T tense from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.17s T trans from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.42s T typ from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.94s T type from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.25s T unicode from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T variant from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.25s T voice from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n" + ] + }, + { + "data": { + "text/html": [ + "\n", + " TF: TF API 12.4.4, saulocantanhede/tfgreek2/app v3, Search Reference
\n", + " Data: saulocantanhede - tfgreek2 0.5.6, Character table, Feature docs
\n", + "
Node types\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "
Name# of nodes# slots / node% coverage
book275102.93100
chapter260529.92100
verse794417.34100
sentence1976713.79198
group89647.0246
clause304797.19159
wg1068686.88533
phrase694031.9196
subphrase1160341.60135
word1377791.00100
\n", + " Sets: no custom sets
\n", + " Features:
\n", + "
Nestle 1904 Greek New Testament\n", + "
\n", + "\n", + "
\n", + "
\n", + "after\n", + "
\n", + "
str
\n", + "\n", + " material after the end of the word\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "appositioncontainer\n", + "
\n", + "
int
\n", + "\n", + " 1 if it is an apposition container\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "articular\n", + "
\n", + "
int
\n", + "\n", + " 1 if the sentence, group, clause, phrase or wg has an article\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "before\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute before\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "book\n", + "
\n", + "
str
\n", + "\n", + " book name (full name)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "bookshort\n", + "
\n", + "
str
\n", + "\n", + " book name (abbreviated) from ref attribute in xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "case\n", + "
\n", + "
str
\n", + "\n", + " grammatical case\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "chapter\n", + "
\n", + "
int
\n", + "\n", + " chapter number, from ref attribute in xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "clausetype\n", + "
\n", + "
str
\n", + "\n", + " clause type\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "cls\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute cls\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "cltype\n", + "
\n", + "
str
\n", + "\n", + " clause type\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "criticalsign\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute criticalsign\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "crule\n", + "
\n", + "
str
\n", + "\n", + " clause rule (from xml attribute Rule)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "degree\n", + "
\n", + "
str
\n", + "\n", + " grammatical degree\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "discontinuous\n", + "
\n", + "
int
\n", + "\n", + " 1 if the word is out of sequence in the xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "domain\n", + "
\n", + "
str
\n", + "\n", + " domain\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "framespec\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute framespec\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "function\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute function\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "gender\n", + "
\n", + "
str
\n", + "\n", + " grammatical gender\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "gloss\n", + "
\n", + "
str
\n", + "\n", + " English gloss (BGVB)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "id\n", + "
\n", + "
str
\n", + "\n", + " xml id\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "junction\n", + "
\n", + "
str
\n", + "\n", + " type of junction\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "lang\n", + "
\n", + "
str
\n", + "\n", + " language the text is in\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "lemma\n", + "
\n", + "
str
\n", + "\n", + " lexical lemma\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "lextranslit\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute lextranslit\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "ln\n", + "
\n", + "
str
\n", + "\n", + " ln\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "mood\n", + "
\n", + "
str
\n", + "\n", + " verbal mood\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "morph\n", + "
\n", + "
str
\n", + "\n", + " morphological code\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "nodeid\n", + "
\n", + "
int
\n", + "\n", + " node id (as in the XML source data\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "normalized\n", + "
\n", + "
str
\n", + "\n", + " lemma normalized\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "note\n", + "
\n", + "
str
\n", + "\n", + " annotation of linguistic nature\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "num\n", + "
\n", + "
int
\n", + "\n", + " generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "number\n", + "
\n", + "
str
\n", + "\n", + " grammatical number\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "otype\n", + "
\n", + "
str
\n", + "\n", + " \n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "person\n", + "
\n", + "
str
\n", + "\n", + " grammatical person\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "punctuation\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute punctuation\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "ref\n", + "
\n", + "
str
\n", + "\n", + " biblical reference with word counting\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "referent\n", + "
\n", + "
str
\n", + "\n", + " number of referent\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "rela\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute rela\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "role\n", + "
\n", + "
str
\n", + "\n", + " role\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "rule\n", + "
\n", + "
str
\n", + "\n", + " syntactical rule\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "strong\n", + "
\n", + "
int
\n", + "\n", + " strong number\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "subjrefspec\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute subjrefspec\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "tense\n", + "
\n", + "
str
\n", + "\n", + " verbal tense\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "text\n", + "
\n", + "
str
\n", + "\n", + " the text of a word\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "trans\n", + "
\n", + "
str
\n", + "\n", + " translation of the word surface text according to the Berean Study Bible\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "translit\n", + "
\n", + "
str
\n", + "\n", + " transliteration of the word surface text\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "typ\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute typ\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "type\n", + "
\n", + "
str
\n", + "\n", + " morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "unaccent\n", + "
\n", + "
str
\n", + "\n", + " word in unicode characters without accents and diacritical markers\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "unicode\n", + "
\n", + "
str
\n", + "\n", + " word in unicode characters plus material after it\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "variant\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute variant\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "verse\n", + "
\n", + "
int
\n", + "\n", + " verse number, from ref attribute in xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "voice\n", + "
\n", + "
str
\n", + "\n", + " verbal voice\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "frame\n", + "
\n", + "
str
\n", + "\n", + " frame\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "oslots\n", + "
\n", + "
none
\n", + "\n", + " \n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "parent\n", + "
\n", + "
none
\n", + "\n", + " parent relationship between words\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "subjref\n", + "
\n", + "
none
\n", + "\n", + " number of subject referent\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "\n", + " Settings:
specified
  1. apiVersion: 3
  2. appName: saulocantanhede/tfgreek2
  3. appPath:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/app
  4. commit: no value
  5. css: ''
  6. dataDisplay:
    • excludedFeatures: []
    • noneValues:
      • none
      • unknown
      • no value
      • NA
    • sectionSep1:
    • sectionSep2: :
    • textFormat: text-orig-full
  7. docs:
    • docBase: https://github.com/saulocantanhede/tfgreek2/tree/main/docs
    • docPage: about
    • docRoot: https://github.com/saulocantanhede/tfgreek2
    • featureBase:https://github.com/saulocantanhede/tfgreek2/tree/main/docs/features/<feature>.md
    • featurePage: README
  8. interfaceDefaults: {fmt: text-orig-full}
  9. isCompatible: True
  10. local: no value
  11. localDir:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/_temp
  12. provenanceSpec:
    • branch: main
    • corpus: Nestle 1904 Greek New Testament
    • doi: 10.5281/zenodo.notyet
    • moduleSpecs: []
    • org: saulocantanhede
    • relative: /tf
    • repo: tfgreek2
    • repro: tfgreek2
    • version: 0.5.6
    • webBase: https://learner.bible/text/show_text/nestle1904/
    • webHint: Show this on the website
    • webLang: en
    • webUrl:https://learner.bible/text/show_text/nestle1904/<1>/<2>/<3>
    • webUrlLex: {webBase}/word?version={version}&id=<lid>
  13. release: no value
  14. typeDisplay:
    • clause:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {cls} {role} {junction}
      • style: ''
    • group:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • phrase:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • sentence:
      • label: {typ} {function} {rela} \\\\ {role} {rule}
      • style: ''
    • subphrase:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • verse:
      • condense: True
      • label: {book} {chapter}:{verse}
      • style: ''
    • wg:
      • condense: True
      • label: {type} {role} {rule} {junction}
      • style: ''
    • word:
      • features:
        • lemma
        • sp
      • featuresBare: [gloss]
  15. writing: grc
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "App config error(s) in word:\n", + "\tfeatures: feature sp not loaded\n" + ] + }, + { + "data": { + "text/html": [ + "" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "Display is setup for viewtype [syntax-view](https://github.com/saulocantanhede/tfgreek2/blob/main/docs/syntax-view.md#start)" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "See [here](https://github.com/saulocantanhede/tfgreek2/blob/main/docs/viewtypes.md#start) for more information on viewtypes" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Load the app and data from the second version in the set for comparison\n", + "A2 = use (\"saulocantanhede/tfgreek2\", version=\"0.5.6\")" + ] + }, + { + "cell_type": "code", + "execution_count": 48, + "id": "eb297e94-cfa8-4cff-8ab2-6eaa29ea4f5e", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Data to be zipped:\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "fatal: not a git repository (or any of the parent directories): .git\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\tOK app (v?? ??) : ~/github/saulocantanhede/tfgreek2/app\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "fatal: not a git repository (or any of the parent directories): .git\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\tOK main data (v?? ??) : ~/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + "Writing zip file ...\n" + ] + }, + { + "data": { + "text/plain": [ + "'~/Downloads/github/saulocantanhede/tfgreek2/complete.zip'" + ] + }, + "execution_count": 48, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "A2.zipAll()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "224ef8fe-fcd9-460d-b1a8-4790cfc0bf94", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "from tf.advanced.helpers import dm\n", + "from tf.advanced.repo import checkoutRepo" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "f020c505-2782-41c0-96b5-b5d9ddfab6f4", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "def do(task):\n", + " md = f\"\"\"\n", + "commit | release | local | base | subdir\n", + "--- | --- | --- | --- | ---\n", + "`{task[0]}` | `{task[1]}` | `{task[2]}` | `{task[3]}` | `{task[4]}`\n", + "\"\"\"\n", + " dm(md)" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "id": "92e809b1-801d-4a68-a149-5f0d68df848a", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "\n", + "commit | release | local | base | subdir\n", + "--- | --- | --- | --- | ---\n", + "`77a9118c7cd97145e8b6d32d23cbf227b3d70727` | `0.5.6` | `local` | `C:/Users/tonyj/text-fabric-data/github` | `saulocantanhede/tfgreek2/tf`\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "do(checkoutRepo(backend='github', org=\"saulocantanhede\", repo=\"tfgreek2\", folder=\"tf\", version=\"0.5.6\", checkout=\"\"))" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "id": "a42f0a91-1a91-48bc-828d-ab593237da84", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "\n", + "commit | release | local | base | subdir\n", + "--- | --- | --- | --- | ---\n", + "`352af50c8ce86edd8a0e2d58519453a8f53ee084` | `None` | `local` | `C:/Users/tonyj/text-fabric-data/github` | `saulocantanhede/tfgreek2/tf`\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "do(checkoutRepo(backend='github', org=\"saulocantanhede\", repo=\"tfgreek2\", folder=\"tf\", version=\"0.5.7\", checkout=\"\"))" + ] + }, + { + "cell_type": "markdown", + "id": "b0127a3f-44ae-4ff7-a1f0-22a3c9c8b167", + "metadata": {}, + "source": [ + "# 4 - Creation of the dataset" + ] + }, + { + "cell_type": "markdown", + "id": "52079cb8-9820-40a3-b73e-4d06a8db8f01", + "metadata": { + "tags": [] + }, + "source": [ + "## 4.1 - Setting up some global variables\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "4d2ff4a6-a1fc-4cfa-8dd6-b07272cc8d97", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "# The version number of the script\n", + "scriptVersion=\"0.1\"\n", + "scriptDate=\"May. 12, 2024\"" + ] + }, + { + "cell_type": "markdown", + "id": "02a9fcc9-cc3e-4607-9f9e-fa60deae0757", + "metadata": {}, + "source": [ + "## 4.2 - Store all relevant data into a dictionary\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "996fcdb5-9214-470d-922f-b0ef35cdc646", + "metadata": {}, + "source": [ + "The following will create a dictionary containing all relevant information for the loaded node and edge features." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "42109e55-d4dc-4908-8b3f-56d9adf936db", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Gathering generic details\n", + "Analyzing Node Features: ..................................................\n", + "Analyzing Edge Features: ....\n", + "Finished in 12.62 seconds.\n" + ] + } + ], + "source": [ + "# Initialize an empty dictionary to store feature data\n", + "featureDict = {}\n", + "import time\n", + "overallTime = time.time()\n", + "\n", + "def getFeatureDescription(metaData):\n", + " \"\"\"\n", + " This function looks for the 'description' key in the metadata dictionary. If the key is found,\n", + " it returns the corresponding description. If the key is not present, it returns a default \n", + " message indicating that no description is available.\n", + "\n", + " Parameters:\n", + " metaData (dict): A dictionary containing metadata about a feature.\n", + "\n", + " Returns:\n", + " str: The description of the feature if available, otherwise a default message.\n", + " \"\"\"\n", + " return metaData.get('description', \"No feature description\")\n", + "\n", + "def setDataType(metaData):\n", + " \"\"\"\n", + " This function checks for the 'valueType' key in the metadata. If the key is present, it\n", + " returns 'String' if the value is 'str', and 'Integer' for other types. If the 'valueType' key\n", + " is not present, it returns 'Unknown'.\n", + "\n", + " Parameters:\n", + " metaData (dict): A dictionary containing metadata, including the 'valueType' of a feature.\n", + "\n", + " Returns:\n", + " str: A string indicating the determined data type ('String', 'Integer', or 'Unknown').\n", + " \"\"\"\n", + " if 'valueType' in metaData:\n", + " return \"String\" if metaData[\"valueType\"] == 'str' else \"Integer\"\n", + " return \"Unknown\"\n", + "\n", + "\n", + "def processFeature(feature, featureType, featureMethod):\n", + " \"\"\"\n", + " Processes a given feature by extracting metadata, description, and data type, and then\n", + " compiles frequency data for different node types in a feature dictionary. Certain features\n", + " are skipped based on their type. The processed data is added to a global feature dictionary.\n", + "\n", + " Parameters:\n", + " feature (str): The name of the feature to be processed.\n", + " featureType (str): The type of the feature ('Node' or 'Edge').\n", + " featureMethod (function): A function to obtain feature data.\n", + "\n", + " Returns:\n", + " None: The function updates a global dictionary with processed feature data and does not return anything.\n", + " \"\"\"\n", + " \n", + " # Obtain the meta data\n", + " featureMetaData = featureMethod(feature).meta\n", + " featureDescription = getFeatureDescription(featureMetaData)\n", + " dataType = setDataType(featureMetaData)\n", + "\n", + " # Initialize dictionary to store feature frequency data\n", + " featureFrequencyDict = {}\n", + "\n", + " # Skip for specific features based on type\n", + " if not (featureType == 'Node' and feature == 'otype') and not (featureType == 'Edge' and feature == 'oslots'):\n", + " for nodeType in F.otype.all:\n", + " frequencyLists = featureMethod(feature).freqList(nodeType)\n", + " if not isinstance(frequencyLists, int):\n", + " if len(frequencyLists)!=0:\n", + " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': frequencyLists[:tableLimit]}\n", + " elif isinstance(frequencyLists, int):\n", + " if frequencyLists != 0:\n", + " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': [(\"Link\", frequencyLists)]}\n", + "\n", + " # Add processed feature data to the main dictionary\n", + " featureDict[feature] = {'name': feature, 'descr': featureDescription, 'type': featureType, 'datatype': dataType, 'freqlist': featureFrequencyDict}\n", + " \n", + "########################################################\n", + "# MAIN FUNCTION #\n", + "########################################################\n", + "\n", + "########################################################\n", + "# Gather general information #\n", + "########################################################\n", + "\n", + "print('Gathering generic details')\n", + "\n", + "# Initialize default values\n", + "corpusName = A.appName\n", + "liveName = ''\n", + "versionName = A.version\n", + "\n", + "# Trying to locate corpus information\n", + "if A.provenance:\n", + " for parts in A.provenance[0]: \n", + " if isinstance(parts, tuple):\n", + " key, value = parts[0], parts[1]\n", + " if verbose: print (f'General info: {key}={value}')\n", + " if key == 'corpus': corpusName = value\n", + " if key == 'version': versionName = value\n", + " # value for live is a tuple\n", + " if key == 'live': liveName=value[1]\n", + "if liveName is not None and len(liveName)>1:\n", + " # an URL was found\n", + " pageTitleMD = f'Doc4TF pages for [{corpusName}]({liveName}) (version {versionName})'\n", + " pageTitleHTML = f'

Doc4TF pages for {corpusName} (version {versionName})

'\n", + "else:\n", + " # No URL found\n", + " pageTitleMD = f'Doc4TF pages for {corpusName} (version {versionName})'\n", + " pageTitleHTML = f'

Doc4TF pages for {corpusName} (version {versionName})

'\n", + "\n", + "# Overwrite in case user provided a title\n", + "if 'customPageTitleMD_' in globals():\n", + " pageTitleMD = customPageTitleMD\n", + "if 'customPageTitleHTML' in globals():\n", + " pageTitleMD = customPageTitleHTML\n", + "\n", + " \n", + "########################################################\n", + "# Processing node features #\n", + "########################################################\n", + "\n", + "print('Analyzing Node Features: ', end='')\n", + "for nodeFeature in Fall():\n", + " if not verbose: print('.', end='') # Progress indicator\n", + " processFeature(nodeFeature, 'Node', Fs)\n", + " if verbose: print(f'\\nFeature {nodeFeature} = {featureDict[nodeFeature]}\\n') # Print feature data if verbose\n", + "\n", + "########################################################\n", + "# Processing edge features #\n", + "########################################################\n", + "\n", + "print('\\nAnalyzing Edge Features: ', end='')\n", + "for edgeFeature in Eall():\n", + " if not verbose: print('.', end='') # Progress indicator\n", + " processFeature(edgeFeature, 'Edge', Es)\n", + " if verbose: print(f'\\nFeature {edgeFeature} = {featureDict[edgeFeature]}\\n') # Print feature data if verbose\n", + "\n", + "print(f'\\nFinished in {time.time() - overallTime:.2f} seconds.')" + ] + }, + { + "cell_type": "markdown", + "id": "5fb116d0-abc5-41a4-ac9c-3192da7e8252", + "metadata": {}, + "source": [ + "# 6 - License\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "3dc84f14-d918-4b19-9d20-151a1a2f2dc2", + "metadata": {}, + "source": [ + "Licenced under [Creative Commons Attribution 4.0 International (CC BY 4.0)](https://github.com/tonyjurg/Doc4TF/blob/main/LICENCE.md)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.5" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/tools/versionMapping.ipynb b/tools/versionMapping.ipynb new file mode 100644 index 0000000..59517f5 --- /dev/null +++ b/tools/versionMapping.ipynb @@ -0,0 +1,2432 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "c1556425-a96e-41c8-9ee1-6ef9e296474f", + "metadata": {}, + "source": [ + "# [Doc4TF/tools/versionMapping](https://github.com/tonyjurg/Doc4TF/tools/versionMapping.ipynb)\n", + "#### *Mapping nodes changes between two Text-Fabric datasets*\n", + "\n", + "Version: 0.1 (May. 13, 2024)." + ] + }, + { + "cell_type": "markdown", + "id": "73d4bb00-9972-42fb-b699-f48285c0ad9d", + "metadata": {}, + "source": [ + "## Table of content \n", + "* 1 - Introduction\n", + "* 2 - Setting up the environment\n", + "* 3 - Load Text-Fabric data\n", + "* 4 - Creation of the dataset\n", + " * 4.1 - Setting up some global variables\n", + " * 4.2 - Store all relevant data into a dictionary\n", + "* 5 - Create the documentation pages\n", + " * 5.1 - Create the set of feature pages\n", + " * 5.2 - Create the index pages\n", + "* 6 - Licence" + ] + }, + { + "cell_type": "markdown", + "id": "fd0740e7-b222-4a88-92e9-199dd8c7ae69", + "metadata": {}, + "source": [ + "# 1 - Introduction \n", + "##### [Back to TOC](#TOC)\n", + "\n", + "This notebook is utilizing the module [tf.dataset.nodemaps](https://annotation.github.io/text-fabric/tf/dataset/nodemaps.html). See also the description provided with the module." + ] + }, + { + "cell_type": "markdown", + "id": "46c7ab99-57e7-460c-b0ab-4513c6d90c78", + "metadata": {}, + "source": [ + "# 2. Setting up the environment\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "2e28d9a6-ad38-475f-87ac-285b8326f837", + "metadata": {}, + "source": [ + "Your environment should (for obvious reasons) include the Python package `Text-Fabric`. If not installed yet, it can be installed using `pip`. Further it is required to be able to invoke the Text-Fabric data sets (either from an online resource, or from a localy stored copy)." + ] + }, + { + "cell_type": "markdown", + "id": "6dccab04-1f63-4021-9609-749cfac0ec47", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# 3 - Load Text-Fabric data \n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "216097a9-5328-4f3b-9e50-4c06faa90455", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "See also notebook [map.ipynb](https://nbviewer.org/github/clariah/wp6-missieven/blob/master/programs/map.ipynb).\n", + "\n", + "See [dataset.Versions](https://annotation.github.io/text-fabric/tf/dataset/nodemaps.html#tf.dataset.nodemaps.Versions) in the Text-Fabric documentation." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "f1de2b3a-3d2e-457a-a710-423bdb0efe8c", + "metadata": { + "slideshow": { + "slide_type": "slide" + }, + "tags": [] + }, + "outputs": [], + "source": [ + "%load_ext autoreload\n", + "%autoreload 2" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "id": "1a33b29e-d68f-4fae-9f2a-974bdb43e384", + "metadata": { + "slideshow": { + "slide_type": "slide" + }, + "tags": [] + }, + "outputs": [ + { + "ename": "NameError", + "evalue": "name 'TF_DIR' is not defined", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mNameError\u001b[0m Traceback (most recent call last)", + "Cell \u001b[1;32mIn[25], line 10\u001b[0m\n\u001b[0;32m 7\u001b[0m vb \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m0.5.7\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;66;03m#\u001b[39;00m\n\u001b[0;32m 9\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m v \u001b[38;5;129;01min\u001b[39;00m (va, vb):\n\u001b[1;32m---> 10\u001b[0m TF[v] \u001b[38;5;241m=\u001b[39m Fabric(locations\u001b[38;5;241m=\u001b[39mTF_DIR, modules\u001b[38;5;241m=\u001b[39mv)\n\u001b[0;32m 11\u001b[0m api[v] \u001b[38;5;241m=\u001b[39m TF[v]\u001b[38;5;241m.\u001b[39mload(features[v])\n", + "\u001b[1;31mNameError\u001b[0m: name 'TF_DIR' is not defined" + ] + } + ], + "source": [ + "# Loading the Text-Fabric code and module versions\n", + "from tf.fabric import Fabric\n", + "from tf.dataset import Versions\n", + "from tf.app import use\n", + "\n", + "va = \"0.5.6\" # \n", + "vb = \"0.5.7\" #\n", + "\n", + "for v in (va, vb):\n", + " TF[v] = Fabric(locations=TF_DIR, modules=v)\n", + " api[v] = TF[v].load(features[v])" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "id": "946c2f74-3dfd-4f8f-84ea-392397af2692", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Collecting marimo\n", + " Downloading marimo-0.5.2-py3-none-any.whl.metadata (26 kB)\n", + "Requirement already satisfied: click<9,>=8.0 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from marimo) (8.1.7)\n", + "Requirement already satisfied: jedi>=0.18.0 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from marimo) (0.18.1)\n", + "Requirement already satisfied: markdown<4,>=3.4 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from marimo) (3.5.1)\n", + "Collecting pymdown-extensions<11,>=9.0 (from marimo)\n", + " Downloading pymdown_extensions-10.8.1-py3-none-any.whl.metadata (3.0 kB)\n", + "Requirement already satisfied: pygments<3,>=2.13 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from marimo) (2.15.1)\n", + "Collecting tomlkit>=0.12.0 (from marimo)\n", + " Downloading tomlkit-0.12.5-py3-none-any.whl.metadata (2.7 kB)\n", + "Collecting uvicorn>=0.22.0 (from marimo)\n", + " Downloading uvicorn-0.29.0-py3-none-any.whl.metadata (6.3 kB)\n", + "Collecting starlette!=0.36.0,>=0.26.1 (from marimo)\n", + " Downloading starlette-0.37.2-py3-none-any.whl.metadata (5.9 kB)\n", + "Collecting websockets<13.0.0,>=10.0.0 (from marimo)\n", + " Downloading websockets-12.0-cp311-cp311-win_amd64.whl.metadata (6.8 kB)\n", + "Collecting docutils>=0.17.0 (from marimo)\n", + " Downloading docutils-0.21.2-py3-none-any.whl.metadata (2.8 kB)\n", + "Requirement already satisfied: psutil>=5.0 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from marimo) (5.9.0)\n", + "Collecting black (from marimo)\n", + " Downloading black-24.4.2-cp311-cp311-win_amd64.whl.metadata (77 kB)\n", + " ---------------------------------------- 0.0/77.1 kB ? eta -:--:--\n", + " ---------------------------------------- 77.1/77.1 kB 2.1 MB/s eta 0:00:00\n", + "Requirement already satisfied: colorama in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from click<9,>=8.0->marimo) (0.4.6)\n", + "Requirement already satisfied: parso<0.9.0,>=0.8.0 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from jedi>=0.18.0->marimo) (0.8.3)\n", + "Collecting markdown<4,>=3.4 (from marimo)\n", + " Downloading Markdown-3.6-py3-none-any.whl.metadata (7.0 kB)\n", + "Requirement already satisfied: pyyaml in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from pymdown-extensions<11,>=9.0->marimo) (6.0.1)\n", + "Requirement already satisfied: anyio<5,>=3.4.0 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from starlette!=0.36.0,>=0.26.1->marimo) (3.5.0)\n", + "Requirement already satisfied: h11>=0.8 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from uvicorn>=0.22.0->marimo) (0.14.0)\n", + "Collecting mypy-extensions>=0.4.3 (from black->marimo)\n", + " Downloading mypy_extensions-1.0.0-py3-none-any.whl.metadata (1.1 kB)\n", + "Requirement already satisfied: packaging>=22.0 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from black->marimo) (23.1)\n", + "Collecting pathspec>=0.9.0 (from black->marimo)\n", + " Downloading pathspec-0.12.1-py3-none-any.whl.metadata (21 kB)\n", + "Requirement already satisfied: platformdirs>=2 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from black->marimo) (3.10.0)\n", + "Requirement already satisfied: idna>=2.8 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from anyio<5,>=3.4.0->starlette!=0.36.0,>=0.26.1->marimo) (3.4)\n", + "Requirement already satisfied: sniffio>=1.1 in c:\\users\\tonyj\\anaconda3\\envs\\text-fabric\\lib\\site-packages (from anyio<5,>=3.4.0->starlette!=0.36.0,>=0.26.1->marimo) (1.2.0)\n", + "Downloading marimo-0.5.2-py3-none-any.whl (10.1 MB)\n", + " ---------------------------------------- 0.0/10.1 MB ? eta -:--:--\n", + " - -------------------------------------- 0.3/10.1 MB 6.9 MB/s eta 0:00:02\n", + " -- ------------------------------------- 0.7/10.1 MB 6.9 MB/s eta 0:00:02\n", + " ---- ----------------------------------- 1.0/10.1 MB 7.2 MB/s eta 0:00:02\n", + " ---- ----------------------------------- 1.1/10.1 MB 6.1 MB/s eta 0:00:02\n", + " ----- ---------------------------------- 1.3/10.1 MB 5.4 MB/s eta 0:00:02\n", + " ------ --------------------------------- 1.6/10.1 MB 5.5 MB/s eta 0:00:02\n", + " ------- -------------------------------- 1.9/10.1 MB 5.7 MB/s eta 0:00:02\n", + " -------- ------------------------------- 2.2/10.1 MB 5.9 MB/s eta 0:00:02\n", + " ---------- ----------------------------- 2.5/10.1 MB 6.0 MB/s eta 0:00:02\n", + " ----------- ---------------------------- 2.9/10.1 MB 6.1 MB/s eta 0:00:02\n", + " ------------ --------------------------- 3.1/10.1 MB 6.0 MB/s eta 0:00:02\n", + " ------------- -------------------------- 3.5/10.1 MB 6.2 MB/s eta 0:00:02\n", + " --------------- ------------------------ 3.8/10.1 MB 6.2 MB/s eta 0:00:02\n", + " ---------------- ----------------------- 4.1/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ----------------- ---------------------- 4.5/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ------------------- -------------------- 4.8/10.1 MB 6.4 MB/s eta 0:00:01\n", + " -------------------- ------------------- 5.2/10.1 MB 6.5 MB/s eta 0:00:01\n", + " --------------------- ------------------ 5.5/10.1 MB 6.6 MB/s eta 0:00:01\n", + " ----------------------- ---------------- 5.8/10.1 MB 6.5 MB/s eta 0:00:01\n", + " ------------------------ --------------- 6.1/10.1 MB 6.5 MB/s eta 0:00:01\n", + " ------------------------- -------------- 6.5/10.1 MB 6.6 MB/s eta 0:00:01\n", + " --------------------------- ------------ 6.8/10.1 MB 6.6 MB/s eta 0:00:01\n", + " --------------------------- ------------ 7.0/10.1 MB 6.7 MB/s eta 0:00:01\n", + " ---------------------------- ----------- 7.1/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ----------------------------- ---------- 7.4/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ------------------------------ --------- 7.7/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ------------------------------- -------- 8.0/10.1 MB 6.3 MB/s eta 0:00:01\n", + " --------------------------------- ------ 8.3/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ---------------------------------- ----- 8.6/10.1 MB 6.4 MB/s eta 0:00:01\n", + " ---------------------------------- ----- 8.7/10.1 MB 6.3 MB/s eta 0:00:01\n", + " ----------------------------------- ---- 8.8/10.1 MB 6.1 MB/s eta 0:00:01\n", + " ----------------------------------- ---- 8.9/10.1 MB 6.0 MB/s eta 0:00:01\n", + " ------------------------------------ --- 9.1/10.1 MB 5.9 MB/s eta 0:00:01\n", + " ------------------------------------ --- 9.2/10.1 MB 5.8 MB/s eta 0:00:01\n", + " ------------------------------------- -- 9.4/10.1 MB 5.8 MB/s eta 0:00:01\n", + " -------------------------------------- - 9.6/10.1 MB 5.8 MB/s eta 0:00:01\n", + " --------------------------------------- 9.8/10.1 MB 5.7 MB/s eta 0:00:01\n", + " --------------------------------------- 10.1/10.1 MB 5.7 MB/s eta 0:00:01\n", + " ---------------------------------------- 10.1/10.1 MB 5.6 MB/s eta 0:00:00\n", + "Downloading docutils-0.21.2-py3-none-any.whl (587 kB)\n", + " ---------------------------------------- 0.0/587.4 kB ? eta -:--:--\n", + " --------------- ------------------------ 225.3/587.4 kB 4.6 MB/s eta 0:00:01\n", + " ------------------------------- -------- 460.8/587.4 kB 4.8 MB/s eta 0:00:01\n", + " ---------------------------------------- 587.4/587.4 kB 4.6 MB/s eta 0:00:00\n", + "Downloading pymdown_extensions-10.8.1-py3-none-any.whl (250 kB)\n", + " ---------------------------------------- 0.0/250.8 kB ? eta -:--:--\n", + " --------------------------------------- 245.8/250.8 kB 5.0 MB/s eta 0:00:01\n", + " ---------------------------------------- 250.8/250.8 kB 5.1 MB/s eta 0:00:00\n", + "Downloading Markdown-3.6-py3-none-any.whl (105 kB)\n", + " ---------------------------------------- 0.0/105.4 kB ? eta -:--:--\n", + " ---------------------------------------- 105.4/105.4 kB 5.9 MB/s eta 0:00:00\n", + "Downloading starlette-0.37.2-py3-none-any.whl (71 kB)\n", + " ---------------------------------------- 0.0/71.9 kB ? eta -:--:--\n", + " ---------------------------------------- 71.9/71.9 kB 3.9 MB/s eta 0:00:00\n", + "Downloading tomlkit-0.12.5-py3-none-any.whl (37 kB)\n", + "Downloading uvicorn-0.29.0-py3-none-any.whl (60 kB)\n", + " ---------------------------------------- 0.0/60.8 kB ? eta -:--:--\n", + " ---------------------------------------- 60.8/60.8 kB 3.2 MB/s eta 0:00:00\n", + "Downloading websockets-12.0-cp311-cp311-win_amd64.whl (124 kB)\n", + " ---------------------------------------- 0.0/125.0 kB ? eta -:--:--\n", + " ---------------------------------------- 125.0/125.0 kB 7.2 MB/s eta 0:00:00\n", + "Downloading black-24.4.2-cp311-cp311-win_amd64.whl (1.4 MB)\n", + " ---------------------------------------- 0.0/1.4 MB ? eta -:--:--\n", + " -------- ------------------------------- 0.3/1.4 MB 6.3 MB/s eta 0:00:01\n", + " ---------------- ----------------------- 0.6/1.4 MB 6.1 MB/s eta 0:00:01\n", + " ------------------------ --------------- 0.9/1.4 MB 6.0 MB/s eta 0:00:01\n", + " -------------------------------- ------- 1.2/1.4 MB 6.1 MB/s eta 0:00:01\n", + " --------------------------------------- 1.4/1.4 MB 6.4 MB/s eta 0:00:01\n", + " ---------------------------------------- 1.4/1.4 MB 6.0 MB/s eta 0:00:00\n", + "Downloading mypy_extensions-1.0.0-py3-none-any.whl (4.7 kB)\n", + "Downloading pathspec-0.12.1-py3-none-any.whl (31 kB)\n", + "Installing collected packages: websockets, tomlkit, pathspec, mypy-extensions, markdown, docutils, uvicorn, starlette, pymdown-extensions, black, marimo\n", + " Attempting uninstall: markdown\n", + " Found existing installation: Markdown 3.5.1\n", + " Uninstalling Markdown-3.5.1:\n", + " Successfully uninstalled Markdown-3.5.1\n", + "Successfully installed black-24.4.2 docutils-0.21.2 marimo-0.5.2 markdown-3.6 mypy-extensions-1.0.0 pathspec-0.12.1 pymdown-extensions-10.8.1 starlette-0.37.2 tomlkit-0.12.5 uvicorn-0.29.0 websockets-12.0\n" + ] + } + ], + "source": [ + "# also required: module marimo\n", + "!pip install marimo" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "id": "210cab72-9658-4fdd-ac5d-9acbd8a8ca9c", + "metadata": { + "scrolled": true, + "slideshow": { + "slide_type": "slide" + }, + "tags": [] + }, + "outputs": [ + { + "data": { + "text/markdown": [ + "**Locating corpus resources ...**" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The requested app is not available offline\n", + "\t~/text-fabric-data/github/saulocantanhede/tfgreek2/app not found\n" + ] + }, + { + "data": { + "text/html": [ + "Status: latest release online 0.5.7 versus None locally" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "downloading app, main data and requested additions ..." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "app: ~/text-fabric-data/github/saulocantanhede/tfgreek2/app" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + " | 0.56s T otype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 6.64s T oslots from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T before from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.16s T lemma from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.00s T punctuation from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.46s T verse from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.11s T lemmatranslit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.03s T after from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.15s T translit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.22s T text from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.47s T chapter from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.21s T unaccent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.99s T book from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | | 0.16s C __levels__ from otype, oslots, otext\n", + " | | 3.69s C __order__ from otype, oslots, __levels__\n", + " | | 0.15s C __rank__ from otype, __order__\n", + " | | 12s C __levUp__ from otype, oslots, __rank__\n", + " | | 6.63s C __levDown__ from otype, __levUp__, __rank__\n", + " | | 0.34s C __characters__ from otext\n", + " | | 2.24s C __boundary__ from otype, oslots, __rank__\n", + " | | 0.04s C __sections__ from otype, oslots, otext, __levUp__, __levels__, book, chapter, verse\n", + " | 0.02s T appositioncontainer from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.21s T articular from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.96s T bookshort from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.66s T case from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T clausetype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.59s T cls from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.03s T cltype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T criticalsign from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T crule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.01s T degree from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T discontinuous from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.99s T domain from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.37s T frame from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.27s T framespec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.72s T function from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.61s T gender from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.19s T gloss from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.36s T id from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.17s T junction from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T lang from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.13s T ln from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.27s T mood from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.14s T morph from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.05s T nodeid from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.26s T normalized from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.00s T note from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.70s T num from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.05s T number from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 2.91s T parent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.21s T person from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.40s T ref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.15s T referent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.01s T rela from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.66s T role from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.78s T rule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 29s T sibling from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 1.06s T sp from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.97s T strong from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.11s T subjref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n", + " | 0.18s T subjrefspec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7\n" + ] + }, + { + "ename": "KeyboardInterrupt", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[1;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "Cell \u001b[1;32mIn[68], line 2\u001b[0m\n\u001b[0;32m 1\u001b[0m \u001b[38;5;66;03m# Load the app and data from the first version in the set for comparison\u001b[39;00m\n\u001b[1;32m----> 2\u001b[0m A1 \u001b[38;5;241m=\u001b[39m use (\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124msaulocantanhede/tfgreek2\u001b[39m\u001b[38;5;124m\"\u001b[39m, version\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m0.5.7\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\app.py:56\u001b[0m, in \u001b[0;36muse\u001b[1;34m(appName, backend, *args, **kwargs)\u001b[0m\n\u001b[0;32m 23\u001b[0m \u001b[38;5;250m\u001b[39m\u001b[38;5;124;03m\"\"\"Make use of a corpus.\u001b[39;00m\n\u001b[0;32m 24\u001b[0m \n\u001b[0;32m 25\u001b[0m \u001b[38;5;124;03mFor a detailed description, see `tf.about.usefunc`.\u001b[39;00m\n\u001b[1;32m (...)\u001b[0m\n\u001b[0;32m 51\u001b[0m \u001b[38;5;124;03mtf.advanced.app.App\u001b[39;00m\n\u001b[0;32m 52\u001b[0m \u001b[38;5;124;03m\"\"\"\u001b[39;00m\n\u001b[0;32m 54\u001b[0m (appName, checkoutApp, dataLoc, backend) \u001b[38;5;241m=\u001b[39m useApp(appName, backend)\n\u001b[1;32m---> 56\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m findApp(appName, checkoutApp, dataLoc, backend, \u001b[38;5;28;01mFalse\u001b[39;00m, \u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\advanced\\app.py:630\u001b[0m, in \u001b[0;36mfindApp\u001b[1;34m(appName, checkoutApp, dataLoc, backend, _browse, silent, version, legacy, *args, **kwargs)\u001b[0m\n\u001b[0;32m 628\u001b[0m kwargs[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mmod\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m=\u001b[39m mod\n\u001b[0;32m 629\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[1;32m--> 630\u001b[0m app \u001b[38;5;241m=\u001b[39m appClass(\n\u001b[0;32m 631\u001b[0m cfg,\n\u001b[0;32m 632\u001b[0m appName,\n\u001b[0;32m 633\u001b[0m appPath,\n\u001b[0;32m 634\u001b[0m commit,\n\u001b[0;32m 635\u001b[0m release,\n\u001b[0;32m 636\u001b[0m local,\n\u001b[0;32m 637\u001b[0m backend,\n\u001b[0;32m 638\u001b[0m _browse,\n\u001b[0;32m 639\u001b[0m \u001b[38;5;241m*\u001b[39margs,\n\u001b[0;32m 640\u001b[0m version\u001b[38;5;241m=\u001b[39mversion,\n\u001b[0;32m 641\u001b[0m versionOverride\u001b[38;5;241m=\u001b[39m\u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m versionGiven,\n\u001b[0;32m 642\u001b[0m silent\u001b[38;5;241m=\u001b[39msilent,\n\u001b[0;32m 643\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs,\n\u001b[0;32m 644\u001b[0m )\n\u001b[0;32m 645\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mException\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m e:\n\u001b[0;32m 646\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m appClass \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m App:\n", + "File \u001b[1;32mC:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/app/app.py:60\u001b[0m, in \u001b[0;36mTfApp.__init__\u001b[1;34m(app, *args, **kwargs)\u001b[0m\n\u001b[0;32m 59\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21m__init__\u001b[39m(app, \u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs):\n\u001b[1;32m---> 60\u001b[0m \u001b[38;5;28msuper\u001b[39m()\u001b[38;5;241m.\u001b[39m\u001b[38;5;21m__init__\u001b[39m(\u001b[38;5;241m*\u001b[39margs, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs)\n\u001b[0;32m 61\u001b[0m app\u001b[38;5;241m.\u001b[39mviewtype(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124msyntax\u001b[39m\u001b[38;5;124m'\u001b[39m) \u001b[38;5;66;03m#default option as syntax view\u001b[39;00m\n\u001b[0;32m 62\u001b[0m app\u001b[38;5;241m.\u001b[39mdm(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mSee [here](https://github.com/saulocantanhede/tfgreek2/blob/main/docs/viewtypes.md#start) for more information on viewtypes\u001b[39m\u001b[38;5;124m'\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\advanced\\app.py:190\u001b[0m, in \u001b[0;36mApp.__init__\u001b[1;34m(self, cfg, appName, appPath, commit, release, local, backend, _browse, hoist, version, versionOverride, checkout, mod, locations, modules, volume, collection, api, setFile, silent, loadData, _withGc, **configOverrides)\u001b[0m\n\u001b[0;32m 184\u001b[0m loadableFeatures \u001b[38;5;241m=\u001b[39m allFeatures[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mnodes\u001b[39m\u001b[38;5;124m\"\u001b[39m] \u001b[38;5;241m+\u001b[39m allFeatures[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124medges\u001b[39m\u001b[38;5;124m\"\u001b[39m]\n\u001b[0;32m 185\u001b[0m useFeatures \u001b[38;5;241m=\u001b[39m [\n\u001b[0;32m 186\u001b[0m f\n\u001b[0;32m 187\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m f \u001b[38;5;129;01min\u001b[39;00m loadableFeatures\n\u001b[0;32m 188\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m f \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;129;01min\u001b[39;00m excludedFeatures \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m f\u001b[38;5;241m.\u001b[39mstartswith(OMAP)\n\u001b[0;32m 189\u001b[0m ]\n\u001b[1;32m--> 190\u001b[0m result \u001b[38;5;241m=\u001b[39m TF\u001b[38;5;241m.\u001b[39mload(useFeatures, add\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m, silent\u001b[38;5;241m=\u001b[39msilent)\n\u001b[0;32m 191\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m result \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mFalse\u001b[39;00m:\n\u001b[0;32m 192\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mapi \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mNone\u001b[39;00m\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\fabric.py:414\u001b[0m, in \u001b[0;36mFabricCore.load\u001b[1;34m(self, features, add, silent)\u001b[0m\n\u001b[0;32m 412\u001b[0m reset()\n\u001b[0;32m 413\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m fName \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfeaturesRequested:\n\u001b[1;32m--> 414\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_loadFeature(fName)\n\u001b[0;32m 415\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgood:\n\u001b[0;32m 416\u001b[0m indent(level\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m0\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\fabric.py:801\u001b[0m, in \u001b[0;36mFabricCore._loadFeature\u001b[1;34m(self, fName, optional)\u001b[0m\n\u001b[0;32m 799\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgood \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n\u001b[0;32m 800\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m--> 801\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfeatures[fName]\u001b[38;5;241m.\u001b[39mload(silent\u001b[38;5;241m=\u001b[39msilent, _withGc\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_withGc):\n\u001b[0;32m 802\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mgood \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\data.py:145\u001b[0m, in \u001b[0;36mData.load\u001b[1;34m(self, metaOnly, silent, _withGc)\u001b[0m\n\u001b[0;32m 143\u001b[0m actionRep \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mM\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[0;32m 144\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[1;32m--> 145\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_writeDataBin()\n\u001b[0;32m 146\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 147\u001b[0m actionRep \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mB\u001b[39m\u001b[38;5;124m\"\u001b[39m\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\site-packages\\tf\\core\\data.py:690\u001b[0m, in \u001b[0;36mData._writeDataBin\u001b[1;34m(self)\u001b[0m\n\u001b[0;32m 687\u001b[0m \u001b[38;5;28;01mtry\u001b[39;00m:\n\u001b[0;32m 688\u001b[0m \u001b[38;5;28;01mwith\u001b[39;00m gzip\u001b[38;5;241m.\u001b[39mopen(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbinPath, mode\u001b[38;5;241m=\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mwb\u001b[39m\u001b[38;5;124m\"\u001b[39m, compresslevel\u001b[38;5;241m=\u001b[39mGZIP_LEVEL) \u001b[38;5;28;01mas\u001b[39;00m f:\n\u001b[0;32m 689\u001b[0m \u001b[38;5;66;03m# pickle.dump(self.data, f, protocol=PICKLE_PROTOCOL)\u001b[39;00m\n\u001b[1;32m--> 690\u001b[0m f\u001b[38;5;241m.\u001b[39mwrite(optimize(pickle\u001b[38;5;241m.\u001b[39mdumps(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mdata, protocol\u001b[38;5;241m=\u001b[39mPICKLE_PROTOCOL)))\n\u001b[0;32m 691\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mException\u001b[39;00m \u001b[38;5;28;01mas\u001b[39;00m e:\n\u001b[0;32m 692\u001b[0m error(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mCannot write to file \u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mbinPath\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m because: \u001b[39m\u001b[38;5;132;01m{\u001b[39;00m\u001b[38;5;28mstr\u001b[39m(e)\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m'\u001b[39m)\n", + "File \u001b[1;32m~\\anaconda3\\envs\\Text-Fabric\\Lib\\gzip.py:289\u001b[0m, in \u001b[0;36mGzipFile.write\u001b[1;34m(self, data)\u001b[0m\n\u001b[0;32m 286\u001b[0m length \u001b[38;5;241m=\u001b[39m data\u001b[38;5;241m.\u001b[39mnbytes\n\u001b[0;32m 288\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m length \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[1;32m--> 289\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mfileobj\u001b[38;5;241m.\u001b[39mwrite(\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcompress\u001b[38;5;241m.\u001b[39mcompress(data))\n\u001b[0;32m 290\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39msize \u001b[38;5;241m+\u001b[39m\u001b[38;5;241m=\u001b[39m length\n\u001b[0;32m 291\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcrc \u001b[38;5;241m=\u001b[39m zlib\u001b[38;5;241m.\u001b[39mcrc32(data, \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcrc)\n", + "\u001b[1;31mKeyboardInterrupt\u001b[0m: " + ] + } + ], + "source": [ + "# Load the app and data from the first version in the set for comparison\n", + "A1 = use (\"saulocantanhede/tfgreek2\", version=\"0.5.7\")" + ] + }, + { + "cell_type": "code", + "execution_count": 70, + "id": "0fd30d97-cd49-48d7-9781-448a0f6cca40", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/markdown": [ + "**Locating corpus resources ...**" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The requested app is not available offline\n", + "\t~/text-fabric-data/github/saulocantanhede/tfgreek2/app not found\n" + ] + }, + { + "data": { + "text/html": [ + "Status: latest release online 0.5.7 versus None locally" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "downloading app, main data and requested additions ..." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "app: ~/text-fabric-data/github/saulocantanhede/tfgreek2/app" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The requested data is not available offline\n", + "\t~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6 not found\n", + "rate limit is 5000 requests per hour, with 4999 left for this hour\n", + "\tconnecting to online GitHub repo saulocantanhede/tfgreek2 ... connected\n", + "\ttf/0.5.6/after.tf...downloaded\n", + "\ttf/0.5.6/appositioncontainer.tf...downloaded\n", + "\ttf/0.5.6/articular.tf...downloaded\n", + "\ttf/0.5.6/before.tf...downloaded\n", + "\ttf/0.5.6/book.tf...downloaded\n", + "\ttf/0.5.6/bookshort.tf...downloaded\n", + "\ttf/0.5.6/case.tf...downloaded\n", + "\ttf/0.5.6/chapter.tf...downloaded\n", + "\ttf/0.5.6/clausetype.tf...downloaded\n", + "\ttf/0.5.6/cls.tf...downloaded\n", + "\ttf/0.5.6/cltype.tf...downloaded\n", + "\ttf/0.5.6/criticalsign.tf...downloaded\n", + "\ttf/0.5.6/crule.tf...downloaded\n", + "\ttf/0.5.6/degree.tf...downloaded\n", + "\ttf/0.5.6/discontinuous.tf...downloaded\n", + "\ttf/0.5.6/domain.tf...downloaded\n", + "\ttf/0.5.6/frame.tf...downloaded\n", + "\ttf/0.5.6/framespec.tf...downloaded\n", + "\ttf/0.5.6/function.tf...downloaded\n", + "\ttf/0.5.6/gender.tf...downloaded\n", + "\ttf/0.5.6/gloss.tf...downloaded\n", + "\ttf/0.5.6/id.tf...downloaded\n", + "\ttf/0.5.6/junction.tf...downloaded\n", + "\ttf/0.5.6/lang.tf...downloaded\n", + "\ttf/0.5.6/lemma.tf...downloaded\n", + "\ttf/0.5.6/lextranslit.tf...downloaded\n", + "\ttf/0.5.6/ln.tf...downloaded\n", + "\ttf/0.5.6/mood.tf...downloaded\n", + "\ttf/0.5.6/morph.tf...downloaded\n", + "\ttf/0.5.6/nodeid.tf...downloaded\n", + "\ttf/0.5.6/normalized.tf...downloaded\n", + "\ttf/0.5.6/note.tf...downloaded\n", + "\ttf/0.5.6/num.tf...downloaded\n", + "\ttf/0.5.6/number.tf...downloaded\n", + "\ttf/0.5.6/oslots.tf...downloaded\n", + "\ttf/0.5.6/otext.tf...downloaded\n", + "\ttf/0.5.6/otype.tf...downloaded\n", + "\ttf/0.5.6/parent.tf...downloaded\n", + "\ttf/0.5.6/person.tf...downloaded\n", + "\ttf/0.5.6/punctuation.tf...downloaded\n", + "\ttf/0.5.6/ref.tf...downloaded\n", + "\ttf/0.5.6/referent.tf...downloaded\n", + "\ttf/0.5.6/rela.tf...downloaded\n", + "\ttf/0.5.6/role.tf...downloaded\n", + "\ttf/0.5.6/rule.tf...downloaded\n", + "\ttf/0.5.6/sibling.zip...downloaded\n", + "\ttf/0.5.6/strong.tf...downloaded\n", + "\ttf/0.5.6/subjref.tf...downloaded\n", + "\ttf/0.5.6/subjrefspec.tf...downloaded\n", + "\ttf/0.5.6/tense.tf...downloaded\n", + "\ttf/0.5.6/text.tf...downloaded\n", + "\ttf/0.5.6/trans.tf...downloaded\n", + "\ttf/0.5.6/translit.tf...downloaded\n", + "\ttf/0.5.6/typ.tf...downloaded\n", + "\ttf/0.5.6/type.tf...downloaded\n", + "\ttf/0.5.6/unaccent.tf...downloaded\n", + "\ttf/0.5.6/unicode.tf...downloaded\n", + "\ttf/0.5.6/variant.tf...downloaded\n", + "\ttf/0.5.6/verse.tf...downloaded\n", + "\ttf/0.5.6/voice.tf...downloaded\n", + "\tOK\n" + ] + }, + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + " | 0.58s T otype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 6.26s T oslots from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T before from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.18s T lemma from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.03s T punctuation from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.47s T verse from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.04s T after from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.18s T translit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.26s T text from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.54s T chapter from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.19s T lextranslit from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.28s T unaccent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.03s T book from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | | 0.17s C __levels__ from otype, oslots, otext\n", + " | | 4.28s C __order__ from otype, oslots, __levels__\n", + " | | 0.14s C __rank__ from otype, __order__\n", + " | | 12s C __levUp__ from otype, oslots, __rank__\n", + " | | 6.64s C __levDown__ from otype, __levUp__, __rank__\n", + " | | 0.34s C __characters__ from otext\n", + " | | 1.83s C __boundary__ from otype, oslots, __rank__\n", + " | | 0.04s C __sections__ from otype, oslots, otext, __levUp__, __levels__, book, chapter, verse\n", + " | 0.02s T appositioncontainer from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.21s T articular from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.98s T bookshort from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.68s T case from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.05s T clausetype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.63s T cls from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.03s T cltype from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T criticalsign from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.06s T crule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.01s T degree from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.05s T discontinuous from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.12s T domain from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.37s T frame from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.29s T framespec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.75s T function from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.60s T gender from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.56s T gloss from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.33s T id from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.15s T junction from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T lang from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.10s T ln from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.25s T mood from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.08s T morph from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.05s T nodeid from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.22s T normalized from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T note from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.65s T num from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.81s T number from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 3.17s T parent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.18s T person from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.33s T ref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.15s T referent from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.01s T rela from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.68s T role from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.82s T rule from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.96s T strong from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.10s T subjref from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.18s T subjrefspec from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.25s T tense from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.17s T trans from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.42s T typ from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.94s T type from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 1.25s T unicode from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.00s T variant from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + " | 0.25s T voice from ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6\n" + ] + }, + { + "data": { + "text/html": [ + "\n", + " TF: TF API 12.4.4, saulocantanhede/tfgreek2/app v3, Search Reference
\n", + " Data: saulocantanhede - tfgreek2 0.5.6, Character table, Feature docs
\n", + "
Node types\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + "\n", + "
Name# of nodes# slots / node% coverage
book275102.93100
chapter260529.92100
verse794417.34100
sentence1976713.79198
group89647.0246
clause304797.19159
wg1068686.88533
phrase694031.9196
subphrase1160341.60135
word1377791.00100
\n", + " Sets: no custom sets
\n", + " Features:
\n", + "
Nestle 1904 Greek New Testament\n", + "
\n", + "\n", + "
\n", + "
\n", + "after\n", + "
\n", + "
str
\n", + "\n", + " material after the end of the word\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "appositioncontainer\n", + "
\n", + "
int
\n", + "\n", + " 1 if it is an apposition container\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "articular\n", + "
\n", + "
int
\n", + "\n", + " 1 if the sentence, group, clause, phrase or wg has an article\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "before\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute before\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "book\n", + "
\n", + "
str
\n", + "\n", + " book name (full name)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "bookshort\n", + "
\n", + "
str
\n", + "\n", + " book name (abbreviated) from ref attribute in xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "case\n", + "
\n", + "
str
\n", + "\n", + " grammatical case\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "chapter\n", + "
\n", + "
int
\n", + "\n", + " chapter number, from ref attribute in xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "clausetype\n", + "
\n", + "
str
\n", + "\n", + " clause type\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "cls\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute cls\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "cltype\n", + "
\n", + "
str
\n", + "\n", + " clause type\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "criticalsign\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute criticalsign\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "crule\n", + "
\n", + "
str
\n", + "\n", + " clause rule (from xml attribute Rule)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "degree\n", + "
\n", + "
str
\n", + "\n", + " grammatical degree\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "discontinuous\n", + "
\n", + "
int
\n", + "\n", + " 1 if the word is out of sequence in the xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "domain\n", + "
\n", + "
str
\n", + "\n", + " domain\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "framespec\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute framespec\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "function\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute function\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "gender\n", + "
\n", + "
str
\n", + "\n", + " grammatical gender\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "gloss\n", + "
\n", + "
str
\n", + "\n", + " English gloss (BGVB)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "id\n", + "
\n", + "
str
\n", + "\n", + " xml id\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "junction\n", + "
\n", + "
str
\n", + "\n", + " type of junction\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "lang\n", + "
\n", + "
str
\n", + "\n", + " language the text is in\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "lemma\n", + "
\n", + "
str
\n", + "\n", + " lexical lemma\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "lextranslit\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute lextranslit\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "ln\n", + "
\n", + "
str
\n", + "\n", + " ln\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "mood\n", + "
\n", + "
str
\n", + "\n", + " verbal mood\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "morph\n", + "
\n", + "
str
\n", + "\n", + " morphological code\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "nodeid\n", + "
\n", + "
int
\n", + "\n", + " node id (as in the XML source data\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "normalized\n", + "
\n", + "
str
\n", + "\n", + " lemma normalized\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "note\n", + "
\n", + "
str
\n", + "\n", + " annotation of linguistic nature\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "num\n", + "
\n", + "
int
\n", + "\n", + " generated number (not in xml): book: (Matthew=1, Mark=2, ..., Revelation=27); sentence: numbered per chapter; word: numbered per verse.\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "number\n", + "
\n", + "
str
\n", + "\n", + " grammatical number\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "otype\n", + "
\n", + "
str
\n", + "\n", + " \n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "person\n", + "
\n", + "
str
\n", + "\n", + " grammatical person\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "punctuation\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute punctuation\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "ref\n", + "
\n", + "
str
\n", + "\n", + " biblical reference with word counting\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "referent\n", + "
\n", + "
str
\n", + "\n", + " number of referent\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "rela\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute rela\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "role\n", + "
\n", + "
str
\n", + "\n", + " role\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "rule\n", + "
\n", + "
str
\n", + "\n", + " syntactical rule\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "strong\n", + "
\n", + "
int
\n", + "\n", + " strong number\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "subjrefspec\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute subjrefspec\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "tense\n", + "
\n", + "
str
\n", + "\n", + " verbal tense\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "text\n", + "
\n", + "
str
\n", + "\n", + " the text of a word\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "trans\n", + "
\n", + "
str
\n", + "\n", + " translation of the word surface text according to the Berean Study Bible\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "translit\n", + "
\n", + "
str
\n", + "\n", + " transliteration of the word surface text\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "typ\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute typ\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "type\n", + "
\n", + "
str
\n", + "\n", + " morphological type (on word), syntactical type (on sentence, group, clause, phrase or wg)\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "unaccent\n", + "
\n", + "
str
\n", + "\n", + " word in unicode characters without accents and diacritical markers\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "unicode\n", + "
\n", + "
str
\n", + "\n", + " word in unicode characters plus material after it\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "variant\n", + "
\n", + "
str
\n", + "\n", + " this is XML attribute variant\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "verse\n", + "
\n", + "
int
\n", + "\n", + " verse number, from ref attribute in xml\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "voice\n", + "
\n", + "
str
\n", + "\n", + " verbal voice\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "frame\n", + "
\n", + "
str
\n", + "\n", + " frame\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "oslots\n", + "
\n", + "
none
\n", + "\n", + " \n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "parent\n", + "
\n", + "
none
\n", + "\n", + " parent relationship between words\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "subjref\n", + "
\n", + "
none
\n", + "\n", + " number of subject referent\n", + "\n", + "
\n", + "\n", + "
\n", + "
\n", + "\n", + " Settings:
specified
  1. apiVersion: 3
  2. appName: saulocantanhede/tfgreek2
  3. appPath:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/app
  4. commit: no value
  5. css: ''
  6. dataDisplay:
    • excludedFeatures: []
    • noneValues:
      • none
      • unknown
      • no value
      • NA
    • sectionSep1:
    • sectionSep2: :
    • textFormat: text-orig-full
  7. docs:
    • docBase: https://github.com/saulocantanhede/tfgreek2/tree/main/docs
    • docPage: about
    • docRoot: https://github.com/saulocantanhede/tfgreek2
    • featureBase:https://github.com/saulocantanhede/tfgreek2/tree/main/docs/features/<feature>.md
    • featurePage: README
  8. interfaceDefaults: {fmt: text-orig-full}
  9. isCompatible: True
  10. local: no value
  11. localDir:C:/Users/tonyj/text-fabric-data/github/saulocantanhede/tfgreek2/_temp
  12. provenanceSpec:
    • branch: main
    • corpus: Nestle 1904 Greek New Testament
    • doi: 10.5281/zenodo.notyet
    • moduleSpecs: []
    • org: saulocantanhede
    • relative: /tf
    • repo: tfgreek2
    • repro: tfgreek2
    • version: 0.5.6
    • webBase: https://learner.bible/text/show_text/nestle1904/
    • webHint: Show this on the website
    • webLang: en
    • webUrl:https://learner.bible/text/show_text/nestle1904/<1>/<2>/<3>
    • webUrlLex: {webBase}/word?version={version}&id=<lid>
  13. release: no value
  14. typeDisplay:
    • clause:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {cls} {role} {junction}
      • style: ''
    • group:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • phrase:
      • condense: True
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • sentence:
      • label: {typ} {function} {rela} \\\\ {role} {rule}
      • style: ''
    • subphrase:
      • label: {typ} {function} {rela} \\\\ {type} {role} {rule}
      • style: ''
    • verse:
      • condense: True
      • label: {book} {chapter}:{verse}
      • style: ''
    • wg:
      • condense: True
      • label: {type} {role} {rule} {junction}
      • style: ''
    • word:
      • features:
        • lemma
        • sp
      • featuresBare: [gloss]
  15. writing: grc
\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "App config error(s) in word:\n", + "\tfeatures: feature sp not loaded\n" + ] + }, + { + "data": { + "text/html": [ + "" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "Display is setup for viewtype [syntax-view](https://github.com/saulocantanhede/tfgreek2/blob/main/docs/syntax-view.md#start)" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "See [here](https://github.com/saulocantanhede/tfgreek2/blob/main/docs/viewtypes.md#start) for more information on viewtypes" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Load the app and data from the second version in the set for comparison\n", + "A2 = use (\"saulocantanhede/tfgreek2\", version=\"0.5.6\")" + ] + }, + { + "cell_type": "code", + "execution_count": 48, + "id": "eb297e94-cfa8-4cff-8ab2-6eaa29ea4f5e", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Data to be zipped:\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "fatal: not a git repository (or any of the parent directories): .git\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\tOK app (v?? ??) : ~/github/saulocantanhede/tfgreek2/app\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "fatal: not a git repository (or any of the parent directories): .git\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\tOK main data (v?? ??) : ~/github/saulocantanhede/tfgreek2/tf/0.5.6\n", + "Writing zip file ...\n" + ] + }, + { + "data": { + "text/plain": [ + "'~/Downloads/github/saulocantanhede/tfgreek2/complete.zip'" + ] + }, + "execution_count": 48, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "A2.zipAll()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "224ef8fe-fcd9-460d-b1a8-4790cfc0bf94", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "from tf.advanced.helpers import dm\n", + "from tf.advanced.repo import checkoutRepo" + ] + }, + { + "cell_type": "code", + "execution_count": 56, + "id": "f020c505-2782-41c0-96b5-b5d9ddfab6f4", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "def do(task):\n", + " md = f\"\"\"\n", + "commit | release | local | base | subdir\n", + "--- | --- | --- | --- | ---\n", + "`{task[0]}` | `{task[1]}` | `{task[2]}` | `{task[3]}` | `{task[4]}`\n", + "\"\"\"\n", + " dm(md)" + ] + }, + { + "cell_type": "code", + "execution_count": 58, + "id": "92e809b1-801d-4a68-a149-5f0d68df848a", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.6" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "\n", + "commit | release | local | base | subdir\n", + "--- | --- | --- | --- | ---\n", + "`77a9118c7cd97145e8b6d32d23cbf227b3d70727` | `0.5.6` | `local` | `C:/Users/tonyj/text-fabric-data/github` | `saulocantanhede/tfgreek2/tf`\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "do(checkoutRepo(backend='github', org=\"saulocantanhede\", repo=\"tfgreek2\", folder=\"tf\", version=\"0.5.6\", checkout=\"\"))" + ] + }, + { + "cell_type": "code", + "execution_count": 62, + "id": "a42f0a91-1a91-48bc-828d-ab593237da84", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "data": { + "text/html": [ + "data: ~/text-fabric-data/github/saulocantanhede/tfgreek2/tf/0.5.7" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/markdown": [ + "\n", + "commit | release | local | base | subdir\n", + "--- | --- | --- | --- | ---\n", + "`352af50c8ce86edd8a0e2d58519453a8f53ee084` | `None` | `local` | `C:/Users/tonyj/text-fabric-data/github` | `saulocantanhede/tfgreek2/tf`\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "do(checkoutRepo(backend='github', org=\"saulocantanhede\", repo=\"tfgreek2\", folder=\"tf\", version=\"0.5.7\", checkout=\"\"))" + ] + }, + { + "cell_type": "markdown", + "id": "b0127a3f-44ae-4ff7-a1f0-22a3c9c8b167", + "metadata": {}, + "source": [ + "# 4 - Creation of the dataset" + ] + }, + { + "cell_type": "markdown", + "id": "52079cb8-9820-40a3-b73e-4d06a8db8f01", + "metadata": { + "tags": [] + }, + "source": [ + "## 4.1 - Setting up some global variables\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "4d2ff4a6-a1fc-4cfa-8dd6-b07272cc8d97", + "metadata": { + "tags": [] + }, + "outputs": [], + "source": [ + "# The version number of the script\n", + "scriptVersion=\"0.1\"\n", + "scriptDate=\"May. 12, 2024\"" + ] + }, + { + "cell_type": "markdown", + "id": "02a9fcc9-cc3e-4607-9f9e-fa60deae0757", + "metadata": {}, + "source": [ + "## 4.2 - Store all relevant data into a dictionary\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "996fcdb5-9214-470d-922f-b0ef35cdc646", + "metadata": {}, + "source": [ + "The following will create a dictionary containing all relevant information for the loaded node and edge features." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "42109e55-d4dc-4908-8b3f-56d9adf936db", + "metadata": { + "tags": [] + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Gathering generic details\n", + "Analyzing Node Features: ..................................................\n", + "Analyzing Edge Features: ....\n", + "Finished in 12.62 seconds.\n" + ] + } + ], + "source": [ + "# Initialize an empty dictionary to store feature data\n", + "featureDict = {}\n", + "import time\n", + "overallTime = time.time()\n", + "\n", + "def getFeatureDescription(metaData):\n", + " \"\"\"\n", + " This function looks for the 'description' key in the metadata dictionary. If the key is found,\n", + " it returns the corresponding description. If the key is not present, it returns a default \n", + " message indicating that no description is available.\n", + "\n", + " Parameters:\n", + " metaData (dict): A dictionary containing metadata about a feature.\n", + "\n", + " Returns:\n", + " str: The description of the feature if available, otherwise a default message.\n", + " \"\"\"\n", + " return metaData.get('description', \"No feature description\")\n", + "\n", + "def setDataType(metaData):\n", + " \"\"\"\n", + " This function checks for the 'valueType' key in the metadata. If the key is present, it\n", + " returns 'String' if the value is 'str', and 'Integer' for other types. If the 'valueType' key\n", + " is not present, it returns 'Unknown'.\n", + "\n", + " Parameters:\n", + " metaData (dict): A dictionary containing metadata, including the 'valueType' of a feature.\n", + "\n", + " Returns:\n", + " str: A string indicating the determined data type ('String', 'Integer', or 'Unknown').\n", + " \"\"\"\n", + " if 'valueType' in metaData:\n", + " return \"String\" if metaData[\"valueType\"] == 'str' else \"Integer\"\n", + " return \"Unknown\"\n", + "\n", + "\n", + "def processFeature(feature, featureType, featureMethod):\n", + " \"\"\"\n", + " Processes a given feature by extracting metadata, description, and data type, and then\n", + " compiles frequency data for different node types in a feature dictionary. Certain features\n", + " are skipped based on their type. The processed data is added to a global feature dictionary.\n", + "\n", + " Parameters:\n", + " feature (str): The name of the feature to be processed.\n", + " featureType (str): The type of the feature ('Node' or 'Edge').\n", + " featureMethod (function): A function to obtain feature data.\n", + "\n", + " Returns:\n", + " None: The function updates a global dictionary with processed feature data and does not return anything.\n", + " \"\"\"\n", + " \n", + " # Obtain the meta data\n", + " featureMetaData = featureMethod(feature).meta\n", + " featureDescription = getFeatureDescription(featureMetaData)\n", + " dataType = setDataType(featureMetaData)\n", + "\n", + " # Initialize dictionary to store feature frequency data\n", + " featureFrequencyDict = {}\n", + "\n", + " # Skip for specific features based on type\n", + " if not (featureType == 'Node' and feature == 'otype') and not (featureType == 'Edge' and feature == 'oslots'):\n", + " for nodeType in F.otype.all:\n", + " frequencyLists = featureMethod(feature).freqList(nodeType)\n", + " if not isinstance(frequencyLists, int):\n", + " if len(frequencyLists)!=0:\n", + " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': frequencyLists[:tableLimit]}\n", + " elif isinstance(frequencyLists, int):\n", + " if frequencyLists != 0:\n", + " featureFrequencyDict[nodeType] = {'nodetype': nodeType, 'freq': [(\"Link\", frequencyLists)]}\n", + "\n", + " # Add processed feature data to the main dictionary\n", + " featureDict[feature] = {'name': feature, 'descr': featureDescription, 'type': featureType, 'datatype': dataType, 'freqlist': featureFrequencyDict}\n", + " \n", + "########################################################\n", + "# MAIN FUNCTION #\n", + "########################################################\n", + "\n", + "########################################################\n", + "# Gather general information #\n", + "########################################################\n", + "\n", + "print('Gathering generic details')\n", + "\n", + "# Initialize default values\n", + "corpusName = A.appName\n", + "liveName = ''\n", + "versionName = A.version\n", + "\n", + "# Trying to locate corpus information\n", + "if A.provenance:\n", + " for parts in A.provenance[0]: \n", + " if isinstance(parts, tuple):\n", + " key, value = parts[0], parts[1]\n", + " if verbose: print (f'General info: {key}={value}')\n", + " if key == 'corpus': corpusName = value\n", + " if key == 'version': versionName = value\n", + " # value for live is a tuple\n", + " if key == 'live': liveName=value[1]\n", + "if liveName is not None and len(liveName)>1:\n", + " # an URL was found\n", + " pageTitleMD = f'Doc4TF pages for [{corpusName}]({liveName}) (version {versionName})'\n", + " pageTitleHTML = f'

Doc4TF pages for {corpusName} (version {versionName})

'\n", + "else:\n", + " # No URL found\n", + " pageTitleMD = f'Doc4TF pages for {corpusName} (version {versionName})'\n", + " pageTitleHTML = f'

Doc4TF pages for {corpusName} (version {versionName})

'\n", + "\n", + "# Overwrite in case user provided a title\n", + "if 'customPageTitleMD_' in globals():\n", + " pageTitleMD = customPageTitleMD\n", + "if 'customPageTitleHTML' in globals():\n", + " pageTitleMD = customPageTitleHTML\n", + "\n", + " \n", + "########################################################\n", + "# Processing node features #\n", + "########################################################\n", + "\n", + "print('Analyzing Node Features: ', end='')\n", + "for nodeFeature in Fall():\n", + " if not verbose: print('.', end='') # Progress indicator\n", + " processFeature(nodeFeature, 'Node', Fs)\n", + " if verbose: print(f'\\nFeature {nodeFeature} = {featureDict[nodeFeature]}\\n') # Print feature data if verbose\n", + "\n", + "########################################################\n", + "# Processing edge features #\n", + "########################################################\n", + "\n", + "print('\\nAnalyzing Edge Features: ', end='')\n", + "for edgeFeature in Eall():\n", + " if not verbose: print('.', end='') # Progress indicator\n", + " processFeature(edgeFeature, 'Edge', Es)\n", + " if verbose: print(f'\\nFeature {edgeFeature} = {featureDict[edgeFeature]}\\n') # Print feature data if verbose\n", + "\n", + "print(f'\\nFinished in {time.time() - overallTime:.2f} seconds.')" + ] + }, + { + "cell_type": "markdown", + "id": "5fb116d0-abc5-41a4-ac9c-3192da7e8252", + "metadata": {}, + "source": [ + "# 6 - License\n", + "##### [Back to TOC](#TOC)" + ] + }, + { + "cell_type": "markdown", + "id": "3dc84f14-d918-4b19-9d20-151a1a2f2dc2", + "metadata": {}, + "source": [ + "Licenced under [Creative Commons Attribution 4.0 International (CC BY 4.0)](https://github.com/tonyjurg/Doc4TF/blob/main/LICENCE.md)" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.5" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +}