Skip to content

Commit 8737b2b

Browse files
committed
arrival of data version 2021
1 parent 035e9ce commit 8737b2b

File tree

742 files changed

+36122961
-18169
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

742 files changed

+36122961
-18169
lines changed

.flake8

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,4 @@
1+
[flake8]
2+
select = C,E,F,W,B,B950
3+
ignore = E203, E501, W503
4+
builtins = C,E,Eall,Es,F,Fall,Fs,L,N,S,T,TF

docs/features/0_home.md

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,7 @@
1-
This is *continuous* version **c**.
1+
This is data version **2021**.
22

3-
To be updated regularly.
4-
5-
Viewable in [SHEBANQ]({{shebanq}}).
6-
7-
**the weekly updates have not started yet**.
3+
Viewable in [SHEBANQ]({{shebanq}}) shortly
4+
(currently the newest stable version in SHEBANQ is 2017).
85

96
## Introduction
107
This is the key to the meaning of the features of the

docs/mql.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ The good news is the existence of the other tool,
1717
This is an **offline** tool based on exactly the same data that powers SHEBANQ.
1818
The programming researcher can use Text-Fabric as a preprocessing tool for transforming the complex BHSA data into the formats that are suitable to
1919
R, spreadsheets, or any format of choice.
20-
Text-Fabric is open source, downloadable from [GitHub]({{tf}}),
20+
Text-Fabric is open source, can be installed by `pip install text-fabric`
2121
and the data is downloadable from [bhsa]({{repo}}).
2222

2323
It can be installed on MacOS, Windows and Linux.

docs/news.md

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,10 @@
11
# Updates
22

3+
## 2021-08-24
4+
5+
Data version `2021` has arrived from the ETCBC. According to Constantijn Sikkel the most
6+
consistent version ever.
7+
38
## 2019-01-31
49

510
Some features only had values for lexeme nodes: `gloss nametype voc_lex voc_lex_utf8`.
@@ -26,6 +31,8 @@ So I added the values of these features for lexemes to all of their occurrences.
2631
There is a fixed version, 2017 (imported on 2017-10-06), and a nearly identical version `c`,
2732
imported at the same time.
2833
Version `c` is continuous and will be frequently updated.
34+
(Spoiler as of 2021-08-24: these updates have only happened a few times.
35+
We discontinue continuous versions. All new versions will be stable versions.)
2936

3037
## 2017-10-05
3138

mkdocs.yml

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -13,8 +13,6 @@ extra:
1313
repo: https://github.com/ETCBC/bhsa
1414
tfBase: https://github.com/annotation/text-fabric/blob/master
1515
tut: https://nbviewer.jupyter.org/github/annotation/tutorials/blob/master/bhsa
16-
tf: https://github.com/Dans-labs/text-fabric
17-
tfw: https://github.com/Dans-labs/text-fabric/wiki
1816
tfd: https://annotation.github.io/text-fabric/tf
1917
lf: https://github.com/Dans-labs/laf-fabric
2018
shebanq: https://shebanq.ancient-data.org

primer/example10a.ipynb

Lines changed: 16 additions & 17 deletions
Original file line numberDiff line numberDiff line change
@@ -48,9 +48,8 @@
4848
"outputs": [],
4949
"source": [
5050
"from tf.app import use\n",
51-
"from tf.core.helpers import project\n",
5251
"\n",
53-
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS"
52+
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS\n"
5453
]
5554
},
5655
{
@@ -628,9 +627,9 @@
628627
}
629628
],
630629
"source": [
631-
"VERSION = '2017'\n",
630+
"VERSION = \"2017\"\n",
632631
"# A = use('bhsa', hoist=globals(), version=VERSION)\n",
633-
"A = use('bhsa:clone', checkout=\"clone\", hoist=globals(), version=VERSION)"
632+
"A = use(\"bhsa:clone\", checkout=\"clone\", hoist=globals(), version=VERSION)"
634633
]
635634
},
636635
{
@@ -814,8 +813,7 @@
814813
"clause\n",
815814
" =: phrases1\n",
816815
" <: phraseNTNps\n",
817-
"```\n",
818-
" "
816+
"```\n"
819817
]
820818
},
821819
{
@@ -973,7 +971,8 @@
973971
" consecutivePhrases.append(phrase)\n",
974972
" maxPos = end\n",
975973
" return tuple(consecutivePhrases)\n",
976-
" \n",
974+
"\n",
975+
"\n",
977976
"results = []\n",
978977
"\n",
979978
"objlike = {\"Objc\", \"Cmpl\"}\n",
@@ -983,15 +982,15 @@
983982
" ntn = r[1]\n",
984983
" obj = r[3] if len(r) == 4 else -1\n",
985984
" phrases = getPhrases(cl)\n",
986-
" \n",
985+
"\n",
987986
" predSeen = False\n",
988987
" objSeen = False\n",
989-
" \n",
988+
"\n",
990989
" good = True\n",
991-
" \n",
990+
"\n",
992991
" for p in getPhrases(cl):\n",
993992
" fn = F.function.v(p)\n",
994-
" \n",
993+
"\n",
995994
" if not predSeen and not objSeen:\n",
996995
" if p == ntn:\n",
997996
" predSeen = True\n",
@@ -1024,24 +1023,24 @@
10241023
" break\n",
10251024
" else:\n",
10261025
" continue\n",
1027-
" \n",
1026+
"\n",
10281027
" if not good:\n",
10291028
" continue\n",
1030-
" \n",
1029+
"\n",
10311030
" if not predSeen:\n",
10321031
" continue\n",
1033-
" \n",
1032+
"\n",
10341033
" pfn = F.function.v(ntn)\n",
1035-
" \n",
1034+
"\n",
10361035
" if objSeen:\n",
10371036
" if pfn == \"PreO\":\n",
10381037
" continue\n",
10391038
" else:\n",
10401039
" if pfn != \"PreO\":\n",
10411040
" continue\n",
1042-
" \n",
1041+
"\n",
10431042
" results.append((cl, ntn, obj))\n",
1044-
" \n",
1043+
"\n",
10451044
"print(f\"{len(results)} results\")"
10461045
]
10471046
},

primer/example10b.ipynb

Lines changed: 7 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -48,9 +48,8 @@
4848
"outputs": [],
4949
"source": [
5050
"from tf.app import use\n",
51-
"from tf.core.helpers import project\n",
5251
"\n",
53-
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS"
52+
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS\n"
5453
]
5554
},
5655
{
@@ -628,9 +627,9 @@
628627
}
629628
],
630629
"source": [
631-
"VERSION = '2017'\n",
630+
"VERSION = \"2017\"\n",
632631
"# A = use('bhsa', hoist=globals(), version=VERSION)\n",
633-
"A = use('bhsa:clone', checkout=\"clone\", hoist=globals(), version=VERSION)"
632+
"A = use(\"bhsa:clone\", checkout=\"clone\", hoist=globals(), version=VERSION)"
634633
]
635634
},
636635
{
@@ -708,7 +707,7 @@
708707
" word vs=qal lex=NTN[\n",
709708
" phrase function=Cmpl\n",
710709
" =: word lex=L\n",
711-
"\"\"\" "
710+
"\"\"\""
712711
]
713712
},
714713
{
@@ -1058,7 +1057,7 @@
10581057
" word vs=qal lex=NTN[\n",
10591058
" phrase function=Cmpl\n",
10601059
" =: word lex=L\n",
1061-
"\"\"\" "
1060+
"\"\"\""
10621061
]
10631062
},
10641063
{
@@ -1169,7 +1168,7 @@
11691168
" word vs=qal lex=NTN[\n",
11701169
" <: phrase function=Cmpl\n",
11711170
" =: word lex=L\n",
1172-
"\"\"\" "
1171+
"\"\"\""
11731172
]
11741173
},
11751174
{
@@ -1284,7 +1283,7 @@
12841283
" word lex=NTN[\n",
12851284
" phrase function=Subj\n",
12861285
" =: word lex=HJ>\n",
1287-
"\"\"\" "
1286+
"\"\"\""
12881287
]
12891288
},
12901289
{

primer/example2.ipynb

Lines changed: 10 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -48,9 +48,8 @@
4848
"outputs": [],
4949
"source": [
5050
"from tf.app import use\n",
51-
"from tf.core.helpers import project\n",
5251
"\n",
53-
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS"
52+
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS\n"
5453
]
5554
},
5655
{
@@ -628,9 +627,9 @@
628627
}
629628
],
630629
"source": [
631-
"VERSION = '2017'\n",
630+
"VERSION = \"2017\"\n",
632631
"# A = use('bhsa', hoist=globals(), version=VERSION)\n",
633-
"A = use('bhsa:clone', checkout=\"clone\", hoist=globals(), version=VERSION)"
632+
"A = use(\"bhsa:clone\", checkout=\"clone\", hoist=globals(), version=VERSION)"
634633
]
635634
},
636635
{
@@ -799,7 +798,7 @@
799798
"\n",
800799
"is *not* matched by words 116853 and **116854**, because 116854 is not part of the embedding clause.\n",
801800
"\n",
802-
"The Text-Fabric notion of adjacency is more crude. \n",
801+
"The Text-Fabric notion of adjacency is more crude.\n",
803802
"The reason is that in Text-Fabric, the query does not have to be a tree, where each object has a unique\n",
804803
"immediate embedder object. There could be several embedder objects in the query, and each of the them may have different\n",
805804
"gaps, and if we had the concept of relative adjacency, our query language would need a way to express relative to which object\n",
@@ -969,19 +968,19 @@
969968
"Let's make a mental shift: what *is* the intention of the MQL query?\n",
970969
"Here is a bit of query-exegesis, in that the query itself is the object of the exegesis.\n",
971970
"\n",
972-
"The MQL query mentions three `[word]` objects, but it puts only the first two of them in `FOCUS`. \n",
971+
"The MQL query mentions three `[word]` objects, but it puts only the first two of them in `FOCUS`.\n",
973972
"\n",
974973
"1. it is not interested in the actual value of the third one;\n",
975974
"2. the third `[word]` is constrained by a very loose restriction: it can be anything, except two specific values.\n",
976975
"\n",
977976
"These two things point to the intended meaning of the query, namely:\n",
978977
"\n",
979-
"> find a clause with the word `FJM[`, and somewhere after that the word `L`, \n",
978+
"> find a clause with the word `FJM[`, and somewhere after that the word `L`,\n",
980979
"which is not followed by either the word `<JN/` or the word `PNH/`.\n",
981980
"\n",
982981
"This differs subtly from what the query actually says:\n",
983982
"\n",
984-
"> find a clause with the word `FJM[`, and somewhere after that the word `L`, \n",
983+
"> find a clause with the word `FJM[`, and somewhere after that the word `L`,\n",
985984
"which is followed by another word that is not `<JN/` and not `PNH/`.\n",
986985
"\n",
987986
"The difference is one of *quantification*.\n",
@@ -1013,7 +1012,7 @@
10131012
"\n",
10141013
"```\n",
10151014
"\n",
1016-
"See \n",
1015+
"See\n",
10171016
"[Dirk Roorda: Example 2: not exist](https://shebanq.ancient-data.org/hebrew/query?version=2017&id=4467)"
10181017
]
10191018
},
@@ -1319,15 +1318,15 @@
13191318
"\n",
13201319
"We tried to improve the MQL query by using `NOTEXIST`, but that did not work out.\n",
13211320
"\n",
1322-
"However, the TF query might include (contrived) cases that the MQL query would rightfully skip. \n",
1321+
"However, the TF query might include (contrived) cases that the MQL query would rightfully skip.\n",
13231322
"We can verify whether those cases actually exist by running a separate TF query, and it turns out they do not exist.\n",
13241323
"\n",
13251324
"**Lesson**\n",
13261325
"\n",
13271326
"Whenever an exegesis hinges on the results of a query, check and double check.\n",
13281327
"You probably will have to run multiple queries in SHEBANQ and combine the results.\n",
13291328
"This will quickly get very cumbersome.\n",
1330-
"If that happens, it starts to pay off to use Text-Fabric, where you have more complete power over \n",
1329+
"If that happens, it starts to pay off to use Text-Fabric, where you have more complete power over\n",
13311330
"the computations and their results."
13321331
]
13331332
}

primer/example7.ipynb

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -48,9 +48,8 @@
4848
"outputs": [],
4949
"source": [
5050
"from tf.app import use\n",
51-
"from tf.core.helpers import project\n",
5251
"\n",
53-
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS"
52+
"from util import getTfVerses, getShebanqData, compareResults, MQL_RESULTS\n"
5453
]
5554
},
5655
{
@@ -628,9 +627,9 @@
628627
}
629628
],
630629
"source": [
631-
"VERSION = '2017'\n",
630+
"VERSION = \"2017\"\n",
632631
"# A = use('bhsa', hoist=globals(), version=VERSION)\n",
633-
"A = use('bhsa:clone', checkout=\"clone\", hoist=globals(), version=VERSION)"
632+
"A = use(\"bhsa:clone\", checkout=\"clone\", hoist=globals(), version=VERSION)"
634633
]
635634
},
636635
{
@@ -754,7 +753,7 @@
754753
"metadata": {},
755754
"outputs": [],
756755
"source": [
757-
"query1= \"\"\"\n",
756+
"query1 = \"\"\"\n",
758757
"clause\n",
759758
" phrase function=PreO|PtcO\n",
760759
" word sp=verb vs=qal lex=FJM[\n",
@@ -995,6 +994,9 @@
995994
}
996995
],
997996
"metadata": {
997+
"jupytext": {
998+
"encoding": "# -*- coding: utf-8 -*-"
999+
},
9981000
"kernelspec": {
9991001
"display_name": "Python 3",
10001002
"language": "python",

0 commit comments

Comments
 (0)