From e84c2da7f42e95b39eb76268599a5a8bb4faca73 Mon Sep 17 00:00:00 2001 From: MuffinLinwist Date: Mon, 5 Aug 2024 12:43:30 +0200 Subject: [PATCH 1/2] =?UTF-8?q?=E2=80=9Cupdate=E2=80=9D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .github/workflows/cldf-validation.yml | 2 +- .zenodo.json | 4 +- CONTRIBUTORS.md | 2 +- README.md | 10 ++--- cldf/README.md | 6 +-- cldf/cldf-metadata.json | 12 +++--- cldf/languages.csv | 4 +- cldf/lingpy-rcParams.json | 4 +- cldf/parameters.csv | 2 +- cldf/requirements.txt | 62 +++++++++++++-------------- etc/languages.csv | 4 +- lexibank_luangthongkumkaren.py | 1 + metadata.json | 2 +- 13 files changed, 57 insertions(+), 58 deletions(-) diff --git a/.github/workflows/cldf-validation.yml b/.github/workflows/cldf-validation.yml index 48ab092..b2f938e 100644 --- a/.github/workflows/cldf-validation.yml +++ b/.github/workflows/cldf-validation.yml @@ -12,7 +12,7 @@ jobs: runs-on: ubuntu-latest strategy: matrix: - python-version: [3.9] + python-version: [3.12] steps: - uses: actions/checkout@v2 diff --git a/.zenodo.json b/.zenodo.json index a7d70a6..9b07a23 100644 --- a/.zenodo.json +++ b/.zenodo.json @@ -7,7 +7,7 @@ ], "creators": [ { - "name": "Luangthongkum, T." + "name": "Luangthongkum, Theraphan" } ], "contributors": [ @@ -22,7 +22,7 @@ } ], "upload_type": "dataset", - "description": "

Cite the source of the dataset as:

\n\n
\n

Luangthongkum, T. (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441

\n
", + "description": "

Cite the source of the dataset as:

\n\n
\n

Luangthongkum, Theraphan (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441

\n
", "license": { "id": "CC-BY-NC-ND-4.0" } diff --git a/CONTRIBUTORS.md b/CONTRIBUTORS.md index 9700004..6550ef1 100644 --- a/CONTRIBUTORS.md +++ b/CONTRIBUTORS.md @@ -2,5 +2,5 @@ Name | GitHub user | Description | Role --- | --- | --- | --- -Luangthongkum, T. | | data collection | Author +Luangthongkum, Theraphan | | data collection | Author Johann-Mattis List | @lingulist | code, integration | Editor diff --git a/README.md b/README.md index 1684ed0..117235f 100644 --- a/README.md +++ b/README.md @@ -6,7 +6,7 @@ If you use these data please cite - the original source - > Luangthongkum, T. (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441 + > Luangthongkum, Theraphan (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441 - the derived dataset using the DOI of the [particular released version](../../releases/) you were using ## Description @@ -23,14 +23,14 @@ Conceptlists in Concepticon: [![CLDF validation](https://github.com/lexibank/luangthongkumkaren/workflows/CLDF-validation/badge.svg)](https://github.com/lexibank/luangthongkumkaren/actions?query=workflow%3ACLDF-validation) -![Glottolog: 81%](https://img.shields.io/badge/Glottolog-81%25-yellowgreen.svg "Glottolog: 81%") +![Glottolog: 100%](https://img.shields.io/badge/Glottolog-100%25-brightgreen.svg "Glottolog: 100%") ![Concepticon: 74%](https://img.shields.io/badge/Concepticon-74%25-yellow.svg "Concepticon: 74%") ![Source: 0%](https://img.shields.io/badge/Source-0%25-red.svg "Source: 0%") ![BIPA: 100%](https://img.shields.io/badge/BIPA-100%25-brightgreen.svg "BIPA: 100%") ![CLTS SoundClass: 100%](https://img.shields.io/badge/CLTS%20SoundClass-100%25-brightgreen.svg "CLTS SoundClass: 100%") -- **Varieties:** 11 -- **Concepts:** 341 +- **Varieties:** 11 (linked to 11 different Glottocodes) +- **Concepts:** 341 (linked to 249 different Concepticon concept sets) - **Lexemes:** 3,233 - **Sources:** 0 - **Synonymy:** 1.01 @@ -51,7 +51,7 @@ Conceptlists in Concepticon: Name | GitHub user | Description | Role --- | --- | --- | --- -Luangthongkum, T. | | data collection | Author +Luangthongkum, Theraphan | | data collection | Author Johann-Mattis List | @lingulist | code, integration | Editor diff --git a/cldf/README.md b/cldf/README.md index e7e09e3..f1f9ff3 100644 --- a/cldf/README.md +++ b/cldf/README.md @@ -8,14 +8,14 @@ property | value --- | --- -[dc:bibliographicCitation](http://purl.org/dc/terms/bibliographicCitation) | Luangthongkum, T. (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441 +[dc:bibliographicCitation](http://purl.org/dc/terms/bibliographicCitation) | Luangthongkum, Theraphan (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441 [dc:conformsTo](http://purl.org/dc/terms/conformsTo) | [CLDF Wordlist](http://cldf.clld.org/v1.0/terms.rdf#Wordlist) [dc:format](http://purl.org/dc/terms/format) |
  1. http://concepticon.clld.org/contributions/Luangthongkum-2019-341
[dc:identifier](http://purl.org/dc/terms/identifier) | http://hdl.handle.net/10524/52441 [dc:license](http://purl.org/dc/terms/license) | https://creativecommons.org/licenses/by-nc-nd/4.0/ [dcat:accessURL](http://www.w3.org/ns/dcat#accessURL) | https://github.com/lexibank/luangthongkumkaren -[prov:wasDerivedFrom](http://www.w3.org/ns/prov#wasDerivedFrom) |
  1. lexibank/luangthongkumkaren v1.0-6-gd0de437
  2. Glottolog v4.8
  3. Concepticon v3.1.0
  4. CLTS v2.2.0
-[prov:wasGeneratedBy](http://www.w3.org/ns/prov#wasGeneratedBy) |
  1. lingpy-rcParams: lingpy-rcParams.json
  2. python: 3.11.7
  3. python-packages: requirements.txt
+[prov:wasDerivedFrom](http://www.w3.org/ns/prov#wasDerivedFrom) |
  1. lexibank/luangthongkumkaren v1.0-1-gce3eb62
  2. Glottolog v5.0
  3. Concepticon v3.2.0
  4. CLTS v2.3.0
+[prov:wasGeneratedBy](http://www.w3.org/ns/prov#wasGeneratedBy) |
  1. lingpy-rcParams: lingpy-rcParams.json
  2. python: 3.9.6
  3. python-packages: requirements.txt
[rdf:ID](http://www.w3.org/1999/02/22-rdf-syntax-ns#ID) | luangthongkumkaren [rdf:type](http://www.w3.org/1999/02/22-rdf-syntax-ns#type) | http://www.w3.org/ns/dcat#Distribution diff --git a/cldf/cldf-metadata.json b/cldf/cldf-metadata.json index 25b2597..dbd0a84 100644 --- a/cldf/cldf-metadata.json +++ b/cldf/cldf-metadata.json @@ -1,7 +1,7 @@ { "@context": "http://www.w3.org/ns/csvw", "aboutUrl": null, - "dc:bibliographicCitation": "Luangthongkum, T. (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441", + "dc:bibliographicCitation": "Luangthongkum, Theraphan (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441", "dc:conformsTo": "http://cldf.clld.org/v1.0/terms.rdf#Wordlist", "dc:format": [ "http://concepticon.clld.org/contributions/Luangthongkum-2019-341" @@ -17,25 +17,25 @@ { "rdf:about": "https://github.com/lexibank/luangthongkumkaren", "rdf:type": "prov:Entity", - "dc:created": "v1.0-6-gd0de437", + "dc:created": "v1.0-1-gce3eb62", "dc:title": "Repository" }, { "rdf:about": "https://github.com/glottolog/glottolog", "rdf:type": "prov:Entity", - "dc:created": "v4.8", + "dc:created": "v5.0", "dc:title": "Glottolog" }, { "rdf:about": "https://github.com/concepticon/concepticon-data", "rdf:type": "prov:Entity", - "dc:created": "v3.1.0", + "dc:created": "v3.2.0", "dc:title": "Concepticon" }, { "rdf:about": "https://github.com/cldf-clts/clts", "rdf:type": "prov:Entity", - "dc:created": "v2.2.0", + "dc:created": "v2.3.0", "dc:title": "CLTS" } ], @@ -46,7 +46,7 @@ }, { "dc:title": "python", - "dc:description": "3.11.7" + "dc:description": "3.9.6" }, { "dc:title": "python-packages", diff --git a/cldf/languages.csv b/cldf/languages.csv index e7e020c..6fae392 100644 --- a/cldf/languages.csv +++ b/cldf/languages.csv @@ -5,8 +5,8 @@ Kayan,Kayan,kaya1315,Kayan Lahwi,pdu,Eurasia,19.5183,97.4138,Sino-Tibetan Kayaw,Kayaw,brek1238,Brek Karen,kvl,Eurasia,19.0561,96.8365,Sino-Tibetan NorthernPao,Northern Pa-O,nort2705,Northern Pa'o,,Eurasia,,,Sino-Tibetan NorthernPwo,Northern Pwo,pwon1235,Pwo Northern Karen,pww,Eurasia,18.016,98.2709,Sino-Tibetan -NorthernSgaw,Northern Sgaw,,,,,,, +NorthernSgaw,Northern Sgaw,wewa1238,Wewaw,wea,Eurasia,19.020577,96.540526,Sino-Tibetan SouthernPao,Southern Pa-O,sout2712,Southern Pa'o,,Eurasia,,,Sino-Tibetan -SouthernPwo,Southern Pwo,,,,,,, +SouthernPwo,Southern Pwo,pwoe1235,Pwo Eastern Karen,kjp,Eurasia,15.1915,98.7355,Sino-Tibetan SouthernSgaw,Southern Sgaw,sgaw1245,S'gaw Karen,ksw,Eurasia,17.9872,97.7126,Sino-Tibetan WesternBwe,Western Bwe,bwek1238,Bwe Karen,bwe,Eurasia,18.9796,96.9936,Sino-Tibetan diff --git a/cldf/lingpy-rcParams.json b/cldf/lingpy-rcParams.json index 5e1b443..9e8c502 100644 --- a/cldf/lingpy-rcParams.json +++ b/cldf/lingpy-rcParams.json @@ -64,7 +64,7 @@ 10, 10 ], - "filename": "lingpy-2024-02-14", + "filename": "lingpy-2024-08-05", "gap_symbol": "-", "gap_weight": 0.5, "gop": -2, @@ -123,7 +123,7 @@ "scorer": {}, "sonar": true, "stress": "\u02c8\u02cc'", - "timestamp": "2024-02-14 12:49", + "timestamp": "2024-08-05 12:40", "tones": "\u00b9\u00b2\u00b3\u2074\u2075\u2076\u2077\u2078\u2079\u2070\u2081\u2082\u2083\u2084\u2085\u2086\u2087\u2088\u2089\u20800123456789\u02e5\u02e6\u02e7\u02e8\u02e9\u02ea\u02eb-\ua708-\ua709-\ua70a-\ua70b-\ua70c-\ua70d-\ua70e-\ua70f-\ua710-\ua711-\ua712-\ua713-\ua714-\ua715-\ua716-\ua717-\ua718-\ua719-\ua71a-\ua700-\ua701-\ua702-\ua703-\ua704-\ua705-\ua706-\ua707", "tree_calc": "neighbor", "unique_sequences": true, diff --git a/cldf/parameters.csv b/cldf/parameters.csv index 4543bda..44c4548 100644 --- a/cldf/parameters.csv +++ b/cldf/parameters.csv @@ -219,7 +219,7 @@ ID,Name,Concepticon_ID,Concepticon_Gloss 218_pig,pig,1337,PIG 219_pile,pile,, 220_pointedasofneedlessharppoint,"pointed (as of needles), sharp point",372,POINTED -221_pole,pole,282,POLE +221_pole,pole,281,POST 222_porcupine,porcupine,2510,PORCUPINE 223_porcupinebrushtailed,porcupine (brush-tailed~),, 224_pot,pot,1462,POT diff --git a/cldf/requirements.txt b/cldf/requirements.txt index 0ed49d6..9d8144f 100644 --- a/cldf/requirements.txt +++ b/cldf/requirements.txt @@ -1,59 +1,57 @@ appdirs==1.4.4 -attrs==23.2.0 -Babel==2.14.0 -bibtexparser==2.0.0b6 +attrs==24.1.0 +Babel==2.15.0 +bibtexparser==2.0.0b7 bs4==0.0.2 -certifi==2024.2.2 +certifi==2024.7.4 cldfbench==1.14.0 cldfcatalog==1.5.1 -cldfzenodo==2.1.0 -clldutils==3.22.1 +cldfzenodo==2.1.1 +clldutils==3.22.2 colorama==0.4.6 colorlog==6.8.2 csvw==3.3.0 +exceptiongroup==1.2.2 gitdb==4.0.11 -greenlet==3.0.3 -idna==3.6 +idna==3.7 iniconfig==2.0.0 isodate==0.6.1 -jsonschema==4.21.1 -lexibank_luangthongkumkaren==0.0.0 +jsonschema==4.23.0 lingpy==2.6.13 -lxml==5.1.0 -Markdown==3.5.2 +lxml==5.2.2 +Markdown==3.6 nameparser==1.1.3 networkx==3.2.1 newick==1.9.0 -numpy==1.26.4 -openpyxl==3.1.2 -packaging==23.2 -pluggy==1.4.0 -purl==1.6 +numpy==2.0.1 +openpyxl==3.1.5 +packaging==24.1 +pluggy==1.5.0 pybtex==0.24.0 -pycldf==1.37.0 -pyclts==3.1.1 -pyconcepticon==3.0.0 -pycountry==23.12.11 -pyedictor==0.4 -pyglottolog==3.12.0 +pycldf==1.38.1 +pyclts==3.2.0 +pyconcepticon==3.1.0 +pycountry==24.6.1 +pyedictor==0.5 +pyglottolog==3.13.0 pylatexenc==2.10 -pylexibank==3.4.0 -pytest==8.0.0 -python-dateutil==2.8.2 +pylexibank==3.5.0 +pytest==8.3.2 +python-dateutil==2.9.0.post0 rdflib==7.0.0 -referencing==0.33.0 -regex==2023.12.25 -requests==2.31.0 +referencing==0.35.1 +regex==2024.7.24 +requests==2.32.3 rfc3986==1.5.0 segments==2.2.1 six==1.16.0 smmap==5.0.1 soupsieve==2.5 -SQLAlchemy==1.4.51 +SQLAlchemy==1.4.53 tabulate==0.9.0 termcolor==2.4.0 -tqdm==4.66.2 +tqdm==4.66.5 uritemplate==4.1.1 -urllib3==2.2.0 +urllib3==2.2.2 xlrd==2.0.1 zenodoclient==0.5.1 \ No newline at end of file diff --git a/etc/languages.csv b/etc/languages.csv index 797302d..39c3cf6 100644 --- a/etc/languages.csv +++ b/etc/languages.csv @@ -9,8 +9,8 @@ Kayan,Kayan,kaya1315 Kayaw,Kayaw,brek1238 NorthernPao,Northern Pa-O,nort2705 NorthernPwo,Northern Pwo,pwon1235 -NorthernSgaw,Northern Sgaw, +NorthernSgaw,Northern Sgaw,wewa1238 SouthernPao,Southern Pa-O,sout2712 -SouthernPwo,Southern Pwo, +SouthernPwo,Southern Pwo,pwoe1235 SouthernSgaw,Southern Sgaw,sgaw1245 WesternBwe,Western Bwe,bwek1238 diff --git a/lexibank_luangthongkumkaren.py b/lexibank_luangthongkumkaren.py index f3a0c87..b1641dd 100644 --- a/lexibank_luangthongkumkaren.py +++ b/lexibank_luangthongkumkaren.py @@ -21,6 +21,7 @@ class Dataset(BaseDataset): id = "luangthongkumkaren" cognate_class = CustomCognate lexeme_class = CustomLexeme + writer_options = dict(keep_languages=False, keep_parameters=False) form_spec = FormSpec( separators="/,", missing_data=["---", "- (?)"], diff --git a/metadata.json b/metadata.json index cde4468..d06eda4 100644 --- a/metadata.json +++ b/metadata.json @@ -1,6 +1,6 @@ { "url": "http://hdl.handle.net/10524/52441", - "citation": "Luangthongkum, T. (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441", + "citation": "Luangthongkum, Theraphan (2019). A View on Proto-Karen Phonology and Lexicon, Journal of Southest Asian Linguistics Society, 12.1, i-lii. doi: http://hdl.handle.net/10524/52441", "conceptlist": ["Luangthongkum-2019-341"], "license": "CC-BY-NC-ND-4.0", "title": "CLDF dataset derived from Luangthongkum's \"Proto-Karen Phonology and Lexicon\" from 2019" From 1b2799f2872540fa9652d9c2b406f02cc6441f90 Mon Sep 17 00:00:00 2001 From: MuffinLinwist Date: Mon, 5 Aug 2024 12:51:59 +0200 Subject: [PATCH 2/2] glottocodes --- cldf/README.md | 2 +- cldf/cldf-metadata.json | 2 +- cldf/languages.csv | 2 +- cldf/lingpy-rcParams.json | 2 +- etc/languages.csv | 2 +- 5 files changed, 5 insertions(+), 5 deletions(-) diff --git a/cldf/README.md b/cldf/README.md index f1f9ff3..2046248 100644 --- a/cldf/README.md +++ b/cldf/README.md @@ -14,7 +14,7 @@ property | value [dc:identifier](http://purl.org/dc/terms/identifier) | http://hdl.handle.net/10524/52441 [dc:license](http://purl.org/dc/terms/license) | https://creativecommons.org/licenses/by-nc-nd/4.0/ [dcat:accessURL](http://www.w3.org/ns/dcat#accessURL) | https://github.com/lexibank/luangthongkumkaren -[prov:wasDerivedFrom](http://www.w3.org/ns/prov#wasDerivedFrom) |
  1. lexibank/luangthongkumkaren v1.0-1-gce3eb62
  2. Glottolog v5.0
  3. Concepticon v3.2.0
  4. CLTS v2.3.0
+[prov:wasDerivedFrom](http://www.w3.org/ns/prov#wasDerivedFrom) |
  1. lexibank/luangthongkumkaren v1.0-2-ge84c2da
  2. Glottolog v5.0
  3. Concepticon v3.2.0
  4. CLTS v2.3.0
[prov:wasGeneratedBy](http://www.w3.org/ns/prov#wasGeneratedBy) |
  1. lingpy-rcParams: lingpy-rcParams.json
  2. python: 3.9.6
  3. python-packages: requirements.txt
[rdf:ID](http://www.w3.org/1999/02/22-rdf-syntax-ns#ID) | luangthongkumkaren [rdf:type](http://www.w3.org/1999/02/22-rdf-syntax-ns#type) | http://www.w3.org/ns/dcat#Distribution diff --git a/cldf/cldf-metadata.json b/cldf/cldf-metadata.json index dbd0a84..9cc7046 100644 --- a/cldf/cldf-metadata.json +++ b/cldf/cldf-metadata.json @@ -17,7 +17,7 @@ { "rdf:about": "https://github.com/lexibank/luangthongkumkaren", "rdf:type": "prov:Entity", - "dc:created": "v1.0-1-gce3eb62", + "dc:created": "v1.0-2-ge84c2da", "dc:title": "Repository" }, { diff --git a/cldf/languages.csv b/cldf/languages.csv index 6fae392..f4575cf 100644 --- a/cldf/languages.csv +++ b/cldf/languages.csv @@ -1,6 +1,6 @@ ID,Name,Glottocode,Glottolog_Name,ISO639P3code,Macroarea,Latitude,Longitude,Family ProtoKaren,Proto-Karen,kare1337,Karenic,,,,,Sino-Tibetan -Kayah,Kayah,east2342,Eastern Kayah,eky,Eurasia,19.8939,98.3359,Sino-Tibetan +Kayah,Kayah,kaya1317,Kayah,,,,,Sino-Tibetan Kayan,Kayan,kaya1315,Kayan Lahwi,pdu,Eurasia,19.5183,97.4138,Sino-Tibetan Kayaw,Kayaw,brek1238,Brek Karen,kvl,Eurasia,19.0561,96.8365,Sino-Tibetan NorthernPao,Northern Pa-O,nort2705,Northern Pa'o,,Eurasia,,,Sino-Tibetan diff --git a/cldf/lingpy-rcParams.json b/cldf/lingpy-rcParams.json index 9e8c502..2d0646a 100644 --- a/cldf/lingpy-rcParams.json +++ b/cldf/lingpy-rcParams.json @@ -123,7 +123,7 @@ "scorer": {}, "sonar": true, "stress": "\u02c8\u02cc'", - "timestamp": "2024-08-05 12:40", + "timestamp": "2024-08-05 12:51", "tones": "\u00b9\u00b2\u00b3\u2074\u2075\u2076\u2077\u2078\u2079\u2070\u2081\u2082\u2083\u2084\u2085\u2086\u2087\u2088\u2089\u20800123456789\u02e5\u02e6\u02e7\u02e8\u02e9\u02ea\u02eb-\ua708-\ua709-\ua70a-\ua70b-\ua70c-\ua70d-\ua70e-\ua70f-\ua710-\ua711-\ua712-\ua713-\ua714-\ua715-\ua716-\ua717-\ua718-\ua719-\ua71a-\ua700-\ua701-\ua702-\ua703-\ua704-\ua705-\ua706-\ua707", "tree_calc": "neighbor", "unique_sequences": true, diff --git a/etc/languages.csv b/etc/languages.csv index 39c3cf6..827b7f8 100644 --- a/etc/languages.csv +++ b/etc/languages.csv @@ -4,7 +4,7 @@ ProtoKarenBurling,Proto-Karen (Burling),kare1337 ProtoNorthernkaren,Proto-Northern-Karen,nort2703 ProtoCentralKaren,Proto-Central-Karen,cent1999 ProtoSouthernKaren,Proto-Southern-Karen,sout1554 -Kayah,Kayah,east2342 +Kayah,Kayah,kaya1317 Kayan,Kayan,kaya1315 Kayaw,Kayaw,brek1238 NorthernPao,Northern Pa-O,nort2705