From 9329960011eaa9fb929e63a962f492f9686e578d Mon Sep 17 00:00:00 2001 From: Andrew Tavis McAllister Date: Thu, 24 Oct 2024 14:48:23 +0200 Subject: [PATCH] #405 finalize Northern Sami and fix proper noun docstrings --- .../basque/proper_nouns/query_proper_nouns.sparql | 4 ++-- .../bengali/proper_nouns/query_proper_nouns.sparql | 2 +- .../english/proper_nouns/query_proper_nouns.sparql | 2 +- .../finnish/proper_nouns/query_proper_nouns.sparql | 2 +- .../hebrew/proper_nouns/query_proper_nouns.sparql | 2 +- .../italian/proper_nouns/query_proper_nouns.sparql | 2 +- .../japanese/proper_nouns/query_proper_nouns.sparql | 2 +- .../kurmanji/proper_nouns/query_proper_nouns.sparql | 2 +- .../malay/proper_nouns/query_proper_nouns.sparql | 2 +- .../proper_nouns/query_proper_nouns.sparql | 2 +- .../polish/proper_nouns/query_proper_nouns.sparql | 2 +- .../proper_nouns/query_proper_nouns.sparql | 2 +- .../gurmukhi/proper_nouns/query_proper_nouns.sparql | 2 +- .../proper_nouns/query_proper_nouns.sparql | 2 +- .../russian/proper_nouns/query_proper_nouns.sparql | 2 +- .../northern/prepositions/query_prepositions.sparql | 13 +++++++++++++ .../northern/proper_nouns/query_proper_nouns.sparql | 13 +++++++++++++ .../spanish/proper_nouns/query_proper_nouns.sparql | 2 +- .../tajik/proper_nouns/query_proper_nouns.sparql | 2 +- .../tamil/proper_nouns/query_proper_nouns.sparql | 2 +- .../yoruba/proper_nouns/query_proper_nouns.sparql | 2 +- 21 files changed, 46 insertions(+), 20 deletions(-) create mode 100644 src/scribe_data/wikidata/language_data_extraction/sami/northern/prepositions/query_prepositions.sparql create mode 100644 src/scribe_data/wikidata/language_data_extraction/sami/northern/proper_nouns/query_proper_nouns.sparql diff --git a/src/scribe_data/wikidata/language_data_extraction/basque/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/basque/proper_nouns/query_proper_nouns.sparql index 5414cef9d..a6be52e77 100644 --- a/src/scribe_data/wikidata/language_data_extraction/basque/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/basque/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Basque (Q8752) nouns (Q1084) and the given forms. +# All Basque (Q8752) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT @@ -8,6 +8,6 @@ SELECT WHERE { ?lexeme dct:language wd:Q8752 ; - wikibase:lexicalCategory wd:Q147276; + wikibase:lexicalCategory wd:Q147276 ; wikibase:lemma ?properNoun . } diff --git a/src/scribe_data/wikidata/language_data_extraction/bengali/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/bengali/proper_nouns/query_proper_nouns.sparql index f795cc083..d463fc848 100644 --- a/src/scribe_data/wikidata/language_data_extraction/bengali/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/bengali/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Bengali (Bangla Q9610) nouns (Q1084) and the given forms. +# All Bengali (Bangla Q9610) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/english/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/english/proper_nouns/query_proper_nouns.sparql index 732b7e61e..7d56acbd2 100644 --- a/src/scribe_data/wikidata/language_data_extraction/english/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/english/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All English (Q1860) nouns (Q1084) and the given forms. +# All English (Q1860) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/finnish/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/finnish/proper_nouns/query_proper_nouns.sparql index 78c6b30ba..47bdd90e2 100644 --- a/src/scribe_data/wikidata/language_data_extraction/finnish/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/finnish/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Finnish (Q1412) nouns (Q1084) and the given forms. +# All Finnish (Q1412) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/hebrew/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/hebrew/proper_nouns/query_proper_nouns.sparql index c252b0b60..f3ed756f5 100644 --- a/src/scribe_data/wikidata/language_data_extraction/hebrew/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/hebrew/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Hebrew (Q9288) nouns (Q1084) and the given forms. +# All Hebrew (Q9288) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/italian/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/italian/proper_nouns/query_proper_nouns.sparql index f6f3518ab..e24635171 100644 --- a/src/scribe_data/wikidata/language_data_extraction/italian/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/italian/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Italian (Q652) nouns (Q1084) and the given forms. +# All Italian (Q652) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/japanese/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/japanese/proper_nouns/query_proper_nouns.sparql index 98761a1a7..5295ba897 100644 --- a/src/scribe_data/wikidata/language_data_extraction/japanese/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/japanese/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Japanese (Q5287) nouns (Q1084) and the given forms. +# All Japanese (Q5287) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/kurmanji/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/kurmanji/proper_nouns/query_proper_nouns.sparql index 13f6609ae..5e4c53c96 100644 --- a/src/scribe_data/wikidata/language_data_extraction/kurmanji/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/kurmanji/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Kurmanji (Q36163) nouns (Q1084) and the given forms. +# All Kurmanji (Q36163) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/malay/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/malay/proper_nouns/query_proper_nouns.sparql index 8c8f4c869..e447e0a6a 100644 --- a/src/scribe_data/wikidata/language_data_extraction/malay/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/malay/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Malay (Q9237) nouns (Q1084) and the given forms. +# All Malay (Q9237) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/malayalam/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/malayalam/proper_nouns/query_proper_nouns.sparql index b8d830057..72dc68a8b 100644 --- a/src/scribe_data/wikidata/language_data_extraction/malayalam/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/malayalam/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Malayalam (Q36236) nouns (Q1084) and the given forms and the given forms. +# All Malayalam (Q36236) proper nouns (Q147276) and the given forms and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/polish/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/polish/proper_nouns/query_proper_nouns.sparql index 1c0091615..1c94ce1e1 100644 --- a/src/scribe_data/wikidata/language_data_extraction/polish/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/polish/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Polish (Q809) nouns (Q1084) and the given forms. +# All Polish (Q809) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/portuguese/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/portuguese/proper_nouns/query_proper_nouns.sparql index 602bbdfde..3484a9b08 100644 --- a/src/scribe_data/wikidata/language_data_extraction/portuguese/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/portuguese/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Portuguese (Q5146) nouns (Q1084) and the given forms. +# All Portuguese (Q5146) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/punjabi/gurmukhi/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/punjabi/gurmukhi/proper_nouns/query_proper_nouns.sparql index 3027ba33b..ebea83057 100644 --- a/src/scribe_data/wikidata/language_data_extraction/punjabi/gurmukhi/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/punjabi/gurmukhi/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Gurmukhi (from Punjabi Q58635) nouns (Q1084) and the given forms. +# All Gurmukhi (from Punjabi Q58635) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. # Note: We need to filter for "pa" to select Gurmukhi words. diff --git a/src/scribe_data/wikidata/language_data_extraction/punjabi/shahmukhi/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/punjabi/shahmukhi/proper_nouns/query_proper_nouns.sparql index aef337511..40c90d7c3 100644 --- a/src/scribe_data/wikidata/language_data_extraction/punjabi/shahmukhi/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/punjabi/shahmukhi/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Shahmukhi (from Punjabi Q58635) nouns (Q1084) and the given forms. +# All Shahmukhi (from Punjabi Q58635) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. # Note: We need to filter for "pnb" to select Shahmukhi words. diff --git a/src/scribe_data/wikidata/language_data_extraction/russian/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/russian/proper_nouns/query_proper_nouns.sparql index 2f0e79f82..63f8c9d31 100644 --- a/src/scribe_data/wikidata/language_data_extraction/russian/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/russian/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Russian (Q7737) nouns (Q1084) and the given forms. +# All Russian (Q7737) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/sami/northern/prepositions/query_prepositions.sparql b/src/scribe_data/wikidata/language_data_extraction/sami/northern/prepositions/query_prepositions.sparql new file mode 100644 index 000000000..37d3ac9e2 --- /dev/null +++ b/src/scribe_data/wikidata/language_data_extraction/sami/northern/prepositions/query_prepositions.sparql @@ -0,0 +1,13 @@ +# tool: scribe-data +# All Northern Sami(Q33947) prepositions (Q4833830) and the given forms. +# Enter this query at https://query.wikidata.org/. + +SELECT + (REPLACE(STR(?lexeme), "http://www.wikidata.org/entity/", "") AS ?lexemeID) + ?preposition + +WHERE { + ?lexeme dct:language wd:Q33947 ; + wikibase:lexicalCategory wd:Q4833830 ; + wikibase:lemma ?preposition . +} diff --git a/src/scribe_data/wikidata/language_data_extraction/sami/northern/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/sami/northern/proper_nouns/query_proper_nouns.sparql new file mode 100644 index 000000000..2d0a70540 --- /dev/null +++ b/src/scribe_data/wikidata/language_data_extraction/sami/northern/proper_nouns/query_proper_nouns.sparql @@ -0,0 +1,13 @@ +# tool: scribe-data +# All Northern Sami(Q33947) nouns (Q147276) and the given forms. +# Enter this query at https://query.wikidata.org/. + +SELECT + (REPLACE(STR(?lexeme), "http://www.wikidata.org/entity/", "") AS ?lexemeID) + ?properNoun + +WHERE { + ?lexeme dct:language wd:Q5146 ; + wikibase:lexicalCategory wd:Q147276 ; + wikibase:lemma ?properNoun . +} diff --git a/src/scribe_data/wikidata/language_data_extraction/spanish/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/spanish/proper_nouns/query_proper_nouns.sparql index 3197d13b7..5c98d4bb4 100644 --- a/src/scribe_data/wikidata/language_data_extraction/spanish/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/spanish/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Spanish (Q1321) nouns (Q1084) and the given forms. +# All Spanish (Q1321) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/tajik/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/tajik/proper_nouns/query_proper_nouns.sparql index 5fecf6c2c..0d782fec3 100644 --- a/src/scribe_data/wikidata/language_data_extraction/tajik/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/tajik/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Tajik (Q9260) nouns (Q1084) and the given forms. +# All Tajik (Q9260) proper nouns (Q147276)s and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/tamil/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/tamil/proper_nouns/query_proper_nouns.sparql index 9d225f60c..92373a5a4 100644 --- a/src/scribe_data/wikidata/language_data_extraction/tamil/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/tamil/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Tamil (Q5885) nouns (Q1084) and the given forms. +# All Tamil (Q5885) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT diff --git a/src/scribe_data/wikidata/language_data_extraction/yoruba/proper_nouns/query_proper_nouns.sparql b/src/scribe_data/wikidata/language_data_extraction/yoruba/proper_nouns/query_proper_nouns.sparql index 39332a043..94d40b35c 100644 --- a/src/scribe_data/wikidata/language_data_extraction/yoruba/proper_nouns/query_proper_nouns.sparql +++ b/src/scribe_data/wikidata/language_data_extraction/yoruba/proper_nouns/query_proper_nouns.sparql @@ -1,5 +1,5 @@ # tool: scribe-data -# All Yoruba (Q34311) nouns (Q1084) and the given forms. +# All Yoruba (Q34311) proper nouns (Q147276) and the given forms. # Enter this query at https://query.wikidata.org/. SELECT