forked from MapComplete/MapComplete
Improve metadata in language translations, remove wikidata-downloading-script
This commit is contained in:
parent
cba1a4340e
commit
30a835a232
4 changed files with 66 additions and 197 deletions
|
@ -132,6 +132,7 @@
|
||||||
"en"
|
"en"
|
||||||
],
|
],
|
||||||
"CN": [
|
"CN": [
|
||||||
|
"zh",
|
||||||
"zh"
|
"zh"
|
||||||
],
|
],
|
||||||
"CO": [
|
"CO": [
|
||||||
|
@ -148,6 +149,7 @@
|
||||||
],
|
],
|
||||||
"CY": [
|
"CY": [
|
||||||
"tr",
|
"tr",
|
||||||
|
"el",
|
||||||
"el"
|
"el"
|
||||||
],
|
],
|
||||||
"CZ": [
|
"CZ": [
|
||||||
|
@ -247,6 +249,9 @@
|
||||||
"es",
|
"es",
|
||||||
"pt"
|
"pt"
|
||||||
],
|
],
|
||||||
|
"GR": [
|
||||||
|
"el"
|
||||||
|
],
|
||||||
"GT": [
|
"GT": [
|
||||||
"es"
|
"es"
|
||||||
],
|
],
|
||||||
|
@ -453,8 +458,7 @@
|
||||||
"fr"
|
"fr"
|
||||||
],
|
],
|
||||||
"NG": [
|
"NG": [
|
||||||
"en",
|
"en"
|
||||||
"yo"
|
|
||||||
],
|
],
|
||||||
"NI": [
|
"NI": [
|
||||||
"es"
|
"es"
|
||||||
|
@ -502,9 +506,7 @@
|
||||||
"en"
|
"en"
|
||||||
],
|
],
|
||||||
"PK": [
|
"PK": [
|
||||||
"ur",
|
"ur"
|
||||||
"en",
|
|
||||||
"ar"
|
|
||||||
],
|
],
|
||||||
"PL": [
|
"PL": [
|
||||||
"pl",
|
"pl",
|
||||||
|
@ -559,7 +561,6 @@
|
||||||
"ar"
|
"ar"
|
||||||
],
|
],
|
||||||
"SE": [
|
"SE": [
|
||||||
"sv",
|
|
||||||
"sv"
|
"sv"
|
||||||
],
|
],
|
||||||
"SG": [
|
"SG": [
|
||||||
|
@ -648,6 +649,9 @@
|
||||||
"en",
|
"en",
|
||||||
"en"
|
"en"
|
||||||
],
|
],
|
||||||
|
"TW": [
|
||||||
|
"zh"
|
||||||
|
],
|
||||||
"TZ": [
|
"TZ": [
|
||||||
"en",
|
"en",
|
||||||
"sw"
|
"sw"
|
||||||
|
@ -693,16 +697,16 @@
|
||||||
"ar"
|
"ar"
|
||||||
],
|
],
|
||||||
"ZA": [
|
"ZA": [
|
||||||
|
"en",
|
||||||
|
"zu",
|
||||||
|
"xh",
|
||||||
"af",
|
"af",
|
||||||
"ve",
|
"ve",
|
||||||
"ss",
|
"ss",
|
||||||
"tn",
|
"tn",
|
||||||
"ts",
|
"ts",
|
||||||
"st",
|
"st",
|
||||||
"nr",
|
"nr"
|
||||||
"en",
|
|
||||||
"zu",
|
|
||||||
"xh"
|
|
||||||
],
|
],
|
||||||
"ZM": [
|
"ZM": [
|
||||||
"en"
|
"en"
|
||||||
|
|
|
@ -54,7 +54,7 @@
|
||||||
"weblate-fix-heavy": "git remote rm weblate-layers; git remote add weblate-layers https://hosted.weblate.org/git/mapcomplete/layers/; git remote update weblate-layers; git merge weblate-layers/master",
|
"weblate-fix-heavy": "git remote rm weblate-layers; git remote add weblate-layers https://hosted.weblate.org/git/mapcomplete/layers/; git remote update weblate-layers; git merge weblate-layers/master",
|
||||||
"housekeeping": "npm run generate && npm run generate:docs && npm run generate:contributor-list && npm run format && git add assets/ langs/ Docs/ **/*.ts Docs/* && git commit -m 'Housekeeping...'",
|
"housekeeping": "npm run generate && npm run generate:docs && npm run generate:contributor-list && npm run format && git add assets/ langs/ Docs/ **/*.ts Docs/* && git commit -m 'Housekeeping...'",
|
||||||
"parseSchools": "ts-node scripts/schools/amendSchoolData.ts",
|
"parseSchools": "ts-node scripts/schools/amendSchoolData.ts",
|
||||||
"steal": "ts-node scripts/thieves/stealLanguages.ts"
|
"steal": "ts-node scripts/fetchLanguages.ts"
|
||||||
},
|
},
|
||||||
"keywords": [
|
"keywords": [
|
||||||
"OpenStreetMap",
|
"OpenStreetMap",
|
||||||
|
|
|
@ -1,5 +1,6 @@
|
||||||
/**
|
/**
|
||||||
* Fetches all 'modern languages' from wikidata, then exports their names in every language
|
* Fetches all 'modern languages' from wikidata, then exports their names in every language.
|
||||||
|
* Some meta-info (e.g. RTL) is exported too
|
||||||
*/
|
*/
|
||||||
|
|
||||||
import * as wds from "wikidata-sdk"
|
import * as wds from "wikidata-sdk"
|
||||||
|
@ -21,12 +22,15 @@ async function fetchRegularLanguages() {
|
||||||
console.log("Fetching languages")
|
console.log("Fetching languages")
|
||||||
|
|
||||||
const sparql =
|
const sparql =
|
||||||
"SELECT ?lang ?label ?code \n" +
|
"SELECT ?lang ?label ?code ?directionalityLabel \n" +
|
||||||
"WHERE \n" +
|
"WHERE \n" +
|
||||||
"{ \n" +
|
"{ \n" +
|
||||||
" ?lang wdt:P31 wd:Q1288568. \n" + // language instanceOf (p31) modern language(Q1288568)
|
" ?lang wdt:P31 wd:Q1288568. \n" + // language instanceOf (p31) modern language(Q1288568)
|
||||||
" ?lang rdfs:label ?label. \n" +
|
" ?lang rdfs:label ?label. \n" +
|
||||||
" ?lang wdt:P424 ?code" + // Wikimedia language code seems to be close to the weblate entries
|
" ?lang wdt:P282 ?writing_system. \n"+
|
||||||
|
" ?writing_system wdt:P1406 ?directionality. \n" +
|
||||||
|
" ?lang wdt:P424 ?code. \n" +// Wikimedia language code seems to be close to the weblate entries
|
||||||
|
" SERVICE wikibase:label { bd:serviceParam wikibase:language \"en\". } \n" +
|
||||||
"} "
|
"} "
|
||||||
const url = wds.sparqlQuery(sparql)
|
const url = wds.sparqlQuery(sparql)
|
||||||
|
|
||||||
|
@ -67,16 +71,19 @@ async function fetchSpecial(id: number, code: string) {
|
||||||
return bindings
|
return bindings
|
||||||
}
|
}
|
||||||
|
|
||||||
function getNativeList(langs: Map<string, Map<string, string>>) {
|
function getNativeList(langs: Map<string, { translations: Map<string, string> }>) {
|
||||||
const native = {}
|
const native = {}
|
||||||
const keys: string[] = Array.from(langs.keys())
|
const keys: string[] = Array.from(langs.keys())
|
||||||
keys.sort()
|
keys.sort()
|
||||||
for (const key of keys) {
|
for (const key of keys) {
|
||||||
const translations: Map<string, string> = langs.get(key)
|
const translations: Map<string, string> = langs.get(key).translations
|
||||||
if (!LanguageUtils.usedLanguages.has(key)) {
|
if (!LanguageUtils.usedLanguages.has(key)) {
|
||||||
continue
|
continue
|
||||||
}
|
}
|
||||||
native[key] = translations.get(key)
|
native[key] = translations.get(key)
|
||||||
|
if(native[key] === undefined){
|
||||||
|
console.log("No native translation found for "+key)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
return native
|
return native
|
||||||
}
|
}
|
||||||
|
@ -108,33 +115,7 @@ async function getOfficialLanguagesPerCountry(): Promise<Map<string, string[]>>
|
||||||
return lngs
|
return lngs
|
||||||
}
|
}
|
||||||
|
|
||||||
async function main(wipeCache = false) {
|
async function getOfficialLanguagesPerCountryCached(wipeCache: boolean): Promise<Record<string /*Country code*/, string[] /*Language codes*/>>{
|
||||||
const cacheFile = "./assets/generated/languages-wd.json"
|
|
||||||
if (wipeCache || !existsSync(cacheFile)) {
|
|
||||||
console.log("Refreshing cache")
|
|
||||||
await fetch(cacheFile)
|
|
||||||
} else {
|
|
||||||
console.log("Reusing the cached file")
|
|
||||||
}
|
|
||||||
const data = JSON.parse(readFileSync(cacheFile, "UTF8"))
|
|
||||||
const perId = WikidataUtils.extractLanguageData(data, WikidataUtils.languageRemapping)
|
|
||||||
const nativeList = getNativeList(perId)
|
|
||||||
writeFileSync("./assets/language_native.json", JSON.stringify(nativeList, null, " "))
|
|
||||||
|
|
||||||
const translations = Utils.MapToObj(perId, (value, key) => {
|
|
||||||
if (!LanguageUtils.usedLanguages.has(key)) {
|
|
||||||
return undefined // Remove unused languages
|
|
||||||
}
|
|
||||||
return Utils.MapToObj(value, (v, k) => {
|
|
||||||
if (!LanguageUtils.usedLanguages.has(k)) {
|
|
||||||
return undefined
|
|
||||||
}
|
|
||||||
return v
|
|
||||||
})
|
|
||||||
})
|
|
||||||
|
|
||||||
writeFileSync("./assets/language_translations.json", JSON.stringify(translations, null, " "))
|
|
||||||
|
|
||||||
let officialLanguages: Record<string, string[]>
|
let officialLanguages: Record<string, string[]>
|
||||||
const officialLanguagesPath = "./assets/language_in_country.json"
|
const officialLanguagesPath = "./assets/language_in_country.json"
|
||||||
if (existsSync("./assets/languages_in_country.json") && !wipeCache) {
|
if (existsSync("./assets/languages_in_country.json") && !wipeCache) {
|
||||||
|
@ -143,37 +124,48 @@ async function main(wipeCache = false) {
|
||||||
officialLanguages = Utils.MapToObj(await getOfficialLanguagesPerCountry(), (t) => t)
|
officialLanguages = Utils.MapToObj(await getOfficialLanguagesPerCountry(), (t) => t)
|
||||||
writeFileSync(officialLanguagesPath, JSON.stringify(officialLanguages, null, " "))
|
writeFileSync(officialLanguagesPath, JSON.stringify(officialLanguages, null, " "))
|
||||||
}
|
}
|
||||||
|
return officialLanguages
|
||||||
|
}
|
||||||
|
|
||||||
const perLanguage = Utils.TransposeMap(officialLanguages)
|
async function main(wipeCache = false) {
|
||||||
console.log(JSON.stringify(perLanguage, null, " "))
|
const cacheFile = "./assets/generated/languages-wd.json"
|
||||||
const mappings: { if: string; then: Record<string, string>; hideInAnswer: string }[] = []
|
if (wipeCache || !existsSync(cacheFile)) {
|
||||||
for (const language of Object.keys(perLanguage)) {
|
console.log("Refreshing cache")
|
||||||
const countries = Utils.Dedup(perLanguage[language].map((c) => c.toLowerCase()))
|
await fetch(cacheFile)
|
||||||
mappings.push({
|
} else {
|
||||||
if: "language=" + language,
|
console.log("Reusing the cached file")
|
||||||
then: translations[language],
|
}
|
||||||
hideInAnswer: "_country=" + countries.join("|"),
|
|
||||||
|
|
||||||
|
const data = JSON.parse(readFileSync(cacheFile, "UTF8"))
|
||||||
|
const perId = WikidataUtils.extractLanguageData(data, WikidataUtils.languageRemapping)
|
||||||
|
const nativeList = getNativeList(perId)
|
||||||
|
writeFileSync("./assets/language_native.json", JSON.stringify(nativeList, null, " "))
|
||||||
|
const languagesPerCountry = Utils.TransposeMap(await getOfficialLanguagesPerCountryCached(wipeCache))
|
||||||
|
const translations = Utils.MapToObj(perId, (value, key) => {
|
||||||
|
// We keep all language codes in the list...
|
||||||
|
const translatedForId : Record<string, string | {countries?: string[], dir: string[]}> = Utils.MapToObj(value.translations, (v, k) => {
|
||||||
|
if (!LanguageUtils.usedLanguages.has(k)) {
|
||||||
|
// ... but don't keep translations if we don't have a displayed language for them
|
||||||
|
return undefined
|
||||||
|
}
|
||||||
|
return v
|
||||||
})
|
})
|
||||||
}
|
|
||||||
|
|
||||||
const tagRenderings = <QuestionableTagRenderingConfigJson>{
|
translatedForId["_meta"] = {
|
||||||
id: "official-language",
|
countries : Utils.Dedup( languagesPerCountry[key]),
|
||||||
mappings,
|
dir: value.directionality
|
||||||
question: "What languages are spoken here?",
|
}
|
||||||
}
|
|
||||||
|
return translatedForId
|
||||||
|
})
|
||||||
|
|
||||||
|
writeFileSync("./assets/language_translations.json", JSON.stringify(translations, null, " "))
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
writeFileSync(
|
|
||||||
"./assets/layers/language/language.json",
|
|
||||||
JSON.stringify(
|
|
||||||
<LayerConfigJson>{
|
|
||||||
id: "language",
|
|
||||||
description: "Various tagRenderings to help language tooling",
|
|
||||||
tagRenderings,
|
|
||||||
},
|
|
||||||
null,
|
|
||||||
" "
|
|
||||||
)
|
|
||||||
)
|
|
||||||
}
|
}
|
||||||
|
|
||||||
const forceRefresh = process.argv[2] === "--force-refresh"
|
const forceRefresh = process.argv[2] === "--force-refresh"
|
||||||
|
|
|
@ -1,127 +0,0 @@
|
||||||
/*
|
|
||||||
* Uses the languages in and to every translation from wikidata to generate a language question in wikidata/wikidata
|
|
||||||
* */
|
|
||||||
|
|
||||||
import WikidataUtils from "../../Utils/WikidataUtils"
|
|
||||||
import { existsSync, mkdirSync, readFileSync, writeFileSync } from "fs"
|
|
||||||
import { LayerConfigJson } from "../../Models/ThemeConfig/Json/LayerConfigJson"
|
|
||||||
import { MappingConfigJson } from "../../Models/ThemeConfig/Json/QuestionableTagRenderingConfigJson"
|
|
||||||
import LanguageUtils from "../../Utils/LanguageUtils"
|
|
||||||
import * as perCountry from "../../assets/language_in_country.json"
|
|
||||||
import { Utils } from "../../Utils"
|
|
||||||
function main() {
|
|
||||||
const sourcepath = "assets/generated/languages-wd.json"
|
|
||||||
console.log(`Converting language data file '${sourcepath}' into a tagMapping`)
|
|
||||||
const languages = WikidataUtils.extractLanguageData(
|
|
||||||
JSON.parse(readFileSync(sourcepath, "utf8")),
|
|
||||||
{}
|
|
||||||
)
|
|
||||||
const mappings: MappingConfigJson[] = []
|
|
||||||
const schoolmappings: MappingConfigJson[] = []
|
|
||||||
const brailemappings: MappingConfigJson[] = []
|
|
||||||
|
|
||||||
const countryToLanguage: Record<string, string[]> = perCountry
|
|
||||||
const officialLanguagesPerCountry = Utils.TransposeMap(countryToLanguage)
|
|
||||||
|
|
||||||
languages.forEach((l, code) => {
|
|
||||||
const then: Record<string, string> = {}
|
|
||||||
l.forEach((tr, lng) => {
|
|
||||||
const languageCodeWeblate = WikidataUtils.languageRemapping[lng] ?? lng
|
|
||||||
if (!LanguageUtils.usedLanguages.has(languageCodeWeblate)) {
|
|
||||||
return
|
|
||||||
}
|
|
||||||
then[languageCodeWeblate] = tr
|
|
||||||
})
|
|
||||||
|
|
||||||
const officialCountries = Utils.Dedup(
|
|
||||||
officialLanguagesPerCountry[code]?.map((s) => s.toLowerCase()) ?? []
|
|
||||||
)
|
|
||||||
const prioritySearch =
|
|
||||||
officialCountries.length > 0
|
|
||||||
? "_country~" + officialCountries.map((c) => "((^|;)" + c + "($|;))").join("|")
|
|
||||||
: undefined
|
|
||||||
mappings.push(<MappingConfigJson>{
|
|
||||||
if: "language:" + code + "=yes",
|
|
||||||
ifnot: "language:" + code + "=",
|
|
||||||
searchTerms: {
|
|
||||||
"*": [code],
|
|
||||||
},
|
|
||||||
then,
|
|
||||||
priorityIf: prioritySearch,
|
|
||||||
})
|
|
||||||
|
|
||||||
schoolmappings.push(<MappingConfigJson>{
|
|
||||||
if: "school:language=" + code,
|
|
||||||
then,
|
|
||||||
priorityIf: prioritySearch,
|
|
||||||
searchTerms: {
|
|
||||||
"*": [code],
|
|
||||||
},
|
|
||||||
})
|
|
||||||
|
|
||||||
brailemappings.push(<MappingConfigJson>{
|
|
||||||
if: "tactile_writing:braille:" + code + "=yes",
|
|
||||||
ifnot: "tactile_writing:braille:" + code + "=",
|
|
||||||
searchTerms: {
|
|
||||||
"*": [code],
|
|
||||||
},
|
|
||||||
then,
|
|
||||||
priorityIf: prioritySearch,
|
|
||||||
})
|
|
||||||
})
|
|
||||||
|
|
||||||
const wikidataLayer = <LayerConfigJson>{
|
|
||||||
id: "wikidata",
|
|
||||||
description: {
|
|
||||||
en: "Various tagrenderings which are generated from Wikidata. Automatically generated with a script, don't edit manually",
|
|
||||||
},
|
|
||||||
"#dont-translate": "*",
|
|
||||||
source: {
|
|
||||||
osmTags: "id~*",
|
|
||||||
},
|
|
||||||
title: null,
|
|
||||||
mapRendering: null,
|
|
||||||
tagRenderings: [
|
|
||||||
{
|
|
||||||
id: "language",
|
|
||||||
// @ts-ignore
|
|
||||||
description: "Enables to pick *a single* 'language:<lng>=yes' within the mappings",
|
|
||||||
mappings,
|
|
||||||
},
|
|
||||||
{
|
|
||||||
builtin: "wikidata.language",
|
|
||||||
override: {
|
|
||||||
id: "language-multi",
|
|
||||||
// @ts-ignore
|
|
||||||
description:
|
|
||||||
"Enables to pick *multiple* 'language:<lng>=yes' within the mappings",
|
|
||||||
multiAnswer: true,
|
|
||||||
},
|
|
||||||
},
|
|
||||||
{
|
|
||||||
id: "school-language",
|
|
||||||
// @ts-ignore
|
|
||||||
description: "Enables to pick a single 'school:language=<lng>' within the mappings",
|
|
||||||
multiAnswer: true,
|
|
||||||
mappings: schoolmappings,
|
|
||||||
},
|
|
||||||
{
|
|
||||||
id: "tactile_writing-braille",
|
|
||||||
// @ts-ignore
|
|
||||||
description:
|
|
||||||
"Enables to pick *multiple* 'tactile_writing:braille=<lng>' within the mappings",
|
|
||||||
multiAnswer: true,
|
|
||||||
mappings: brailemappings,
|
|
||||||
},
|
|
||||||
],
|
|
||||||
}
|
|
||||||
const dir = "./assets/layers/wikidata/"
|
|
||||||
if (!existsSync(dir)) {
|
|
||||||
mkdirSync(dir)
|
|
||||||
}
|
|
||||||
const path = dir + "wikidata.json"
|
|
||||||
writeFileSync(path, JSON.stringify(wikidataLayer, null, " "))
|
|
||||||
console.log("Written " + path)
|
|
||||||
}
|
|
||||||
|
|
||||||
main()
|
|
Loading…
Add table
Reference in a new issue