forked from MapComplete/MapComplete
		
	
		
			
				
	
	
		
			177 lines
		
	
	
	
		
			6.3 KiB
		
	
	
	
		
			TypeScript
		
	
	
	
	
	
			
		
		
	
	
			177 lines
		
	
	
	
		
			6.3 KiB
		
	
	
	
		
			TypeScript
		
	
	
	
	
	
/**
 | 
						|
 * Fetches all 'modern languages' from wikidata, then exports their names in every language
 | 
						|
 */
 | 
						|
 | 
						|
import * as wds from "wikidata-sdk"
 | 
						|
import {Utils} from "../Utils";
 | 
						|
import ScriptUtils from "./ScriptUtils";
 | 
						|
import {existsSync, readFileSync, writeFileSync} from "fs";
 | 
						|
import {QuestionableTagRenderingConfigJson} from "../Models/ThemeConfig/Json/QuestionableTagRenderingConfigJson";
 | 
						|
import {LayerConfigJson} from "../Models/ThemeConfig/Json/LayerConfigJson";
 | 
						|
import WikidataUtils from "../Utils/WikidataUtils";
 | 
						|
import LanguageUtils from "../Utils/LanguageUtils";
 | 
						|
 | 
						|
async function fetch(target: string){
 | 
						|
    const regular = await fetchRegularLanguages()
 | 
						|
    writeFileSync(target, JSON.stringify(regular, null, "  "))
 | 
						|
    console.log("Written to "+target)
 | 
						|
}
 | 
						|
 | 
						|
async function fetchRegularLanguages() {
 | 
						|
 | 
						|
    console.log("Fetching languages")
 | 
						|
 | 
						|
    const sparql = 'SELECT ?lang ?label ?code \n' +
 | 
						|
        'WHERE \n' +
 | 
						|
        '{ \n' +
 | 
						|
        '  ?lang wdt:P31 wd:Q1288568. \n' + // language instanceOf (p31) modern language(Q1288568)
 | 
						|
        '  ?lang rdfs:label ?label. \n' +
 | 
						|
        '  ?lang wdt:P424 ?code' + // Wikimedia language code seems to be close to the weblate entries
 | 
						|
        '} ' 
 | 
						|
    const url = wds.sparqlQuery(sparql)
 | 
						|
 | 
						|
// request the generated URL with your favorite HTTP request library
 | 
						|
    const result = await Utils.downloadJson(url, {"User-Agent": "MapComplete script"})
 | 
						|
    const bindings = result.results.bindings
 | 
						|
    
 | 
						|
    const zh_hant = await fetchSpecial(18130932, "zh_Hant")
 | 
						|
    const zh_hans = await fetchSpecial(13414913, "zh_Hant")
 | 
						|
    const pt_br = await fetchSpecial( 750553, "pt_BR")
 | 
						|
    const fil = await fetchSpecial( 33298, "fil")
 | 
						|
 | 
						|
    bindings.push(...zh_hant)
 | 
						|
    bindings.push(...zh_hans)
 | 
						|
    bindings.push(...pt_br)
 | 
						|
    bindings.push(...fil)
 | 
						|
    
 | 
						|
    return result.results.bindings
 | 
						|
 | 
						|
}
 | 
						|
 | 
						|
async function fetchSpecial(id: number, code: string) {
 | 
						|
 | 
						|
    ScriptUtils.fixUtils()
 | 
						|
    console.log("Fetching languages")
 | 
						|
 | 
						|
    const sparql = 'SELECT ?lang ?label ?code \n' +
 | 
						|
        'WHERE \n' +
 | 
						|
        '{ \n' +
 | 
						|
        '  wd:Q'+id+' rdfs:label ?label. \n' +
 | 
						|
        '} '
 | 
						|
    const url = wds.sparqlQuery(sparql)
 | 
						|
 | 
						|
    const result = await Utils.downloadJson(url, {"User-Agent": "MapComplete script"})
 | 
						|
    const bindings = result.results.bindings
 | 
						|
    bindings.forEach(binding => binding["code"] = {value: code})
 | 
						|
    return bindings
 | 
						|
}
 | 
						|
 | 
						|
function getNativeList(langs: Map<string, Map<string, string>>){
 | 
						|
    const native = {}
 | 
						|
    const keys: string[] = Array.from(langs.keys())
 | 
						|
    keys.sort()
 | 
						|
    for (const key of keys) {
 | 
						|
        const translations: Map<string, string> = langs.get(key)
 | 
						|
        if(!LanguageUtils.usedLanguages.has(key)){
 | 
						|
            continue
 | 
						|
        }
 | 
						|
        native[key] = translations.get(key)
 | 
						|
    }
 | 
						|
    return native
 | 
						|
}
 | 
						|
 | 
						|
async function getOfficialLanguagesPerCountry() : Promise<Map<string, string[]>>{
 | 
						|
    const lngs = new Map<string, string[]>();
 | 
						|
    const sparql = `SELECT ?country ?countryLabel ?countryCode ?language ?languageCode ?languageLabel
 | 
						|
    WHERE
 | 
						|
    {
 | 
						|
            ?country wdt:P31/wdt:P279* wd:Q3624078;
 | 
						|
        wdt:P297 ?countryCode;
 | 
						|
        wdt:P37 ?language.
 | 
						|
            ?language wdt:P218 ?languageCode.
 | 
						|
            SERVICE wikibase:label { bd:serviceParam wikibase:language "en". }
 | 
						|
    }`
 | 
						|
    const url = wds.sparqlQuery(sparql)
 | 
						|
 | 
						|
    const result = await Utils.downloadJson(url, {"User-Agent": "MapComplete script"})
 | 
						|
    const bindings : {countryCode: {value: string}, languageCode: {value: string}}[]= result.results.bindings
 | 
						|
    for (const binding of bindings) {
 | 
						|
        const countryCode = binding.countryCode.value
 | 
						|
        const language = binding.languageCode.value
 | 
						|
        if(lngs.get(countryCode) === undefined){
 | 
						|
            lngs.set(countryCode, [])
 | 
						|
        }
 | 
						|
        lngs.get(countryCode).push(language)
 | 
						|
    }
 | 
						|
    return lngs;
 | 
						|
}
 | 
						|
 | 
						|
async function main(wipeCache = false){
 | 
						|
    const cacheFile = "./assets/generated/languages-wd.json"
 | 
						|
    if(wipeCache || !existsSync(cacheFile)){
 | 
						|
        console.log("Refreshing cache")
 | 
						|
        await fetch(cacheFile);
 | 
						|
    }else{
 | 
						|
        console.log("Reusing the cached file")
 | 
						|
    }
 | 
						|
    const data = JSON.parse(readFileSync( cacheFile, "UTF8"))
 | 
						|
    const perId = WikidataUtils.extractLanguageData(data, WikidataUtils.languageRemapping)
 | 
						|
    const nativeList = getNativeList(perId)
 | 
						|
    writeFileSync("./assets/language_native.json", JSON.stringify(nativeList, null, "  "))
 | 
						|
    
 | 
						|
 | 
						|
    const translations = Utils.MapToObj(perId, (value, key) => {
 | 
						|
        if(!LanguageUtils.usedLanguages.has(key)){
 | 
						|
            return undefined // Remove unused languages
 | 
						|
        }
 | 
						|
        return Utils.MapToObj(value, (v, k ) => {
 | 
						|
            if(!LanguageUtils.usedLanguages.has(k)){
 | 
						|
                return undefined
 | 
						|
            }
 | 
						|
            return v
 | 
						|
        })
 | 
						|
    })
 | 
						|
    
 | 
						|
    writeFileSync("./assets/language_translations.json", 
 | 
						|
        JSON.stringify(translations, null, "  "))
 | 
						|
    
 | 
						|
    
 | 
						|
    let officialLanguages : Record<string, string[]>;
 | 
						|
    const officialLanguagesPath = "./assets/language_in_country.json"
 | 
						|
    if(existsSync("./assets/languages_in_country.json") && !wipeCache){
 | 
						|
        officialLanguages = JSON.parse(readFileSync(officialLanguagesPath, "utf8"))
 | 
						|
    }else {
 | 
						|
        officialLanguages = Utils.MapToObj(await getOfficialLanguagesPerCountry(), t => t)
 | 
						|
        writeFileSync(officialLanguagesPath, JSON.stringify(officialLanguages, null, "  "))
 | 
						|
    }
 | 
						|
    
 | 
						|
    const perLanguage = Utils.TransposeMap(officialLanguages);
 | 
						|
    console.log(JSON.stringify(perLanguage, null, " "))
 | 
						|
    const mappings: {if: string, then: Record<string, string>, hideInAnswer: string}[] = []
 | 
						|
    for (const language of Object.keys(perLanguage)) {
 | 
						|
        const countries = Utils.Dedup(perLanguage[language].map(c => c.toLowerCase()))
 | 
						|
        mappings.push({
 | 
						|
            if: "language="+language,
 | 
						|
            then: translations[language],
 | 
						|
            hideInAnswer : "_country="+countries.join("|")
 | 
						|
        })
 | 
						|
    }
 | 
						|
    
 | 
						|
    const tagRenderings =  <QuestionableTagRenderingConfigJson> {
 | 
						|
        id: "official-language",
 | 
						|
        mappings,
 | 
						|
        question: "What languages are spoken here?"
 | 
						|
    }
 | 
						|
    
 | 
						|
    writeFileSync("./assets/layers/language/language.json", JSON.stringify(<LayerConfigJson>{
 | 
						|
        id:"language",
 | 
						|
        description: "Various tagRenderings to help language tooling",
 | 
						|
        tagRenderings
 | 
						|
    }, null, "  "))
 | 
						|
    
 | 
						|
}
 | 
						|
 | 
						|
const forceRefresh = process.argv[2] === "--force-refresh"
 | 
						|
ScriptUtils.fixUtils()
 | 
						|
main(forceRefresh).then(() => console.log("Done!"))
 | 
						|
 |