| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  | /** | 
					
						
							|  |  |  |  * Fetches all 'modern languages' from wikidata, then exports their names in every language | 
					
						
							|  |  |  |  */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import * as wds from "wikidata-sdk" | 
					
						
							|  |  |  | import {Utils} from "../Utils"; | 
					
						
							|  |  |  | import ScriptUtils from "./ScriptUtils"; | 
					
						
							|  |  |  | import {existsSync, readFileSync, writeFileSync} from "fs"; | 
					
						
							| 
									
										
										
										
											2022-02-25 01:50:15 +01:00
										 |  |  | import * as used_languages from "../assets/generated/used_languages.json" | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  | const languageRemap = { | 
					
						
							|  |  |  |     // MapComplete (or weblate) on the left, language of wikimedia on the right
 | 
					
						
							|  |  |  |     "nb":"nb_NO", | 
					
						
							|  |  |  |     "zh-hant":"zh_Hant", | 
					
						
							|  |  |  |     "zh-hans":"zh_Hans", | 
					
						
							|  |  |  |     "pt-br":"pt_BR" | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-25 01:50:15 +01:00
										 |  |  | const usedLanguages : Set<string> = new Set(used_languages.languages) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  | async function fetch(target: string){ | 
					
						
							|  |  |  |     const regular = await fetchRegularLanguages() | 
					
						
							|  |  |  |     writeFileSync(target, JSON.stringify(regular, null, "  ")) | 
					
						
							|  |  |  |     console.log("Written to "+target) | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | async function fetchRegularLanguages() { | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  |     ScriptUtils.fixUtils() | 
					
						
							|  |  |  |     console.log("Fetching languages") | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     const sparql = 'SELECT ?lang ?label ?code \n' + | 
					
						
							|  |  |  |         'WHERE \n' + | 
					
						
							|  |  |  |         '{ \n' + | 
					
						
							|  |  |  |         '  ?lang wdt:P31 wd:Q1288568. \n' + // language instanceOf (p31) modern language(Q1288568)
 | 
					
						
							|  |  |  |         '  ?lang rdfs:label ?label. \n' + | 
					
						
							|  |  |  |         '  ?lang wdt:P424 ?code' + // Wikimedia language code seems to be close to the weblate entries
 | 
					
						
							|  |  |  |         '} '  | 
					
						
							|  |  |  |     const url = wds.sparqlQuery(sparql) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // request the generated URL with your favorite HTTP request library
 | 
					
						
							|  |  |  |     const result = await Utils.downloadJson(url, {"User-Agent": "MapComplete script"}) | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  |     const bindings = result.results.bindings | 
					
						
							|  |  |  |      | 
					
						
							|  |  |  |     const zh_hant = await fetchSpecial(18130932, "zh_Hant") | 
					
						
							|  |  |  |     const zh_hans = await fetchSpecial(13414913, "zh_Hant") | 
					
						
							|  |  |  |     const pt_br = await fetchSpecial( 750553, "pt_BR") | 
					
						
							| 
									
										
										
										
											2022-04-22 16:51:49 +02:00
										 |  |  |     const fil = await fetchSpecial( 33298, "fil") | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  |     bindings.push(...zh_hant) | 
					
						
							|  |  |  |     bindings.push(...zh_hans) | 
					
						
							|  |  |  |     bindings.push(...pt_br) | 
					
						
							| 
									
										
										
										
											2022-04-22 16:51:49 +02:00
										 |  |  |     bindings.push(...fil) | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  |      | 
					
						
							|  |  |  |     return result.results.bindings | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | async function fetchSpecial(id: number, code: string) { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     ScriptUtils.fixUtils() | 
					
						
							|  |  |  |     console.log("Fetching languages") | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     const sparql = 'SELECT ?lang ?label ?code \n' + | 
					
						
							|  |  |  |         'WHERE \n' + | 
					
						
							|  |  |  |         '{ \n' + | 
					
						
							|  |  |  |         '  wd:Q'+id+' rdfs:label ?label. \n' + | 
					
						
							|  |  |  |         '} ' | 
					
						
							|  |  |  |     const url = wds.sparqlQuery(sparql) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // request the generated URL with your favorite HTTP request library
 | 
					
						
							|  |  |  |     const result = await Utils.downloadJson(url, {"User-Agent": "MapComplete script"}) | 
					
						
							|  |  |  |     const bindings = result.results.bindings | 
					
						
							|  |  |  |     bindings.forEach(binding => binding["code"] = {value: code}) | 
					
						
							|  |  |  |     return bindings | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | function extract(data){ | 
					
						
							|  |  |  |     console.log("Got "+data.length+" entries") | 
					
						
							|  |  |  |     const perId = new Map<string, Map<string, string>>(); | 
					
						
							|  |  |  |     for (const element of data) { | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  |         let id = element.code.value | 
					
						
							|  |  |  |         id = languageRemap[id] ?? id | 
					
						
							|  |  |  |         let labelLang = element.label["xml:lang"] | 
					
						
							|  |  |  |         labelLang = languageRemap[labelLang] ?? labelLang | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |         const value = element.label.value | 
					
						
							|  |  |  |         if(!perId.has(id)){ | 
					
						
							|  |  |  |             perId.set(id, new Map<string, string>()) | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         perId.get(id).set(labelLang, value) | 
					
						
							|  |  |  |     } | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |     console.log("Got "+perId.size+" languages") | 
					
						
							|  |  |  |     return perId | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | function getNativeList(langs: Map<string, Map<string, string>>){ | 
					
						
							|  |  |  |     const native = {} | 
					
						
							| 
									
										
										
										
											2022-04-19 01:55:14 +02:00
										 |  |  |     const keys: string[] = Array.from(langs.keys()) | 
					
						
							|  |  |  |     keys.sort() | 
					
						
							|  |  |  |     for (const key of keys) { | 
					
						
							|  |  |  |         const translations: Map<string, string> = langs.get(key) | 
					
						
							| 
									
										
										
										
											2022-02-25 01:50:15 +01:00
										 |  |  |         if(!usedLanguages.has(key)){ | 
					
						
							| 
									
										
										
										
											2022-04-19 01:55:14 +02:00
										 |  |  |             continue | 
					
						
							| 
									
										
										
										
											2022-02-25 01:50:15 +01:00
										 |  |  |         } | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |         native[key] = translations.get(key) | 
					
						
							| 
									
										
										
										
											2022-04-19 01:55:14 +02:00
										 |  |  |     } | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |     return native | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  | async function main(wipeCache = false){ | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |     const cacheFile = "./assets/generated/languages-wd.json" | 
					
						
							|  |  |  |     if(wipeCache || !existsSync(cacheFile)){ | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  |         console.log("Refreshing cache") | 
					
						
							|  |  |  |         await fetch(cacheFile); | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |     }else{ | 
					
						
							|  |  |  |         console.log("Reusing the cached file") | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |     const data = JSON.parse(readFileSync( cacheFile, "UTF8")) | 
					
						
							|  |  |  |     const perId = extract(data) | 
					
						
							|  |  |  |     const nativeList = getNativeList(perId) | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  |     writeFileSync("./assets/language_native.json", JSON.stringify(nativeList, null, "  ")) | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |      | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-25 01:50:15 +01:00
										 |  |  |     const translations = Utils.MapToObj<Map<string, string>>(perId, (value, key) => { | 
					
						
							|  |  |  |         if(!usedLanguages.has(key)){ | 
					
						
							|  |  |  |             return undefined // Remove unused languages
 | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         return Utils.MapToObj(value, (v, k ) => { | 
					
						
							|  |  |  |             if(!usedLanguages.has(k)){ | 
					
						
							|  |  |  |                 return undefined | 
					
						
							|  |  |  |             } | 
					
						
							|  |  |  |             return v | 
					
						
							|  |  |  |         }) | 
					
						
							|  |  |  |     }) | 
					
						
							|  |  |  |      | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  |     writeFileSync("./assets/language_translations.json",  | 
					
						
							| 
									
										
										
										
											2022-02-25 01:50:15 +01:00
										 |  |  |         JSON.stringify(translations, null, "  ")) | 
					
						
							| 
									
										
										
										
											2022-02-24 02:33:20 +01:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-02-25 01:15:16 +01:00
										 |  |  | const forceRefresh = process.argv[2] === "--force-refresh" | 
					
						
							|  |  |  | main(forceRefresh).then(() => console.log("Done!")) |