import known_layers from "../src/assets/generated/known_layers.json" import { LayerConfigJson } from "../src/Models/ThemeConfig/Json/LayerConfigJson" import { TagUtils } from "../src/Logic/Tags/TagUtils" import { Utils } from "../src/Utils" import { copyFileSync, existsSync, readFileSync, writeFileSync } from "fs" import ScriptUtils from "./ScriptUtils" import TagRenderingConfig from "../src/Models/ThemeConfig/TagRenderingConfig" import { And } from "../src/Logic/Tags/And" import Script from "./Script" import NameSuggestionIndex from "../src/Logic/Web/NameSuggestionIndex" import TagInfo from "../src/Logic/Web/TagInfo" class Utilities { static mapValues( record: Record, f: (t: T) => TOut ): Record { const newR = >{} for (const x in record) { newR[x] = f(record[x]) } return newR } } class GenerateStats extends Script { async createOptimizationFile(includeTags = true) { ScriptUtils.fixUtils() const layers = known_layers["layers"] const keysAndTags = new Map>() for (const layer of layers) { if (layer.source["geoJson"] !== undefined && !layer.source["isOsmCache"]) { continue } if (layer.source == null || typeof layer.source === "string") { continue } const sourcesList = [TagUtils.Tag(layer.source["osmTags"])] if (layer?.title) { sourcesList.push(...new TagRenderingConfig(layer.title).usedTags()) } const sources = new And(sourcesList) const allKeys = sources.usedKeys() for (const key of allKeys) { if (!keysAndTags.has(key)) { keysAndTags.set(key, new Set()) } } const allTags = includeTags ? sources.usedTags() : [] for (const tag of allTags) { if (!keysAndTags.has(tag.key)) { keysAndTags.set(tag.key, new Set()) } keysAndTags.get(tag.key).add(tag.value) } } const keyTotal = new Map() const tagTotal = new Map>() await Promise.all( Array.from(keysAndTags.keys()).map(async (key) => { const values = keysAndTags.get(key) const data = await TagInfo.global.getStats(key) const count = data.data.find((item) => item.type === "all").count keyTotal.set(key, count) console.log(key, "-->", count) if (values.size > 0) { tagTotal.set(key, new Map()) await Promise.all( Array.from(values).map(async (value) => { const tagData = await TagInfo.global.getStats(key, value) const count = tagData.data.find((item) => item.type === "all").count tagTotal.get(key).set(value, count) console.log(key + "=" + value, "-->", count) }) ) } }) ) writeFileSync( "./src/assets/key_totals.json", JSON.stringify( { "#": "Generated with generateStats.ts", date: new Date().toISOString(), keys: Utils.MapToObj(keyTotal, (t) => t), tags: Utils.MapToObj(tagTotal, (v) => Utils.MapToObj(v, (t) => t)), }, null, " " ) ) } private summarizeNSI(sourcefile: string, pathNoExtension: string): void { const data = >>( JSON.parse(readFileSync(sourcefile, "utf8")) ) const allCountries: Set = new Set() for (const brand in data) { const perCountry = data[brand] for (const country in perCountry) { allCountries.add(country) const count = perCountry[country] if (count === 0) { delete perCountry[country] } } } const pathOut = pathNoExtension + ".summarized.json" writeFileSync(pathOut, JSON.stringify(data, null, " "), "utf8") console.log("Written", pathOut) const allBrands = Object.keys(data) allBrands.sort() for (const country of allCountries) { const summary = >{} for (const brand of allBrands) { const count = data[brand][country] if (count > 2) { // EƩntje is geentje // We ignore count == 1 as they are rather exceptional summary[brand] = data[brand][country] } } const countryPath = pathNoExtension + "." + country + ".json" writeFileSync(countryPath, JSON.stringify(summary), "utf8") console.log("Written", countryPath) } } async createNameSuggestionIndexFile(basepath: string, type: "brand" | "operator" | string) { const path = basepath + type + ".json" let allBrands: Record> = {} if (existsSync(path)) { allBrands = JSON.parse(readFileSync(path, "utf8")) console.log( "Loaded", Object.keys(allBrands).length, " previously loaded " + type, "from", path ) } const nsi = await NameSuggestionIndex.getNsiIndex() const allBrandNames: string[] = Utils.Dedup( nsi.allPossible(type).map((item) => item.tags[type]) ) const batchSize = 50 for (let i = 0; i < allBrandNames.length; i += batchSize) { console.warn( "Downloading ", batchSize, "occurence counts, items: ", i + "/" + allBrandNames.length ) let downloaded = 0 await Promise.all( Utils.TimesT(batchSize, async (j) => { const brand = allBrandNames[i + j] if (!allBrands[brand]) { allBrands[brand] = {} } const writeInto = allBrands[brand] const dloaded = await TagInfo.getGlobalDistributionsFor( writeInto, (stats) => stats.data.find((t) => t.type === "all").count, type, brand ) downloaded += dloaded }) ) console.log("Downloaded ", downloaded, " values this batch") writeFileSync(path, JSON.stringify(allBrands), "utf8") console.log("Checkpointed", path) } console.log("Written:", path) writeFileSync(path, JSON.stringify(allBrands), "utf8") } constructor() { super( "Downloads stats on osmSource-tags and keys from tagInfo. There are two usecases with separate outputs:\n 1. To optimize the query before sending it to overpass (generates ./src/assets/key_totals.json) \n 2. To amend the Name Suggestion Index " ) } async main(_: string[]) { const target = "./public/assets/data/nsi/" const basepath = target + "stats/" { const src = "./node_modules/name-suggestion-index/dist/" const files = ["featureCollection.min.json", "nsi.min.json", "wikidata.min.json"] console.log(process.cwd()) for (const file of files) { console.log("Copying ", src + file, target + "/" + file) copyFileSync(src + file, target + file) } } for (const type of ["operator", "brand"]) { await this.createNameSuggestionIndexFile(basepath, type) this.summarizeNSI(basepath + type + ".json", "./public/assets/data/nsi/stats/" + type) } await this.createOptimizationFile() } } new GenerateStats().run()