MapComplete/scripts/generateCache.ts

572 lines
20 KiB
TypeScript
Raw Normal View History

/**
* Generates a collection of geojson files based on an overpass query for a given theme
*/
2023-07-15 18:55:03 +02:00
import { Utils } from "../src/Utils"
import { Overpass } from "../src/Logic/Osm/Overpass"
import { existsSync, readFileSync, writeFileSync } from "fs"
2023-07-15 18:55:03 +02:00
import { TagsFilter } from "../src/Logic/Tags/TagsFilter"
import { Or } from "../src/Logic/Tags/Or"
import { AllKnownLayouts } from "../src/Customizations/AllKnownLayouts"
2022-09-08 21:40:48 +02:00
import * as OsmToGeoJson from "osmtogeojson"
2023-07-15 18:55:03 +02:00
import MetaTagging from "../src/Logic/MetaTagging"
import { UIEventSource } from "../src/Logic/UIEventSource"
import { TileRange, Tiles } from "../src/Models/TileRange"
import LayoutConfig from "../src/Models/ThemeConfig/LayoutConfig"
2022-09-08 21:40:48 +02:00
import ScriptUtils from "./ScriptUtils"
2023-07-15 18:55:03 +02:00
import PerLayerFeatureSourceSplitter from "../src/Logic/FeatureSource/PerLayerFeatureSourceSplitter"
import FilteredLayer from "../src/Models/FilteredLayer"
import StaticFeatureSource from "../src/Logic/FeatureSource/Sources/StaticFeatureSource"
import Constants from "../src/Models/Constants"
import { GeoOperations } from "../src/Logic/GeoOperations"
import SimpleMetaTaggers, { ReferencingWaysMetaTagger } from "../src/Logic/SimpleMetaTagger"
import FilteringFeatureSource from "../src/Logic/FeatureSource/Sources/FilteringFeatureSource"
import { Feature } from "geojson"
2023-07-15 18:55:03 +02:00
import { BBox } from "../src/Logic/BBox"
import { FeatureSource } from "../src/Logic/FeatureSource/FeatureSource"
import OsmObjectDownloader from "../src/Logic/Osm/OsmObjectDownloader"
import FeaturePropertiesStore from "../src/Logic/FeatureSource/Actors/FeaturePropertiesStore"
2022-01-16 01:59:06 +01:00
2021-09-10 00:00:48 +02:00
ScriptUtils.fixUtils()
function createOverpassObject(theme: LayoutConfig, backend: string) {
2022-09-08 21:40:48 +02:00
let filters: TagsFilter[] = []
let extraScripts: string[] = []
for (const layer of theme.layers) {
2022-09-08 21:40:48 +02:00
if (typeof layer === "string") {
throw "A layer was not expanded!"
}
if (layer.doNotDownload) {
2022-09-08 21:40:48 +02:00
continue
}
2023-05-17 13:18:00 +02:00
if (!layer.source) {
continue
}
if (layer.source.geojsonSource) {
// This layer defines a geoJson-source
// SHould it be cached?
if (layer.source.isOsmCacheLayer !== true) {
2022-09-08 21:40:48 +02:00
continue
}
}
filters.push(layer.source.osmTags)
}
filters = Utils.NoNull(filters)
extraScripts = Utils.NoNull(extraScripts)
if (filters.length + extraScripts.length === 0) {
throw "Nothing to download! The theme doesn't declare anything to download"
}
return new Overpass(new Or(filters), extraScripts, backend, new UIEventSource<number>(60))
}
function rawJsonName(targetDir: string, x: number, y: number, z: number): string {
return targetDir + "_" + z + "_" + x + "_" + y + ".json"
}
function geoJsonName(targetDir: string, x: number, y: number, z: number): string {
return targetDir + "_" + z + "_" + x + "_" + y + ".geojson"
}
2023-02-06 22:23:56 +01:00
/// Downloads the given tilerange from overpass and saves them to disk
2022-09-08 21:40:48 +02:00
async function downloadRaw(
targetdir: string,
r: TileRange,
theme: LayoutConfig
2023-02-06 22:23:56 +01:00
): Promise<{ failed: number; skipped: number }> {
let downloaded = 0
2021-04-22 16:01:43 +02:00
let failed = 0
let skipped = 0
2021-10-13 01:28:20 +02:00
const startTime = new Date().getTime()
for (let x = r.xstart; x <= r.xend; x++) {
for (let y = r.ystart; y <= r.yend; y++) {
2022-09-08 21:40:48 +02:00
downloaded++
const filename = rawJsonName(targetdir, x, y, r.zoomlevel)
if (existsSync(filename)) {
console.log("Already exists (not downloading again): ", filename)
2021-04-22 16:01:43 +02:00
skipped++
2022-09-08 21:40:48 +02:00
continue
}
2021-10-13 01:28:20 +02:00
const runningSeconds = (new Date().getTime() - startTime) / 1000
const resting = failed + (r.total - downloaded)
2022-09-08 21:40:48 +02:00
const perTile = runningSeconds / (downloaded - skipped)
2021-11-07 16:34:51 +01:00
const estimated = Math.floor(resting * perTile)
2022-09-08 21:40:48 +02:00
console.log(
"total: ",
downloaded,
"/",
r.total,
"failed: ",
failed,
"skipped: ",
skipped,
"running time: ",
Utils.toHumanTime(runningSeconds) + "s",
"estimated left: ",
Utils.toHumanTime(estimated),
"(" + Math.floor(perTile) + "s/tile)"
)
const boundsArr = Tiles.tile_bounds(r.zoomlevel, x, y)
const bounds = {
north: Math.max(boundsArr[0][0], boundsArr[1][0]),
south: Math.min(boundsArr[0][0], boundsArr[1][0]),
east: Math.max(boundsArr[0][1], boundsArr[1][1]),
2022-09-08 21:40:48 +02:00
west: Math.min(boundsArr[0][1], boundsArr[1][1]),
}
2022-09-08 21:40:48 +02:00
const overpass = createOverpassObject(
theme,
Constants.defaultOverpassUrls[failed % Constants.defaultOverpassUrls.length]
)
const url = overpass.buildQuery(
"[bbox:" +
bounds.south +
"," +
bounds.west +
"," +
bounds.north +
"," +
bounds.east +
"]"
2022-09-08 21:40:48 +02:00
)
2021-10-03 01:38:57 +02:00
try {
2022-02-14 01:15:20 +01:00
const json = await Utils.downloadJson(url)
if ((<string>json.remark ?? "").startsWith("runtime error")) {
console.error("Got a runtime error: ", json.remark)
2022-09-08 21:40:48 +02:00
failed++
2021-11-07 16:34:51 +01:00
} else if (json.elements.length === 0) {
console.log("Got an empty response! Writing anyway")
}
2021-10-03 01:38:57 +02:00
2022-09-08 21:40:48 +02:00
console.log(
"Got the response - writing ",
json.elements.length,
" elements to ",
filename
)
writeFileSync(filename, JSON.stringify(json, null, " "))
2021-10-03 01:38:57 +02:00
} catch (err) {
console.log(url)
2022-09-08 21:40:48 +02:00
console.log(
"Could not download - probably hit the rate limit; waiting a bit. (" + err + ")"
)
failed++
2023-05-17 13:18:00 +02:00
await ScriptUtils.sleep(1)
2021-09-10 00:00:48 +02:00
}
}
}
2021-04-22 16:01:43 +02:00
return { failed: failed, skipped: skipped }
}
2022-09-08 21:40:48 +02:00
/*
* Downloads extra geojson sources and returns the features.
* Extra geojson layers should not be tiled
*/
2022-09-08 21:40:48 +02:00
async function downloadExtraData(theme: LayoutConfig) /* : any[] */ {
const allFeatures: any[] = []
for (const layer of theme.layers) {
if (!layer.source?.geojsonSource) {
2022-09-08 21:40:48 +02:00
continue
}
2023-05-17 13:18:00 +02:00
const source = layer.source.geojsonSource
2021-09-10 00:00:48 +02:00
if (layer.source.isOsmCacheLayer !== undefined && layer.source.isOsmCacheLayer !== false) {
// Cached layers are not considered here
2022-09-08 21:40:48 +02:00
continue
}
if (source.startsWith("https://api.openstreetmap.org/api/0.6/notes.json")) {
2023-05-17 13:18:00 +02:00
// We ignore map notes
continue
}
console.log("Downloading extra data: ", source)
2022-09-08 21:40:48 +02:00
await Utils.downloadJson(source).then((json) => allFeatures.push(...json.features))
}
2022-09-08 21:40:48 +02:00
return allFeatures
}
2022-09-08 21:40:48 +02:00
function loadAllTiles(
targetdir: string,
r: TileRange,
theme: LayoutConfig,
extraFeatures: any[]
): FeatureSource {
let allFeatures = [...extraFeatures]
2022-09-08 21:40:48 +02:00
let processed = 0
for (let x = r.xstart; x <= r.xend; x++) {
for (let y = r.ystart; y <= r.yend; y++) {
2022-09-08 21:40:48 +02:00
processed++
const filename = rawJsonName(targetdir, x, y, r.zoomlevel)
console.log(" Loading and processing", processed, "/", r.total, filename)
if (!existsSync(filename)) {
console.error("Not found - and not downloaded. Run this script again!: " + filename)
2022-09-08 21:40:48 +02:00
continue
}
// We read the raw OSM-file and convert it to a geojson
const rawOsm = JSON.parse(readFileSync(filename, { encoding: "utf8" }))
// Create and save the geojson file - which is the main chunk of the data
2022-09-08 21:40:48 +02:00
const geojson = OsmToGeoJson.default(rawOsm)
2022-01-16 01:59:06 +01:00
console.log(" which as", geojson.features.length, "features")
2021-04-23 20:09:27 +02:00
allFeatures.push(...geojson.features)
}
}
return StaticFeatureSource.fromGeojson(allFeatures)
}
/**
* Load all the tiles into memory from disk
*/
2023-05-17 13:18:00 +02:00
async function sliceToTiles(
2022-09-08 21:40:48 +02:00
allFeatures: FeatureSource,
theme: LayoutConfig,
targetdir: string,
2023-02-14 00:08:21 +01:00
pointsOnlyLayers: string[],
2023-05-17 13:18:00 +02:00
clip: boolean,
targetzoomLevel: number = 9
2022-09-08 21:40:48 +02:00
) {
const skippedLayers = new Set<string>()
2022-01-16 01:59:06 +01:00
const indexedFeatures: Map<string, any> = new Map<string, any>()
2022-09-08 21:40:48 +02:00
let indexisBuilt = false
2023-05-17 13:18:00 +02:00
const osmObjectDownloader = new OsmObjectDownloader()
2022-01-16 01:59:06 +01:00
function buildIndex() {
for (const f of allFeatures.features.data) {
2021-12-07 17:46:57 +01:00
indexedFeatures.set(f.properties.id, f)
}
2022-09-08 21:40:48 +02:00
indexisBuilt = true
2021-12-07 17:46:57 +01:00
}
2022-01-16 01:59:06 +01:00
function getFeatureById(id) {
if (!indexisBuilt) {
2021-12-07 17:46:57 +01:00
buildIndex()
}
return indexedFeatures.get(id)
}
2022-01-16 01:59:06 +01:00
2023-05-17 13:18:00 +02:00
const flayers: FilteredLayer[] = theme.layers.map((l) => new FilteredLayer(l))
const perLayer = new PerLayerFeatureSourceSplitter(flayers, allFeatures)
2023-05-17 13:18:00 +02:00
for (const [layerId, source] of perLayer.perLayer) {
const layer = flayers.find((flayer) => flayer.layerDef.id === layerId).layerDef
const targetZoomLevel = layer.source.geojsonZoomLevel ?? targetzoomLevel
if (layer.source.geojsonSource && layer.source.isOsmCacheLayer !== true) {
console.log("Skipping layer ", layerId, ": not a caching layer")
skippedLayers.add(layer.id)
continue
}
const flayer: FilteredLayer = new FilteredLayer(layer)
console.log(
"Handling layer ",
layerId,
"which has",
source.features.data.length,
"features"
)
if (source.features.data.length === 0) {
continue
}
const featureProperties: FeaturePropertiesStore = new FeaturePropertiesStore(source)
MetaTagging.addMetatags(
source.features.data,
{
getFeaturesWithin: (_) => {
return <any>[allFeatures.features.data]
},
getFeatureById: getFeatureById,
},
layer,
theme,
osmObjectDownloader,
featureProperties,
{
includeDates: false,
includeNonDates: true,
evaluateStrict: true,
2023-05-17 13:18:00 +02:00
}
)
while (SimpleMetaTaggers.country.runningTasks.size > 0) {
2022-09-08 21:40:48 +02:00
console.log(
"Still waiting for ",
SimpleMetaTaggers.country.runningTasks.size,
" features which don't have a country yet"
2022-09-08 21:40:48 +02:00
)
await ScriptUtils.sleep(250)
}
const createdTiles = []
// At this point, we have all the features of the entire area.
// However, we want to export them per tile of a fixed size, so we use a dynamicTileSOurce to split it up
const features = source.features.data
const perBbox = GeoOperations.spreadIntoBboxes(features, targetZoomLevel)
2022-01-16 01:59:06 +01:00
for (let [tileIndex, features] of perBbox) {
const bbox = BBox.fromTileIndex(tileIndex).asGeoJson({})
console.log("Got tile:", tileIndex, layer.id)
if (features.length === 0) {
continue
2023-05-17 13:18:00 +02:00
}
const filteredTile = new FilteringFeatureSource(
flayer,
new StaticFeatureSource(features)
)
console.log(
"Tile " +
2023-05-17 13:18:00 +02:00
layer.id +
"." +
tileIndex +
" contains " +
filteredTile.features.data.length +
" features after filtering (" +
features.length +
") features before"
)
if (filteredTile.features.data.length === 0) {
continue
}
let strictlyCalculated = 0
let featureCount = 0
2023-05-17 13:18:00 +02:00
for (const feature of features) {
// Some cleanup
if (layer.calculatedTags !== undefined) {
// Evaluate all the calculated tags strictly
const calculatedTagKeys = layer.calculatedTags.map((ct) => ct[0])
featureCount++
const props = feature.properties
for (const calculatedTagKey of calculatedTagKeys) {
const strict = props[calculatedTagKey]
if (props.hasOwnProperty(calculatedTagKey)) {
delete props[calculatedTagKey]
}
props[calculatedTagKey] = strict
strictlyCalculated++
if (strictlyCalculated % 100 === 0) {
console.log(
"Strictly calculated ",
strictlyCalculated,
"values for tile",
tileIndex,
": now at ",
featureCount,
"/",
filteredTile.features.data.length,
"examle value: ",
strict
)
}
}
}
delete feature["bbox"]
}
2023-02-14 00:08:21 +01:00
if (clip) {
console.log("Clipping features")
features = [].concat(
...features.map((f: Feature) => GeoOperations.clipWith(<any>f, bbox))
2022-09-08 21:40:48 +02:00
)
2023-05-17 13:18:00 +02:00
}
// Lets save this tile!
const [z, x, y] = Tiles.tile_from_index(tileIndex)
// console.log("Writing tile ", z, x, y, layerId)
const targetPath = geoJsonName(targetdir + "_" + layerId, x, y, z)
createdTiles.push(tileIndex)
// This is the geojson file containing all features for this tile
writeFileSync(
targetPath,
JSON.stringify(
{
type: "FeatureCollection",
features,
},
null,
" "
2022-09-08 21:40:48 +02:00
)
)
console.log("Written tile", targetPath, "with", filteredTile.features.data.length)
}
// All the tiles are written at this point
// Only thing left to do is to create the index
const path = targetdir + "_" + layerId + "_" + targetZoomLevel + "_overview.json"
const perX = {}
createdTiles
.map((i) => Tiles.tile_from_index(i))
.forEach(([z, x, y]) => {
const key = "" + x
if (perX[key] === undefined) {
perX[key] = []
}
perX[key].push(y)
})
console.log("Written overview: ", path, "with ", createdTiles.length, "tiles")
writeFileSync(path, JSON.stringify(perX))
// And, if needed, to create a points-only layer
if (pointsOnlyLayers.indexOf(layer.id) >= 0) {
const filtered = new FilteringFeatureSource(flayer, source)
const features = filtered.features.data
const points = features.map((feature) => GeoOperations.centerpoint(feature))
console.log("Writing points overview for ", layerId)
const targetPath = targetdir + "_" + layerId + "_points.geojson"
// This is the geojson file containing all features for this tile
writeFileSync(
targetPath,
JSON.stringify(
{
type: "FeatureCollection",
features: points,
},
null,
" "
2023-05-17 13:18:00 +02:00
)
)
2023-05-17 13:18:00 +02:00
}
}
const skipped = Array.from(skippedLayers)
if (skipped.length > 0) {
2022-09-08 21:40:48 +02:00
console.warn(
"Did not save any cache files for layers " +
skipped.join(", ") +
" as these didn't set the flag `isOsmCache` to true"
2022-09-08 21:40:48 +02:00
)
}
}
2021-04-23 20:09:27 +02:00
2022-02-14 01:15:20 +01:00
export async function main(args: string[]) {
2023-05-17 13:18:00 +02:00
console.log("Cache builder started with args ", args.join(" "))
2023-02-09 00:10:59 +01:00
ReferencingWaysMetaTagger.enabled = false
if (args.length < 6) {
2022-09-08 21:40:48 +02:00
console.error(
2023-02-14 00:08:21 +01:00
"Expected arguments are: theme zoomlevel targetdirectory lat0 lon0 lat1 lon1 [--generate-point-overview layer-name,layer-name,...] [--force-zoom-level z] [--clip]" +
"--force-zoom-level causes non-cached-layers to be donwnloaded\n" +
"--clip will erase parts of the feature falling outside of the bounding box"
2022-09-08 21:40:48 +02:00
)
return
}
const themeName = args[0]
const zoomlevel = Number(args[1])
console.log(
"Target zoomlevel for the tiles is",
zoomlevel,
"; this can be overridden by the individual layers"
)
const targetdir = args[2] + "/" + themeName
if (!existsSync(args[2])) {
console.log("Directory not found")
throw `The directory ${args[2]} does not exist`
}
const lat0 = Number(args[3])
const lon0 = Number(args[4])
const lat1 = Number(args[5])
const lon1 = Number(args[6])
2023-02-14 00:08:21 +01:00
const clip = args.indexOf("--clip") >= 0
2021-11-07 16:34:51 +01:00
2022-01-26 21:40:38 +01:00
if (isNaN(lat0)) {
2022-01-25 18:20:15 +01:00
throw "The first number (a latitude) is not a valid number"
}
2022-01-26 21:40:38 +01:00
if (isNaN(lon0)) {
2022-01-25 18:20:15 +01:00
throw "The second number (a longitude) is not a valid number"
}
2022-01-26 21:40:38 +01:00
if (isNaN(lat1)) {
2022-01-25 18:20:15 +01:00
throw "The third number (a latitude) is not a valid number"
}
2022-01-26 21:40:38 +01:00
if (isNaN(lon1)) {
2022-02-14 01:15:20 +01:00
throw "The fourth number (a longitude) is not a valid number"
2022-01-25 18:20:15 +01:00
}
2022-01-26 21:40:38 +01:00
const tileRange = Tiles.TileRangeBetween(zoomlevel, lat0, lon0, lat1, lon1)
2022-01-26 21:40:38 +01:00
if (isNaN(tileRange.total)) {
2022-01-25 18:20:15 +01:00
throw "Something has gone wrong: tilerange is NAN"
}
2022-01-26 21:40:38 +01:00
if (tileRange.total === 0) {
console.log("Tilerange has zero tiles - this is probably an error")
return
}
const theme = AllKnownLayouts.allKnownLayouts.get(themeName)
if (theme === undefined) {
const keys = Array.from(AllKnownLayouts.allKnownLayouts.keys())
2023-05-19 11:48:04 +02:00
console.error("The theme " + themeName + " was not found; try one of ", keys)
return
}
2021-12-07 17:46:57 +01:00
theme.layers = theme.layers.filter(
(l) =>
Constants.priviliged_layers.indexOf(<any>l.id) < 0 && !l.id.startsWith("note_import_")
)
console.log("Layers to download:", theme.layers.map((l) => l.id).join(", "))
2023-05-17 13:18:00 +02:00
2021-12-07 17:46:57 +01:00
let generatePointLayersFor = []
if (args[7] == "--generate-point-overview") {
2022-01-16 01:59:06 +01:00
if (args[8] === undefined) {
2021-12-07 17:46:57 +01:00
throw "--generate-point-overview needs a list of layers to generate the overview for (or * for all)"
2022-09-08 21:40:48 +02:00
} else if (args[8] === "*") {
generatePointLayersFor = theme.layers.map((l) => l.id)
2022-01-16 01:59:06 +01:00
} else {
2021-12-07 17:46:57 +01:00
generatePointLayersFor = args[8].split(",")
}
2022-09-08 21:40:48 +02:00
console.log(
"Also generating a point overview for layers ",
generatePointLayersFor.join(",")
)
2021-12-07 17:46:57 +01:00
}
{
2022-01-16 01:59:06 +01:00
const index = args.indexOf("--force-zoom-level")
if (index >= 0) {
const forcedZoomLevel = Number(args[index + 1])
for (const layer of theme.layers) {
layer.source.geojsonSource = "https://127.0.0.1/cache_{layer}_{z}_{x}_{y}.geojson"
layer.source.isOsmCacheLayer = true
layer.source.geojsonZoomLevel = forcedZoomLevel
}
2021-12-07 17:46:57 +01:00
}
}
2022-01-16 01:59:06 +01:00
2022-09-08 21:40:48 +02:00
let failed = 0
2021-04-22 16:01:43 +02:00
do {
try {
const cachingResult = await downloadRaw(targetdir, tileRange, theme)
failed = cachingResult.failed
if (failed > 0) {
await ScriptUtils.sleep(30000)
}
} catch (e) {
2023-05-17 13:18:00 +02:00
console.error(e)
return
}
2021-04-22 16:01:43 +02:00
} while (failed > 0)
2022-09-08 21:40:48 +02:00
const extraFeatures = await downloadExtraData(theme)
const allFeaturesSource = loadAllTiles(targetdir, tileRange, theme, extraFeatures)
2023-05-17 13:18:00 +02:00
await sliceToTiles(allFeaturesSource, theme, targetdir, generatePointLayersFor, clip, zoomlevel)
}
let args = [...process.argv]
if (!args[1]?.endsWith("test/TestAll.ts")) {
args.splice(0, 2)
try {
main(args)
.then(() => console.log("All done!"))
2022-09-08 21:40:48 +02:00
.catch((e) => console.error("Error building cache:", e))
} catch (e) {
console.error("Error building cache:", e)
}
}