MapComplete/scripts/generateCache.ts

479 lines
19 KiB
TypeScript
Raw Normal View History

/**
* Generates a collection of geojson files based on an overpass query for a given theme
*/
2021-07-10 21:03:41 +02:00
import {Utils} from "../Utils";
import {Overpass} from "../Logic/Osm/Overpass";
2021-04-23 12:58:49 +02:00
import {existsSync, readFileSync, writeFileSync} from "fs";
import {TagsFilter} from "../Logic/Tags/TagsFilter";
import {Or} from "../Logic/Tags/Or";
import {AllKnownLayouts} from "../Customizations/AllKnownLayouts";
import RelationsTracker from "../Logic/Osm/RelationsTracker";
import * as OsmToGeoJson from "osmtogeojson";
import MetaTagging from "../Logic/MetaTagging";
2022-07-22 11:50:25 +02:00
import {ImmutableStore, UIEventSource} from "../Logic/UIEventSource";
import {TileRange, Tiles} from "../Models/TileRange";
import LayoutConfig from "../Models/ThemeConfig/LayoutConfig";
2021-09-10 00:00:48 +02:00
import ScriptUtils from "./ScriptUtils";
import PerLayerFeatureSourceSplitter from "../Logic/FeatureSource/PerLayerFeatureSourceSplitter";
import FilteredLayer from "../Models/FilteredLayer";
import FeatureSource, {FeatureSourceForLayer} from "../Logic/FeatureSource/FeatureSource";
import StaticFeatureSource from "../Logic/FeatureSource/Sources/StaticFeatureSource";
import TiledFeatureSource from "../Logic/FeatureSource/TiledFeatureSource/TiledFeatureSource";
2021-10-03 01:38:57 +02:00
import Constants from "../Models/Constants";
2021-10-13 00:08:41 +02:00
import {GeoOperations} from "../Logic/GeoOperations";
import SimpleMetaTaggers from "../Logic/SimpleMetaTagger";
import FilteringFeatureSource from "../Logic/FeatureSource/Sources/FilteringFeatureSource";
import Loc from "../Models/Loc";
2022-01-16 01:59:06 +01:00
2021-09-10 00:00:48 +02:00
ScriptUtils.fixUtils()
2021-10-03 01:38:57 +02:00
function createOverpassObject(theme: LayoutConfig, relationTracker: RelationsTracker, backend: string) {
let filters: TagsFilter[] = [];
let extraScripts: string[] = [];
for (const layer of theme.layers) {
if (typeof (layer) === "string") {
throw "A layer was not expanded!"
}
if (layer.doNotDownload) {
continue;
}
if (layer.source.geojsonSource !== undefined) {
// This layer defines a geoJson-source
// SHould it be cached?
if (layer.source.isOsmCacheLayer !== true) {
continue;
}
}
// Check if data for this layer has already been loaded
if (layer.source.overpassScript !== undefined) {
extraScripts.push(layer.source.overpassScript)
} else {
filters.push(layer.source.osmTags);
}
}
filters = Utils.NoNull(filters)
extraScripts = Utils.NoNull(extraScripts)
if (filters.length + extraScripts.length === 0) {
throw "Nothing to download! The theme doesn't declare anything to download"
}
2021-10-03 01:38:57 +02:00
return new Overpass(new Or(filters), extraScripts, backend,
new UIEventSource<number>(60), relationTracker);
}
function rawJsonName(targetDir: string, x: number, y: number, z: number): string {
return targetDir + "_" + z + "_" + x + "_" + y + ".json"
}
function geoJsonName(targetDir: string, x: number, y: number, z: number): string {
return targetDir + "_" + z + "_" + x + "_" + y + ".geojson"
}
/// Downloads the given feature and saves them to disk
2021-10-03 01:38:57 +02:00
async function downloadRaw(targetdir: string, r: TileRange, theme: LayoutConfig, relationTracker: RelationsTracker)/* : {failed: number, skipped :number} */ {
let downloaded = 0
2021-04-22 16:01:43 +02:00
let failed = 0
let skipped = 0
2021-10-13 01:28:20 +02:00
const startTime = new Date().getTime()
for (let x = r.xstart; x <= r.xend; x++) {
for (let y = r.ystart; y <= r.yend; y++) {
downloaded++;
const filename = rawJsonName(targetdir, x, y, r.zoomlevel)
if (existsSync(filename)) {
console.log("Already exists (not downloading again): ", filename)
2021-04-22 16:01:43 +02:00
skipped++
continue;
}
2021-10-13 01:28:20 +02:00
const runningSeconds = (new Date().getTime() - startTime) / 1000
const resting = failed + (r.total - downloaded)
2021-11-07 16:34:51 +01:00
const perTile = (runningSeconds / (downloaded - skipped))
const estimated = Math.floor(resting * perTile)
console.log("total: ", downloaded, "/", r.total, "failed: ", failed, "skipped: ", skipped, "running time: ", Utils.toHumanTime(runningSeconds) + "s", "estimated left: ", Utils.toHumanTime(estimated), "(" + Math.floor(perTile) + "s/tile)")
const boundsArr = Tiles.tile_bounds(r.zoomlevel, x, y)
const bounds = {
north: Math.max(boundsArr[0][0], boundsArr[1][0]),
south: Math.min(boundsArr[0][0], boundsArr[1][0]),
east: Math.max(boundsArr[0][1], boundsArr[1][1]),
west: Math.min(boundsArr[0][1], boundsArr[1][1])
}
2021-10-13 01:28:20 +02:00
const overpass = createOverpassObject(theme, relationTracker, Constants.defaultOverpassUrls[(failed) % Constants.defaultOverpassUrls.length])
const url = overpass.buildQuery("[bbox:" + bounds.south + "," + bounds.west + "," + bounds.north + "," + bounds.east + "]")
2021-10-03 01:38:57 +02:00
try {
2022-02-14 01:15:20 +01:00
const json = await Utils.downloadJson(url)
if ((<string>json.remark ?? "").startsWith("runtime error")) {
console.error("Got a runtime error: ", json.remark)
failed++;
2021-11-07 16:34:51 +01:00
} else if (json.elements.length === 0) {
console.log("Got an empty response! Writing anyway")
}
2021-10-03 01:38:57 +02:00
2021-11-07 16:34:51 +01:00
console.log("Got the response - writing ",json.elements.length," elements to ", filename)
2021-11-07 16:34:51 +01:00
writeFileSync(filename, JSON.stringify(json, null, " "));
2021-10-03 01:38:57 +02:00
} catch (err) {
console.log(url)
console.log("Could not download - probably hit the rate limit; waiting a bit. (" + err + ")")
failed++;
await ScriptUtils.sleep(1000)
2021-09-10 00:00:48 +02:00
}
}
}
2021-04-22 16:01:43 +02:00
return {failed: failed, skipped: skipped}
}
/*
* Downloads extra geojson sources and returns the features.
* Extra geojson layers should not be tiled
*/
async function downloadExtraData(theme: LayoutConfig)/* : any[] */ {
const allFeatures: any[] = []
for (const layer of theme.layers) {
const source = layer.source.geojsonSource;
if (source === undefined) {
continue;
}
2021-09-10 00:00:48 +02:00
if (layer.source.isOsmCacheLayer !== undefined && layer.source.isOsmCacheLayer !== false) {
// Cached layers are not considered here
continue;
}
console.log("Downloading extra data: ", source)
2022-02-14 01:15:20 +01:00
await Utils.downloadJson(source).then(json => allFeatures.push(...json.features))
}
return allFeatures;
}
function loadAllTiles(targetdir: string, r: TileRange, theme: LayoutConfig, extraFeatures: any[]): FeatureSource {
let allFeatures = [...extraFeatures]
let processed = 0;
for (let x = r.xstart; x <= r.xend; x++) {
for (let y = r.ystart; y <= r.yend; y++) {
processed++;
const filename = rawJsonName(targetdir, x, y, r.zoomlevel)
console.log(" Loading and processing", processed, "/", r.total, filename)
if (!existsSync(filename)) {
console.error("Not found - and not downloaded. Run this script again!: " + filename)
continue;
}
// We read the raw OSM-file and convert it to a geojson
const rawOsm = JSON.parse(readFileSync(filename, "UTF8"))
// Create and save the geojson file - which is the main chunk of the data
const geojson = OsmToGeoJson.default(rawOsm);
2022-01-16 01:59:06 +01:00
console.log(" which as", geojson.features.length, "features")
2021-04-23 20:09:27 +02:00
allFeatures.push(...geojson.features)
}
}
return StaticFeatureSource.fromGeojson(allFeatures)
}
/**
* Load all the tiles into memory from disk
*/
2021-10-13 00:08:41 +02:00
function sliceToTiles(allFeatures: FeatureSource, theme: LayoutConfig, relationsTracker: RelationsTracker, targetdir: string, pointsOnlyLayers: string[]) {
const skippedLayers = new Set<string>()
2022-01-16 01:59:06 +01:00
const indexedFeatures: Map<string, any> = new Map<string, any>()
2021-12-07 17:46:57 +01:00
let indexisBuilt = false;
2022-01-16 01:59:06 +01:00
function buildIndex() {
2021-12-07 17:46:57 +01:00
for (const ff of allFeatures.features.data) {
const f = ff.feature
indexedFeatures.set(f.properties.id, f)
}
indexisBuilt = true;
}
2022-01-16 01:59:06 +01:00
function getFeatureById(id) {
if (!indexisBuilt) {
2021-12-07 17:46:57 +01:00
buildIndex()
}
return indexedFeatures.get(id)
}
2022-01-16 01:59:06 +01:00
async function handleLayer(source: FeatureSourceForLayer) {
const layer = source.layer.layerDef;
2021-10-13 00:08:41 +02:00
const targetZoomLevel = layer.source.geojsonZoomLevel ?? 0
2021-11-07 16:34:51 +01:00
const layerId = layer.id
if (layer.source.isOsmCacheLayer !== true) {
console.log("Skipping layer ", layerId, ": not a caching layer")
skippedLayers.add(layer.id)
return;
}
console.log("Handling layer ", layerId, "which has", source.features.data.length, "features")
if (source.features.data.length === 0) {
return;
}
MetaTagging.addMetatags(source.features.data,
{
memberships: relationsTracker,
getFeaturesWithin: _ => {
return [allFeatures.features.data.map(f => f.feature)]
2021-12-07 17:46:57 +01:00
},
getFeatureById: getFeatureById
},
layer,
2021-12-13 13:22:23 +01:00
{},
{
includeDates: false,
includeNonDates: true,
evaluateStrict: true
});
2022-01-16 01:59:06 +01:00
while (SimpleMetaTaggers.country.runningTasks.size > 0) {
2022-01-16 01:59:06 +01:00
console.log("Still waiting for ", SimpleMetaTaggers.country.runningTasks.size, " features which don't have a country yet")
await ScriptUtils.sleep(1)
}
const createdTiles = []
// At this point, we have all the features of the entire area.
// However, we want to export them per tile of a fixed size, so we use a dynamicTileSOurce to split it up
TiledFeatureSource.createHierarchy(source, {
2021-10-13 00:08:41 +02:00
minZoomLevel: targetZoomLevel,
maxZoomLevel: targetZoomLevel,
maxFeatureCount: undefined,
registerTile: tile => {
const tileIndex = tile.tileIndex;
console.log("Got tile:", tileIndex, tile.layer.layerDef.id)
if (tile.features.data.length === 0) {
return
}
2022-01-16 01:59:06 +01:00
const filteredTile = new FilteringFeatureSource({
2022-07-22 11:50:25 +02:00
locationControl: new ImmutableStore<Loc>(undefined),
2022-01-16 01:59:06 +01:00
allElements: undefined,
2022-07-22 11:50:25 +02:00
selectedElement: new ImmutableStore<any>(undefined),
globalFilters: new ImmutableStore([])
2022-01-16 01:59:06 +01:00
},
tileIndex,
tile,
new UIEventSource<any>(undefined)
2022-01-16 01:59:06 +01:00
)
2022-01-16 01:59:06 +01:00
console.log("Tile " + layer.id + "." + tileIndex + " contains " + filteredTile.features.data.length + " features after filtering (" + tile.features.data.length + ") features before")
if (filteredTile.features.data.length === 0) {
return
}
let strictlyCalculated = 0
let featureCount = 0
for (const feature of filteredTile.features.data) {
// Some cleanup
delete feature.feature["bbox"]
2022-01-16 01:59:06 +01:00
if (tile.layer.layerDef.calculatedTags !== undefined) {
// Evaluate all the calculated tags strictly
const calculatedTagKeys = tile.layer.layerDef.calculatedTags.map(ct => ct[0])
featureCount++
2022-03-18 13:08:04 +01:00
const props = feature.feature.properties
2022-01-16 01:59:06 +01:00
for (const calculatedTagKey of calculatedTagKeys) {
2022-03-18 13:08:04 +01:00
const strict = props[calculatedTagKey]
if(props.hasOwnProperty(calculatedTagKey)){
delete props[calculatedTagKey]
}
props[calculatedTagKey] = strict
2022-01-16 01:59:06 +01:00
strictlyCalculated++;
if (strictlyCalculated % 100 === 0) {
console.log("Strictly calculated ", strictlyCalculated, "values for tile", tileIndex, ": now at ", featureCount, "/", filteredTile.features.data.length, "examle value: ", strict)
}
}
}
2022-01-16 01:59:06 +01:00
}
// Lets save this tile!
const [z, x, y] = Tiles.tile_from_index(tileIndex)
// console.log("Writing tile ", z, x, y, layerId)
const targetPath = geoJsonName(targetdir + "_" + layerId, x, y, z)
createdTiles.push(tileIndex)
// This is the geojson file containing all features for this tile
writeFileSync(targetPath, JSON.stringify({
type: "FeatureCollection",
features: filteredTile.features.data.map(f => f.feature)
}, null, " "))
2022-01-16 01:59:06 +01:00
console.log("Written tile", targetPath, "with", filteredTile.features.data.length)
}
})
2021-04-23 20:09:27 +02:00
// All the tiles are written at this point
// Only thing left to do is to create the index
2021-10-13 00:08:41 +02:00
const path = targetdir + "_" + layerId + "_" + targetZoomLevel + "_overview.json"
const perX = {}
createdTiles.map(i => Tiles.tile_from_index(i)).forEach(([z, x, y]) => {
const key = "" + x
if (perX[key] === undefined) {
perX[key] = []
}
perX[key].push(y)
})
console.log("Written overview: ", path, "with ", createdTiles.length, "tiles")
writeFileSync(path, JSON.stringify(perX))
2021-10-13 00:08:41 +02:00
// And, if needed, to create a points-only layer
2021-11-07 16:34:51 +01:00
if (pointsOnlyLayers.indexOf(layer.id) >= 0) {
2021-12-07 17:46:57 +01:00
const filtered = new FilteringFeatureSource({
2022-07-22 11:50:25 +02:00
locationControl: new ImmutableStore<Loc>(undefined),
2021-12-07 17:46:57 +01:00
allElements: undefined,
2022-07-22 11:50:25 +02:00
selectedElement: new ImmutableStore<any>(undefined),
globalFilters: new ImmutableStore([])
2021-12-07 17:46:57 +01:00
},
2022-01-16 01:59:06 +01:00
Tiles.tile_index(0, 0, 0),
2021-12-07 17:46:57 +01:00
source,
new UIEventSource<any>(undefined)
)
const features = filtered.features.data.map(f => f.feature)
2022-01-16 01:59:06 +01:00
2021-10-13 00:08:41 +02:00
const points = features.map(feature => GeoOperations.centerpoint(feature))
console.log("Writing points overview for ", layerId)
2021-11-07 16:34:51 +01:00
const targetPath = targetdir + "_" + layerId + "_points.geojson"
2021-10-13 00:08:41 +02:00
// This is the geojson file containing all features for this tile
writeFileSync(targetPath, JSON.stringify({
type: "FeatureCollection",
features: points
}, null, " "))
}
}
new PerLayerFeatureSourceSplitter(
new UIEventSource<FilteredLayer[]>(theme.layers.map(l => ({
layerDef: l,
isDisplayed: new UIEventSource<boolean>(true),
appliedFilters: new UIEventSource(undefined)
}))),
handleLayer,
allFeatures
)
const skipped = Array.from(skippedLayers)
if (skipped.length > 0) {
console.warn("Did not save any cache files for layers " + skipped.join(", ") + " as these didn't set the flag `isOsmCache` to true")
}
}
2021-04-23 20:09:27 +02:00
2022-02-14 01:15:20 +01:00
export async function main(args: string[]) {
console.log("Cache builder started with args ", args.join(", "))
if (args.length < 6) {
2021-12-07 17:46:57 +01:00
console.error("Expected arguments are: theme zoomlevel targetdirectory lat0 lon0 lat1 lon1 [--generate-point-overview layer-name,layer-name,...] [--force-zoom-level z] \n" +
"Note: a new directory named <theme> will be created in targetdirectory")
return;
}
const themeName = args[0]
const zoomlevel = Number(args[1])
const targetdir = args[2] + "/" + themeName
if (!existsSync(args[2])) {
console.log("Directory not found")
throw `The directory ${args[2]} does not exist`
}
const lat0 = Number(args[3])
const lon0 = Number(args[4])
const lat1 = Number(args[5])
const lon1 = Number(args[6])
2021-11-07 16:34:51 +01:00
2022-01-26 21:40:38 +01:00
if (isNaN(lat0)) {
2022-01-25 18:20:15 +01:00
throw "The first number (a latitude) is not a valid number"
}
2022-01-26 21:40:38 +01:00
if (isNaN(lon0)) {
2022-01-25 18:20:15 +01:00
throw "The second number (a longitude) is not a valid number"
}
2022-01-26 21:40:38 +01:00
if (isNaN(lat1)) {
2022-01-25 18:20:15 +01:00
throw "The third number (a latitude) is not a valid number"
}
2022-01-26 21:40:38 +01:00
if (isNaN(lon1)) {
2022-02-14 01:15:20 +01:00
throw "The fourth number (a longitude) is not a valid number"
2022-01-25 18:20:15 +01:00
}
2022-01-26 21:40:38 +01:00
const tileRange = Tiles.TileRangeBetween(zoomlevel, lat0, lon0, lat1, lon1)
2022-01-26 21:40:38 +01:00
if (isNaN(tileRange.total)) {
2022-01-25 18:20:15 +01:00
throw "Something has gone wrong: tilerange is NAN"
}
2022-01-26 21:40:38 +01:00
if (tileRange.total === 0) {
console.log("Tilerange has zero tiles - this is probably an error")
return
}
const theme = AllKnownLayouts.allKnownLayouts.get(themeName)
if (theme === undefined) {
const keys = []
AllKnownLayouts.allKnownLayouts.forEach((_, key) => {
keys.push(key)
})
console.error("The theme " + theme + " was not found; try one of ", keys);
return
}
2021-12-07 17:46:57 +01:00
let generatePointLayersFor = []
if (args[7] == "--generate-point-overview") {
2022-01-16 01:59:06 +01:00
if (args[8] === undefined) {
2021-12-07 17:46:57 +01:00
throw "--generate-point-overview needs a list of layers to generate the overview for (or * for all)"
2022-01-16 01:59:06 +01:00
} else if (args[8] === '*') {
2021-12-07 17:46:57 +01:00
generatePointLayersFor = theme.layers.map(l => l.id)
2022-01-16 01:59:06 +01:00
} else {
2021-12-07 17:46:57 +01:00
generatePointLayersFor = args[8].split(",")
}
console.log("Also generating a point overview for layers ", generatePointLayersFor.join(","))
}
{
2022-01-16 01:59:06 +01:00
const index = args.indexOf("--force-zoom-level")
if (index >= 0) {
const forcedZoomLevel = Number(args[index + 1])
for (const layer of theme.layers) {
layer.source.geojsonSource = "https://127.0.0.1/cache_{layer}_{z}_{x}_{y}.geojson"
layer.source.isOsmCacheLayer = true
layer.source.geojsonZoomLevel = forcedZoomLevel
}
2021-12-07 17:46:57 +01:00
}
}
2022-01-16 01:59:06 +01:00
const relationTracker = new RelationsTracker()
2021-04-22 16:01:43 +02:00
let failed = 0;
do {
2021-10-03 01:38:57 +02:00
const cachingResult = await downloadRaw(targetdir, tileRange, theme, relationTracker)
2021-04-22 16:01:43 +02:00
failed = cachingResult.failed
if (failed > 0) {
await ScriptUtils.sleep(30000)
2021-04-22 16:01:43 +02:00
}
} while (failed > 0)
const extraFeatures = await downloadExtraData(theme);
const allFeaturesSource = loadAllTiles(targetdir, tileRange, theme, extraFeatures)
2021-10-13 00:08:41 +02:00
sliceToTiles(allFeaturesSource, theme, relationTracker, targetdir, generatePointLayersFor)
}
let args = [...process.argv]
if (!args[1]?.endsWith("test/TestAll.ts")) {
args.splice(0, 2)
try {
main(args)
.then(() => console.log("All done!"))
.catch(e => console.error("Error building cache:", e));
} catch (e) {
console.error("Error building cache:", e)
}
}