MapComplete/Docs/Tools/GenerateSeries.ts

862 lines
29 KiB
TypeScript
Raw Normal View History

import {existsSync, mkdirSync, readdirSync, readFileSync, writeFileSync} from "fs";
2021-08-22 15:53:05 +02:00
import ScriptUtils from "../../scripts/ScriptUtils";
import {Utils} from "../../Utils";
import {exec} from "child_process"
import {GeoOperations} from "../../Logic/GeoOperations";
2022-02-14 01:15:20 +01:00
ScriptUtils.fixUtils()
2021-08-22 15:53:05 +02:00
class StatsDownloader {
private readonly startYear = 2020
private readonly startMonth = 5;
private readonly urlTemplate = "https://osmcha.org/api/v1/changesets/?date__gte={start_date}&date__lte={end_date}&page={page}&comment=%23mapcomplete&page_size=100"
2021-08-22 15:53:05 +02:00
private readonly _targetDirectory: string;
constructor(targetDirectory = ".") {
this._targetDirectory = targetDirectory;
}
public async DownloadStats() {
2022-07-16 01:01:51 +02:00
const today = new Date();
const currentYear = today.getFullYear()
const currentMonth = today.getMonth() + 1
2021-08-22 15:53:05 +02:00
for (let year = this.startYear; year <= currentYear; year++) {
for (let month = 1; month <= 12; month++) {
if (year === this.startYear && month < this.startMonth) {
continue;
}
if (year === currentYear && month > currentMonth) {
2022-07-16 01:01:51 +02:00
break
2021-08-22 15:53:05 +02:00
}
2022-07-16 01:01:51 +02:00
const pathM = `${this._targetDirectory}/stats.${year}-${month}.json`
if (existsSync(pathM)) {
continue;
}
for (let day = 1; day <= 31; day++) {
if (year === currentYear && month === currentMonth && day === today.getDate() ) {
break;
2021-08-22 15:53:05 +02:00
}
2022-07-29 23:25:22 +02:00
const path = `${this._targetDirectory}/stats.${year}-${month}-${(day < 10 ? "0" : "") + day}.json`
2022-07-16 01:01:51 +02:00
if(existsSync(path)){
2022-07-29 23:25:22 +02:00
console.log("Skipping ", path,": already exists")
2022-07-16 01:01:51 +02:00
continue
}
2022-07-29 23:25:22 +02:00
try{
2022-07-16 01:01:51 +02:00
await this.DownloadStatsForDay(year, month, day, path)
2022-07-29 23:25:22 +02:00
}catch(e){
console.error(e)
console.error("Could not download "+year+"-"+month+"-"+day+"... Trying again")
try{
await this.DownloadStatsForDay(year, month, day, path)
}catch(e){
console.error("Could not download "+year+"-"+month+"-"+day+", skipping for now")
}
}
2021-08-22 15:53:05 +02:00
}
}
}
}
2022-07-16 01:01:51 +02:00
public async DownloadStatsForDay(year: number, month: number, day: number, path: string) {
2021-08-22 15:53:05 +02:00
let page = 1;
let allFeatures = []
2022-07-16 01:01:51 +02:00
let endDay = new Date(year,month - 1 /* Zero-indexed: 0 = january*/,day + 1);
let endDate = `${endDay.getFullYear()}-${Utils.TwoDigits(endDay.getMonth()+1)}-${Utils.TwoDigits(endDay.getDate())}`
let url = this.urlTemplate.replace("{start_date}", year + "-" + Utils.TwoDigits(month) + "-" + Utils.TwoDigits(day))
2021-08-22 15:53:05 +02:00
.replace("{end_date}", endDate)
.replace("{page}", "" + page)
let headers = {
'User-Agent': 'Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:86.0) Gecko/20100101 Firefox/86.0',
'Accept-Language': 'en-US,en;q=0.5',
'Referer': 'https://osmcha.org/?filters=%7B%22date__gte%22%3A%5B%7B%22label%22%3A%222020-07-05%22%2C%22value%22%3A%222020-07-05%22%7D%5D%2C%22editor%22%3A%5B%7B%22label%22%3A%22mapcomplete%22%2C%22value%22%3A%22mapcomplete%22%7D%5D%7D',
'Content-Type': 'application/json',
'Authorization': 'Token 6e422e2afedb79ef66573982012000281f03dc91',
'DNT': '1',
'Connection': 'keep-alive',
'TE': 'Trailers',
'Pragma': 'no-cache',
'Cache-Control': 'no-cache'
}
while (url) {
2022-07-16 01:01:51 +02:00
ScriptUtils.erasableLog(`Downloading stats for ${year}-${month}-${day}, page ${page} ${url}`)
2022-02-14 01:15:20 +01:00
const result = await Utils.downloadJson(url, headers)
2021-08-22 15:53:05 +02:00
page++;
allFeatures.push(...result.features)
if (result.features === undefined) {
console.log("ERROR", result)
return
}
url = result.next
}
2022-01-16 02:52:46 +01:00
console.log(`Writing ${allFeatures.length} features to `, path, Utils.Times(_ => " ", 80))
allFeatures = Utils.NoNull(allFeatures)
allFeatures.forEach(f => {
f.properties.id = f.id
})
2021-08-22 15:53:05 +02:00
writeFileSync(path, JSON.stringify({
features: allFeatures
}, undefined, 2))
}
}
interface ChangeSetData {
"id": number,
"type": "Feature",
"geometry": {
"type": "Polygon",
"coordinates": [number, number][][]
},
"properties": {
"check_user": null,
"reasons": [],
"tags": [],
"features": [],
"user": string,
"uid": string,
"editor": string,
"comment": string,
"comments_count": number,
"source": string,
"imagery_used": string,
"date": string,
"reviewed_features": [],
"create": number,
"modify": number,
"delete": number,
"area": number,
"is_suspect": boolean,
"harmful": any,
"checked": boolean,
"check_date": any,
"metadata": {
"host": string,
"theme": string,
"imagery": string,
"language": string
}
}
}
const theme_remappings = {
"metamap": "maps",
"groen": "buurtnatuur",
"updaten van metadata met mapcomplete": "buurtnatuur",
"Toevoegen of dit natuurreservaat toegangkelijk is": "buurtnatuur",
"wiki:mapcomplete/fritures": "fritures",
"wiki:MapComplete/Fritures": "fritures",
"lits": "lit",
"pomp": "cyclofix",
"wiki:user:joost_schouppe/campersite": "campersite",
"wiki-user-joost_schouppe-geveltuintjes": "geveltuintjes",
"wiki-user-joost_schouppe-campersite": "campersite",
"wiki-User-joost_schouppe-campersite": "campersite",
"wiki-User-joost_schouppe-geveltuintjes": "geveltuintjes",
"wiki:User:joost_schouppe/campersite": "campersite",
"arbres": "arbres_llefia",
"aed_brugge": "aed",
"https://llefia.org/arbres/mapcomplete.json": "arbres_llefia",
"https://llefia.org/arbres/mapcomplete1.json": "arbres_llefia",
"toevoegen of dit natuurreservaat toegangkelijk is": "buurtnatuur",
"testing mapcomplete 0.0.0": "buurtnatuur",
"https://raw.githubusercontent.com/osmbe/play/master/mapcomplete/geveltuinen/geveltuinen.json": "geveltuintjes"
}
class ChangesetDataTools {
public static cleanChangesetData(cs: ChangeSetData): ChangeSetData {
if (cs.properties.metadata.theme === undefined) {
cs.properties.metadata.theme = cs.properties.comment.substr(cs.properties.comment.lastIndexOf("#") + 1)
}
cs.properties.metadata.theme = cs.properties.metadata.theme.toLowerCase()
const remapped = theme_remappings[cs.properties.metadata.theme]
cs.properties.metadata.theme = remapped ?? cs.properties.metadata.theme
if (cs.properties.metadata.theme.startsWith("https://raw.githubusercontent.com/")) {
cs.properties.metadata.theme = "gh://" + cs.properties.metadata.theme.substr("https://raw.githubusercontent.com/".length)
}
if (cs.properties.modify + cs.properties.delete + cs.properties.create == 0) {
cs.properties.metadata.theme = "EMPTY CS"
2022-03-17 16:40:53 +01:00
}
try {
cs.properties.metadata.host = new URL(cs.properties.metadata.host).host
} catch (e) {
}
2022-07-16 01:01:51 +02:00
if (cs.properties.metadata["answer"] > 100) {
console.log("Lots of answers for https://osm.org/changeset/" + cs.id)
2021-08-22 15:53:05 +02:00
}
return cs
}
}
interface PlotSpec {
name: string,
interpetKeysAs: "date" | "number" | "string" | string
plot: {
type: "pie" | "bar" | "line"
2021-08-22 15:53:05 +02:00
count: { key: string, value: number }[]
} | {
type: "stacked-bar"
count: {
label: string,
2022-03-17 16:40:53 +01:00
values: { key: string | Date, value: number }[],
color?: string
2021-08-22 15:53:05 +02:00
}[]
},
2022-03-17 16:40:53 +01:00
render(): Promise<void>
2021-08-22 15:53:05 +02:00
}
function createGraph(
title: string,
2022-03-17 16:40:53 +01:00
...options: PlotSpec[]): Promise<void> {
console.log("Creating graph", title, "...")
2022-07-16 01:01:51 +02:00
const process = exec("python3 Docs/Tools/GenPlot.py \"graphs/" + title + "\"", ((error, stdout, stderr) => {
2021-08-22 15:53:05 +02:00
console.log("Python: ", stdout)
if (error !== null) {
console.error(error)
}
if (stderr !== "") {
console.error(stderr)
}
}))
for (const option of options) {
const d = JSON.stringify(option) + "\n"
process.stdin._write(d, "utf-8", undefined)
2021-08-22 15:53:05 +02:00
}
process.stdin._write("\n", "utf-8", undefined)
2022-03-17 16:40:53 +01:00
return new Promise((resolve) => {
process.on("exit", () => resolve())
})
2021-08-22 15:53:05 +02:00
}
class Histogram<K> {
public counts: Map<K, number> = new Map<K, number>()
private sortAtEnd: K[] = []
constructor(keys?: K[]) {
const self = this
keys?.forEach(key => self.bump(key))
}
total(): number {
let total = 0
Array.from(this.counts.values()).forEach(i => total = total + i)
return total
}
2021-08-22 15:53:05 +02:00
public bump(key: K, increase = 1) {
2021-08-22 15:53:05 +02:00
if (this.counts.has(key)) {
this.counts.set(key, increase + this.counts.get(key))
} else {
this.counts.set(key, increase)
}
}
/**
* Adds all the values of the given histogram to this histogram
* @param hist
*/
public bumpHist(hist: Histogram<K>) {
const self = this
hist.counts.forEach((value, key) => {
self.bump(key, value)
})
}
/**
* Creates a new histogram. All entries with less then 'cutoff' count are lumped together into the 'other' category
*/
public createOthersCategory(otherName: K, cutoff: number | ((key: K, value: number) => boolean) = 15): Histogram<K> {
const hist = new Histogram<K>()
hist.sortAtEnd.push(otherName)
if (typeof cutoff === "number") {
this.counts.forEach((value, key) => {
if (value <= cutoff) {
hist.bump(otherName, value)
} else {
hist.bump(key, value)
}
})
} else {
this.counts.forEach((value, key) => {
if (cutoff(key, value)) {
hist.bump(otherName, value)
} else {
hist.bump(key, value)
}
})
}
return hist;
}
public addCountToName(): Histogram<string> {
const self = this;
const hist = new Histogram<string>()
hist.sortAtEnd = this.sortAtEnd.map(name => `${name} (${self.counts.get(name)})`)
this.counts.forEach((value, key) => {
hist.bump(`${key} (${value})`, value)
})
return hist;
}
public Clone(): Histogram<K> {
const hist = new Histogram<K>()
hist.bumpHist(this)
hist.sortAtEnd = [...this.sortAtEnd];
return hist;
}
public keyToDate(addMissingDays: boolean = false): Histogram<Date> {
const hist = new Histogram<Date>()
hist.sortAtEnd = this.sortAtEnd.map(name => new Date("" + name))
let earliest = undefined;
let latest = undefined;
this.counts.forEach((value, key) => {
const d = new Date("" + key);
if (earliest === undefined) {
earliest = d
} else if (d < earliest) {
earliest = d
}
if (latest === undefined) {
latest = d
} else if (d > latest) {
latest = d
}
hist.bump(d, value)
})
if (addMissingDays) {
while (earliest < latest) {
earliest.setDate(earliest.getDate() + 1)
hist.bump(earliest, 0)
}
}
return hist
}
public asRunningAverages(convertToRange: ((key: K) => K[])) {
const newCount = new Histogram<K>()
const self = this
this.counts.forEach((_, key) => {
const keysToCheck = convertToRange(key)
let sum = 0
for (const k of keysToCheck) {
sum += self.counts.get(k) ?? 0
}
newCount.bump(key, sum / keysToCheck.length)
})
return newCount
}
2021-08-22 15:53:05 +02:00
/**
* Given a histogram:
* 'a': 3
* 'b': 5
* 'c': 3
* 'd': 1
*
* This will create a new histogram, which counts how much every count occurs, thus:
* 5: 1 // as only 'b' had 5 counts
* 3: 2 // as both 'a' and 'c' had 3 counts
* 1: 1 // as only 'd' has 1 count
*/
public binPerCount(): Histogram<number> {
const hist = new Histogram<number>()
this.counts.forEach((value) => {
hist.bump(value)
})
return hist;
}
public stringifyName(): Histogram<string> {
const hist = new Histogram<string>()
this.counts.forEach((value, key) => {
hist.bump("" + key, value)
})
return hist;
}
public asPie(options: {
name: string
compare?: (a: K, b: K) => number
}): PlotSpec {
const self = this
const entriesArray = Array.from(this.counts.entries())
let type: string = (typeof entriesArray[0][0])
if (entriesArray[0][0] instanceof Date) {
type = "date"
}
const entries = entriesArray.map(kv => {
return ({key: kv[0], value: kv[1]});
})
if (options.compare) {
entries.sort((a, b) => options.compare(a.key, b.key))
} else {
entries.sort((a, b) => b.value - a.value)
}
entries.sort((a, b) => self.sortAtEnd.indexOf(a.key) - self.sortAtEnd.indexOf(b.key))
const graph: PlotSpec = {
name: options.name,
interpetKeysAs: type,
plot: {
type: "pie",
count: entries.map(kv => {
if (kv.key instanceof Date) {
return ({key: kv.key.toISOString(), value: kv.value})
}
return ({key: kv.key + "", value: kv.value});
})
},
render: undefined
}
2022-03-17 16:40:53 +01:00
graph.render = async () => await createGraph(graph.name, graph)
2021-08-22 15:53:05 +02:00
return graph;
}
public asBar(options: {
name: string
2022-03-17 16:40:53 +01:00
compare?: (a: K, b: K) => number,
color?: string
2021-08-22 15:53:05 +02:00
}): PlotSpec {
const spec = this.asPie(options)
spec.plot.type = "bar"
2022-03-17 16:40:53 +01:00
spec.plot["color"] = options.color
2021-08-22 15:53:05 +02:00
return spec;
}
public asLine(options: {
name: string
compare?: (a: K, b: K) => number
}) {
const spec = this.asPie(options)
spec.plot.type = "line"
return spec
}
2021-08-22 15:53:05 +02:00
}
2022-03-17 16:40:53 +01:00
/**
* A group keeps track of a matrix of changes, e.g.
* 'All contributors per day'. This will be stored internally, e.g. as {'2022-03-16' --> ['Pieter Vander Vennet', 'Pieter Vander Vennet', 'Joost Schouppe', 'Pieter Vander Vennet', 'dentonny', ...]}
*/
2021-08-22 15:53:05 +02:00
class Group<K, V> {
public groups: Map<K, V[]> = new Map<K, V[]>()
constructor(features?: any[], fkey?: (feature: any) => K, fvalue?: (feature: any) => V) {
const self = this;
features?.forEach(f => {
self.bump(fkey(f), fvalue(f))
})
}
public static createStackedBarChartPerDay(name: string, features: any, extractV: (feature: any) => string, minNeededTotal = 1): void {
const perDay = new Group<string, string>(
features,
f => f.properties.date.substr(0, 10),
extractV
)
createGraph(
name,
...Array.from(
stackHists<string, string>(
perDay.asGroupedHists()
.filter(tpl => tpl[1].total() > minNeededTotal)
.map(tpl => [`${tpl[0]} (${tpl[1].total()})`, tpl[1]])
)
)
.map(
tpl => {
const [name, hist] = tpl
return hist
.keyToDate(true)
.asBar({
name: name
});
}
)
)
}
public bump(key: K, value: V) {
if (!this.groups.has(key)) {
this.groups.set(key, [])
}
this.groups.get(key).push(value)
}
public asHist(dedup = false): Histogram<K> {
const hist = new Histogram<K>()
this.groups.forEach((values, key) => {
if (dedup) {
hist.bump(key, new Set(values).size)
} else {
hist.bump(key, values.length)
}
})
return hist
}
2022-03-17 16:40:53 +01:00
/**
* Given a group, creates a kind of histogram.
* E.g: if the Group is {'2022-03-16' --> ['Pieter Vander Vennet', 'Pieter Vander Vennet', 'Seppe Santens']}, the resulting 'groupedHists' will be:
* [['Pieter Vander Vennet', {'2022-03-16' --> 2}],['Seppe Santens', {'2022-03-16' --> 1}]]
*/
2021-08-22 15:53:05 +02:00
asGroupedHists(): [V, Histogram<K>][] {
const allHists = new Map<V, Histogram<K>>()
const allValues = new Set<V>();
Array.from(this.groups.values()).forEach(vs =>
vs.forEach(v => {
allValues.add(v)
})
)
allValues.forEach(v => allHists.set(v, new Histogram<K>()))
this.groups.forEach((values, key) => {
values.forEach(v => {
allHists.get(v).bump(key)
})
})
return Array.from(allHists.entries())
}
}
2022-03-17 16:40:53 +01:00
/**
*
* @param hists
*/
2021-08-22 15:53:05 +02:00
function stackHists<K, V>(hists: [V, Histogram<K>][]): [V, Histogram<K>][] {
const runningTotals = new Histogram<K>()
const result: [V, Histogram<K>][] = []
hists.forEach(vhist => {
const hist = vhist[1]
const clone = hist.Clone()
clone.bumpHist(runningTotals)
runningTotals.bumpHist(hist)
result.push([vhist[0], clone])
})
2022-02-22 14:13:41 +01:00
result.reverse(/* Changes in place, safe copy*/)
2021-08-22 15:53:05 +02:00
return result
}
2022-03-17 16:40:53 +01:00
/**
* Given histograms which should be shown as bars on top of each other, creates a new list of histograms with adjusted heights in order to create a coherent sum
* e.g.: for a given day, there are 2 deletions, 3 additions and 5 answers, this will be ordered as 2, 5 and 10 in order to mimic a coherent bar
* @param hists
*/
function stackHistsSimple<K>(hists: Histogram<K>[]): Histogram<K>[] {
const runningTotals = new Histogram<K>()
const result: Histogram<K>[] = []
for (const hist of hists) {
const clone = hist.Clone()
clone.bumpHist(runningTotals) // "Copies" one histogram into the other
runningTotals.bumpHist(hist)
result.push(clone)
}
result.reverse(/* Changes in place, safe copy*/)
return result
}
function createActualChangesGraph(allFeatures: ChangeSetData[], appliedFilterDescription: string) {
const metadataOptions = {
"answer": "#5b5bdc",
"create": "#46ea46",
"move": "#ffa600",
"deletion": "#ff0000",
"soft-delete": "#ff8888",
"add-image": "#8888ff",
"import": "#00ff00",
"conflation": "#ffff00",
"split": "#000000",
"relation-fix": "#cccccc",
"delete-image": "#ff00ff"
}
const metadataKeys: string[] = Object.keys(metadataOptions)
const histograms: Map<string, Histogram<string>> = new Map<string, Histogram<string>>() // {metakey --> Histogram<date>}
allFeatures.forEach(f => {
const day = f.properties.date.substr(0, 10)
for (const key of metadataKeys) {
const v = f.properties.metadata[key]
if (v === undefined) {
continue
}
const count = Number(v)
if (isNaN(count)) {
continue
}
if (!histograms.has(key)) {
histograms.set(key, new Histogram<string>())
}
histograms.get(key).bump(day, count)
}
})
2021-08-22 15:53:05 +02:00
2022-03-17 16:40:53 +01:00
const entries = stackHists(Array.from(histograms.entries()))
const allGraphs = entries.map(([name, stackedHist]) => {
const hist = histograms.get(name)
return stackedHist
.keyToDate(true)
.asBar({name: `${name} (${hist.total()})`, color: metadataOptions[name]});
}
)
createGraph("Actual changes" + appliedFilterDescription, ...allGraphs)
}
async function createGraphs(allFeatures: ChangeSetData[], appliedFilterDescription: string, cutoff = undefined) {
2021-08-22 15:53:05 +02:00
const hist = new Histogram<string>(allFeatures.map(f => f.properties.metadata.theme))
2022-03-17 16:40:53 +01:00
await hist
2022-03-11 00:17:34 +01:00
.createOthersCategory("other", cutoff ?? 20)
2021-08-22 15:53:05 +02:00
.addCountToName()
.asBar({name: "Changesets per theme (bar)" + appliedFilterDescription})
2022-03-17 16:40:53 +01:00
.render()
2021-08-22 15:53:05 +02:00
2022-03-17 16:40:53 +01:00
await new Histogram<string>(allFeatures.map(f => f.properties.user))
2021-08-22 15:53:05 +02:00
.binPerCount()
.stringifyName()
2022-03-17 16:40:53 +01:00
.createOthersCategory("25 or more", (key, _) => Number(key) >= (cutoff ?? 25)).asBar(
{
compare: (a, b) => Number(a) - Number(b),
name: "Contributors per changeset count" + appliedFilterDescription
})
.render()
const csPerDay = new Histogram<string>(allFeatures.map(f => f.properties.date.substr(0, 10)))
const perDayLine = csPerDay
.keyToDate()
.asLine({
compare: (a, b) => a.getTime() - b.getTime(),
name: "Changesets per day" + appliedFilterDescription
})
const perDayAvg = csPerDay.asRunningAverages(key => {
const keys = []
for (let i = 0; i < 7; i++) {
const otherDay = new Date(new Date(key).getTime() - i * 1000 * 60 * 60 * 24)
keys.push(otherDay.toISOString().substr(0, 10))
}
return keys
})
2022-03-17 16:40:53 +01:00
.keyToDate(true)
.asLine({
2022-03-17 16:40:53 +01:00
compare: (a, b) => a.getTime() - b.getTime(),
name: "Rolling 7 day average" + appliedFilterDescription
})
2021-12-13 17:50:47 +01:00
const perDayAvgMonth = csPerDay.asRunningAverages(key => {
const keys = []
for (let i = 0; i < 31; i++) {
const otherDay = new Date(new Date(key).getTime() - i * 1000 * 60 * 60 * 24)
keys.push(otherDay.toISOString().substr(0, 10))
}
return keys
})
.keyToDate()
.asLine({
2022-03-17 16:40:53 +01:00
compare: (a, b) => a.getTime() - b.getTime(),
name: "Rolling 31 day average" + appliedFilterDescription
})
await createGraph("Changesets per day (line)" + appliedFilterDescription, perDayLine, perDayAvg, perDayAvgMonth)
2021-08-22 15:53:05 +02:00
2022-03-17 16:40:53 +01:00
await new Histogram<string>(allFeatures.map(f => f.properties.metadata.host))
2021-08-22 15:53:05 +02:00
.asPie({
2021-08-22 22:08:14 +02:00
name: "Changesets per host" + appliedFilterDescription
2021-08-22 15:53:05 +02:00
}).render()
2022-03-17 16:40:53 +01:00
await new Histogram<string>(allFeatures.map(f => f.properties.metadata.theme))
2022-03-11 00:17:34 +01:00
.createOthersCategory("< 25 changesets", (cutoff ?? 25))
2021-09-08 17:32:31 +02:00
.addCountToName()
.asPie({
name: "Changesets per theme (pie)" + appliedFilterDescription
}).render()
2021-08-22 15:53:05 +02:00
Group.createStackedBarChartPerDay(
"Changesets per theme" + appliedFilterDescription,
allFeatures,
f => f.properties.metadata.theme,
2022-03-11 00:17:34 +01:00
cutoff ?? 25
2021-08-22 15:53:05 +02:00
)
2022-03-17 16:40:53 +01:00
2021-08-22 15:53:05 +02:00
Group.createStackedBarChartPerDay(
"Changesets per version number" + appliedFilterDescription,
allFeatures,
f => f.properties.editor?.substr("MapComplete ".length, 6)?.replace(/[a-zA-Z-/]/g, '') ?? "UNKNOWN",
2022-03-11 00:17:34 +01:00
cutoff ?? 1
2021-08-22 15:53:05 +02:00
)
2022-03-17 16:40:53 +01:00
2022-02-16 03:30:23 +01:00
Group.createStackedBarChartPerDay(
"Changesets per minor version number" + appliedFilterDescription,
allFeatures,
f => {
2022-03-17 16:40:53 +01:00
const base = f.properties.editor?.substr("MapComplete ".length)?.replace(/[a-zA-Z-/]/g, '') ?? "UNKNOWN"
const [major, minor, patch] = base.split(".")
return major + "." + minor
2022-02-16 03:30:23 +01:00
},
2022-03-17 16:40:53 +01:00
cutoff ?? 1
2022-02-16 03:30:23 +01:00
)
2021-08-22 15:53:05 +02:00
2021-08-24 12:13:21 +02:00
Group.createStackedBarChartPerDay(
"Deletion-changesets per theme" + appliedFilterDescription,
allFeatures.filter(f => f.properties.delete > 0),
f => f.properties.metadata.theme,
2022-03-11 00:17:34 +01:00
cutoff ?? 1
2021-08-24 12:13:21 +02:00
)
2021-08-22 15:53:05 +02:00
{
// Contributors (unique + unique new) per day
const contributorCountPerDay = new Group<string, string>()
const newContributorsPerDay = new Group<string, string>()
const seenContributors = new Set<string>()
allFeatures.forEach(f => {
const user = f.properties.user
const day = f.properties.date.substr(0, 10)
contributorCountPerDay.bump(day, user)
if (!seenContributors.has(user)) {
seenContributors.add(user)
newContributorsPerDay.bump(day, user)
}
})
const total = new Set(allFeatures.map(f => f.properties.user)).size
2022-03-17 16:40:53 +01:00
await createGraph(
2021-09-04 15:46:18 +02:00
`Contributors per day${appliedFilterDescription}`,
2021-08-22 15:53:05 +02:00
contributorCountPerDay
.asHist(true)
.keyToDate(true)
.asBar({
name: `Unique contributors per day (${total} total)`
2021-08-22 15:53:05 +02:00
}),
newContributorsPerDay
.asHist(true)
.keyToDate(true)
.asBar({
name: "New, unique contributors per day"
}),
)
2022-03-17 16:40:53 +01:00
await createActualChangesGraph(allFeatures, appliedFilterDescription);
2021-08-22 15:53:05 +02:00
}
}
2022-03-17 16:40:53 +01:00
async function createMiscGraphs(allFeatures: ChangeSetData[], emptyCS: ChangeSetData[]) {
await new Histogram(emptyCS.map(f => f.properties.date)).keyToDate().asBar({
name: "Empty changesets by date"
}).render()
const geojson = {
type: "FeatureCollection",
features: Utils.NoNull(allFeatures
.map(f => {
try {
const point = GeoOperations.centerpoint(f.geometry);
point.properties = {...f.properties, ...f.properties.metadata}
delete point.properties.metadata
for (const key in f.properties.metadata) {
point.properties[key] = f.properties.metadata[key]
}
2022-03-17 16:40:53 +01:00
return point
} catch (e) {
console.error("Could not create center point: ", e, f)
return undefined
}
2022-03-17 16:40:53 +01:00
}))
}
writeFileSync("centerpoints.geojson", JSON.stringify(geojson, undefined, 2))
}
2022-03-17 16:40:53 +01:00
async function main(): Promise<void> {
if (!existsSync("graphs")) {
mkdirSync("graphs")
}
2022-03-17 16:40:53 +01:00
2022-07-16 01:01:51 +02:00
const targetDir = "Docs/Tools/stats"
2022-03-17 16:40:53 +01:00
if (process.argv.indexOf("--no-download") < 0) {
2022-07-16 01:01:51 +02:00
await new StatsDownloader(targetDir).DownloadStats()
2022-03-14 02:48:50 +01:00
}
2022-07-16 01:01:51 +02:00
const allPaths = readdirSync(targetDir)
2022-01-16 02:52:46 +01:00
.filter(p => p.startsWith("stats.") && p.endsWith(".json"));
let allFeatures: ChangeSetData[] = [].concat(...allPaths
2022-07-16 01:01:51 +02:00
.map(path => JSON.parse(readFileSync("Docs/Tools/stats/" + path, "utf-8")).features
2022-01-16 02:52:46 +01:00
.map(cs => ChangesetDataTools.cleanChangesetData(cs))));
2022-03-14 02:48:50 +01:00
allFeatures = allFeatures.filter(f => f.properties.editor === null || f.properties.editor.toLowerCase().startsWith("mapcomplete"))
2022-01-16 02:52:46 +01:00
const emptyCS = allFeatures.filter(f => f.properties.metadata.theme === "EMPTY CS")
allFeatures = allFeatures.filter(f => f.properties.metadata.theme !== "EMPTY CS")
2022-03-17 16:40:53 +01:00
const noEditor = allFeatures.filter(f => f.properties.editor === null).map(f => "https://www.osm.org/changeset/" + f.id)
2022-03-14 02:48:50 +01:00
writeFileSync("missing_editor.json", JSON.stringify(noEditor, null, " "));
2022-01-16 02:52:46 +01:00
2022-03-17 16:40:53 +01:00
if (process.argv.indexOf("--no-graphs") >= 0) {
return
2022-03-14 02:48:50 +01:00
}
2022-07-29 23:25:22 +02:00
const allFiles = readdirSync("Docs/Tools/stats").filter(p => p.endsWith(".json"))
writeFileSync("Docs/Tools/stats/file-overview.json", JSON.stringify(allFiles))
/*
await createMiscGraphs(allFeatures, emptyCS)
const grbOnly = allFeatures.filter(f => f.properties.metadata.theme === "grb")
allFeatures = allFeatures.filter(f => f.properties.metadata.theme !== "grb")
await createGraphs(allFeatures, "")
await createGraphs(allFeatures.filter(f => f.properties.date.startsWith("2020")), " in 2020")
await createGraphs(allFeatures.filter(f => f.properties.date.startsWith("2021")), " in 2021")
await createGraphs(allFeatures.filter(f => f.properties.date.startsWith("2022")), " in 2022")
await createGraphs(allFeatures.filter(f => f.properties.metadata.theme === "toerisme_vlaanderen"), " met pin je punt", 0)
await createGraphs(grbOnly, " with the GRB import tool", 0)
*/
2022-01-16 02:52:46 +01:00
}
2021-08-22 15:53:05 +02:00
2022-01-16 02:52:46 +01:00
main().then(_ => console.log("All done!"))
2021-08-22 15:53:05 +02:00