2022-03-14 01:37:50 +01:00
|
|
|
import {existsSync, mkdirSync, readdirSync, readFileSync, writeFileSync} from "fs";
|
2021-08-22 15:53:05 +02:00
|
|
|
import ScriptUtils from "../../scripts/ScriptUtils";
|
|
|
|
import {Utils} from "../../Utils";
|
|
|
|
import {exec} from "child_process"
|
|
|
|
import {GeoOperations} from "../../Logic/GeoOperations";
|
|
|
|
|
2022-02-14 01:15:20 +01:00
|
|
|
ScriptUtils.fixUtils()
|
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
class StatsDownloader {
|
|
|
|
|
|
|
|
private readonly startYear = 2020
|
|
|
|
private readonly startMonth = 5;
|
2022-03-14 01:37:50 +01:00
|
|
|
private readonly urlTemplate = "https://osmcha.org/api/v1/changesets/?date__gte={start_date}&date__lte={end_date}&page={page}&comment=%23mapcomplete&page_size=100"
|
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
private readonly _targetDirectory: string;
|
|
|
|
|
|
|
|
|
|
|
|
constructor(targetDirectory = ".") {
|
|
|
|
this._targetDirectory = targetDirectory;
|
|
|
|
}
|
|
|
|
|
|
|
|
public async DownloadStats() {
|
|
|
|
|
2022-07-16 01:01:51 +02:00
|
|
|
const today = new Date();
|
|
|
|
const currentYear = today.getFullYear()
|
|
|
|
const currentMonth = today.getMonth() + 1
|
2021-08-22 15:53:05 +02:00
|
|
|
for (let year = this.startYear; year <= currentYear; year++) {
|
|
|
|
for (let month = 1; month <= 12; month++) {
|
|
|
|
|
|
|
|
if (year === this.startYear && month < this.startMonth) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (year === currentYear && month > currentMonth) {
|
2022-07-16 01:01:51 +02:00
|
|
|
break
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
|
2022-07-16 01:01:51 +02:00
|
|
|
const pathM = `${this._targetDirectory}/stats.${year}-${month}.json`
|
|
|
|
if (existsSync(pathM)) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (let day = 1; day <= 31; day++) {
|
|
|
|
if (year === currentYear && month === currentMonth && day === today.getDate() ) {
|
|
|
|
break;
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
2022-07-29 23:25:22 +02:00
|
|
|
const path = `${this._targetDirectory}/stats.${year}-${month}-${(day < 10 ? "0" : "") + day}.json`
|
2022-07-16 01:01:51 +02:00
|
|
|
if(existsSync(path)){
|
2022-07-29 23:25:22 +02:00
|
|
|
console.log("Skipping ", path,": already exists")
|
2022-07-16 01:01:51 +02:00
|
|
|
continue
|
|
|
|
}
|
2022-07-29 23:25:22 +02:00
|
|
|
try{
|
|
|
|
|
2022-07-16 01:01:51 +02:00
|
|
|
await this.DownloadStatsForDay(year, month, day, path)
|
2022-07-29 23:25:22 +02:00
|
|
|
}catch(e){
|
|
|
|
console.error(e)
|
|
|
|
console.error("Could not download "+year+"-"+month+"-"+day+"... Trying again")
|
|
|
|
try{
|
|
|
|
await this.DownloadStatsForDay(year, month, day, path)
|
|
|
|
}catch(e){
|
|
|
|
console.error("Could not download "+year+"-"+month+"-"+day+", skipping for now")
|
|
|
|
}
|
|
|
|
}
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2022-07-16 01:01:51 +02:00
|
|
|
public async DownloadStatsForDay(year: number, month: number, day: number, path: string) {
|
2021-08-22 15:53:05 +02:00
|
|
|
|
|
|
|
let page = 1;
|
|
|
|
let allFeatures = []
|
2022-07-16 01:01:51 +02:00
|
|
|
let endDay = new Date(year,month - 1 /* Zero-indexed: 0 = january*/,day + 1);
|
|
|
|
let endDate = `${endDay.getFullYear()}-${Utils.TwoDigits(endDay.getMonth()+1)}-${Utils.TwoDigits(endDay.getDate())}`
|
|
|
|
let url = this.urlTemplate.replace("{start_date}", year + "-" + Utils.TwoDigits(month) + "-" + Utils.TwoDigits(day))
|
2021-08-22 15:53:05 +02:00
|
|
|
.replace("{end_date}", endDate)
|
|
|
|
.replace("{page}", "" + page)
|
|
|
|
|
|
|
|
|
|
|
|
let headers = {
|
|
|
|
'User-Agent': 'Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:86.0) Gecko/20100101 Firefox/86.0',
|
|
|
|
'Accept-Language': 'en-US,en;q=0.5',
|
|
|
|
'Referer': 'https://osmcha.org/?filters=%7B%22date__gte%22%3A%5B%7B%22label%22%3A%222020-07-05%22%2C%22value%22%3A%222020-07-05%22%7D%5D%2C%22editor%22%3A%5B%7B%22label%22%3A%22mapcomplete%22%2C%22value%22%3A%22mapcomplete%22%7D%5D%7D',
|
|
|
|
'Content-Type': 'application/json',
|
|
|
|
'Authorization': 'Token 6e422e2afedb79ef66573982012000281f03dc91',
|
|
|
|
'DNT': '1',
|
|
|
|
'Connection': 'keep-alive',
|
|
|
|
'TE': 'Trailers',
|
|
|
|
'Pragma': 'no-cache',
|
|
|
|
'Cache-Control': 'no-cache'
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
while (url) {
|
2022-07-16 01:01:51 +02:00
|
|
|
ScriptUtils.erasableLog(`Downloading stats for ${year}-${month}-${day}, page ${page} ${url}`)
|
2022-02-14 01:15:20 +01:00
|
|
|
const result = await Utils.downloadJson(url, headers)
|
2021-08-22 15:53:05 +02:00
|
|
|
page++;
|
|
|
|
allFeatures.push(...result.features)
|
|
|
|
if (result.features === undefined) {
|
|
|
|
console.log("ERROR", result)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
url = result.next
|
|
|
|
}
|
2022-01-16 02:52:46 +01:00
|
|
|
console.log(`Writing ${allFeatures.length} features to `, path, Utils.Times(_ => " ", 80))
|
|
|
|
allFeatures = Utils.NoNull(allFeatures)
|
|
|
|
allFeatures.forEach(f => {
|
|
|
|
f.properties.id = f.id
|
|
|
|
})
|
2021-08-22 15:53:05 +02:00
|
|
|
writeFileSync(path, JSON.stringify({
|
|
|
|
features: allFeatures
|
|
|
|
}, undefined, 2))
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
interface ChangeSetData {
|
|
|
|
"id": number,
|
|
|
|
"type": "Feature",
|
|
|
|
"geometry": {
|
|
|
|
"type": "Polygon",
|
|
|
|
"coordinates": [number, number][][]
|
|
|
|
},
|
|
|
|
"properties": {
|
|
|
|
"check_user": null,
|
|
|
|
"reasons": [],
|
|
|
|
"tags": [],
|
|
|
|
"features": [],
|
|
|
|
"user": string,
|
|
|
|
"uid": string,
|
|
|
|
"editor": string,
|
|
|
|
"comment": string,
|
|
|
|
"comments_count": number,
|
|
|
|
"source": string,
|
|
|
|
"imagery_used": string,
|
|
|
|
"date": string,
|
|
|
|
"reviewed_features": [],
|
|
|
|
"create": number,
|
|
|
|
"modify": number,
|
|
|
|
"delete": number,
|
|
|
|
"area": number,
|
|
|
|
"is_suspect": boolean,
|
|
|
|
"harmful": any,
|
|
|
|
"checked": boolean,
|
|
|
|
"check_date": any,
|
|
|
|
"metadata": {
|
|
|
|
"host": string,
|
|
|
|
"theme": string,
|
|
|
|
"imagery": string,
|
|
|
|
"language": string
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
const theme_remappings = {
|
|
|
|
"metamap": "maps",
|
|
|
|
"groen": "buurtnatuur",
|
|
|
|
"updaten van metadata met mapcomplete": "buurtnatuur",
|
|
|
|
"Toevoegen of dit natuurreservaat toegangkelijk is": "buurtnatuur",
|
|
|
|
"wiki:mapcomplete/fritures": "fritures",
|
|
|
|
"wiki:MapComplete/Fritures": "fritures",
|
|
|
|
"lits": "lit",
|
|
|
|
"pomp": "cyclofix",
|
|
|
|
"wiki:user:joost_schouppe/campersite": "campersite",
|
|
|
|
"wiki-user-joost_schouppe-geveltuintjes": "geveltuintjes",
|
|
|
|
"wiki-user-joost_schouppe-campersite": "campersite",
|
|
|
|
"wiki-User-joost_schouppe-campersite": "campersite",
|
|
|
|
"wiki-User-joost_schouppe-geveltuintjes": "geveltuintjes",
|
|
|
|
"wiki:User:joost_schouppe/campersite": "campersite",
|
|
|
|
"arbres": "arbres_llefia",
|
|
|
|
"aed_brugge": "aed",
|
|
|
|
"https://llefia.org/arbres/mapcomplete.json": "arbres_llefia",
|
|
|
|
"https://llefia.org/arbres/mapcomplete1.json": "arbres_llefia",
|
|
|
|
"toevoegen of dit natuurreservaat toegangkelijk is": "buurtnatuur",
|
|
|
|
"testing mapcomplete 0.0.0": "buurtnatuur",
|
|
|
|
"https://raw.githubusercontent.com/osmbe/play/master/mapcomplete/geveltuinen/geveltuinen.json": "geveltuintjes"
|
|
|
|
}
|
|
|
|
|
|
|
|
class ChangesetDataTools {
|
|
|
|
|
|
|
|
public static cleanChangesetData(cs: ChangeSetData): ChangeSetData {
|
|
|
|
if (cs.properties.metadata.theme === undefined) {
|
|
|
|
cs.properties.metadata.theme = cs.properties.comment.substr(cs.properties.comment.lastIndexOf("#") + 1)
|
|
|
|
}
|
|
|
|
cs.properties.metadata.theme = cs.properties.metadata.theme.toLowerCase()
|
|
|
|
const remapped = theme_remappings[cs.properties.metadata.theme]
|
|
|
|
cs.properties.metadata.theme = remapped ?? cs.properties.metadata.theme
|
|
|
|
if (cs.properties.metadata.theme.startsWith("https://raw.githubusercontent.com/")) {
|
|
|
|
cs.properties.metadata.theme = "gh://" + cs.properties.metadata.theme.substr("https://raw.githubusercontent.com/".length)
|
|
|
|
}
|
|
|
|
if (cs.properties.modify + cs.properties.delete + cs.properties.create == 0) {
|
|
|
|
cs.properties.metadata.theme = "EMPTY CS"
|
2022-03-17 16:40:53 +01:00
|
|
|
}
|
|
|
|
try {
|
|
|
|
cs.properties.metadata.host = new URL(cs.properties.metadata.host).host
|
|
|
|
} catch (e) {
|
|
|
|
|
2022-03-29 00:20:10 +02:00
|
|
|
}
|
2022-07-16 01:01:51 +02:00
|
|
|
if (cs.properties.metadata["answer"] > 100) {
|
|
|
|
console.log("Lots of answers for https://osm.org/changeset/" + cs.id)
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
return cs
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
interface PlotSpec {
|
|
|
|
name: string,
|
|
|
|
interpetKeysAs: "date" | "number" | "string" | string
|
|
|
|
plot: {
|
2021-11-23 00:15:10 +01:00
|
|
|
type: "pie" | "bar" | "line"
|
2021-08-22 15:53:05 +02:00
|
|
|
count: { key: string, value: number }[]
|
|
|
|
} | {
|
|
|
|
type: "stacked-bar"
|
|
|
|
count: {
|
|
|
|
label: string,
|
2022-03-17 16:40:53 +01:00
|
|
|
values: { key: string | Date, value: number }[],
|
|
|
|
color?: string
|
2021-08-22 15:53:05 +02:00
|
|
|
}[]
|
|
|
|
},
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
render(): Promise<void>
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
function createGraph(
|
|
|
|
title: string,
|
2022-03-17 16:40:53 +01:00
|
|
|
...options: PlotSpec[]): Promise<void> {
|
|
|
|
console.log("Creating graph", title, "...")
|
2022-07-16 01:01:51 +02:00
|
|
|
const process = exec("python3 Docs/Tools/GenPlot.py \"graphs/" + title + "\"", ((error, stdout, stderr) => {
|
2021-08-22 15:53:05 +02:00
|
|
|
console.log("Python: ", stdout)
|
|
|
|
if (error !== null) {
|
|
|
|
console.error(error)
|
|
|
|
}
|
|
|
|
if (stderr !== "") {
|
|
|
|
console.error(stderr)
|
|
|
|
}
|
|
|
|
}))
|
|
|
|
|
|
|
|
for (const option of options) {
|
2021-11-23 00:15:10 +01:00
|
|
|
const d = JSON.stringify(option) + "\n"
|
|
|
|
process.stdin._write(d, "utf-8", undefined)
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
process.stdin._write("\n", "utf-8", undefined)
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
|
|
|
|
return new Promise((resolve) => {
|
|
|
|
process.on("exit", () => resolve())
|
|
|
|
})
|
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
class Histogram<K> {
|
|
|
|
public counts: Map<K, number> = new Map<K, number>()
|
|
|
|
private sortAtEnd: K[] = []
|
|
|
|
|
|
|
|
constructor(keys?: K[]) {
|
|
|
|
const self = this
|
|
|
|
keys?.forEach(key => self.bump(key))
|
|
|
|
}
|
|
|
|
|
2021-09-09 00:05:51 +02:00
|
|
|
total(): number {
|
|
|
|
let total = 0
|
|
|
|
Array.from(this.counts.values()).forEach(i => total = total + i)
|
|
|
|
return total
|
|
|
|
}
|
2021-08-22 15:53:05 +02:00
|
|
|
|
|
|
|
public bump(key: K, increase = 1) {
|
2021-11-23 00:15:10 +01:00
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
if (this.counts.has(key)) {
|
|
|
|
this.counts.set(key, increase + this.counts.get(key))
|
|
|
|
} else {
|
|
|
|
this.counts.set(key, increase)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Adds all the values of the given histogram to this histogram
|
|
|
|
* @param hist
|
|
|
|
*/
|
|
|
|
public bumpHist(hist: Histogram<K>) {
|
|
|
|
const self = this
|
|
|
|
hist.counts.forEach((value, key) => {
|
|
|
|
self.bump(key, value)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Creates a new histogram. All entries with less then 'cutoff' count are lumped together into the 'other' category
|
|
|
|
*/
|
|
|
|
public createOthersCategory(otherName: K, cutoff: number | ((key: K, value: number) => boolean) = 15): Histogram<K> {
|
|
|
|
const hist = new Histogram<K>()
|
|
|
|
hist.sortAtEnd.push(otherName)
|
|
|
|
|
|
|
|
if (typeof cutoff === "number") {
|
|
|
|
this.counts.forEach((value, key) => {
|
|
|
|
if (value <= cutoff) {
|
|
|
|
hist.bump(otherName, value)
|
|
|
|
} else {
|
|
|
|
hist.bump(key, value)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
} else {
|
|
|
|
this.counts.forEach((value, key) => {
|
|
|
|
if (cutoff(key, value)) {
|
|
|
|
hist.bump(otherName, value)
|
|
|
|
} else {
|
|
|
|
hist.bump(key, value)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
return hist;
|
|
|
|
}
|
|
|
|
|
|
|
|
public addCountToName(): Histogram<string> {
|
|
|
|
const self = this;
|
|
|
|
const hist = new Histogram<string>()
|
|
|
|
hist.sortAtEnd = this.sortAtEnd.map(name => `${name} (${self.counts.get(name)})`)
|
|
|
|
|
|
|
|
this.counts.forEach((value, key) => {
|
|
|
|
hist.bump(`${key} (${value})`, value)
|
|
|
|
})
|
|
|
|
|
|
|
|
return hist;
|
|
|
|
}
|
|
|
|
|
|
|
|
public Clone(): Histogram<K> {
|
|
|
|
const hist = new Histogram<K>()
|
|
|
|
hist.bumpHist(this)
|
|
|
|
hist.sortAtEnd = [...this.sortAtEnd];
|
|
|
|
return hist;
|
|
|
|
}
|
|
|
|
|
|
|
|
public keyToDate(addMissingDays: boolean = false): Histogram<Date> {
|
|
|
|
const hist = new Histogram<Date>()
|
|
|
|
hist.sortAtEnd = this.sortAtEnd.map(name => new Date("" + name))
|
|
|
|
|
|
|
|
let earliest = undefined;
|
|
|
|
let latest = undefined;
|
|
|
|
this.counts.forEach((value, key) => {
|
|
|
|
const d = new Date("" + key);
|
|
|
|
if (earliest === undefined) {
|
|
|
|
earliest = d
|
|
|
|
} else if (d < earliest) {
|
|
|
|
earliest = d
|
|
|
|
}
|
|
|
|
if (latest === undefined) {
|
|
|
|
latest = d
|
|
|
|
} else if (d > latest) {
|
|
|
|
latest = d
|
|
|
|
}
|
|
|
|
hist.bump(d, value)
|
|
|
|
})
|
|
|
|
|
|
|
|
if (addMissingDays) {
|
|
|
|
while (earliest < latest) {
|
|
|
|
earliest.setDate(earliest.getDate() + 1)
|
|
|
|
hist.bump(earliest, 0)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return hist
|
|
|
|
}
|
|
|
|
|
2021-11-23 00:15:10 +01:00
|
|
|
public asRunningAverages(convertToRange: ((key: K) => K[])) {
|
|
|
|
const newCount = new Histogram<K>()
|
|
|
|
const self = this
|
|
|
|
this.counts.forEach((_, key) => {
|
|
|
|
const keysToCheck = convertToRange(key)
|
|
|
|
let sum = 0
|
|
|
|
for (const k of keysToCheck) {
|
|
|
|
sum += self.counts.get(k) ?? 0
|
|
|
|
}
|
|
|
|
newCount.bump(key, sum / keysToCheck.length)
|
|
|
|
})
|
|
|
|
return newCount
|
|
|
|
}
|
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
/**
|
|
|
|
* Given a histogram:
|
|
|
|
* 'a': 3
|
|
|
|
* 'b': 5
|
|
|
|
* 'c': 3
|
|
|
|
* 'd': 1
|
|
|
|
*
|
|
|
|
* This will create a new histogram, which counts how much every count occurs, thus:
|
|
|
|
* 5: 1 // as only 'b' had 5 counts
|
|
|
|
* 3: 2 // as both 'a' and 'c' had 3 counts
|
|
|
|
* 1: 1 // as only 'd' has 1 count
|
|
|
|
*/
|
|
|
|
public binPerCount(): Histogram<number> {
|
|
|
|
const hist = new Histogram<number>()
|
|
|
|
this.counts.forEach((value) => {
|
|
|
|
hist.bump(value)
|
|
|
|
})
|
|
|
|
return hist;
|
|
|
|
}
|
|
|
|
|
|
|
|
public stringifyName(): Histogram<string> {
|
|
|
|
const hist = new Histogram<string>()
|
|
|
|
this.counts.forEach((value, key) => {
|
|
|
|
hist.bump("" + key, value)
|
|
|
|
})
|
|
|
|
return hist;
|
|
|
|
}
|
|
|
|
|
|
|
|
public asPie(options: {
|
|
|
|
name: string
|
|
|
|
compare?: (a: K, b: K) => number
|
|
|
|
}): PlotSpec {
|
|
|
|
const self = this
|
|
|
|
const entriesArray = Array.from(this.counts.entries())
|
|
|
|
let type: string = (typeof entriesArray[0][0])
|
|
|
|
if (entriesArray[0][0] instanceof Date) {
|
|
|
|
type = "date"
|
|
|
|
}
|
|
|
|
const entries = entriesArray.map(kv => {
|
|
|
|
return ({key: kv[0], value: kv[1]});
|
|
|
|
})
|
|
|
|
|
|
|
|
if (options.compare) {
|
|
|
|
entries.sort((a, b) => options.compare(a.key, b.key))
|
|
|
|
} else {
|
|
|
|
entries.sort((a, b) => b.value - a.value)
|
|
|
|
}
|
|
|
|
entries.sort((a, b) => self.sortAtEnd.indexOf(a.key) - self.sortAtEnd.indexOf(b.key))
|
|
|
|
|
|
|
|
|
|
|
|
const graph: PlotSpec = {
|
|
|
|
name: options.name,
|
|
|
|
interpetKeysAs: type,
|
|
|
|
plot: {
|
|
|
|
|
|
|
|
type: "pie",
|
|
|
|
count: entries.map(kv => {
|
|
|
|
if (kv.key instanceof Date) {
|
|
|
|
return ({key: kv.key.toISOString(), value: kv.value})
|
|
|
|
}
|
|
|
|
return ({key: kv.key + "", value: kv.value});
|
|
|
|
})
|
|
|
|
},
|
|
|
|
render: undefined
|
|
|
|
}
|
2022-03-17 16:40:53 +01:00
|
|
|
graph.render = async () => await createGraph(graph.name, graph)
|
2021-08-22 15:53:05 +02:00
|
|
|
return graph;
|
|
|
|
}
|
|
|
|
|
|
|
|
public asBar(options: {
|
|
|
|
name: string
|
2022-03-17 16:40:53 +01:00
|
|
|
compare?: (a: K, b: K) => number,
|
|
|
|
color?: string
|
2021-08-22 15:53:05 +02:00
|
|
|
}): PlotSpec {
|
|
|
|
const spec = this.asPie(options)
|
|
|
|
spec.plot.type = "bar"
|
2022-03-17 16:40:53 +01:00
|
|
|
spec.plot["color"] = options.color
|
2021-08-22 15:53:05 +02:00
|
|
|
return spec;
|
|
|
|
}
|
|
|
|
|
2021-11-23 00:15:10 +01:00
|
|
|
public asLine(options: {
|
|
|
|
name: string
|
|
|
|
compare?: (a: K, b: K) => number
|
|
|
|
}) {
|
|
|
|
const spec = this.asPie(options)
|
|
|
|
spec.plot.type = "line"
|
|
|
|
return spec
|
|
|
|
}
|
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
/**
|
|
|
|
* A group keeps track of a matrix of changes, e.g.
|
|
|
|
* 'All contributors per day'. This will be stored internally, e.g. as {'2022-03-16' --> ['Pieter Vander Vennet', 'Pieter Vander Vennet', 'Joost Schouppe', 'Pieter Vander Vennet', 'dentonny', ...]}
|
|
|
|
*/
|
2021-08-22 15:53:05 +02:00
|
|
|
class Group<K, V> {
|
|
|
|
|
|
|
|
public groups: Map<K, V[]> = new Map<K, V[]>()
|
|
|
|
|
|
|
|
constructor(features?: any[], fkey?: (feature: any) => K, fvalue?: (feature: any) => V) {
|
|
|
|
const self = this;
|
|
|
|
features?.forEach(f => {
|
|
|
|
self.bump(fkey(f), fvalue(f))
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
public static createStackedBarChartPerDay(name: string, features: any, extractV: (feature: any) => string, minNeededTotal = 1): void {
|
|
|
|
const perDay = new Group<string, string>(
|
|
|
|
features,
|
|
|
|
f => f.properties.date.substr(0, 10),
|
|
|
|
extractV
|
|
|
|
)
|
|
|
|
|
|
|
|
createGraph(
|
|
|
|
name,
|
|
|
|
...Array.from(
|
|
|
|
stackHists<string, string>(
|
|
|
|
perDay.asGroupedHists()
|
|
|
|
.filter(tpl => tpl[1].total() > minNeededTotal)
|
|
|
|
.map(tpl => [`${tpl[0]} (${tpl[1].total()})`, tpl[1]])
|
|
|
|
)
|
|
|
|
)
|
|
|
|
.map(
|
|
|
|
tpl => {
|
|
|
|
const [name, hist] = tpl
|
|
|
|
return hist
|
|
|
|
.keyToDate(true)
|
|
|
|
.asBar({
|
|
|
|
name: name
|
|
|
|
});
|
|
|
|
}
|
|
|
|
)
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
|
|
|
public bump(key: K, value: V) {
|
|
|
|
if (!this.groups.has(key)) {
|
|
|
|
this.groups.set(key, [])
|
|
|
|
}
|
|
|
|
this.groups.get(key).push(value)
|
|
|
|
}
|
|
|
|
|
|
|
|
public asHist(dedup = false): Histogram<K> {
|
|
|
|
const hist = new Histogram<K>()
|
|
|
|
this.groups.forEach((values, key) => {
|
|
|
|
if (dedup) {
|
|
|
|
hist.bump(key, new Set(values).size)
|
|
|
|
} else {
|
|
|
|
hist.bump(key, values.length)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
return hist
|
|
|
|
}
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
/**
|
|
|
|
* Given a group, creates a kind of histogram.
|
|
|
|
* E.g: if the Group is {'2022-03-16' --> ['Pieter Vander Vennet', 'Pieter Vander Vennet', 'Seppe Santens']}, the resulting 'groupedHists' will be:
|
|
|
|
* [['Pieter Vander Vennet', {'2022-03-16' --> 2}],['Seppe Santens', {'2022-03-16' --> 1}]]
|
|
|
|
*/
|
2021-08-22 15:53:05 +02:00
|
|
|
asGroupedHists(): [V, Histogram<K>][] {
|
|
|
|
|
|
|
|
const allHists = new Map<V, Histogram<K>>()
|
|
|
|
|
|
|
|
const allValues = new Set<V>();
|
|
|
|
Array.from(this.groups.values()).forEach(vs =>
|
|
|
|
vs.forEach(v => {
|
|
|
|
allValues.add(v)
|
|
|
|
})
|
|
|
|
)
|
|
|
|
|
|
|
|
allValues.forEach(v => allHists.set(v, new Histogram<K>()))
|
|
|
|
|
|
|
|
this.groups.forEach((values, key) => {
|
|
|
|
values.forEach(v => {
|
|
|
|
allHists.get(v).bump(key)
|
|
|
|
})
|
|
|
|
})
|
|
|
|
|
|
|
|
return Array.from(allHists.entries())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
/**
|
|
|
|
*
|
|
|
|
* @param hists
|
|
|
|
*/
|
2021-08-22 15:53:05 +02:00
|
|
|
function stackHists<K, V>(hists: [V, Histogram<K>][]): [V, Histogram<K>][] {
|
|
|
|
const runningTotals = new Histogram<K>()
|
|
|
|
const result: [V, Histogram<K>][] = []
|
|
|
|
hists.forEach(vhist => {
|
|
|
|
const hist = vhist[1]
|
|
|
|
const clone = hist.Clone()
|
|
|
|
clone.bumpHist(runningTotals)
|
|
|
|
runningTotals.bumpHist(hist)
|
|
|
|
result.push([vhist[0], clone])
|
|
|
|
})
|
2022-02-22 14:13:41 +01:00
|
|
|
result.reverse(/* Changes in place, safe copy*/)
|
2021-08-22 15:53:05 +02:00
|
|
|
return result
|
|
|
|
}
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
/**
|
|
|
|
* Given histograms which should be shown as bars on top of each other, creates a new list of histograms with adjusted heights in order to create a coherent sum
|
|
|
|
* e.g.: for a given day, there are 2 deletions, 3 additions and 5 answers, this will be ordered as 2, 5 and 10 in order to mimic a coherent bar
|
|
|
|
* @param hists
|
|
|
|
*/
|
|
|
|
function stackHistsSimple<K>(hists: Histogram<K>[]): Histogram<K>[] {
|
|
|
|
const runningTotals = new Histogram<K>()
|
|
|
|
const result: Histogram<K>[] = []
|
|
|
|
for (const hist of hists) {
|
|
|
|
const clone = hist.Clone()
|
|
|
|
clone.bumpHist(runningTotals) // "Copies" one histogram into the other
|
|
|
|
runningTotals.bumpHist(hist)
|
|
|
|
result.push(clone)
|
|
|
|
}
|
|
|
|
result.reverse(/* Changes in place, safe copy*/)
|
|
|
|
return result
|
|
|
|
}
|
|
|
|
|
|
|
|
function createActualChangesGraph(allFeatures: ChangeSetData[], appliedFilterDescription: string) {
|
|
|
|
const metadataOptions = {
|
|
|
|
"answer": "#5b5bdc",
|
|
|
|
"create": "#46ea46",
|
|
|
|
"move": "#ffa600",
|
|
|
|
"deletion": "#ff0000",
|
|
|
|
"soft-delete": "#ff8888",
|
|
|
|
"add-image": "#8888ff",
|
|
|
|
"import": "#00ff00",
|
|
|
|
"conflation": "#ffff00",
|
|
|
|
"split": "#000000",
|
|
|
|
"relation-fix": "#cccccc",
|
|
|
|
"delete-image": "#ff00ff"
|
|
|
|
}
|
|
|
|
|
|
|
|
const metadataKeys: string[] = Object.keys(metadataOptions)
|
|
|
|
const histograms: Map<string, Histogram<string>> = new Map<string, Histogram<string>>() // {metakey --> Histogram<date>}
|
|
|
|
allFeatures.forEach(f => {
|
|
|
|
const day = f.properties.date.substr(0, 10)
|
|
|
|
|
|
|
|
for (const key of metadataKeys) {
|
|
|
|
const v = f.properties.metadata[key]
|
|
|
|
if (v === undefined) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
const count = Number(v)
|
|
|
|
if (isNaN(count)) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if (!histograms.has(key)) {
|
|
|
|
histograms.set(key, new Histogram<string>())
|
|
|
|
}
|
|
|
|
histograms.get(key).bump(day, count)
|
|
|
|
}
|
|
|
|
|
|
|
|
})
|
2021-08-22 15:53:05 +02:00
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
|
|
|
|
const entries = stackHists(Array.from(histograms.entries()))
|
|
|
|
|
|
|
|
const allGraphs = entries.map(([name, stackedHist]) => {
|
|
|
|
const hist = histograms.get(name)
|
|
|
|
return stackedHist
|
|
|
|
.keyToDate(true)
|
|
|
|
.asBar({name: `${name} (${hist.total()})`, color: metadataOptions[name]});
|
|
|
|
}
|
|
|
|
)
|
|
|
|
|
|
|
|
createGraph("Actual changes" + appliedFilterDescription, ...allGraphs)
|
|
|
|
}
|
|
|
|
|
|
|
|
async function createGraphs(allFeatures: ChangeSetData[], appliedFilterDescription: string, cutoff = undefined) {
|
2021-08-22 15:53:05 +02:00
|
|
|
const hist = new Histogram<string>(allFeatures.map(f => f.properties.metadata.theme))
|
2022-03-17 16:40:53 +01:00
|
|
|
await hist
|
2022-03-11 00:17:34 +01:00
|
|
|
.createOthersCategory("other", cutoff ?? 20)
|
2021-08-22 15:53:05 +02:00
|
|
|
.addCountToName()
|
2021-11-23 00:15:10 +01:00
|
|
|
.asBar({name: "Changesets per theme (bar)" + appliedFilterDescription})
|
2022-03-17 16:40:53 +01:00
|
|
|
.render()
|
2021-08-22 15:53:05 +02:00
|
|
|
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
await new Histogram<string>(allFeatures.map(f => f.properties.user))
|
2021-08-22 15:53:05 +02:00
|
|
|
.binPerCount()
|
|
|
|
.stringifyName()
|
2022-03-17 16:40:53 +01:00
|
|
|
.createOthersCategory("25 or more", (key, _) => Number(key) >= (cutoff ?? 25)).asBar(
|
|
|
|
{
|
|
|
|
compare: (a, b) => Number(a) - Number(b),
|
|
|
|
name: "Contributors per changeset count" + appliedFilterDescription
|
|
|
|
})
|
|
|
|
.render()
|
2021-11-23 00:15:10 +01:00
|
|
|
|
|
|
|
|
|
|
|
const csPerDay = new Histogram<string>(allFeatures.map(f => f.properties.date.substr(0, 10)))
|
|
|
|
|
|
|
|
const perDayLine = csPerDay
|
|
|
|
.keyToDate()
|
|
|
|
.asLine({
|
|
|
|
compare: (a, b) => a.getTime() - b.getTime(),
|
|
|
|
name: "Changesets per day" + appliedFilterDescription
|
|
|
|
})
|
|
|
|
|
|
|
|
const perDayAvg = csPerDay.asRunningAverages(key => {
|
|
|
|
const keys = []
|
|
|
|
for (let i = 0; i < 7; i++) {
|
|
|
|
const otherDay = new Date(new Date(key).getTime() - i * 1000 * 60 * 60 * 24)
|
|
|
|
keys.push(otherDay.toISOString().substr(0, 10))
|
|
|
|
}
|
|
|
|
return keys
|
|
|
|
})
|
2022-03-17 16:40:53 +01:00
|
|
|
.keyToDate(true)
|
2021-11-23 00:15:10 +01:00
|
|
|
.asLine({
|
2022-03-17 16:40:53 +01:00
|
|
|
compare: (a, b) => a.getTime() - b.getTime(),
|
|
|
|
name: "Rolling 7 day average" + appliedFilterDescription
|
|
|
|
})
|
|
|
|
|
2021-12-13 17:50:47 +01:00
|
|
|
const perDayAvgMonth = csPerDay.asRunningAverages(key => {
|
|
|
|
const keys = []
|
|
|
|
for (let i = 0; i < 31; i++) {
|
|
|
|
const otherDay = new Date(new Date(key).getTime() - i * 1000 * 60 * 60 * 24)
|
|
|
|
keys.push(otherDay.toISOString().substr(0, 10))
|
|
|
|
}
|
|
|
|
return keys
|
|
|
|
})
|
|
|
|
.keyToDate()
|
|
|
|
.asLine({
|
2022-03-17 16:40:53 +01:00
|
|
|
compare: (a, b) => a.getTime() - b.getTime(),
|
|
|
|
name: "Rolling 31 day average" + appliedFilterDescription
|
|
|
|
})
|
|
|
|
|
|
|
|
await createGraph("Changesets per day (line)" + appliedFilterDescription, perDayLine, perDayAvg, perDayAvgMonth)
|
2021-08-22 15:53:05 +02:00
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
|
|
|
|
await new Histogram<string>(allFeatures.map(f => f.properties.metadata.host))
|
2021-08-22 15:53:05 +02:00
|
|
|
.asPie({
|
2021-08-22 22:08:14 +02:00
|
|
|
name: "Changesets per host" + appliedFilterDescription
|
2021-08-22 15:53:05 +02:00
|
|
|
}).render()
|
2021-09-09 00:05:51 +02:00
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
await new Histogram<string>(allFeatures.map(f => f.properties.metadata.theme))
|
2022-03-11 00:17:34 +01:00
|
|
|
.createOthersCategory("< 25 changesets", (cutoff ?? 25))
|
2021-09-08 17:32:31 +02:00
|
|
|
.addCountToName()
|
|
|
|
.asPie({
|
|
|
|
name: "Changesets per theme (pie)" + appliedFilterDescription
|
|
|
|
}).render()
|
2021-08-22 15:53:05 +02:00
|
|
|
|
|
|
|
Group.createStackedBarChartPerDay(
|
|
|
|
"Changesets per theme" + appliedFilterDescription,
|
|
|
|
allFeatures,
|
|
|
|
f => f.properties.metadata.theme,
|
2022-03-11 00:17:34 +01:00
|
|
|
cutoff ?? 25
|
2021-08-22 15:53:05 +02:00
|
|
|
)
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
Group.createStackedBarChartPerDay(
|
|
|
|
"Changesets per version number" + appliedFilterDescription,
|
|
|
|
allFeatures,
|
2022-03-14 01:37:50 +01:00
|
|
|
f => f.properties.editor?.substr("MapComplete ".length, 6)?.replace(/[a-zA-Z-/]/g, '') ?? "UNKNOWN",
|
2022-03-11 00:17:34 +01:00
|
|
|
cutoff ?? 1
|
2021-08-22 15:53:05 +02:00
|
|
|
)
|
2022-03-17 16:40:53 +01:00
|
|
|
|
2022-02-16 03:30:23 +01:00
|
|
|
Group.createStackedBarChartPerDay(
|
|
|
|
"Changesets per minor version number" + appliedFilterDescription,
|
|
|
|
allFeatures,
|
|
|
|
f => {
|
2022-03-17 16:40:53 +01:00
|
|
|
const base = f.properties.editor?.substr("MapComplete ".length)?.replace(/[a-zA-Z-/]/g, '') ?? "UNKNOWN"
|
|
|
|
const [major, minor, patch] = base.split(".")
|
|
|
|
return major + "." + minor
|
|
|
|
|
2022-02-16 03:30:23 +01:00
|
|
|
},
|
2022-03-17 16:40:53 +01:00
|
|
|
cutoff ?? 1
|
2022-02-16 03:30:23 +01:00
|
|
|
)
|
2021-08-22 15:53:05 +02:00
|
|
|
|
2021-08-24 12:13:21 +02:00
|
|
|
Group.createStackedBarChartPerDay(
|
|
|
|
"Deletion-changesets per theme" + appliedFilterDescription,
|
|
|
|
allFeatures.filter(f => f.properties.delete > 0),
|
|
|
|
f => f.properties.metadata.theme,
|
2022-03-11 00:17:34 +01:00
|
|
|
cutoff ?? 1
|
2021-08-24 12:13:21 +02:00
|
|
|
)
|
|
|
|
|
2021-08-22 15:53:05 +02:00
|
|
|
{
|
|
|
|
// Contributors (unique + unique new) per day
|
|
|
|
const contributorCountPerDay = new Group<string, string>()
|
|
|
|
const newContributorsPerDay = new Group<string, string>()
|
|
|
|
const seenContributors = new Set<string>()
|
|
|
|
allFeatures.forEach(f => {
|
|
|
|
const user = f.properties.user
|
|
|
|
const day = f.properties.date.substr(0, 10)
|
|
|
|
contributorCountPerDay.bump(day, user)
|
|
|
|
if (!seenContributors.has(user)) {
|
|
|
|
seenContributors.add(user)
|
|
|
|
newContributorsPerDay.bump(day, user)
|
|
|
|
}
|
|
|
|
})
|
|
|
|
const total = new Set(allFeatures.map(f => f.properties.user)).size
|
2022-03-17 16:40:53 +01:00
|
|
|
await createGraph(
|
2021-09-04 15:46:18 +02:00
|
|
|
`Contributors per day${appliedFilterDescription}`,
|
2021-08-22 15:53:05 +02:00
|
|
|
contributorCountPerDay
|
|
|
|
.asHist(true)
|
|
|
|
.keyToDate(true)
|
|
|
|
.asBar({
|
2021-08-26 11:48:25 +02:00
|
|
|
name: `Unique contributors per day (${total} total)`
|
2021-08-22 15:53:05 +02:00
|
|
|
}),
|
|
|
|
newContributorsPerDay
|
|
|
|
.asHist(true)
|
|
|
|
.keyToDate(true)
|
|
|
|
.asBar({
|
|
|
|
name: "New, unique contributors per day"
|
|
|
|
}),
|
|
|
|
)
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
await createActualChangesGraph(allFeatures, appliedFilterDescription);
|
2021-08-22 15:53:05 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
async function createMiscGraphs(allFeatures: ChangeSetData[], emptyCS: ChangeSetData[]) {
|
|
|
|
await new Histogram(emptyCS.map(f => f.properties.date)).keyToDate().asBar({
|
2021-11-23 00:15:10 +01:00
|
|
|
name: "Empty changesets by date"
|
|
|
|
}).render()
|
|
|
|
const geojson = {
|
|
|
|
type: "FeatureCollection",
|
2022-01-16 01:58:02 +01:00
|
|
|
features: Utils.NoNull(allFeatures
|
|
|
|
.map(f => {
|
|
|
|
try {
|
|
|
|
const point = GeoOperations.centerpoint(f.geometry);
|
|
|
|
point.properties = {...f.properties, ...f.properties.metadata}
|
|
|
|
delete point.properties.metadata
|
|
|
|
for (const key in f.properties.metadata) {
|
|
|
|
point.properties[key] = f.properties.metadata[key]
|
|
|
|
}
|
2022-03-17 16:40:53 +01:00
|
|
|
|
2022-01-16 01:58:02 +01:00
|
|
|
return point
|
|
|
|
} catch (e) {
|
|
|
|
console.error("Could not create center point: ", e, f)
|
|
|
|
return undefined
|
|
|
|
}
|
2022-03-17 16:40:53 +01:00
|
|
|
}))
|
2021-11-23 00:15:10 +01:00
|
|
|
}
|
|
|
|
writeFileSync("centerpoints.geojson", JSON.stringify(geojson, undefined, 2))
|
|
|
|
}
|
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
async function main(): Promise<void> {
|
|
|
|
if (!existsSync("graphs")) {
|
2022-03-14 01:37:50 +01:00
|
|
|
mkdirSync("graphs")
|
|
|
|
}
|
2022-03-17 16:40:53 +01:00
|
|
|
|
2022-07-16 01:01:51 +02:00
|
|
|
const targetDir = "Docs/Tools/stats"
|
2022-03-17 16:40:53 +01:00
|
|
|
if (process.argv.indexOf("--no-download") < 0) {
|
2022-07-16 01:01:51 +02:00
|
|
|
await new StatsDownloader(targetDir).DownloadStats()
|
2022-03-14 02:48:50 +01:00
|
|
|
}
|
2022-07-16 01:01:51 +02:00
|
|
|
const allPaths = readdirSync(targetDir)
|
2022-01-16 02:52:46 +01:00
|
|
|
.filter(p => p.startsWith("stats.") && p.endsWith(".json"));
|
|
|
|
let allFeatures: ChangeSetData[] = [].concat(...allPaths
|
2022-07-16 01:01:51 +02:00
|
|
|
.map(path => JSON.parse(readFileSync("Docs/Tools/stats/" + path, "utf-8")).features
|
2022-01-16 02:52:46 +01:00
|
|
|
.map(cs => ChangesetDataTools.cleanChangesetData(cs))));
|
2022-03-14 02:48:50 +01:00
|
|
|
allFeatures = allFeatures.filter(f => f.properties.editor === null || f.properties.editor.toLowerCase().startsWith("mapcomplete"))
|
2022-01-16 02:52:46 +01:00
|
|
|
|
|
|
|
const emptyCS = allFeatures.filter(f => f.properties.metadata.theme === "EMPTY CS")
|
|
|
|
allFeatures = allFeatures.filter(f => f.properties.metadata.theme !== "EMPTY CS")
|
2022-03-17 16:40:53 +01:00
|
|
|
|
|
|
|
const noEditor = allFeatures.filter(f => f.properties.editor === null).map(f => "https://www.osm.org/changeset/" + f.id)
|
2022-03-14 02:48:50 +01:00
|
|
|
writeFileSync("missing_editor.json", JSON.stringify(noEditor, null, " "));
|
2022-01-16 02:52:46 +01:00
|
|
|
|
2022-03-17 16:40:53 +01:00
|
|
|
if (process.argv.indexOf("--no-graphs") >= 0) {
|
|
|
|
return
|
2022-03-14 02:48:50 +01:00
|
|
|
}
|
2022-07-29 23:25:22 +02:00
|
|
|
const allFiles = readdirSync("Docs/Tools/stats").filter(p => p.endsWith(".json"))
|
|
|
|
writeFileSync("Docs/Tools/stats/file-overview.json", JSON.stringify(allFiles))
|
|
|
|
|
|
|
|
/*
|
|
|
|
await createMiscGraphs(allFeatures, emptyCS)
|
|
|
|
|
|
|
|
const grbOnly = allFeatures.filter(f => f.properties.metadata.theme === "grb")
|
|
|
|
allFeatures = allFeatures.filter(f => f.properties.metadata.theme !== "grb")
|
|
|
|
await createGraphs(allFeatures, "")
|
|
|
|
await createGraphs(allFeatures.filter(f => f.properties.date.startsWith("2020")), " in 2020")
|
|
|
|
await createGraphs(allFeatures.filter(f => f.properties.date.startsWith("2021")), " in 2021")
|
|
|
|
await createGraphs(allFeatures.filter(f => f.properties.date.startsWith("2022")), " in 2022")
|
|
|
|
await createGraphs(allFeatures.filter(f => f.properties.metadata.theme === "toerisme_vlaanderen"), " met pin je punt", 0)
|
|
|
|
await createGraphs(grbOnly, " with the GRB import tool", 0)
|
|
|
|
*/
|
2022-01-16 02:52:46 +01:00
|
|
|
}
|
2021-08-22 15:53:05 +02:00
|
|
|
|
2022-01-16 02:52:46 +01:00
|
|
|
main().then(_ => console.log("All done!"))
|
2021-08-22 15:53:05 +02:00
|
|
|
|