MapComplete/src/Logic/ImageProviders/WikimediaImageProvider.ts

188 lines
6.6 KiB
TypeScript
Raw Normal View History

2022-09-08 21:40:48 +02:00
import ImageProvider, { ProvidedImage } from "./ImageProvider"
import BaseUIElement from "../../UI/BaseUIElement"
import { Utils } from "../../Utils"
import { LicenseInfo } from "./LicenseInfo"
import Wikimedia from "../Web/Wikimedia"
import SvelteUIElement from "../../UI/Base/SvelteUIElement"
import Wikimedia_commons_white from "../../assets/svg/Wikimedia_commons_white.svelte"
/**
* This module provides endpoints for wikimedia and others
*/
export class WikimediaImageProvider extends ImageProvider {
2022-09-08 21:40:48 +02:00
public static readonly singleton = new WikimediaImageProvider()
2023-09-27 22:21:35 +02:00
public static readonly apiUrls = [
2022-09-08 21:40:48 +02:00
"https://commons.wikimedia.org/wiki/",
2024-04-13 02:40:21 +02:00
"https://upload.wikimedia.org",
2022-09-08 21:40:48 +02:00
]
2023-09-27 22:21:35 +02:00
public static readonly commonsPrefixes = [...WikimediaImageProvider.apiUrls, "File:"]
2021-11-07 16:34:51 +01:00
private readonly commons_key = "wikimedia_commons"
public readonly defaultKeyPrefixes = [this.commons_key, "image"]
public readonly name = "Wikimedia"
private constructor() {
2022-09-08 21:40:48 +02:00
super()
}
private static ExtractFileName(url: string) {
if (!url.startsWith("http")) {
2022-09-08 21:40:48 +02:00
return url
}
const path = new URL(url).pathname
2022-09-08 21:40:48 +02:00
return path.substring(path.lastIndexOf("/") + 1)
}
private static PrepareUrl(value: string, useHd = false): string {
2021-11-07 16:34:51 +01:00
if (value.toLowerCase().startsWith("https://commons.wikimedia.org/wiki/")) {
2022-09-08 21:40:48 +02:00
return value
2021-11-07 16:34:51 +01:00
}
const baseUrl = `https://commons.wikimedia.org/wiki/Special:FilePath/${encodeURIComponent(
2022-09-08 21:40:48 +02:00
value
)}`
if (useHd) {
return baseUrl
}
return baseUrl + `?width=500&height=400`
2021-11-07 16:34:51 +01:00
}
private static startsWithCommonsPrefix(value: string): boolean {
2022-09-08 21:40:48 +02:00
return WikimediaImageProvider.commonsPrefixes.some((prefix) => value.startsWith(prefix))
2021-11-07 16:34:51 +01:00
}
private static removeCommonsPrefix(value: string): string {
if (value.startsWith("https://upload.wikimedia.org/")) {
value = value.substring(value.lastIndexOf("/") + 1)
value = decodeURIComponent(value)
if (!value.startsWith("File:")) {
value = "File:" + value
}
2022-09-08 21:40:48 +02:00
return value
2021-11-07 16:34:51 +01:00
}
for (const prefix of WikimediaImageProvider.commonsPrefixes) {
if (value.startsWith(prefix)) {
let part = value.substr(prefix.length)
if (prefix.startsWith("http")) {
part = decodeURIComponent(part)
}
return part
}
}
2022-09-08 21:40:48 +02:00
return value
2021-11-07 16:34:51 +01:00
}
2023-09-27 22:21:35 +02:00
apiUrls(): string[] {
return WikimediaImageProvider.apiUrls
}
2023-12-02 03:12:34 +01:00
SourceIcon(): BaseUIElement {
return new SvelteUIElement(Wikimedia_commons_white).SetStyle("width:2em;height: 2em")
}
public PrepUrl(value: NonNullable<string>): ProvidedImage
public PrepUrl(value: undefined): undefined
public PrepUrl(value: string): ProvidedImage
public PrepUrl(value: string | undefined): ProvidedImage | undefined{
if(value === undefined){
return undefined
}
2021-11-07 16:34:51 +01:00
value = WikimediaImageProvider.removeCommonsPrefix(value)
2021-11-07 16:34:51 +01:00
if (value.startsWith("File:")) {
return this.UrlForImage(value)
}
2021-11-07 16:34:51 +01:00
// We do a last effort and assume this is a file
return this.UrlForImage("File:" + value)
}
public async ExtractUrls(key: string, value: string): Promise<Promise<ProvidedImage>[]> {
const hasCommonsPrefix = WikimediaImageProvider.startsWithCommonsPrefix(value)
if (key !== undefined && key !== this.commons_key && !hasCommonsPrefix) {
return []
}
value = WikimediaImageProvider.removeCommonsPrefix(value)
if (value.startsWith("Category:")) {
const urls = await Wikimedia.GetCategoryContents(value)
2022-09-08 21:40:48 +02:00
return urls
.filter((url) => url.startsWith("File:"))
.map((image) => Promise.resolve(this.UrlForImage(image)))
2021-11-07 16:34:51 +01:00
}
if (value.startsWith("File:")) {
return [Promise.resolve(this.UrlForImage(value))]
}
if (value.startsWith("http")) {
// PRobably an error
return []
}
// We do a last effort and assume this is a file
return [Promise.resolve(this.UrlForImage("File:" + value))]
}
2024-07-19 11:57:53 +02:00
public async DownloadAttribution(img: {url: string}): Promise<LicenseInfo> {
2024-04-01 02:00:48 +02:00
const filename = WikimediaImageProvider.ExtractFileName(img.url)
if (filename === "") {
2022-09-08 21:40:48 +02:00
return undefined
}
2022-09-08 21:40:48 +02:00
const url =
"https://en.wikipedia.org/w/" +
"api.php?action=query&prop=imageinfo&iiprop=extmetadata&" +
2022-09-08 21:40:48 +02:00
"titles=" +
filename +
"&format=json&origin=*"
const data = await Utils.downloadJsonCached<{query: {pages: {title: string, imageinfo: { extmetadata} []}[]}}>(url, 365 * 24 * 60 * 60)
2022-09-08 21:40:48 +02:00
const licenseInfo = new LicenseInfo()
const pageInfo = data.query.pages.at(-1)
2021-11-07 16:34:51 +01:00
if (pageInfo === undefined) {
2022-09-08 21:40:48 +02:00
return undefined
}
2022-09-08 21:40:48 +02:00
const license = (pageInfo.imageinfo ?? [])[0]?.extmetadata
if (license === undefined) {
2022-09-08 21:40:48 +02:00
console.warn(
"The file",
filename,
"has no usable metedata or license attached... Please fix the license info file yourself!"
)
return undefined
}
let title = pageInfo.title
2021-11-07 16:34:51 +01:00
if (title.startsWith("File:")) {
title = title.substr("File:".length)
}
2021-11-07 16:34:51 +01:00
if (title.endsWith(".jpg") || title.endsWith(".png")) {
title = title.substring(0, title.length - 4)
}
2021-11-07 16:34:51 +01:00
licenseInfo.title = title
2022-09-08 21:40:48 +02:00
licenseInfo.artist = license.Artist?.value
licenseInfo.license = license.License?.value
licenseInfo.copyrighted = license.Copyrighted?.value
licenseInfo.attributionRequired = license.AttributionRequired?.value
licenseInfo.usageTerms = license.UsageTerms?.value
licenseInfo.licenseShortName = license.LicenseShortName?.value
licenseInfo.credit = license.Credit?.value
licenseInfo.description = license.ImageDescription?.value
licenseInfo.informationLocation = new URL("https://en.wikipedia.org/wiki/" + pageInfo.title)
return licenseInfo
}
2021-10-08 04:33:39 +02:00
private UrlForImage(image: string): ProvidedImage {
if (!image.startsWith("File:")) {
image = "File:" + image
}
2023-12-19 22:08:00 +01:00
return {
url: WikimediaImageProvider.PrepareUrl(image),
url_hd: WikimediaImageProvider.PrepareUrl(image, true),
2023-12-19 22:08:00 +01:00
key: undefined,
provider: this,
2024-04-13 02:40:21 +02:00
id: image,
2023-12-19 22:08:00 +01:00
}
}
}