| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  | import Script from "./Script" | 
					
						
							|  |  |  | import NameSuggestionIndex, { NSIItem } from "../src/Logic/Web/NameSuggestionIndex" | 
					
						
							|  |  |  | import * as nsiWD from "../node_modules/name-suggestion-index/dist/wikidata.min.json" | 
					
						
							| 
									
										
										
										
											2024-07-29 03:16:35 +02:00
										 |  |  | import { existsSync, readFileSync, unlinkSync, writeFileSync } from "fs" | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  | import ScriptUtils from "./ScriptUtils" | 
					
						
							|  |  |  | import { Utils } from "../src/Utils" | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-05-23 11:28:51 +02:00
										 |  |  | class DownloadNsiLogos extends Script { | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |     constructor() { | 
					
						
							|  |  |  |         super("Downloads all images of the NSI") | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     private async downloadLogo(nsiItem: NSIItem, type: string, basePath: string) { | 
					
						
							|  |  |  |         try { | 
					
						
							|  |  |  |             return await this.downloadLogoUnsafe(nsiItem, type, basePath) | 
					
						
							|  |  |  |         } catch (e) { | 
					
						
							|  |  |  |             console.error("Could not download", nsiItem.displayName, "due to", e) | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |             return "error" | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     private async downloadLogoUnsafe(nsiItem: NSIItem, type: string, basePath: string) { | 
					
						
							|  |  |  |         if (nsiItem === undefined) { | 
					
						
							|  |  |  |             return false | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         let path = basePath + nsiItem.id | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         const logos = nsiWD["wikidata"][nsiItem?.tags?.[type + ":wikidata"]]?.logos | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if (NameSuggestionIndex.isSvg(nsiItem, type)) { | 
					
						
							|  |  |  |             path = path + ".svg" | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if (existsSync(path)) { | 
					
						
							|  |  |  |             return false | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         if (!logos) { | 
					
						
							|  |  |  |             return false | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         if (logos.facebook) { | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |             // Facebook's logos are generally better and square
 | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |             await ScriptUtils.DownloadFileTo(logos.facebook, path) | 
					
						
							| 
									
										
										
										
											2024-07-29 03:16:35 +02:00
										 |  |  |             // Validate
 | 
					
						
							|  |  |  |             const content = readFileSync(path, "utf8") | 
					
						
							| 
									
										
										
										
											2024-08-09 16:55:08 +02:00
										 |  |  |             if (content.startsWith('{"error"')) { | 
					
						
							| 
									
										
										
										
											2024-07-29 03:16:35 +02:00
										 |  |  |                 unlinkSync(path) | 
					
						
							| 
									
										
										
										
											2024-08-09 16:55:08 +02:00
										 |  |  |                 console.error("Attempted to fetch", logos.facebook, " but this gave an error") | 
					
						
							|  |  |  |             } else { | 
					
						
							| 
									
										
										
										
											2024-07-29 03:16:35 +02:00
										 |  |  |                 return true | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |         } | 
					
						
							|  |  |  |         if (logos.wikidata) { | 
					
						
							|  |  |  |             let url: string = logos.wikidata | 
					
						
							|  |  |  |             console.log("Downloading", url) | 
					
						
							|  |  |  |             let ttl = 10 | 
					
						
							|  |  |  |             do { | 
					
						
							|  |  |  |                 ttl-- | 
					
						
							|  |  |  |                 const dloaded = await Utils.downloadAdvanced(url, { | 
					
						
							| 
									
										
										
										
											2024-06-16 16:06:26 +02:00
										 |  |  |                     "User-Agent": | 
					
						
							|  |  |  |                         "MapComplete NSI scraper/0.1 (https://github.com/pietervdvn/MapComplete; pietervdvn@posteo.net)", | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |                 }) | 
					
						
							|  |  |  |                 const redirect: string | undefined = dloaded["redirect"] | 
					
						
							|  |  |  |                 if (redirect) { | 
					
						
							|  |  |  |                     console.log("Got a redirect from", url, "to", redirect) | 
					
						
							|  |  |  |                     url = redirect | 
					
						
							|  |  |  |                     continue | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |                 if ((<string>logos.wikidata).toLowerCase().endsWith(".svg")) { | 
					
						
							|  |  |  |                     console.log("Written SVG", path) | 
					
						
							| 
									
										
										
										
											2024-05-23 11:28:51 +02:00
										 |  |  |                     if (!path.endsWith(".svg")) { | 
					
						
							|  |  |  |                         throw "Undetected svg path:" + logos.wikidata | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |                     } | 
					
						
							|  |  |  |                     writeFileSync(path, dloaded["content"], "utf8") | 
					
						
							|  |  |  |                     return true | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |                 console.log("Got data from", url, "-->", path) | 
					
						
							|  |  |  |                 await ScriptUtils.DownloadFileTo(url, path) | 
					
						
							|  |  |  |                 return true | 
					
						
							|  |  |  |             } while (ttl > 0) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             return false | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         return false | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2024-05-23 11:28:51 +02:00
										 |  |  |     async main(): Promise<void> { | 
					
						
							|  |  |  |         await this.downloadFor("operator") | 
					
						
							|  |  |  |         await this.downloadFor("brand") | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     async downloadFor(type: "brand" | "operator"): Promise<void> { | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |         const items = NameSuggestionIndex.allPossible(type) | 
					
						
							|  |  |  |         const basePath = "./public/assets/data/nsi/logos/" | 
					
						
							|  |  |  |         let downloadCount = 0 | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |         const stepcount = 5 | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |         for (let i = 0; i < items.length; i += stepcount) { | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |             if (downloadCount > 0 || i % 200 === 0) { | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |                 console.log(i + "/" + items.length, "downloaded " + downloadCount) | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |             const results = await Promise.all( | 
					
						
							| 
									
										
										
										
											2024-06-16 16:06:26 +02:00
										 |  |  |                 Utils.TimesT(stepcount, (j) => j).map(async (j) => { | 
					
						
							|  |  |  |                     const downloaded = await this.downloadLogo(items[i + j], type, basePath) | 
					
						
							|  |  |  |                     if (downloaded) { | 
					
						
							|  |  |  |                         downloadCount++ | 
					
						
							|  |  |  |                     } | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |                     return downloaded | 
					
						
							| 
									
										
										
										
											2024-06-16 16:06:26 +02:00
										 |  |  |                 }) | 
					
						
							|  |  |  |             ) | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |             for (let j = 0; j < results.length; j++) { | 
					
						
							|  |  |  |                 let didDownload = results[j] | 
					
						
							| 
									
										
										
										
											2024-07-09 13:42:08 +02:00
										 |  |  |                 if (didDownload !== "error") { | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |                     continue | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |                 console.log("Retrying", items[i + j].id, type) | 
					
						
							|  |  |  |                 didDownload = await this.downloadLogo(items[i + j], type, basePath) | 
					
						
							| 
									
										
										
										
											2024-07-09 13:42:08 +02:00
										 |  |  |                 if (didDownload === "error") { | 
					
						
							| 
									
										
										
										
											2024-07-08 23:13:57 +02:00
										 |  |  |                     console.log("Failed again:", items[i + j].id) | 
					
						
							|  |  |  |                 } | 
					
						
							|  |  |  |             } | 
					
						
							| 
									
										
										
										
											2024-05-16 00:12:50 +02:00
										 |  |  |         } | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | new DownloadNsiLogos().run() |