2024-05-16 00:12:50 +02:00
|
|
|
import Script from "./Script"
|
|
|
|
import NameSuggestionIndex, { NSIItem } from "../src/Logic/Web/NameSuggestionIndex"
|
|
|
|
import * as nsiWD from "../node_modules/name-suggestion-index/dist/wikidata.min.json"
|
2024-07-29 03:16:35 +02:00
|
|
|
import { existsSync, readFileSync, unlinkSync, writeFileSync } from "fs"
|
2024-05-16 00:12:50 +02:00
|
|
|
import ScriptUtils from "./ScriptUtils"
|
|
|
|
import { Utils } from "../src/Utils"
|
|
|
|
|
2024-05-23 11:28:51 +02:00
|
|
|
class DownloadNsiLogos extends Script {
|
2024-05-16 00:12:50 +02:00
|
|
|
constructor() {
|
|
|
|
super("Downloads all images of the NSI")
|
|
|
|
}
|
|
|
|
|
|
|
|
private async downloadLogo(nsiItem: NSIItem, type: string, basePath: string) {
|
|
|
|
try {
|
|
|
|
return await this.downloadLogoUnsafe(nsiItem, type, basePath)
|
|
|
|
} catch (e) {
|
|
|
|
console.error("Could not download", nsiItem.displayName, "due to", e)
|
2024-07-08 23:13:57 +02:00
|
|
|
return "error"
|
2024-05-16 00:12:50 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private async downloadLogoUnsafe(nsiItem: NSIItem, type: string, basePath: string) {
|
|
|
|
if (nsiItem === undefined) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
let path = basePath + nsiItem.id
|
|
|
|
|
|
|
|
const logos = nsiWD["wikidata"][nsiItem?.tags?.[type + ":wikidata"]]?.logos
|
|
|
|
|
|
|
|
if (NameSuggestionIndex.isSvg(nsiItem, type)) {
|
|
|
|
path = path + ".svg"
|
|
|
|
}
|
|
|
|
|
|
|
|
if (existsSync(path)) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!logos) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if (logos.facebook) {
|
2024-07-08 23:13:57 +02:00
|
|
|
// Facebook's logos are generally better and square
|
2024-05-16 00:12:50 +02:00
|
|
|
await ScriptUtils.DownloadFileTo(logos.facebook, path)
|
2024-07-29 03:16:35 +02:00
|
|
|
// Validate
|
|
|
|
const content = readFileSync(path, "utf8")
|
2024-08-09 16:55:08 +02:00
|
|
|
if (content.startsWith('{"error"')) {
|
2024-07-29 03:16:35 +02:00
|
|
|
unlinkSync(path)
|
2024-08-09 16:55:08 +02:00
|
|
|
console.error("Attempted to fetch", logos.facebook, " but this gave an error")
|
|
|
|
} else {
|
2024-07-29 03:16:35 +02:00
|
|
|
return true
|
|
|
|
}
|
2024-05-16 00:12:50 +02:00
|
|
|
}
|
|
|
|
if (logos.wikidata) {
|
|
|
|
let url: string = logos.wikidata
|
|
|
|
console.log("Downloading", url)
|
|
|
|
let ttl = 10
|
|
|
|
do {
|
|
|
|
ttl--
|
|
|
|
const dloaded = await Utils.downloadAdvanced(url, {
|
2024-06-16 16:06:26 +02:00
|
|
|
"User-Agent":
|
|
|
|
"MapComplete NSI scraper/0.1 (https://github.com/pietervdvn/MapComplete; pietervdvn@posteo.net)",
|
2024-05-16 00:12:50 +02:00
|
|
|
})
|
|
|
|
const redirect: string | undefined = dloaded["redirect"]
|
|
|
|
if (redirect) {
|
|
|
|
console.log("Got a redirect from", url, "to", redirect)
|
|
|
|
url = redirect
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if ((<string>logos.wikidata).toLowerCase().endsWith(".svg")) {
|
|
|
|
console.log("Written SVG", path)
|
2024-05-23 11:28:51 +02:00
|
|
|
if (!path.endsWith(".svg")) {
|
|
|
|
throw "Undetected svg path:" + logos.wikidata
|
2024-05-16 00:12:50 +02:00
|
|
|
}
|
|
|
|
writeFileSync(path, dloaded["content"], "utf8")
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
console.log("Got data from", url, "-->", path)
|
|
|
|
await ScriptUtils.DownloadFileTo(url, path)
|
|
|
|
return true
|
|
|
|
} while (ttl > 0)
|
|
|
|
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2024-05-23 11:28:51 +02:00
|
|
|
async main(): Promise<void> {
|
|
|
|
await this.downloadFor("operator")
|
|
|
|
await this.downloadFor("brand")
|
|
|
|
}
|
|
|
|
|
|
|
|
async downloadFor(type: "brand" | "operator"): Promise<void> {
|
2024-05-16 00:12:50 +02:00
|
|
|
const items = NameSuggestionIndex.allPossible(type)
|
|
|
|
const basePath = "./public/assets/data/nsi/logos/"
|
|
|
|
let downloadCount = 0
|
2024-07-08 23:13:57 +02:00
|
|
|
const stepcount = 5
|
2024-05-16 00:12:50 +02:00
|
|
|
for (let i = 0; i < items.length; i += stepcount) {
|
2024-07-08 23:13:57 +02:00
|
|
|
if (downloadCount > 0 || i % 200 === 0) {
|
2024-05-16 00:12:50 +02:00
|
|
|
console.log(i + "/" + items.length, "downloaded " + downloadCount)
|
|
|
|
}
|
2024-07-08 23:13:57 +02:00
|
|
|
|
|
|
|
const results = await Promise.all(
|
2024-06-16 16:06:26 +02:00
|
|
|
Utils.TimesT(stepcount, (j) => j).map(async (j) => {
|
|
|
|
const downloaded = await this.downloadLogo(items[i + j], type, basePath)
|
|
|
|
if (downloaded) {
|
|
|
|
downloadCount++
|
|
|
|
}
|
2024-07-08 23:13:57 +02:00
|
|
|
return downloaded
|
2024-06-16 16:06:26 +02:00
|
|
|
})
|
|
|
|
)
|
2024-07-08 23:13:57 +02:00
|
|
|
for (let j = 0; j < results.length; j++) {
|
|
|
|
let didDownload = results[j]
|
2024-07-09 13:42:08 +02:00
|
|
|
if (didDownload !== "error") {
|
2024-07-08 23:13:57 +02:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
console.log("Retrying", items[i + j].id, type)
|
|
|
|
didDownload = await this.downloadLogo(items[i + j], type, basePath)
|
2024-07-09 13:42:08 +02:00
|
|
|
if (didDownload === "error") {
|
2024-07-08 23:13:57 +02:00
|
|
|
console.log("Failed again:", items[i + j].id)
|
|
|
|
}
|
|
|
|
}
|
2024-05-16 00:12:50 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
new DownloadNsiLogos().run()
|