2022-09-08 21:40:48 +02:00
|
|
|
import { Utils } from "../../Utils"
|
2021-10-06 02:30:23 +02:00
|
|
|
|
|
|
|
export default class Wikimedia {
|
|
|
|
/**
|
|
|
|
* Recursively walks a wikimedia commons category in order to search for entries, which can be File: or Category: entries
|
|
|
|
* Returns (a promise of) a list of URLS
|
|
|
|
* @param categoryName The name of the wikimedia category
|
|
|
|
* @param maxLoad: the maximum amount of images to return
|
|
|
|
* @param continueParameter: if the page indicates that more pages should be loaded, this uses a token to continue. Provided by wikimedia
|
|
|
|
*/
|
2022-09-08 21:40:48 +02:00
|
|
|
public static async GetCategoryContents(
|
|
|
|
categoryName: string,
|
|
|
|
maxLoad = 10,
|
|
|
|
continueParameter: string = undefined
|
|
|
|
): Promise<string[]> {
|
2021-10-06 02:30:23 +02:00
|
|
|
if (categoryName === undefined || categoryName === null || categoryName === "") {
|
2022-09-08 21:40:48 +02:00
|
|
|
return []
|
2021-10-06 02:30:23 +02:00
|
|
|
}
|
|
|
|
if (!categoryName.startsWith("Category:")) {
|
2022-09-08 21:40:48 +02:00
|
|
|
categoryName = "Category:" + categoryName
|
2021-10-06 02:30:23 +02:00
|
|
|
}
|
|
|
|
|
2022-09-08 21:40:48 +02:00
|
|
|
let url =
|
|
|
|
"https://commons.wikimedia.org/w/api.php?" +
|
2021-10-06 02:30:23 +02:00
|
|
|
"action=query&list=categorymembers&format=json&" +
|
|
|
|
"&origin=*" +
|
2022-09-08 21:40:48 +02:00
|
|
|
"&cmtitle=" +
|
|
|
|
encodeURIComponent(categoryName)
|
2021-10-06 02:30:23 +02:00
|
|
|
if (continueParameter !== undefined) {
|
2022-09-08 21:40:48 +02:00
|
|
|
url = `${url}&cmcontinue=${continueParameter}`
|
2021-10-06 02:30:23 +02:00
|
|
|
}
|
|
|
|
const response = await Utils.downloadJson(url)
|
2022-09-08 21:40:48 +02:00
|
|
|
const members = response.query?.categorymembers ?? []
|
|
|
|
const imageOverview: string[] = members.map((member) => member.title)
|
2021-10-06 02:30:23 +02:00
|
|
|
|
|
|
|
if (response.continue === undefined) {
|
|
|
|
// We are done crawling through the category - no continuation in sight
|
2022-09-08 21:40:48 +02:00
|
|
|
return imageOverview
|
2021-10-06 02:30:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
if (maxLoad - imageOverview.length <= 0) {
|
|
|
|
console.debug(`Recursive wikimedia category load stopped for ${categoryName}`)
|
2022-09-08 21:40:48 +02:00
|
|
|
return imageOverview
|
2021-10-06 02:30:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// We do have a continue token - let's load the next page
|
2022-09-08 21:40:48 +02:00
|
|
|
const recursive = await Wikimedia.GetCategoryContents(
|
|
|
|
categoryName,
|
|
|
|
maxLoad - imageOverview.length,
|
|
|
|
response.continue.cmcontinue
|
|
|
|
)
|
2021-10-06 02:30:23 +02:00
|
|
|
imageOverview.push(...recursive)
|
|
|
|
return imageOverview
|
|
|
|
}
|
2022-09-08 21:40:48 +02:00
|
|
|
}
|