Files
drop/server/internal/metadata/pcgamingwiki.ts
2025-06-09 13:52:42 +10:00

503 lines
14 KiB
TypeScript

import type { Company } from "~/prisma/client";
import { MetadataSource } from "~/prisma/client";
import type { MetadataProvider } from ".";
import type {
GameMetadataSearchResult,
_FetchGameMetadataParams,
GameMetadata,
_FetchCompanyMetadataParams,
CompanyMetadata,
GameMetadataRating,
} from "./types";
import type { AxiosRequestConfig } from "axios";
import axios from "axios";
import * as jdenticon from "jdenticon";
import { DateTime } from "luxon";
import * as cheerio from "cheerio";
import { type } from "arktype";
import type { TaskRunContext } from "../tasks";
interface PCGamingWikiParseRawPage {
parse: {
title: string;
pageid: number;
revid: number;
displaytitle: string;
// array of links
externallinks: string[];
// array of wiki file names
images: string[];
text: {
// rendered page contents
"*": string;
};
};
}
interface PCGamingWikiPage {
PageID: string;
PageName: string;
}
interface PCGamingWikiSearchStub extends PCGamingWikiPage {
"Cover URL": string | null;
Released: string | null;
Released__precision: string | null;
}
interface PCGamingWikiGame extends PCGamingWikiSearchStub {
Developers: string | string[] | null;
Publishers: string | string[] | null;
// TODO: save this somewhere, maybe a tag?
Series: string | null;
// tags
Perspectives: string | string[] | null; // ie: First-person
Genres: string | string[] | null; // ie: Action, FPS
"Art styles": string | string[] | null; // ie: Stylized
Themes: string | string[] | null; // ie: Post-apocalyptic, Sci-fi, Space
Modes: string | string[] | null; // ie: Singleplayer, Multiplayer
Pacing: string | string[] | null; // ie: Real-time
}
interface PCGamingWikiCompany extends PCGamingWikiPage {
Parent: string | null;
Founded: string | null;
Website: string | null;
Founded__precision: string | null;
Defunct__precision: string | null;
}
interface PCGamingWikiCargoResult<T> {
cargoquery: [
{
title: T;
},
];
error?: {
code?: string;
info?: string;
errorclass?: string;
"*"?: string;
};
}
type StringArrayKeys<T> = {
[K in keyof T]: T[K] extends string | string[] | null ? K : never;
}[keyof T];
const ratingProviderReview = type({
rating: "string.integer.parse",
});
// Api Docs: https://www.pcgamingwiki.com/wiki/PCGamingWiki:API
// Good tool for helping build cargo queries: https://www.pcgamingwiki.com/wiki/Special:CargoQuery
export class PCGamingWikiProvider implements MetadataProvider {
name() {
return "PCGamingWiki";
}
source() {
return MetadataSource.PCGamingWiki;
}
private async request<T>(
query: URLSearchParams,
options?: AxiosRequestConfig,
) {
const finalURL = `https://www.pcgamingwiki.com/w/api.php?${query.toString()}`;
const overlay: AxiosRequestConfig = {
url: finalURL,
baseURL: "",
};
const response = await axios.request<T>(
Object.assign({}, options, overlay),
);
if (response.status !== 200)
throw new Error(
`Error in pcgamingwiki \nStatus Code: ${response.status}\n${response.data}`,
);
return response;
}
private async cargoQuery<T>(
query: URLSearchParams,
options?: AxiosRequestConfig,
) {
const response = await this.request<PCGamingWikiCargoResult<T>>(
query,
options,
);
if (response.data.error !== undefined)
throw new Error(`Error in pcgamingwiki cargo query`);
return response;
}
/**
* Gets the raw wiki page for parsing,
* requested values are to be considered unstable as compared to cargo queries
* @param pageID
* @returns
*/
private async getPageContent(pageID: string) {
const searchParams = new URLSearchParams({
action: "parse",
format: "json",
pageid: pageID,
});
const res = await this.request<PCGamingWikiParseRawPage>(searchParams);
const $ = cheerio.load(res.data.parse.text["*"]);
// get intro based on 'introduction' class
const introductionEle = $(".introduction").first();
// remove citations from intro
introductionEle.find("sup").remove();
const infoBoxEle = $(".template-infobox").first();
const receptionEle = infoBoxEle
.find(".template-infobox-header")
.filter((_, el) => $(el).text().trim() === "Reception");
const receptionResults: (GameMetadataRating | undefined)[] = [];
if (receptionEle.length > 0) {
// we have a match!
const ratingElements = infoBoxEle.find(".template-infobox-type");
// TODO: cleanup this ratnest
const parseIdFromHref = (href: string): string | undefined => {
const url = new URL(href);
const opencriticRegex = /^\/game\/(\d+)\/.+$/;
switch (url.hostname.toLocaleLowerCase()) {
case "www.metacritic.com": {
// https://www.metacritic.com/game/elden-ring/critic-reviews/?platform=pc
return url.pathname
.replace("/game/", "")
.replace("/critic-reviews", "")
.replace(/\/$/, "");
}
case "opencritic.com": {
// https://opencritic.com/game/12090/elden-ring
let id = "unknown";
let matches;
if ((matches = opencriticRegex.exec(url.pathname)) !== null) {
matches.forEach((match, _groupIndex) => {
// console.log(`Found match, group ${_groupIndex}: ${match}`);
id = match;
});
}
if (id === "unknown") {
return undefined;
}
return id;
}
case "www.igdb.com": {
// https://www.igdb.com/games/elden-ring
return url.pathname.replace("/games/", "").replace(/\/$/, "");
}
default: {
console.warn("Pcgamingwiki, unknown host", url.hostname);
return undefined;
}
}
};
const getRating = (
source: MetadataSource,
): GameMetadataRating | undefined => {
const providerEle = ratingElements.filter(
(_, el) =>
$(el).text().trim().toLocaleLowerCase() ===
source.toLocaleLowerCase(),
);
if (providerEle.length > 0) {
// get info associated with provider
const reviewEle = providerEle
.first()
.parent()
.find(".template-infobox-info")
.find("a")
.first();
const href = reviewEle.attr("href");
if (!href) {
console.log(
`pcgamingwiki: failed to properly get review href for ${source}`,
);
return undefined;
}
const ratingObj = ratingProviderReview({
rating: reviewEle.text().trim(),
});
if (ratingObj instanceof type.errors) {
console.log(
"pcgamingwiki: failed to properly get review rating",
ratingObj.summary,
);
return undefined;
}
const id = parseIdFromHref(href);
if (!id) return undefined;
return {
mReviewHref: href,
metadataId: id,
metadataSource: source,
mReviewCount: 0,
// make float within 0 to 1
mReviewRating: ratingObj.rating / 100,
};
}
return undefined;
};
receptionResults.push(getRating(MetadataSource.Metacritic));
receptionResults.push(getRating(MetadataSource.IGDB));
receptionResults.push(getRating(MetadataSource.OpenCritic));
}
return {
shortIntro: introductionEle.find("p").first().text().trim(),
introduction: introductionEle.text().trim(),
reception: receptionResults,
};
}
async search(query: string) {
const searchParams = new URLSearchParams({
action: "cargoquery",
tables: "Infobox_game",
fields:
"Infobox_game._pageID=PageID,Infobox_game._pageName=PageName,Infobox_game.Cover_URL,Infobox_game.Released",
where: `Infobox_game._pageName="${query}"`,
format: "json",
});
const response =
await this.cargoQuery<PCGamingWikiSearchStub>(searchParams);
const results: GameMetadataSearchResult[] = [];
for (const result of response.data.cargoquery) {
const game = result.title;
const pageContent = await this.getPageContent(game.PageID);
results.push({
id: game.PageID,
name: game.PageName,
icon: game["Cover URL"] ?? "",
description: pageContent.shortIntro,
year:
game.Released !== null && game.Released.length > 0
? // sometimes will provide multiple dates
this.parseTS(game.Released).year
: 0,
});
}
return results;
}
/**
* Parses the specific format that the wiki returns when specifying an array
* @param input string or array
* @returns
*/
private parseWikiStringArray(input: string | string[]): string[] {
const cleanStr = (str: string): string => {
// remove any dumb prefixes we don't care about
return str.replace("Company:", "").trim();
};
// input can provides the string as a list
// ie: "Company:Digerati Distribution,Company:Greylock Studio"
// or as an array, sometimes the array has empty values
const results: string[] = [];
if (Array.isArray(input)) {
input.forEach((c) => {
const clean = cleanStr(c);
if (clean !== "") results.push(clean);
});
} else {
const items = input.split(",");
items.forEach((item) => {
const clean = cleanStr(item);
if (clean !== "") results.push(clean);
});
}
return results;
}
/**
* Parses the specific format that the wiki returns when specifying a iso timestamp
* @param isoStr
* @returns
*/
private parseTS(isoStr: string): DateTime {
return DateTime.fromISO(isoStr.split(";")[0]);
}
private parseWebsitesGetFirst(websiteStr?: string | null): string {
if (websiteStr === undefined || websiteStr === null) return "";
// string comes in format: "[https://www.gamesci.com.cn www.gamesci.com.cn]"
return websiteStr.replaceAll(/\[|]/g, "").split(" ")[0] ?? "";
}
private compileTags(game: PCGamingWikiGame): string[] {
const results: string[] = [];
const properties: StringArrayKeys<PCGamingWikiGame>[] = [
"Art styles",
"Genres",
"Modes",
"Pacing",
"Perspectives",
"Themes",
];
// loop through all above keys, get the tags they contain
properties.forEach((p) => {
if (game[p] === null) return;
results.push(...this.parseWikiStringArray(game[p]));
});
return results;
}
async fetchGame(
{ id, name, publisher, developer, createObject }: _FetchGameMetadataParams,
context?: TaskRunContext,
): Promise<GameMetadata> {
context?.log("Using PCGamingWiki provider");
context?.progress(0);
const searchParams = new URLSearchParams({
action: "cargoquery",
tables: "Infobox_game",
fields:
"Infobox_game._pageID=PageID,Infobox_game._pageName=PageName,Infobox_game.Cover_URL,Infobox_game.Developers,Infobox_game.Released,Infobox_game.Genres,Infobox_game.Publishers,Infobox_game.Themes,Infobox_game.Series,Infobox_game.Modes,Infobox_game.Perspectives,Infobox_game.Art_styles,Infobox_game.Pacing",
where: `Infobox_game._pageID="${id}"`,
format: "json",
});
const [res, pageContent] = await Promise.all([
this.cargoQuery<PCGamingWikiGame>(searchParams),
this.getPageContent(id),
]);
if (res.data.cargoquery.length < 1)
throw new Error("Error in pcgamingwiki, no game");
const game = res.data.cargoquery[0].title;
const publishers: Company[] = [];
if (game.Publishers !== null) {
context?.log("Found publishers, importing...");
const pubListClean = this.parseWikiStringArray(game.Publishers);
for (const pub of pubListClean) {
context?.log(`Importing "${pub}"...`);
const res = await publisher(pub);
if (res === undefined) continue;
publishers.push(res);
}
}
context?.progress(40);
const developers: Company[] = [];
if (game.Developers !== null) {
context?.log("Found developers, importing...");
const devListClean = this.parseWikiStringArray(game.Developers);
for (const dev of devListClean) {
context?.log(`Importing "${dev}"...`);
const res = await developer(dev);
if (res === undefined) continue;
developers.push(res);
}
}
context?.progress(80);
const icon = createObject(
game["Cover URL"] !== null
? game["Cover URL"]
: jdenticon.toPng(name, 512),
);
const released = game.Released
? DateTime.fromISO(game.Released.split(";")[0]).toJSDate()
: new Date();
const metadata: GameMetadata = {
id: game.PageID,
name: game.PageName,
shortDescription: pageContent.shortIntro,
description: pageContent.introduction,
released,
tags: this.compileTags(game),
reviews: pageContent.reception.filter((v) => typeof v !== "undefined"),
publishers,
developers,
icon: icon,
bannerId: icon,
coverId: icon,
images: [icon],
};
context?.log("PCGamingWiki provider finished.");
context?.progress(100);
return metadata;
}
async fetchCompany({
query,
createObject,
}: _FetchCompanyMetadataParams): Promise<CompanyMetadata> {
const searchParams = new URLSearchParams({
action: "cargoquery",
tables: "Company",
fields:
"Company.Parent,Company.Founded,Company.Defunct,Company.Website,Company._pageName=PageName,Company._pageID=PageID",
where: `Company._pageName="Company:${query}"`,
format: "json",
});
const res = await this.cargoQuery<PCGamingWikiCompany>(searchParams);
// TODO: replace with company logo
const icon = createObject(jdenticon.toPng(query, 512));
for (let i = 0; i < res.data.cargoquery.length; i++) {
const company = res.data.cargoquery[i].title;
const fixedCompanyName =
this.parseWikiStringArray(company.PageName)[0] ?? company.PageName;
const metadata: CompanyMetadata = {
id: company.PageID,
name: fixedCompanyName,
shortDescription: "",
description: "",
website: this.parseWebsitesGetFirst(company?.Website),
logo: icon,
banner: icon,
cover: icon,
};
return metadata;
}
throw new Error(`pcgamingwiki failed to find publisher/developer ${query}`);
}
}