Files
Myrient-Search-Engine/lib/crawler/metadatamanager.js

326 lines
9.4 KiB
JavaScript

import {
twitchAccessToken,
igdb,
request,
multi,
} from "@phalcode/ts-igdb-client";
import {
fields,
or,
and,
where,
whereIn,
WhereFlags,
WhereInFlags,
sort,
limit,
offset,
} from "@phalcode/ts-igdb-client";
import { File, Metadata } from "../database/database.js";
import TaskQueue from "../utility/taskqueue.js";
import { singleLineStatus } from "../utility/printutils.js";
import { Timer } from "../utility/time.js";
import { readFileSync } from "fs";
export default class MetadataManager {
constructor() {
this.twitchSecrets = {
client_id: process.env.TWITCH_CLIENT_ID,
client_secret: process.env.TWITCH_CLIENT_SECRET,
};
this.setupClient();
this.queue = new TaskQueue();
}
gameFields = [
"name",
"alternative_names.comment",
"alternative_names.name",
"cover.image_id",
"total_rating",
"first_release_date",
"summary",
"genres.name",
"involved_companies.company.name",
"involved_companies.developer",
"involved_companies.publisher",
"involved_companies.supporting",
"game_modes.name",
"game_localizations.name",
"game_localizations.region",
"game_localizations.region.name",
"game_localizations.cover.image_id",
"platforms.name",
"game_type.type",
"screenshots.image_id",
"videos.video_id",
];
async setupClient() {
try {
if (this.twitchSecrets.client_id && this.twitchSecrets.client_secret) {
this.accessToken = await twitchAccessToken(this.twitchSecrets);
this.client = igdb(this.twitchSecrets.client_id, this.accessToken);
const mapFilePath = "./lib/json/maps/igdb_platform.json";
this.platformMap = JSON.parse(readFileSync(mapFilePath, "utf8"));
if (this.accessToken) {
this.authorized = true;
this.ready = true;
return;
}
}
this.ready = true;
this.authorized = false; //disable
} catch (error) {
this.ready = true;
this.authorized = false;
}
}
normalizeName(filename) {
if (!filename) return;
return filename
.replace(
/\.[A-z]{3,3}|\.|&|-|\+|,|v[0-9]+\.[0-9]+|\[.*?\]|\(.*?\)|the|usa/gi,
""
)
.replace(/\s{2,}/g, " ")
.trim();
}
async getIGDBGamesCount(retrying = false) {
try {
// hack to ensure the client is ready before we do anything
while (!this.ready) {
await this.sleep(500);
}
if (this.authorized === false) return 0;
const { data } = await this.client
.request("games/count")
.pipe(
and(
where("game_type.type", "!=", "Mod"),
where("game_type.type", "!=", "DLC")
)
)
.execute();
return data.count;
} catch (error) {
if (error.code === "ERR_BAD_REQUEST" && !retrying) {
this.setupClient();
return this.getIGDBGamesCount(true);
}
console.error("Error getting IGDB games count:", error);
return 0;
}
}
async matchAllMetadata(fuzzy = false) {
let games = await File.findAll({
where: {
nongame: false,
detailsId: null,
},
attributes: ["id", "filename"],
order: ["id", "filename"],
include: { model: Metadata, as: "details" },
});
let count = games.length;
let timer = new Timer();
let found = 0;
console.log(`Matching ${count} games to metadata.`);
for (let x = 0; x < count; x++) {
singleLineStatus(
`Matching metadata: ${x} / ${count} ${(
((x) / count) *
100
).toFixed(2)}% (${timer.elapsed()}) Total Matches: ${found}`
);
let game = games[x];
let metadata = await Metadata.searchByText(
"title",
this.normalizeName(game.filename),
game.category
);
if (metadata?.length == 0) {
// repeat the search under one of the alternate titles
metadata = await Metadata.searchByText(
"alternatetitles",
this.normalizeName(game.filename),
game.category
);
}
if (metadata?.length >= 1) {
let md = await Metadata.findByPk(metadata[0].id);
await game.setDetails(md);
await md.addFile(game);
await game.save();
await md.save();
found++;
} else if (fuzzy) {
//this is much slower and should only be used if the faster full text search can't find it.
let metadata = await Metadata.fuzzySearchByText(
"title",
this.normalizeName(game.filename),
0.8,
game.category
);
if (!metadata?.length == 0) {
metadata = await Metadata.fuzzySearchByText(
"alternatetitles",
this.normalizeName(game.filename),
0.8,
game.category
);
}
if (metadata?.length >= 1) {
let md = await Metadata.findByPk(metadata[0].id);
await game.setDetails(md);
await md.addFile(game);
await game.save();
await md.save();
found++;
}
}
}
console.log(`\nFinished matching metadata to files in ${timer.elapsed()}`);
}
async syncAllMetadata(retrying = false) {
try {
const timer = new Timer();
// hack to ensure the client is ready before we do anything
while (!this.ready) {
await this.sleep(500);
}
if (!this.authorized) {
console.log(
"Twitch credentials are unavailable or invalid; metadata sync is unavailable."
);
return;
}
console.log("Syncing all metadata...");
let count = await this.getIGDBGamesCount();
let pageSize = 500;
let pages = Math.ceil(count / pageSize);
let retryCount = 0;
for (let x = 0; x < pages; x++) {
if (retryCount == 5) continue;
singleLineStatus(
`Syncing metadata: ${x * 500} / ${count} ${(
((x * 500) / count) *
100
).toFixed(2)}% (${timer.elapsed()})`
);
try {
let { data } = await this.client
.request("games")
.pipe(
limit(pageSize),
offset(x * pageSize),
fields(this.gameFields),
sort("id")
)
.execute();
for (let y in data) {
await this.addMetadataToDb(data[y]);
}
} catch (error) {
if (error.code === "ERR_BAD_RESPONSE") {
x--;
await this.sleep(1000);
retryCount++;
console.log(
`Retrieving metadata at offset ${
x * 500
} failed. Retry count: ${retryCount}`
);
continue;
}
throw error; //hoist it up
}
retryCount = 0;
}
console.log(`\nFinished syncing metadata in ${timer.elapsed()}`);
} catch (error) {
if (error.code === "ERR_BAD_REQUEST" && !retrying) {
this.setupClient();
return this.syncAllMetadata(true);
}
console.error("Error syncing all metadata:", error);
}
}
async addMetadataToDb(metadata) {
try {
let md = await Metadata.findByPk(metadata.id);
if (!md) {
md = await Metadata.build(
{
id: metadata.id,
},
{
include: File,
}
);
}
// I hate this
let coverArt = {
default: metadata.cover?.image_id,
};
for (let x in metadata.game_localizations) {
let gl = metadata.game_localizations[x];
if (gl.region && gl.cover) {
coverArt[gl.region.name] = gl.cover.image_id;
}
}
md.title = metadata.name;
md.description = metadata.summary;
md.rating = metadata.total_rating;
md.coverartid = JSON.stringify(coverArt);
md.releasedate = metadata.first_release_date
? new Date(metadata.first_release_date * 1000)
: null;
md.genre = metadata.genres?.map((genre) => genre.name);
md.gamemodes = metadata.game_modes?.map((gm) => gm.name);
md.platforms = metadata.platforms?.map(
(platform) => this.platformMap[platform.name] || platform.name
);
md.screenshots = metadata.screenshots?.map((ss) => ss.image_id);
md.videos = metadata.videos?.map((v) => v.video_id);
md.developers = metadata.involved_companies
?.filter((ic) => ic.developer)
?.map((ic) => ic.company.name);
md.publishers = metadata.involved_companies
?.filter((ic) => ic.publisher)
?.map((ic) => ic.company.name);
//I hate this too
let alternates = new Object();
if (metadata.alternative_names) {
for (let x in metadata.alternative_names) {
let an = metadata.alternative_names[x];
if (an.comment && an.name) {
alternates[an.comment] = an.name;
}
}
}
if (metadata.game_localizations) {
for (let x in metadata.game_localizations) {
let gl = metadata.game_localizations[x];
if (gl.region.name && gl.name) {
alternates[gl.region.name] = gl.name;
}
}
}
//this needs to remain json as we want the keys to be retained
md.alternatetitles = alternates ? JSON.stringify(alternates) : null;
await md.save();
} catch (error) {
console.error("Error adding metadata:", error);
}
}
async sleep(delay) {
return new Promise((resolve) => setTimeout(resolve, delay));
}
}