diff options
Diffstat (limited to 'update')
-rw-r--r-- | update/episodes/index.js | 141 | ||||
-rw-r--r-- | update/episodes/series.json | 127 | ||||
-rw-r--r-- | update/ponies/dict.js (renamed from update/dict.js) | 0 | ||||
-rw-r--r-- | update/ponies/index.js (renamed from update/index.js) | 0 | ||||
-rw-r--r-- | update/ponies/infobox.js (renamed from update/infobox.js) | 0 | ||||
-rw-r--r-- | update/ponies/listgen.js (renamed from update/listgen.js) | 0 | ||||
-rw-r--r-- | update/ponies/pages.js (renamed from update/pages.js) | 0 | ||||
-rw-r--r-- | update/ponies/parse.js (renamed from update/parse.js) | 51 |
8 files changed, 309 insertions, 10 deletions
diff --git a/update/episodes/index.js b/update/episodes/index.js new file mode 100644 index 0000000..f071707 --- /dev/null +++ b/update/episodes/index.js @@ -0,0 +1,141 @@ +const config = require("./series.json"); +const axios = require('axios'); +const fs = require('fs'); +const WikiTextParser = require('parse-wikitext'); +const parser = new WikiTextParser("mlp.fandom.com"); + +(async () => { + let all = []; + + for (let series of config) { + let data = { + command: series.cmd, + title: series.title, + date: series.date, + link: series.page, + description: { + series: null, + plot: null, + }, + seasons: [] + }; + console.log(series.title + " (" + data.date + ")"); + + ddata = (await axios.get("https://mlp.fandom.com/api.php?format=json&action=query&prop=extracts&exlimit=max&explaintext&exintro&titles=" + encodeURI(series.page) + "&redirects=")).data; + data.description.series = ddata.query.pages[Object.keys(ddata.query.pages)[0]].extract.split("\n")[0]; + data.description.plot = ddata.query.pages[Object.keys(ddata.query.pages)[0]].extract.split("\n")[1]; + + for (let s of series.seasons) { + console.log(" Season " + s.id); + + let season = { + name: "Season " + s.id, + id: "s" + s.id, + date: null, + count: null, + episodes: [] + } + + let sdata = (await axios.get("https://mlp.fandom.com/api.php?action=query&prop=revisions&titles=" + s.table.page + "&rvslots=*&rvprop=content&formatversion=2&format=json")).data; + let sections = parser.pageToSectionObject(sdata.query.pages[0].revisions[0].slots.main.content); + let episodes = sections.Episodes[s.table.section].content + .filter(i => i.startsWith("|")) + .join("||") + .replace("|}", "") + .split("|-").map(i => { + return i.split("||").filter(i => i.trim() !== ""); + }) + .filter(i => i.length > 1) + .map(i => { + let index = 0; + return i.map(i => { + return i.replace(/^(\| |\|)(.*)/gm, "$2") + .replace(/^style="(.*)"( |)\|( |)(.*)/gm, "$4") + .replace(/\[\[((.*)\|(.*)|(.*))\]\]/gm, "$3$4"); + }).map(i => { + if (index === 0) { + index++; + return i.replace(/(.*) \((.*)\)/gm, "$1|$2"); + } else { + index++; + return i; + } + }) + }); + + index = 1; + for (let e of episodes) { + process.stdout.write(" S" + s.id + "E" + index); + + let episode = { + local: null, + global: null, + date: null, + name: null, + writer: null, + cover: null, + characters: [], + plot: null + } + + episode.local = e[s.table.fields.number].replace(/(.*)\|(.*)/gm, "$1").replace(/''(.*)''/gm, "$1").replace(/{{(.*)\|(.*)}}/gm, "$2").replace(/(.*)\|(.*)/gm, "$2"); + episode.global = e[s.table.fields.number].replace(/(.*)\|(.*)/gm, "$2"); + episode.date_pre = e[s.table.fields.date].replace(/{{(.*)\|(.*)\|(.*)\|link=(no|yes)}}/gm, "$3").replace(/{{(.*)\|(.*)}}/gm, "$2").replace(/(.*)\|(.*)/gm, "$2"); + try { + episode.date = new Date(e[s.table.fields.date].replace(/{{(.*)\|(.*)\|(.*)\|link=(no|yes)}}/gm, "$3").replace(/{{(.*)\|(.*)}}/gm, "$2").replace(/(.*)\|(.*)/gm, "$2")).toISOString(); + } catch (e) { + episode.date = null; + } + episode.name = e[s.table.fields.title]; + episode.writer = e[s.table.fields.writer].replace(/{{(.*)\|(.*)\|(.*)\|link=(no|yes)}}/gm, "$3").replace(/(]]|\[\[)/gm, "").replace(/(.*)\|(.*)/gm, "$2"); + + process.stdout.write(": " + episode.name + "\n"); + + if (episode.local.length !== 2 || episode.global.length > 3 || episode.global.length < 2 || episode.date_pre.length !== 10) { + console.log("FAILURE: " + JSON.stringify(episode)); + } + + let edata = (await axios.get("https://mlp.fandom.com/api.php?action=query&prop=revisions&titles=" + encodeURI(episode.name).replaceAll("?", "%3F").replaceAll("&", "%26") + "&rvslots=*&rvprop=content&formatversion=2&format=json")).data; + let eext = (await axios.get("https://mlp.fandom.com/api.php?format=json&action=query&prop=extracts&exlimit=max&explaintext&exintro&titles=" + encodeURI(episode.name).replaceAll("?", "%3F").replaceAll("&", "%26") + "&redirects=")).data; + + episode.plot = eext.query.pages[Object.keys(eext.query.pages)[0]].extract.replace(/(.*)\n(.*)/, "$2").replace(/(.*)\n\n(.*)/gm, "$2").replace(/([.?!])\s*(?=[A-Z])/g, "$1|").split("|").join(" "); + + let infobox = null; + try { + sections = parser.pageToSectionObject(edata.query.pages[0].revisions[0].slots.main.content); + box = parser.parseInfoBox(sections["content"]); + if (box.template === "Infobox episode") { + infobox = parser.parseInfoBox(sections["content"]).values; + } + } catch (e) { + console.log(edata); + throw e; + } + + if (infobox !== null) { + try { + if (typeof infobox.image !== "undefined") episode.cover = (await axios.head("https://mlp.fandom.com/Special:FilePath/" + encodeURI(infobox.image.replace(/<!--[\s\S]*?-->/g, "").trim()).replaceAll("?", "%3F").replaceAll("&", "%26"))).request.res.responseUrl; + } catch (e) { + try { + if (typeof infobox.image !== "undefined") episode.cover = e.request.res.responseUrl; + } catch (e2) { + console.error(e2); + throw e; + } + } + if (typeof infobox.featured !== "undefined") episode.characters = infobox.featured.replace(/\[\[(([a-zA-Z0-9 .\-# _\\\/]*)\|([a-zA-Z0-9 .\-_\\\/]*)|([a-zA-Z0-9 .\-#_\\\/]*))\]\]/gm, "$3$4").replace(/(<(\/| |)(\/| |)br(\/| |)(\/| |)>)/gm, "|||").split("|||") + } + + season.episodes.push(episode); + index++; + } + + season.count = season.episodes.length; + season.date = season.episodes[0].date; + data.seasons.push(season); + } + all.push(data); + } + + fs.writeFileSync("./data/series.json", JSON.stringify(all, null, 4)); +})();
\ No newline at end of file diff --git a/update/episodes/series.json b/update/episodes/series.json new file mode 100644 index 0000000..0935658 --- /dev/null +++ b/update/episodes/series.json @@ -0,0 +1,127 @@ +[ + { + "title": "Friendship is Magic", + "cmd": "FIM", + "page": "My Little Pony Friendship is Magic", + "date": "2010-2019", + "seasons": [ + { + "id": 1, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season one", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 2, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season two", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 3, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season three", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 4, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season four", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 5, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season five", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 6, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season six", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 7, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season seven", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 8, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season eight", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + }, + { + "id": 9, + "table": { + "page": "Friendship is Magic animated media", + "section": "Season nine", + "fields": { + "number": 0, + "title": 1, + "writer": 2, + "date": 3 + } + } + } + ] + } +]
\ No newline at end of file diff --git a/update/dict.js b/update/ponies/dict.js index 88ec568..88ec568 100644 --- a/update/dict.js +++ b/update/ponies/dict.js diff --git a/update/index.js b/update/ponies/index.js index 53acf34..53acf34 100644 --- a/update/index.js +++ b/update/ponies/index.js diff --git a/update/infobox.js b/update/ponies/infobox.js index f53be0e..f53be0e 100644 --- a/update/infobox.js +++ b/update/ponies/infobox.js diff --git a/update/listgen.js b/update/ponies/listgen.js index d9401f8..d9401f8 100644 --- a/update/listgen.js +++ b/update/ponies/listgen.js diff --git a/update/pages.js b/update/ponies/pages.js index 7f3a1c8..7f3a1c8 100644 --- a/update/pages.js +++ b/update/ponies/pages.js diff --git a/update/parse.js b/update/ponies/parse.js index 0b2baa9..bd06081 100644 --- a/update/parse.js +++ b/update/ponies/parse.js @@ -38,28 +38,59 @@ let ponies = {}; if (typeof box.kind !== "undefined") { kp = box.kind.replace(/<!--[\s\S]*?-->/g, "").replace(/[^a-zA-Z0-9-_ ]/gm, "").split(" ")[0]; - data.kind = kp.substr(kp.replace(/([A-Z])([a-z0-9]*)$/g, "").length); + data.kind = kp.substring(kp.replace(/([A-Z])([a-z0-9]*)$/g, "").length); } if (typeof box.sex !== "undefined") data.sex = box.sex.replace(/<!--[\s\S]*?-->/g, "").trim().startsWith("F") ? "F" : "M"; if (typeof box._extract !== "undefined") { data.extract = box._extract; } - if (typeof box._extract_fr !== "undefined") { - data.extract_fr = box._extract_fr.replace(/ma petite amitié de poney est la magie/gmi, "My Little Pony Friendship is Magic").replace(/Mon amitié avec mon petit poney est magique/gmi, "My Little Pony Friendship is Magic").replace(/Mon petit Poney/gmi, "My Little Pony").replace(/Mon Petit Poney Une Nouvelle Génération/gmi, "My Little Pony A New Generation").replace(/Mon petit poney : une nouvelle génération/gmi, "My Little Pony: A New Generation").replace(/pegasus/gmi, "pégase").replace(/alicorn[^e]/gmi, "alicorne").replace(/une poney/gmi, "une ponette").replace(/petite génération de poney 5/gmi, "Génération 5"); - } else { - data.extract_fr = data.extract; - } if (typeof box.coat !== "undefined") data.color = box.coat.replace(/<!--[\s\S]*?-->/g, "").trim().replace(/\[([a-z.\/ \nA-Z0-9:]*)\/(.{6})\/ (.*)\]/gm, "$2").replace(/{{perbang\|([0-9A-Fa-f].{5})(.*)/g, "$1"); - if (typeof box.main !== "undefined") data.image = "https://mlp.fandom.com/Special:FilePath/" + encodeURI(box.main.replace(/<!--[\s\S]*?-->/g, "").trim()); - if (typeof box.main1 !== "undefined") data.image = "https://mlp.fandom.com/Special:FilePath/" + encodeURI(box.main1.replace(/<!--[\s\S]*?-->/g, "").trim()); - if (typeof box.image !== "undefined") data.image = "https://mlp.fandom.com/Special:FilePath/" + encodeURI(box.image.replace(/<!--[\s\S]*?-->/g, "").trim()); + try { + if (typeof box.main !== "undefined") data.image = (await axios.head("https://mlp.fandom.com/Special:FilePath/" + encodeURI(box.main.replace(/<!--[\s\S]*?-->/g, "").trim()).replaceAll("?", "%3F").replaceAll("&", "%26"))).request.res.responseUrl; + } catch (e) { + try { + if (typeof box.main !== "undefined") data.image = e.request.res.responseUrl; + } catch (e2) { + console.error(e2); + throw e; + } + } + try { + if (typeof box.main1 !== "undefined") data.image = (await axios.head("https://mlp.fandom.com/Special:FilePath/" + encodeURI(box.main1.replace(/<!--[\s\S]*?-->/g, "").trim()).replaceAll("?", "%3F").replaceAll("&", "%26"))).request.res.responseUrl; + } catch (e) { + try { + if (typeof box.main1 !== "undefined") data.image = e.request.res.responseUrl; + } catch (e2) { + console.error(e2); + throw e; + } + } + try { + if (typeof box.image !== "undefined") data.image = (await axios.head("https://mlp.fandom.com/Special:FilePath/" + encodeURI(box.image.replace(/<!--[\s\S]*?-->/g, "").trim()).replaceAll("?", "%3F").replaceAll("&", "%26"))).request.res.responseUrl; + } catch (e) { + try { + if (typeof box.image !== "undefined") data.image = e.request.res.responseUrl; + } catch (e2) { + console.error(e2); + throw e; + } + } if (typeof box["cutie mark"] !== "undefined") { try { data.markimg = box["cutie mark"].replace(/<!--[\s\S]*?-->/g, "").trim().split("[[File:")[1].split("|")[0]; } catch (e) { data.markimg = box["cutie mark"].replace(/<!--[\s\S]*?-->/g, "").trim().split("[[File:")[0].split("|")[0]; } - data.mark = "https://mlp.fandom.com/Special:Redirect/file/" + encodeURI(data.markimg) + "?width=128"; + try { + data.mark = (await axios.head("https://mlp.fandom.com/Special:FilePath/" + encodeURI(data.markimg).replaceAll("?", "%3F").replaceAll("&", "%26"))).request.res.responseUrl; + } catch (e) { + try { + data.mark = e.request.res.responseUrl; + } catch (e2) { + console.error(e2); + throw e; + } + } } if (typeof box.occupation !== "undefined") { |