From 15b7b180306e0856da9b280c43396889644c5b93 Mon Sep 17 00:00:00 2001 From: Siddharth VP Date: Mon, 17 May 2021 00:54:06 +0530 Subject: [PATCH] move queryAuthors() to page object; fix its types Also added a test. --- CHANGELOG.md | 3 + package-lock.json | 4 +- package.json | 2 +- src/bot.ts | 76 +------------------------ src/page.ts | 120 ++++++++++++++++++++++++++++++++++------ src/static_utils.ts | 10 +--- tests/suppl.bot.test.js | 13 +++++ 7 files changed, 128 insertions(+), 100 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 172b681..46b61dc 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,8 @@ Only breaking changes, deprecations and the like are documented in this change log. +#### 0.11.0 +- mwn#queryAuthors() now requires `getSiteInfo()` to have run first. Also, it is deprecated in favour of using the `queryAuthors()` method on a page object. + #### 0.10.0 - `loginGetToken()` is now deprecated in favour of `login()` which will now fetch tokens as well. diff --git a/package-lock.json b/package-lock.json index a5db1fd..b3719a2 100644 --- a/package-lock.json +++ b/package-lock.json @@ -1,11 +1,11 @@ { "name": "mwn", - "version": "0.10.4", + "version": "0.11.0", "lockfileVersion": 2, "requires": true, "packages": { "": { - "version": "0.10.4", + "version": "0.11.0", "license": "LGPL-3.0-or-later", "dependencies": { "@types/eventsource": "^1.1.4", diff --git a/package.json b/package.json index 8cb9c1c..85adb1f 100644 --- a/package.json +++ b/package.json @@ -1,6 +1,6 @@ { "name": "mwn", - "version": "0.10.4", + "version": "0.11.0", "description": "JavaScript & TypeScript MediaWiki bot framework for Node.js", "main": "./build/bot.js", "types": "./build/bot.d.ts", diff --git a/src/bot.ts b/src/bot.ts index 4c257dd..2a15608 100644 --- a/src/bot.ts +++ b/src/bot.ts @@ -1917,84 +1917,12 @@ export class mwn { * This API has a throttling of 2000 requests a day. * Supported for EN, DE, ES, EU, TR Wikipedias only * @see https://api.wikiwho.net/ + * @deprecated Use queryAuthors on the page object directly instead */ async queryAuthors( title: string, ): Promise<{ totalBytes: number; users: { id: number; name: string; bytes: number; percent: number }[] }> { - let langcodematch = this.options.apiUrl.match(/([^/]*?)\.wikipedia\.org/); - if (!langcodematch || !langcodematch[1]) { - throw new Error('WikiWho API is not supported for bot API URL. Re-check.'); - } - - let json; - try { - json = await this.rawRequest({ - url: `https://api.wikiwho.net/${ - langcodematch[1] - }/api/v1.0.0-beta/latest_rev_content/${encodeURIComponent(title)}/?editor=true`, - }).then((response) => response.data); - } catch (err) { - throw new Error(err && err.response && err.response.data && err.response.data.Error); - } - - const tokens = Object.values(json.revisions[0])[0].tokens; - - let data = { - totalBytes: 0, - users: [], - }; - let userdata: { - [editor: string]: { - name?: number; - bytes: number; - percent?: number; - }; - } = {}; - - for (let token of tokens) { - data.totalBytes += token.str.length; - let editor = token['editor']; - if (!userdata[editor]) { - userdata[editor] = { bytes: 0 }; - } - userdata[editor].bytes += token.str.length; - if (editor.startsWith('0|')) { - // IP - userdata[editor].name = editor.slice(2); - } - } - - Object.entries(userdata).map(([userid, { bytes }]) => { - userdata[userid].percent = bytes / data.totalBytes; - if (userdata[userid].percent < 0.02) { - delete userdata[userid]; - } - }); - - await this.request({ - action: 'query', - list: 'users', - ususerids: Object.keys(userdata).filter((us) => !us.startsWith('0|')), // don't lookup IPs - }).then((json) => { - json.query.users.forEach((us: any) => { - userdata[String(us.userid)].name = us.name; - }); - }); - - data.users = Object.entries(userdata) - .map(([userid, { bytes, name, percent }]) => { - return { - id: userid, - name: name, - bytes: bytes, - percent: percent, - }; - }) - .sort((a, b) => { - return a.bytes < b.bytes ? 1 : -1; - }); - - return data; + return new this.page(title).queryAuthors(); } /** diff --git a/src/page.ts b/src/page.ts index 7cc5177..c0560aa 100644 --- a/src/page.ts +++ b/src/page.ts @@ -55,6 +55,16 @@ export interface PageViewData { views: number; } +export interface AuthorshipData { + totalBytes: number; + users: Array<{ + id: number; + name: string; + bytes: number; + percent: number; + }>; +} + export interface ApiPage { pageid: number; ns: number; @@ -153,6 +163,7 @@ export interface MwnPage extends MwnTitle { customOptions?: ApiQueryLogEventsParams, ): AsyncGenerator; pageViews(options?: PageViewOptions): Promise; + queryAuthors(): Promise; edit(transform: (rev: { content: string; timestamp: string }) => string | ApiEditPageParams): Promise; save(text: string, summary?: string, options?: ApiEditPageParams): Promise; newSection(header: string, message: string, additionalParams?: ApiEditPageParams): Promise; @@ -600,22 +611,9 @@ export default function (bot: mwn): MwnPageStatic { return bot .rawRequest({ - url: - 'https://wikimedia.org/api/rest_v1/metrics/pageviews/per-article' + - '/' + - project + - '/' + - access + - '/' + - agent + - '/' + - encodeURIComponent(this.toString()) + - '/' + - granularity + - '/' + - startString + - '/' + - endString, + url: `https://wikimedia.org/api/rest_v1/metrics/pageviews/per-article/${project}/${access}/${agent}/${encodeURIComponent( + this.toString(), + )}/${granularity}/${startString}/${endString}`, headers: { 'User-Agent': bot.options.userAgent, }, @@ -625,6 +623,96 @@ export default function (bot: mwn): MwnPageStatic { }); } + /** + * Query the top contributors to the article using the WikiWho API. + * This API has a throttling of 2000 requests a day. + * Supported for EN, DE, ES, EU, TR Wikipedias only + * @see https://api.wikiwho.net/ + */ + async queryAuthors(): Promise { + let langcodematch = bot.options.apiUrl.match(/([^/]*?)\.wikipedia\.org/); + if (!langcodematch || !langcodematch[1]) { + throw new Error('WikiWho API is not supported for bot API URL. Re-check.'); + } + + let json; + try { + json = await bot + .rawRequest({ + url: `https://api.wikiwho.net/${ + langcodematch[1] + }/api/v1.0.0-beta/latest_rev_content/${encodeURIComponent(this.toString())}/?editor=true`, + headers: { + 'User-Agent': bot.options.userAgent, + }, + }) + .then((response) => response.data); + } catch (err) { + throw new Error(err && err.response && err.response.data && err.response.data.Error); + } + + const tokens = Object.values(json.revisions[0])[0].tokens; + + let data: AuthorshipData = { + totalBytes: 0, + users: [], + }; + let userdata: { + [editor: string]: { + name?: string; + bytes: number; + percent?: number; + }; + } = {}; + + for (let token of tokens) { + data.totalBytes += token.str.length; + let editor = token['editor']; + if (!userdata[editor]) { + userdata[editor] = { bytes: 0 }; + } + userdata[editor].bytes += token.str.length; + if (editor.startsWith('0|')) { + // IP + userdata[editor].name = editor.slice(2); + } + } + + Object.entries(userdata).map(([userid, { bytes }]) => { + userdata[userid].percent = bytes / data.totalBytes; + if (userdata[userid].percent < 0.02) { + delete userdata[userid]; + } + }); + + await bot + .request({ + action: 'query', + list: 'users', + ususerids: Object.keys(userdata).filter((us) => !us.startsWith('0|')), // don't lookup IPs + }) + .then((json) => { + json.query.users.forEach((us: any) => { + userdata[us.userid].name = us.name; + }); + }); + + data.users = Object.entries(userdata) + .map(([userid, { bytes, name, percent }]) => { + return { + id: Number(userid), + name: name, + bytes: bytes, + percent: percent, + }; + }) + .sort((a, b) => { + return a.bytes < b.bytes ? 1 : -1; + }); + + return data; + } + /**** Post operations *****/ // Defined in bot.js diff --git a/src/static_utils.ts b/src/static_utils.ts index 010e385..8ed7ac8 100644 --- a/src/static_utils.ts +++ b/src/static_utils.ts @@ -29,6 +29,7 @@ export function link(target: string | MwnTitle, displaytext?: string): string { */ export function template(title: string | MwnTitle, parameters: { [parameter: string]: string } = {}): string { if (typeof title !== 'string') { + // title object provided if (title.namespace === 10) { title = title.getMainText(); // skip namespace name for templates } else if (title.namespace === 0) { @@ -41,13 +42,8 @@ export function template(title: string | MwnTitle, parameters: { [parameter: str '{{' + title + Object.entries(parameters) - .map(([key, val]) => { - if (!val) { - // skip parameter if no value provided - return ''; - } - return '|' + key + '=' + val; - }) + .filter(([, value]) => !!value) // ignore params with no value + .map(([name, value]) => `|${name}=${value}`) .join('') + '}}' ); diff --git a/tests/suppl.bot.test.js b/tests/suppl.bot.test.js index 72f4ee5..4ffe1c5 100644 --- a/tests/suppl.bot.test.js +++ b/tests/suppl.bot.test.js @@ -102,4 +102,17 @@ describe('supplementary functions', function () { expect(views[1]).to.be.an('object').with.property('timestamp').that.equals('2021020100'); }); + it('wikiwho', async function () { + this.timeout(10000); + await bot.getSiteInfo(); + let page = new bot.page('Dairy in India'); + let data = await page.queryAuthors(); + expect(data).to.be.an('object').with.property('totalBytes').that.is.a('number'); + expect(data).to.have.property('users').that.is.instanceOf(Array).of.length.greaterThan(1); + expect(data.users[0]).to.be.an('object').with.property('id').that.is.a('number'); + expect(data.users[0]).to.have.property('name').that.is.a('string'); + expect(data.users[0]).to.have.property('percent').that.is.a('number'); + expect(data.users[0]).to.have.property('bytes').that.is.a('number'); + }); + });