| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490 | import * as fs from 'fs';import * as path from 'path';import * as Twitter from 'twitter';import TwitterTypes from 'twitter-d';import { getLogger } from './loggers';import QQBot from './koishi';import RedisSvc from './redis';import { chainPromises, BigNumOps } from './utils';import Webshot from './webshot';interface IWorkerOption {  lock: ILock;  lockfile: string;  bot: QQBot;  workInterval: number;  webshotDelay: number;  consumerKey: string;  consumerSecret: string;  accessTokenKey: string;  accessTokenSecret: string;  mode: number;  wsUrl: string;  redis?: IRedisConfig;}export class ScreenNameNormalizer {  // tslint:disable-next-line: variable-name  public static _queryUser: (username: string) => Promise<string>;  public static normalize = (username: string) => username.toLowerCase().replace(/^@/, '');  public static async normalizeLive(username: string) {    if (this._queryUser) {      return await this._queryUser(username)        .catch((err: {code: number, message: string}[]) => {          if (err[0].code !== 50) {            logger.warn(`error looking up user: ${err[0].message}`);            return username;          }          return null;        });    }    return this.normalize(username);  }}export let sendTweet = (id: string, receiver: IChat, forceRefresh: boolean): void => {  throw Error();};export interface ITimelineQueryConfig {  username: string;  count?: number;  since?: string;  until?: string;  noreps?: boolean;  norts?: boolean;}export let sendTimeline = (  conf: {[key in keyof ITimelineQueryConfig]: string},  receiver: IChat): void => {  throw Error();};const TWITTER_EPOCH = 1288834974657;const snowflake = (epoch: number) => Number.isNaN(epoch) ? undefined :  BigNumOps.lShift(String(epoch - 1 - TWITTER_EPOCH), 22);const logger = getLogger('twitter');const maxTrials = 3;const retryInterval = 1500;const ordinal = (n: number) => {  switch ((Math.trunc(n / 10) % 10 === 1) ? 0 : n % 10) {    case 1:      return `${n}st`;    case 2:      return `${n}nd`;    case 3:      return `${n}rd`;    default:      return `${n}th`;  }};const retryOnError = <T, U>(  doWork: () => Promise<T>,  onRetry: (error, count: number, terminate: (defaultValue: U) => void) => void) => new Promise<T | U>(resolve => {  const retry = (reason, count: number) => {    setTimeout(() => {      let terminate = false;      onRetry(reason, count, defaultValue => { terminate = true; resolve(defaultValue); });      if (!terminate) doWork().then(resolve).catch(error => retry(error, count + 1));    }, retryInterval);  };  doWork().then(resolve).catch(error => retry(error, 1));});export type FullUser = TwitterTypes.FullUser;export type Entities = TwitterTypes.Entities;export type ExtendedEntities = TwitterTypes.ExtendedEntities;export type MediaEntity = TwitterTypes.MediaEntity;export interface Tweet extends TwitterTypes.Status {  user: FullUser;  retweeted_status?: Tweet;}export default class {  private client: Twitter;  private lock: ILock;  private lockfile: string;  private workInterval: number;  private bot: QQBot;  private webshotDelay: number;  private webshot: Webshot;  private mode: number;  private wsUrl: string;  private redis: RedisSvc;  constructor(opt: IWorkerOption) {    this.client = new Twitter({      consumer_key: opt.consumerKey,      consumer_secret: opt.consumerSecret,      access_token_key: opt.accessTokenKey,      access_token_secret: opt.accessTokenSecret,    });    this.lockfile = opt.lockfile;    this.lock = opt.lock;    this.workInterval = opt.workInterval;    this.bot = opt.bot;    this.webshotDelay = opt.webshotDelay;    this.mode = opt.mode;    this.wsUrl = opt.wsUrl;    if (opt.redis) this.redis = new RedisSvc(opt.redis);    ScreenNameNormalizer._queryUser = this.queryUser;    sendTweet = (idOrQuery, receiver, forceRefresh) => {      const send = (id: string) => this.getTweet(        id,        this.sendTweets({sourceInfo: `tweet ${id}`, reportOnSkip: true, force: forceRefresh}, receiver),        forceRefresh      )        .catch((err: {code: number, message: string}[]) => {          if (err[0]?.code === 34)            return this.bot.sendTo(receiver, `找不到用户 ${match[2].replace(/^@?(.*)$/, '@$1')}。`);          if (err[0].code !== 144) {            logger.warn(`error retrieving tweet: ${err[0].message}`);            this.bot.sendTo(receiver, `获取推文时出现错误:${err[0].message}`);          }          this.bot.sendTo(receiver, '找不到请求的推文,它可能已被删除。');        });      const match = /^last(|-\d+)@([^\/?#,]+)((?:,no.*?=[^,]*)*)$/.exec(idOrQuery);      const query = () => this.queryTimeline({          username: match[2],          count: 1 - Number(match[1]),          noreps: {on: true, off: false}[match[3].replace(/.*,noreps=([^,]*).*/, '$1')],          norts: {on: true, off: false}[match[3].replace(/.*,norts=([^,]*).*/, '$1')],        }).then(tweets => tweets.slice(-1)[0].id_str);      (match ? query() : Promise.resolve(idOrQuery)).then(send);    };    sendTimeline = ({username, count, since, until, noreps, norts}, receiver) => {      const countNum = Number(count) || 10;      (countNum > 0 ? this.queryTimeline : this.queryTimelineReverse)({        username,        count: Math.abs(countNum),        since: BigNumOps.parse(since) || snowflake(new Date(since).getTime()),        until: BigNumOps.parse(until) || snowflake(new Date(until).getTime()),        noreps: {on: true, off: false}[noreps],        norts: {on: true, off: false}[norts],      })        .then(tweets => chainPromises(          tweets.map(tweet => () => this.bot.sendTo(receiver, `\编号:${tweet.id_str}时间:${tweet.created_at}媒体:${tweet.extended_entities ? '有' : '无'}正文:\n${tweet.full_text.replace(/^([\s\S\n]{50})[\s\S\n]+?( https:\/\/t.co\/.*)?$/, '$1…$2')}`          ))            .concat(() => this.bot.sendTo(receiver, tweets.length ?              '时间线查询完毕,使用 /twitter_view <编号> 查看推文详细内容。' :              '时间线查询完毕,没有找到符合条件的推文。'            ))        ))        .catch((err: {code: number, message: string}[]) => {          if (err[0]?.code !== 34) {            logger.warn(`error retrieving timeline: ${err[0]?.message || err}`);            return this.bot.sendTo(receiver, `获取时间线时出现错误:${err[0]?.message || err}`);          }          this.bot.sendTo(receiver, `找不到用户 ${username.replace(/^@?(.*)$/, '@$1')}。`);        });    };  }  public launch = () => {    this.webshot = new Webshot(      this.wsUrl,      this.mode,      () => setTimeout(this.work, this.workInterval * 1000)    );  };  public queryUser = (username: string) => this.client.get('users/show', {screen_name: username})    .then((user: FullUser) => user.screen_name);  public queryTimelineReverse = (conf: ITimelineQueryConfig) => {    if (!conf.since) return this.queryTimeline(conf);    const count = conf.count;    const maxID = conf.until;    conf.count = undefined;    const until = () =>      BigNumOps.min(maxID, BigNumOps.plus(conf.since, String(7 * 24 * 3600 * 1000 * 2 ** 22)));    conf.until = until();    const promise = (tweets: Tweet[]): Promise<Tweet[]> =>      this.queryTimeline(conf).then(newTweets => {        tweets = newTweets.concat(tweets);        conf.since = conf.until;        conf.until = until();        if (          tweets.length >= count ||          BigNumOps.compare(conf.since, conf.until) >= 0        ) {          return tweets.slice(-count);        }        return promise(tweets);      });    return promise([]);  };  public queryTimeline = (    { username, count, since, until, noreps, norts }: ITimelineQueryConfig  ) => {    username = username.replace(/^@?(.*)$/, '@$1');    logger.info(`querying timeline of ${username} with config: ${      JSON.stringify({        ...(count && {count}),        ...(since && {since}),        ...(until && {until}),        ...(noreps && {noreps}),        ...(norts && {norts}),      })}`);    const fetchTimeline = (      config = {        screen_name: username.slice(1),        trim_user: true,        exclude_replies: noreps ?? true,        include_rts: !(norts ?? false),        since_id: since,        max_id: until,        tweet_mode: 'extended',      },      tweets: Tweet[] = []    ): Promise<Tweet[]> => this.client.get('statuses/user_timeline', config)      .then((newTweets: Tweet[]) => {        if (newTweets.length) {          logger.debug(`fetched tweets: ${JSON.stringify(newTweets)}`);          config.max_id = BigNumOps.plus('-1', newTweets[newTweets.length - 1].id_str);          logger.info(`timeline query of ${username} yielded ${            newTweets.length          } new tweets, next query will start at offset ${config.max_id}`);          tweets.push(...newTweets);        }        if (!newTweets.length || tweets.length >= count) {          logger.info(`timeline query of ${username} finished successfully, ${            tweets.length          } tweets have been fetched`);          return tweets.slice(0, count);        }        return fetchTimeline(config, tweets);      });    return fetchTimeline();  };  private workOnTweets = (    tweets: Tweet[],    sendTweets: (cacheId: string, msg: string, text: string, author: string) => void,    refresh = false  ) => Promise.all(tweets.map(tweet =>    ((this.redis && !refresh) ?      this.redis.waitForProcess(`webshot/${tweet.id_str}`, this.webshotDelay * 4)        .then(() => this.redis.getContent(`webshot/${tweet.id_str}`)) :      Promise.reject())      .then(content => {        if (content === null) throw Error();        logger.info(`retrieved cached webshot of tweet ${tweet.id_str} from redis database`);        const {msg, text, author} = JSON.parse(content) as {[key: string]: string};        let cacheId = tweet.id_str;        if (tweet.retweeted_status) cacheId += `,rt:${tweet.retweeted_status.id_str}`;        sendTweets(cacheId, msg, text, author);        return null as Tweet;      })      .catch(() => {        this.redis.startProcess(`webshot/${tweet.id_str}`);        return tweet;      })  )).then(tweets =>    this.webshot(      tweets.filter(t => t),      (cacheId: string, msg: string, text: string, author: string) => {        Promise.resolve()          .then(() => {            if (!this.redis) return;            const [twid, rtid] = cacheId.split(',rt:');            logger.info(`caching webshot of tweet ${twid} to redis database`);            this.redis.cacheContent(`webshot/${twid}`, JSON.stringify({msg, text, author, rtid}))              .then(() => this.redis.finishProcess(`webshot/${twid}`));          })          .then(() => sendTweets(cacheId, msg, text, author));      },      this.webshotDelay    )  );  public getTweet = (    id: string,    sender: (cacheId: string, msg: string, text: string, author: string) => void,    refresh = false  ) => {    const endpoint = 'statuses/show';    const config = {      id,      tweet_mode: 'extended',    };    return ((this.redis && !refresh) ?      this.redis.waitForProcess(`webshot/${id}`, this.webshotDelay * 4)        .then(() => this.redis.getContent(`webshot/${id}`))        .then(content => {          if (content === null) throw Error();          const {rtid} = JSON.parse(content);          return {id_str: id, retweeted_status: rtid ? {id_str: rtid} : undefined} as Tweet;        }) :      Promise.reject())      .catch(() => this.client.get(endpoint, config))      .then((tweet: Tweet) => {        if (tweet.id) {          logger.debug(`api returned tweet ${JSON.stringify(tweet)} for query id=${id}`);        } else {          logger.debug(`skipped querying api as this tweet has been cached`)        }        return this.workOnTweets([tweet], sender, refresh);      });  };  private sendTweets = (    config: {sourceInfo?: string, reportOnSkip?: boolean, force?: boolean}      = {reportOnSkip: false, force: false},    ...to: IChat[]  ) => (id: string, msg: string, text: string, author: string) => {    to.forEach(subscriber => {      const [twid, rtid] = id.split(',rt:');      const {sourceInfo: source, reportOnSkip, force} = config;      const targetStr = JSON.stringify(subscriber);      const send = () => retryOnError(        () => this.bot.sendTo(subscriber, msg),        (_, count, terminate: (doNothing: Promise<void>) => void) => {          if (count <= maxTrials) {            logger.warn(`retry sending to ${subscriber.chatID} for the ${ordinal(count)} time...`);          } else {            logger.warn(`${count - 1} consecutive failures while sending message chain, trying plain text instead...`);            terminate(this.bot.sendTo(subscriber, author + text, true));          }        }      ).then(() => {        if (this.redis) {          logger.info(`caching push status of tweet ${rtid ? `${rtid} (RTed as ${twid})` : twid} for ${targetStr}...`);          return this.redis.cacheForChat(rtid || twid, subscriber);        }      });      ((this.redis && !force) ? this.redis.isCachedForChat(rtid || twid, subscriber) : Promise.resolve(false))        .then(isCached => {          if (isCached) {            logger.info(`skipped subscriber ${targetStr} as tweet ${rtid ? `${rtid} (or its RT)` : twid} has been sent already`);            if (!reportOnSkip) return;            text = `[最近发送过的推文:${rtid || twid}]`;            msg = author + text;          }          logger.info(`pushing data${source ? ` of ${source}` : ''} to ${targetStr}`);          return send();        });    });  };  public work = () => {    const lock = this.lock;    if (this.workInterval < 1) this.workInterval = 1;    if (lock.feed.length === 0) {      setTimeout(() => {        this.work();      }, this.workInterval * 1000);      return;    }    if (lock.workon >= lock.feed.length) lock.workon = 0;    if (!lock.threads[lock.feed[lock.workon]] ||      !lock.threads[lock.feed[lock.workon]].subscribers ||      lock.threads[lock.feed[lock.workon]].subscribers.length === 0) {      logger.warn(`nobody subscribes thread ${lock.feed[lock.workon]}, removing from feed`);      delete lock.threads[lock.feed[lock.workon]];      lock.feed.splice(lock.workon, 1);      fs.writeFileSync(path.resolve(this.lockfile), JSON.stringify(lock));      this.work();      return;    }    const currentFeed = lock.feed[lock.workon];    logger.debug(`pulling feed ${currentFeed}`);    const promise = new Promise(resolve => {      let match = /https:\/\/twitter.com\/([^\/]+)\/lists\/([^\/]+)/.exec(currentFeed);      let config: {[key: string]: any};      let endpoint: string;      if (match) {        if (match[1] === 'i') {          config = {            list_id: match[2],            tweet_mode: 'extended',          };        } else {          config = {            owner_screen_name: match[1],            slug: match[2],            tweet_mode: 'extended',          };        }        endpoint = 'lists/statuses';      } else {        match = /https:\/\/twitter.com\/([^\/]+)/.exec(currentFeed);        if (match) {          config = {            screen_name: match[1],            exclude_replies: false,            tweet_mode: 'extended',          };          endpoint = 'statuses/user_timeline';        }      }      if (endpoint) {        const offset = lock.threads[currentFeed].offset;        if (offset as unknown as number > 0) config.since_id = offset;        const getMore = (gotTweets: Tweet[] = []) => this.client.get(          endpoint, config, (error: {[key: string]: any}[], tweets: Tweet[]        ) => {          if (error) {            if (error instanceof Array && error.length > 0 && error[0].code === 34) {              logger.warn(`error on fetching tweets for ${currentFeed}: ${JSON.stringify(error)}`);              lock.threads[currentFeed].subscribers.forEach(subscriber => {                logger.info(`sending notfound message of ${currentFeed} to ${JSON.stringify(subscriber)}`);                this.bot.sendTo(subscriber, `链接 ${currentFeed} 指向的用户或列表不存在,请退订。`).catch();              });            } else {              logger.error(`unhandled error on fetching tweets for ${currentFeed}: ${JSON.stringify(error)}`);            }          }          if (!tweets || tweets.length <= 1) return resolve(gotTweets);          config.max_id = tweets.slice(-1)[0].id_str;          getMore(gotTweets.concat(tweets));        });        getMore();      }    });    promise.then((tweets: Tweet[]) => {      logger.debug(`api returned ${JSON.stringify(tweets)} for feed ${currentFeed}`);      const currentThread = lock.threads[currentFeed];      const updateDate = () => currentThread.updatedAt = new Date().toString();      if (!tweets || tweets.length === 0) { updateDate(); return; }      const topOfFeed = tweets[0].id_str;      const updateOffset = () => currentThread.offset = topOfFeed;      if (currentThread.offset === '-1') { updateOffset(); return; }      if (currentThread.offset === '0') tweets.splice(1);      return this.workOnTweets(tweets, this.sendTweets({sourceInfo: `thread ${currentFeed}`}, ...currentThread.subscribers))        .then(updateDate).then(updateOffset);    })      .then(() => {        lock.workon++;        let timeout = this.workInterval * 1000 / lock.feed.length;        if (timeout < 1000) timeout = 1000;        fs.writeFileSync(path.resolve(this.lockfile), JSON.stringify(lock));        setTimeout(() => {          this.work();        }, timeout);      });  };}
 |