| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535 | import * as crypto from 'crypto';import * as fs from 'fs';import * as http from 'http';import * as path from 'path';import { parse as parseUrl } from 'url';import { promisify } from 'util';import {  instagramIdToUrlSegment as idToUrlSegment,  urlSegmentToInstagramId as urlSegmentToId} from 'instagram-id-to-url-segment';import {  IgApiClient,  IgClientError, IgExactUserNotFoundError, IgLoginTwoFactorRequiredError, IgResponseError,  MediaInfoResponseItemsItem, UserFeedResponseItemsItem} from 'instagram-private-api';import { SocksProxyAgent } from 'socks-proxy-agent';import { getLogger } from './loggers';import QQBot from './koishi';import { BigNumOps } from './utils';import Webshot, { Cookies, Page } from './webshot';const parseLink = (link: string): { userName?: string, postUrlSegment?: string } => {  let match =    /instagram\.com\/p\/([A-Za-z0-9\-_]+)/.exec(link);  if (match) return { postUrlSegment: match[1] };  match =    /instagram\.com\/([^\/?#]+)/.exec(link) ||    /^([^\/?#]+)$/.exec(link);  if (match) return { userName: ScreenNameNormalizer.normalize(match[1]).split(':')[0] };  return;};const isValidUrlSegment = (input: string) => /^[A-Za-z0-9\-_]+$/.test(input);const linkBuilder = (config: ReturnType<typeof parseLink>): string => {  if (config.userName) return `https://www.instagram.com/${config.userName}/`;  if (config.postUrlSegment) return `https://www.instagram.com/p/${config.postUrlSegment}/`;};export { linkBuilder, parseLink, isValidUrlSegment, idToUrlSegment, urlSegmentToId };interface IWorkerOption {  sessionLockfile: string;  credentials: [string, string];  codeServicePort: number;  proxyUrl: string;  lock: ILock;  lockfile: string;  webshotCookiesLockfile: string;  bot: QQBot;  inactiveHours: string[];  workInterval: number;  webshotDelay: number;  mode: number;  wsUrl: string;}export class SessionManager {  private ig: IgApiClient;  private username: string;  private password: string;  private lockfile: string;  private codeServicePort: number;  constructor(client: IgApiClient, file: string, credentials: [string, string], codeServicePort: number) {    this.ig = client;    this.lockfile = file;    [this.username, this.password] = credentials;    this.codeServicePort = codeServicePort;  }  public init = () => {    this.ig.state.generateDevice(this.username);    this.ig.request.end$.subscribe(() => { this.save(); });    const filePath = path.resolve(this.lockfile);    if (fs.existsSync(filePath)) {      try {        const serialized = JSON.parse(fs.readFileSync(filePath, 'utf8')) as { [key: string]: any };        return this.ig.state.deserialize(serialized).then(() => {          logger.info(`successfully loaded client session cookies for user ${this.username}`);        });      } catch (err) {        logger.error(`failed to load client session cookies from file ${this.lockfile}: `, err);        return Promise.resolve();      }    } else {      return this.login().catch((err: IgClientError) => {        logger.error(`error while trying to log in as user ${this.username}, error: ${err}`);        logger.warn('attempting to retry after 1 minute...');        if (fs.existsSync(filePath)) fs.unlinkSync(filePath);        promisify(setTimeout)(60000).then(this.init);      });    }  };  public handle2FA = <T>(submitter: (code: string) => Promise<T>) => new Promise<T>((resolve, reject) => {    const token = crypto.randomBytes(20).toString('hex');    logger.info('please submit the code with a one-time token from your browser with this path:');    logger.info(`/confirm-2fa?code=<the code you received>&token=${token}`);    let working;    const server = http.createServer((req, res) => {      const {pathname, query} = parseUrl(req.url, true);      if (!working && pathname === '/confirm-2fa' && query.token === token &&        typeof(query.code) === 'string' && /^\d{6}$/.test(query.code)) {        const code = query.code;        logger.debug(`received code: ${code}`);        working = true;        submitter(code)          .then(response => { res.write('OK'); res.end(); server.close(() => resolve(response)); })          .catch(err => { res.write('Error'); res.end(); reject(err); })          .finally(() => { working = false; });      }    });    server.listen(this.codeServicePort);  });  public login = () =>    this.ig.simulate.preLoginFlow()      .then(() => this.ig.account.login(this.username, this.password))      .catch((err: IgClientError) => {        if (err instanceof IgLoginTwoFactorRequiredError) {          const {two_factor_identifier, totp_two_factor_on} = err.response.body.two_factor_info;          logger.debug(`2FA info: ${JSON.stringify(err.response.body.two_factor_info)}`);          logger.info(`login is requesting two-factor authentication via ${totp_two_factor_on ? 'TOTP' : 'SMS'}`);          return this.handle2FA(code => this.ig.account.twoFactorLogin({            username: this.username,            verificationCode: code,            twoFactorIdentifier: two_factor_identifier,            verificationMethod: totp_two_factor_on ? '0' : '1',          }));        }        throw err;      })      .then(user => new Promise<typeof user>(resolve => {        logger.info(`successfully logged in as ${this.username}`);        process.nextTick(() => resolve(this.ig.simulate.postLoginFlow().then(() => user)));      }));  public save = () =>    this.ig.state.serialize()      .then((serialized: { [key: string]: any }) => {        delete serialized.constants;        return fs.writeFileSync(path.resolve(this.lockfile), JSON.stringify(serialized, null, 2), 'utf-8');      });}export class ScreenNameNormalizer {  // tslint:disable-next-line: variable-name  public static _queryUser: (username: string) => Promise<string>;  public static normalize = (username: string) => `${username.toLowerCase().replace(/^@/, '')}:`;  public static async normalizeLive(username: string) {    if (this._queryUser) {      return await this._queryUser(username)        .catch((err: IgClientError) => {          if (!(err instanceof IgExactUserNotFoundError)) {            logger.warn(`error looking up user: ${err.message}`);            return `${username}:`;          }          return null;        });    }    return this.normalize(username);  }}let browserLogin = (page: Page): Promise<void> => Promise.reject();let browserSaveCookies = browserLogin;let isWaitingForLogin = false;const acceptCookieConsent = (page: Page) =>  page.click('button:has-text("すべて許可")', { timeout: 5000 })    .then(() => logger.info('accepted cookie consent'))    .catch((err: Error) => { if (err.name !== 'TimeoutError') throw err; });export const WebshotHelpers = {  handleLogin: browserLogin,  handleCookieConsent: acceptCookieConsent,  get isWaitingForLogin() { return isWaitingForLogin; },};export let getPostOwner = (segmentId: string): Promise<string> => Promise.reject();export let sendPost = (segmentId: string, receiver: IChat): void => {  throw Error();};export type MediaItem = MediaInfoResponseItemsItem & UserFeedResponseItemsItem;export type LazyMediaItem = {  pk: string,  item: () => Promise<MediaItem>,};const logger = getLogger('instagram');const maxTrials = 3;const retryInterval = 1500;const ordinal = (n: number) => {  switch ((Math.trunc(n / 10) % 10 === 1) ? 0 : n % 10) {    case 1:      return `${n}st`;    case 2:      return `${n}nd`;    case 3:      return `${n}rd`;    default:      return `${n}th`;  }};const retryOnError = <T, U>(  doWork: () => Promise<T>,  onRetry: (error, count: number, terminate: (defaultValue: U) => void) => void) => new Promise<T | U>(resolve => {  const retry = (reason, count: number) => {    setTimeout(() => {      let terminate = false;      onRetry(reason, count, defaultValue => { terminate = true; resolve(defaultValue); });      if (!terminate) doWork().then(resolve).catch(error => retry(error, count + 1));    }, retryInterval);  };  doWork().then(resolve).catch(error => retry(error, 1));});export default class {  private client: IgApiClient;  private lock: ILock;  private lockfile: string;  private inactiveHours: string[];  private workInterval: number;  private bot: QQBot;  private webshotDelay: number;  private webshotCookies: Cookies = [];  private webshotCookiesLockfile: string;  private webshot: Webshot;  private mode: number;  private wsUrl: string;  public session: SessionManager;  constructor(opt: IWorkerOption) {    this.client = new IgApiClient();    if (opt.proxyUrl) {      try {        const url = new URL(opt.proxyUrl);        if (!/^socks(?:4a?|5h?)?:$/.test(url.protocol)) throw Error();        if (!url.port) url.port = '1080';        this.client.request.defaults.agent = new SocksProxyAgent({          hostname: url.hostname,          port: url.port,          userId: url.username,          password: url.password,        });      } catch (e) {        logger.warn(`invalid socks proxy url: ${opt.proxyUrl}, ignoring`);      }    }    this.session = new SessionManager(this.client, opt.sessionLockfile, opt.credentials, opt.codeServicePort);    this.lockfile = opt.lockfile;    this.webshotCookiesLockfile = opt.webshotCookiesLockfile;    this.lock = opt.lock;    this.inactiveHours = opt.inactiveHours;    this.workInterval = opt.workInterval;    this.bot = opt.bot;    this.webshotDelay = opt.webshotDelay;    this.mode = opt.mode;    this.wsUrl = opt.wsUrl;    const cookiesFilePath = path.resolve(this.webshotCookiesLockfile);    try {      this.webshotCookies = JSON.parse(fs.readFileSync(cookiesFilePath, 'utf8')) as Cookies;      logger.info(`loaded webshot cookies from file ${this.webshotCookiesLockfile}`);    } catch (err) {      logger.warn(        `failed to load webshot cookies from file ${this.webshotCookiesLockfile}: `,        (err as Error).message      );      logger.warn('cookies will be saved to this file when needed');    }    browserLogin = page =>      page.fill('input[name="username"]', opt.credentials[0], {timeout: 0})        .then(() => { isWaitingForLogin = true; logger.warn('blocked by login dialog, trying to log in manually...'); })        .then(() => page.fill('input[name="password"]', opt.credentials[1], {timeout: 0}))        .then(() => page.click('button[type="submit"]', {timeout: 0}))        .then(() =>          (next => Promise.race([            page.waitForSelector('#verificationCodeDescription', {timeout: 0}).then(handle => handle.innerText()).then(text => {              logger.info(`login is requesting two-factor authentication via ${/認証アプリ/.test(text) ? 'TOTP' : 'SMS'}`);              return this.session.handle2FA(code => page.fill('input[name="verificationCode"]', code, {timeout: 0}))                .then(() => page.click('button:has-text("実行")', {timeout: 0}))                .then(next);            }),            page.waitForResponse(res => res.status() === 429, {timeout: 0})              .then(() => { logger.error('fatal error: login restricted: code 429, exiting'); process.exit(1); }),            next(),          ]))(() => page.click('button:has-text("情報を保存")', {timeout: 0}).then(() => { isWaitingForLogin = false; }))        );    browserSaveCookies = page =>      page.context().cookies()        .then(cookies => {          this.webshotCookies = cookies;          logger.info('successfully logged in, saving cookies to file...');          fs.writeFileSync(path.resolve(this.webshotCookiesLockfile), JSON.stringify(cookies, null, 2), 'utf-8');        });    WebshotHelpers.handleLogin = page =>      browserLogin(page)        .then(() => page.waitForSelector('img[data-testid="user-avatar"]', { timeout: this.webshotDelay }))        .then(() => browserSaveCookies(page))        .catch((err: Error) => {          if (err.name === 'TimeoutError') { logger.warn('navigation timed out, assuming login has failed'); isWaitingForLogin = false; }          throw err;        });    ScreenNameNormalizer._queryUser = this.queryUser;    const parseMediaError = (err: IgClientError) => {      if (!(err instanceof IgResponseError && err.text === 'Media not found or unavailable')) {        logger.warn(`error retrieving instagram media: ${err.message}`);        return `获取媒体时出现错误:${err.message}`;      }      return '找不到请求的媒体,它可能已被删除。';    };    getPostOwner = (segmentId) =>      this.client.media.info(urlSegmentToId(segmentId))        .then(media => media.items[0].user)        .then(user => `${user.username}:${user.pk}`)        .catch((err: IgClientError) => { throw Error(parseMediaError(err)); });    sendPost = (segmentId, receiver) => {      this.getMedia(segmentId, this.sendMedia(`instagram media ${segmentId}`, receiver))        .catch((err: IgClientError) => { this.bot.sendTo(receiver, parseMediaError(err)); });    };  }  public launch = () => {    this.webshot = new Webshot(      this.wsUrl,      this.mode,      () => this.webshotCookies,      doOnNewPage => {        this.queryUserMedia = ((userName, targetId) => {          let page: Page;          const url = linkBuilder({ userName });          logger.debug(`pulling ${targetId !== '0' ? `feed ${url} up to ${targetId}` : `top of feed ${url}`}...`);          return doOnNewPage(newPage => {            page = newPage;            let timeout = this.workInterval * 1000;            const startTime = new Date().getTime();            const getTimerTime = () => new Date().getTime() - startTime;            const getTimeout = () => isWaitingForLogin ? 0 : Math.max(90000, timeout - getTimerTime());            return page.context().addCookies(this.webshotCookies)              .then(() => page.goto(url, { waitUntil: 'load', timeout: getTimeout() }))              .then(response => {                if (response.status() !== 200) {                  const err = new Error(                    `error navigating to user page, error was: ${response.status()} ${response.statusText()}`                  );                  throw Object.defineProperty(err, 'name', {                    value: 'ResponseError',                  });                }              }).then(() => acceptCookieConsent(page))              .then(() =>                (next => Promise.race([                  browserLogin(page)                    .catch((err: Error) => {                      if (err.name === 'TimeoutError') { logger.warn('navigation timed out, assuming login has failed'); isWaitingForLogin = false; }                      throw err;                    })                    .then(() => browserSaveCookies(page))                    .then(() => page.goto(url)).then(next),                  next(),                ]))(() => promisify(setTimeout)(2000).then(() => page.waitForSelector('article', {timeout: getTimeout()})))              ).then(handle => {                const postHandler = () => {                  const toId = (href: string) => urlSegmentToId((/\/p\/(.*)\/$/.exec(href) ?? [,''])[1]);                  if (targetId === '0') {                    return handle.$$eval('a', as =>                      as.filter(a => !a.querySelector('[aria-label="IGTV"]'))[0].href                    ).then(href => Number(toId(href)) > 0 ? [toId(href)] : []);                  }                  return handle.$$eval('a', as =>                    as.filter(a => !a.querySelector('[aria-label="IGTV"]')).map(a => a.href)                  ).then(hrefs => {                    let id: string;                    const itemIds: string[] = [];                    for (const href of hrefs) {                      id = toId(href);                      if (id && BigNumOps.compare(id, targetId) > 0) itemIds.push(id);                      else return itemIds;                    }                    logger.info('unable to find a smaller id than target, trying on next page...');                    return null; // has more                  });                };                return postHandler().then(itemIds => {                  if (itemIds) return itemIds;                  timeout += this.workInterval * 500;                  return handle.$$('a')                    .then(as => { as.pop().scrollIntoViewIfNeeded(); return as.length + 1; })                    .then(loadedCount => page.waitForFunction(count =>                      document.querySelectorAll('article a').length > count                    , loadedCount))                    .then(postHandler);                });              }).catch((err: Error) => {                if (err.name !== 'TimeoutError' && err.name !== 'ResponseError') throw err;                if (err.name === 'ResponseError') {                  logger.warn(`error while fetching tweets for ${userName}: ${err.message}`);                } else logger.warn(`navigation timed out at ${getTimerTime()} ms`);                return [] as string[];              }).then(itemIds => promisify(setTimeout)(getTimeout()).then(() =>                itemIds.map(id => this.lazyGetMediaById(id))              ));          }).finally(() => { page.close(); });        });        setTimeout(this.work, this.workInterval * 1000);      }    );  };  public queryUserMedia: (username: string, targetId?: string) => Promise<LazyMediaItem[]>;  public queryUser = (username: string) => this.client.user.searchExact(username)    .then(user => `${user.username}:${user.pk}`);  private workOnMedia = (    lazyMediaItems: LazyMediaItem[],    sendMedia: (msg: string, text: string, author: string) => void  ) => this.webshot(lazyMediaItems, sendMedia, this.webshotDelay);  public urlSegmentToId = urlSegmentToId;  public lazyGetMediaById = (id: string): LazyMediaItem => ({    pk: id,    item: () => this.client.media.info(id).then(media => {      const mediaItem = media.items[0] as MediaItem;      logger.debug(`api returned media post ${JSON.stringify(mediaItem)} for query id=${id}`);      return mediaItem;    }),  });  private getMedia = (segmentId: string, sender: (msg: string, text: string, author: string) => void) =>    this.workOnMedia([this.lazyGetMediaById(urlSegmentToId(segmentId))], sender);  private sendMedia = (source?: string, ...to: IChat[]) => (msg: string, text: string, author: string) => {    to.forEach(subscriber => {      logger.info(`pushing data${source ? ` of ${source}` : ''} to ${JSON.stringify(subscriber)}`);      retryOnError(        () => this.bot.sendTo(subscriber, msg),        (_, count, terminate: (doNothing: Promise<void>) => void) => {          if (count <= maxTrials) {            logger.warn(`retry sending to ${subscriber.chatID} for the ${ordinal(count)} time...`);          } else {            logger.warn(`${count - 1} consecutive failures while sending message chain, trying plain text instead...`);            terminate(this.bot.sendTo(subscriber, author + text, true));          }        });    });  };  public get isInactiveTime() {    const timeToEpoch = (h = 0, m = 0) => new Date().setHours(h, m, 0, 0);    return this.inactiveHours      .map(rangeStr => ((start, end) => ({start, end}))(        ...rangeStr.split('-', 2).map(timeStr => timeToEpoch(...timeStr.split(':', 2).map(Number))) as [number, number?]      ))      .some(range => (now => now >= range.start && now < range.end)(Date.now()));  }  public work = () => {    const lock = this.lock;    if (this.workInterval < 1) this.workInterval = 1;    if (this.isInactiveTime || lock.feed.length === 0) {      setTimeout(this.work, this.workInterval * 1000);      return;    }    if (lock.workon >= lock.feed.length) lock.workon = 0;    if (!lock.threads[lock.feed[lock.workon]] ||      !lock.threads[lock.feed[lock.workon]].subscribers ||      lock.threads[lock.feed[lock.workon]].subscribers.length === 0) {      logger.warn(`nobody subscribes thread ${lock.feed[lock.workon]}, removing from feed`);      delete lock.threads[lock.feed[lock.workon]];      lock.feed.splice(lock.workon, 1);      fs.writeFileSync(path.resolve(this.lockfile), JSON.stringify(lock));      this.work();      return;    }    const currentFeed = lock.feed[lock.workon];    const promise = new Promise<LazyMediaItem[]>(resolve => {      const match = /https:\/\/www\.instagram\.com\/([^\/]+)/.exec(currentFeed);      if (!match) {        logger.error(`current feed "${currentFeed}" is invalid, please remove this feed manually`);        return resolve([]);      }      this.queryUserMedia(match[1], this.lock.threads[currentFeed].offset)        .then(resolve)        .catch((error: Error) => {          logger.error(`error scraping media off profile page of ${match[1]}, error: ${error}`);          resolve([]);        });    });    promise.then((mediaItems: LazyMediaItem[]) => {      const currentThread = lock.threads[currentFeed];      const updateDate = () => currentThread.updatedAt = new Date().toString();      if (!mediaItems || mediaItems.length === 0) { updateDate(); return; }      const topOfFeed = mediaItems[0].pk;      const updateOffset = () => currentThread.offset = topOfFeed;      if (currentThread.offset === '-1') { updateOffset(); return; }      if (currentThread.offset === '0') mediaItems.splice(1);      return this.workOnMedia(mediaItems, this.sendMedia(`thread ${currentFeed}`, ...currentThread.subscribers))        .then(updateDate).then(updateOffset);    })      .then(() => {        lock.workon++;        let timeout = this.workInterval * 1000 / lock.feed.length;        if (timeout < 1000) timeout = 1000;        fs.writeFileSync(path.resolve(this.lockfile), JSON.stringify(lock));        setTimeout(() => {          this.work();        }, timeout);      });  };}
 |