1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471 |
- // @ts-check
- const fs = require('fs');
- const http = require('http');
- const url = require('url');
- const dotenv = require('dotenv');
- const express = require('express');
- const Redis = require('ioredis');
- const { JSDOM } = require('jsdom');
- const log = require('npmlog');
- const pg = require('pg');
- const dbUrlToConfig = require('pg-connection-string').parse;
- const metrics = require('prom-client');
- const uuid = require('uuid');
- const WebSocket = require('ws');
- const environment = process.env.NODE_ENV || 'development';
- dotenv.config({
- path: environment === 'production' ? '.env.production' : '.env',
- });
- log.level = process.env.LOG_LEVEL || 'verbose';
- /**
- * @param {Object.<string, any>} config
- */
- const createRedisClient = async (config) => {
- const { redisParams, redisUrl } = config;
- const client = new Redis(redisUrl, redisParams);
- client.on('error', (err) => log.error('Redis Client Error!', err));
- return client;
- };
- /**
- * Attempts to safely parse a string as JSON, used when both receiving a message
- * from redis and when receiving a message from a client over a websocket
- * connection, this is why it accepts a `req` argument.
- * @param {string} json
- * @param {any?} req
- * @returns {Object.<string, any>|null}
- */
- const parseJSON = (json, req) => {
- try {
- return JSON.parse(json);
- } catch (err) {
- /* FIXME: This logging isn't great, and should probably be done at the
- * call-site of parseJSON, not in the method, but this would require changing
- * the signature of parseJSON to return something akin to a Result type:
- * [Error|null, null|Object<string,any}], and then handling the error
- * scenarios.
- */
- if (req) {
- if (req.accountId) {
- log.warn(req.requestId, `Error parsing message from user ${req.accountId}: ${err}`);
- } else {
- log.silly(req.requestId, `Error parsing message from ${req.remoteAddress}: ${err}`);
- }
- } else {
- log.warn(`Error parsing message from redis: ${err}`);
- }
- return null;
- }
- };
- /**
- * @param {Object.<string, any>} env the `process.env` value to read configuration from
- * @returns {Object.<string, any>} the configuration for the PostgreSQL connection
- */
- const pgConfigFromEnv = (env) => {
- const pgConfigs = {
- development: {
- user: env.DB_USER || pg.defaults.user,
- password: env.DB_PASS || pg.defaults.password,
- database: env.DB_NAME || 'mastodon_development',
- host: env.DB_HOST || pg.defaults.host,
- port: env.DB_PORT || pg.defaults.port,
- },
- production: {
- user: env.DB_USER || 'mastodon',
- password: env.DB_PASS || '',
- database: env.DB_NAME || 'mastodon_production',
- host: env.DB_HOST || 'localhost',
- port: env.DB_PORT || 5432,
- },
- };
- let baseConfig;
- if (env.DATABASE_URL) {
- baseConfig = dbUrlToConfig(env.DATABASE_URL);
- // Support overriding the database password in the connection URL
- if (!baseConfig.password && env.DB_PASS) {
- baseConfig.password = env.DB_PASS;
- }
- } else {
- baseConfig = pgConfigs[environment];
- if (env.DB_SSLMODE) {
- switch(env.DB_SSLMODE) {
- case 'disable':
- case '':
- baseConfig.ssl = false;
- break;
- case 'no-verify':
- baseConfig.ssl = { rejectUnauthorized: false };
- break;
- default:
- baseConfig.ssl = {};
- break;
- }
- }
- }
- return {
- ...baseConfig,
- max: env.DB_POOL || 10,
- connectionTimeoutMillis: 15000,
- application_name: '',
- };
- };
- /**
- * @param {Object.<string, any>} env the `process.env` value to read configuration from
- * @returns {Object.<string, any>} configuration for the Redis connection
- */
- const redisConfigFromEnv = (env) => {
- // ioredis *can* transparently add prefixes for us, but it doesn't *in some cases*,
- // which means we can't use it. But this is something that should be looked into.
- const redisPrefix = env.REDIS_NAMESPACE ? `${env.REDIS_NAMESPACE}:` : '';
- const redisParams = {
- host: env.REDIS_HOST || '127.0.0.1',
- port: env.REDIS_PORT || 6379,
- db: env.REDIS_DB || 0,
- password: env.REDIS_PASSWORD || undefined,
- };
- // redisParams.path takes precedence over host and port.
- if (env.REDIS_URL && env.REDIS_URL.startsWith('unix://')) {
- redisParams.path = env.REDIS_URL.slice(7);
- }
- return {
- redisParams,
- redisPrefix,
- redisUrl: env.REDIS_URL,
- };
- };
- const startServer = async () => {
- const app = express();
- app.set('trust proxy', process.env.TRUSTED_PROXY_IP ? process.env.TRUSTED_PROXY_IP.split(/(?:\s*,\s*|\s+)/) : 'loopback,uniquelocal');
- const pgPool = new pg.Pool(pgConfigFromEnv(process.env));
- const server = http.createServer(app);
- /**
- * @type {Object.<string, Array.<function(Object<string, any>): void>>}
- */
- const subs = {};
- const redisConfig = redisConfigFromEnv(process.env);
- const redisSubscribeClient = await createRedisClient(redisConfig);
- const redisClient = await createRedisClient(redisConfig);
- const { redisPrefix } = redisConfig;
- // Collect metrics from Node.js
- metrics.collectDefaultMetrics();
- new metrics.Gauge({
- name: 'pg_pool_total_connections',
- help: 'The total number of clients existing within the pool',
- collect() {
- this.set(pgPool.totalCount);
- },
- });
- new metrics.Gauge({
- name: 'pg_pool_idle_connections',
- help: 'The number of clients which are not checked out but are currently idle in the pool',
- collect() {
- this.set(pgPool.idleCount);
- },
- });
- new metrics.Gauge({
- name: 'pg_pool_waiting_queries',
- help: 'The number of queued requests waiting on a client when all clients are checked out',
- collect() {
- this.set(pgPool.waitingCount);
- },
- });
- const connectedClients = new metrics.Gauge({
- name: 'connected_clients',
- help: 'The number of clients connected to the streaming server',
- labelNames: ['type'],
- });
- connectedClients.set({ type: 'websocket' }, 0);
- connectedClients.set({ type: 'eventsource' }, 0);
- const connectedChannels = new metrics.Gauge({
- name: 'connected_channels',
- help: 'The number of channels the streaming server is streaming to',
- labelNames: [ 'type', 'channel' ]
- });
- const redisSubscriptions = new metrics.Gauge({
- name: 'redis_subscriptions',
- help: 'The number of Redis channels the streaming server is subscribed to',
- });
- // When checking metrics in the browser, the favicon is requested this
- // prevents the request from falling through to the API Router, which would
- // error for this endpoint:
- app.get('/favicon.ico', (req, res) => res.status(404).end());
- app.get('/api/v1/streaming/health', (req, res) => {
- res.writeHead(200, { 'Content-Type': 'text/plain' });
- res.end('OK');
- });
- app.get('/metrics', async (req, res) => {
- try {
- res.set('Content-Type', metrics.register.contentType);
- res.end(await metrics.register.metrics());
- } catch (ex) {
- log.error(ex);
- res.status(500).end();
- }
- });
- /**
- * @param {string[]} channels
- * @returns {function(): void}
- */
- const subscriptionHeartbeat = channels => {
- const interval = 6 * 60;
- const tellSubscribed = () => {
- channels.forEach(channel => redisClient.set(`${redisPrefix}subscribed:${channel}`, '1', 'EX', interval * 3));
- };
- tellSubscribed();
- const heartbeat = setInterval(tellSubscribed, interval * 1000);
- return () => {
- clearInterval(heartbeat);
- };
- };
- /**
- * @param {string} channel
- * @param {string} message
- */
- const onRedisMessage = (channel, message) => {
- const callbacks = subs[channel];
- log.silly(`New message on channel ${redisPrefix}${channel}`);
- if (!callbacks) {
- return;
- }
- const json = parseJSON(message, null);
- if (!json) return;
- callbacks.forEach(callback => callback(json));
- };
- redisSubscribeClient.on("message", onRedisMessage);
- /**
- * @callback SubscriptionListener
- * @param {ReturnType<parseJSON>} json of the message
- * @returns void
- */
- /**
- * @param {string} channel
- * @param {SubscriptionListener} callback
- */
- const subscribe = (channel, callback) => {
- log.silly(`Adding listener for ${channel}`);
- subs[channel] = subs[channel] || [];
- if (subs[channel].length === 0) {
- log.verbose(`Subscribe ${channel}`);
- redisSubscribeClient.subscribe(channel, (err, count) => {
- if (err) {
- log.error(`Error subscribing to ${channel}`);
- }
- else {
- redisSubscriptions.set(count);
- }
- });
- }
- subs[channel].push(callback);
- };
- /**
- * @param {string} channel
- * @param {SubscriptionListener} callback
- */
- const unsubscribe = (channel, callback) => {
- log.silly(`Removing listener for ${channel}`);
- if (!subs[channel]) {
- return;
- }
- subs[channel] = subs[channel].filter(item => item !== callback);
- if (subs[channel].length === 0) {
- log.verbose(`Unsubscribe ${channel}`);
- redisSubscribeClient.unsubscribe(channel, (err, count) => {
- if (err) {
- log.error(`Error unsubscribing to ${channel}`);
- }
- else {
- redisSubscriptions.set(count);
- }
- });
- delete subs[channel];
- }
- };
- const FALSE_VALUES = [
- false,
- 0,
- '0',
- 'f',
- 'F',
- 'false',
- 'FALSE',
- 'off',
- 'OFF',
- ];
- /**
- * @param {any} value
- * @returns {boolean}
- */
- const isTruthy = value =>
- value && !FALSE_VALUES.includes(value);
- /**
- * @param {any} req
- * @param {any} res
- * @param {function(Error=): void} next
- */
- const allowCrossDomain = (req, res, next) => {
- res.header('Access-Control-Allow-Origin', '*');
- res.header('Access-Control-Allow-Headers', 'Authorization, Accept, Cache-Control');
- res.header('Access-Control-Allow-Methods', 'GET, OPTIONS');
- next();
- };
- /**
- * @param {any} req
- * @param {any} res
- * @param {function(Error=): void} next
- */
- const setRequestId = (req, res, next) => {
- req.requestId = uuid.v4();
- res.header('X-Request-Id', req.requestId);
- next();
- };
- /**
- * @param {any} req
- * @param {any} res
- * @param {function(Error=): void} next
- */
- const setRemoteAddress = (req, res, next) => {
- req.remoteAddress = req.connection.remoteAddress;
- next();
- };
- /**
- * @param {any} req
- * @param {string[]} necessaryScopes
- * @returns {boolean}
- */
- const isInScope = (req, necessaryScopes) =>
- req.scopes.some(scope => necessaryScopes.includes(scope));
- /**
- * @param {string} token
- * @param {any} req
- * @returns {Promise.<void>}
- */
- const accountFromToken = (token, req) => new Promise((resolve, reject) => {
- pgPool.connect((err, client, done) => {
- if (err) {
- reject(err);
- return;
- }
- client.query('SELECT oauth_access_tokens.id, oauth_access_tokens.resource_owner_id, users.account_id, users.chosen_languages, oauth_access_tokens.scopes, devices.device_id FROM oauth_access_tokens INNER JOIN users ON oauth_access_tokens.resource_owner_id = users.id LEFT OUTER JOIN devices ON oauth_access_tokens.id = devices.access_token_id WHERE oauth_access_tokens.token = $1 AND oauth_access_tokens.revoked_at IS NULL LIMIT 1', [token], (err, result) => {
- done();
- if (err) {
- reject(err);
- return;
- }
- if (result.rows.length === 0) {
- err = new Error('Invalid access token');
- err.status = 401;
- reject(err);
- return;
- }
- req.accessTokenId = result.rows[0].id;
- req.scopes = result.rows[0].scopes.split(' ');
- req.accountId = result.rows[0].account_id;
- req.chosenLanguages = result.rows[0].chosen_languages;
- req.deviceId = result.rows[0].device_id;
- resolve();
- });
- });
- });
- /**
- * @param {any} req
- * @returns {Promise.<void>}
- */
- const accountFromRequest = (req) => new Promise((resolve, reject) => {
- const authorization = req.headers.authorization;
- const location = url.parse(req.url, true);
- const accessToken = location.query.access_token || req.headers['sec-websocket-protocol'];
- if (!authorization && !accessToken) {
- const err = new Error('Missing access token');
- err.status = 401;
- reject(err);
- return;
- }
- const token = authorization ? authorization.replace(/^Bearer /, '') : accessToken;
- resolve(accountFromToken(token, req));
- });
- /**
- * @param {any} req
- * @returns {string|undefined}
- */
- const channelNameFromPath = req => {
- const { path, query } = req;
- const onlyMedia = isTruthy(query.only_media);
- switch (path) {
- case '/api/v1/streaming/user':
- return 'user';
- case '/api/v1/streaming/user/notification':
- return 'user:notification';
- case '/api/v1/streaming/public':
- return onlyMedia ? 'public:media' : 'public';
- case '/api/v1/streaming/public/local':
- return onlyMedia ? 'public:local:media' : 'public:local';
- case '/api/v1/streaming/public/remote':
- return onlyMedia ? 'public:remote:media' : 'public:remote';
- case '/api/v1/streaming/hashtag':
- return 'hashtag';
- case '/api/v1/streaming/hashtag/local':
- return 'hashtag:local';
- case '/api/v1/streaming/direct':
- return 'direct';
- case '/api/v1/streaming/list':
- return 'list';
- default:
- return undefined;
- }
- };
- const PUBLIC_CHANNELS = [
- 'public',
- 'public:media',
- 'public:local',
- 'public:local:media',
- 'public:remote',
- 'public:remote:media',
- 'hashtag',
- 'hashtag:local',
- ];
- /**
- * @param {any} req
- * @param {string|undefined} channelName
- * @returns {Promise.<void>}
- */
- const checkScopes = (req, channelName) => new Promise((resolve, reject) => {
- log.silly(req.requestId, `Checking OAuth scopes for ${channelName}`);
- // When accessing public channels, no scopes are needed
- if (PUBLIC_CHANNELS.includes(channelName)) {
- resolve();
- return;
- }
- // The `read` scope has the highest priority, if the token has it
- // then it can access all streams
- const requiredScopes = ['read'];
- // When accessing specifically the notifications stream,
- // we need a read:notifications, while in all other cases,
- // we can allow access with read:statuses. Mind that the
- // user stream will not contain notifications unless
- // the token has either read or read:notifications scope
- // as well, this is handled separately.
- if (channelName === 'user:notification') {
- requiredScopes.push('read:notifications');
- } else {
- requiredScopes.push('read:statuses');
- }
- if (req.scopes && requiredScopes.some(requiredScope => req.scopes.includes(requiredScope))) {
- resolve();
- return;
- }
- const err = new Error('Access token does not cover required scopes');
- err.status = 401;
- reject(err);
- });
- /**
- * @param {any} info
- * @param {function(boolean, number, string): void} callback
- */
- const wsVerifyClient = (info, callback) => {
- // When verifying the websockets connection, we no longer pre-emptively
- // check OAuth scopes and drop the connection if they're missing. We only
- // drop the connection if access without token is not allowed by environment
- // variables. OAuth scope checks are moved to the point of subscription
- // to a specific stream.
- accountFromRequest(info.req).then(() => {
- callback(true, undefined, undefined);
- }).catch(err => {
- log.error(info.req.requestId, err.toString());
- callback(false, 401, 'Unauthorized');
- });
- };
- /**
- * @typedef SystemMessageHandlers
- * @property {function(): void} onKill
- */
- /**
- * @param {any} req
- * @param {SystemMessageHandlers} eventHandlers
- * @returns {function(object): void}
- */
- const createSystemMessageListener = (req, eventHandlers) => {
- return message => {
- const { event } = message;
- log.silly(req.requestId, `System message for ${req.accountId}: ${event}`);
- if (event === 'kill') {
- log.verbose(req.requestId, `Closing connection for ${req.accountId} due to expired access token`);
- eventHandlers.onKill();
- } else if (event === 'filters_changed') {
- log.verbose(req.requestId, `Invalidating filters cache for ${req.accountId}`);
- req.cachedFilters = null;
- }
- };
- };
- /**
- * @param {any} req
- * @param {any} res
- */
- const subscribeHttpToSystemChannel = (req, res) => {
- const accessTokenChannelId = `timeline:access_token:${req.accessTokenId}`;
- const systemChannelId = `timeline:system:${req.accountId}`;
- const listener = createSystemMessageListener(req, {
- onKill() {
- res.end();
- },
- });
- res.on('close', () => {
- unsubscribe(`${redisPrefix}${accessTokenChannelId}`, listener);
- unsubscribe(`${redisPrefix}${systemChannelId}`, listener);
- connectedChannels.labels({ type: 'eventsource', channel: 'system' }).dec(2);
- });
- subscribe(`${redisPrefix}${accessTokenChannelId}`, listener);
- subscribe(`${redisPrefix}${systemChannelId}`, listener);
- connectedChannels.labels({ type: 'eventsource', channel: 'system' }).inc(2);
- };
- /**
- * @param {any} req
- * @param {any} res
- * @param {function(Error=): void} next
- */
- const authenticationMiddleware = (req, res, next) => {
- if (req.method === 'OPTIONS') {
- next();
- return;
- }
- const channelName = channelNameFromPath(req);
- // If no channelName can be found for the request, then we should terminate
- // the connection, as there's nothing to stream back
- if (!channelName) {
- const err = new Error('Unknown channel requested');
- err.status = 400;
- next(err);
- return;
- }
- accountFromRequest(req).then(() => checkScopes(req, channelName)).then(() => {
- subscribeHttpToSystemChannel(req, res);
- }).then(() => {
- next();
- }).catch(err => {
- next(err);
- });
- };
- /**
- * @param {Error} err
- * @param {any} req
- * @param {any} res
- * @param {function(Error=): void} next
- */
- const errorMiddleware = (err, req, res, next) => {
- log.error(req.requestId, err.toString());
- if (res.headersSent) {
- next(err);
- return;
- }
- res.writeHead(err.status || 500, { 'Content-Type': 'application/json' });
- res.end(JSON.stringify({ error: err.status ? err.toString() : 'An unexpected error occurred' }));
- };
- /**
- * @param {array} arr
- * @param {number=} shift
- * @returns {string}
- */
- const placeholders = (arr, shift = 0) => arr.map((_, i) => `$${i + 1 + shift}`).join(', ');
- /**
- * @param {string} listId
- * @param {any} req
- * @returns {Promise.<void>}
- */
- const authorizeListAccess = (listId, req) => new Promise((resolve, reject) => {
- const { accountId } = req;
- pgPool.connect((err, client, done) => {
- if (err) {
- reject();
- return;
- }
- client.query('SELECT id, account_id FROM lists WHERE id = $1 LIMIT 1', [listId], (err, result) => {
- done();
- if (err || result.rows.length === 0 || result.rows[0].account_id !== accountId) {
- reject();
- return;
- }
- resolve();
- });
- });
- });
- /**
- * @param {string[]} ids
- * @param {any} req
- * @param {function(string, string): void} output
- * @param {undefined | function(string[], SubscriptionListener): void} attachCloseHandler
- * @param {boolean=} needsFiltering
- * @returns {SubscriptionListener}
- */
- const streamFrom = (ids, req, output, attachCloseHandler, needsFiltering = false) => {
- const accountId = req.accountId || req.remoteAddress;
- log.verbose(req.requestId, `Starting stream from ${ids.join(', ')} for ${accountId}`);
- const transmit = (event, payload) => {
- // TODO: Replace "string"-based delete payloads with object payloads:
- const encodedPayload = typeof payload === 'object' ? JSON.stringify(payload) : payload;
- log.silly(req.requestId, `Transmitting for ${accountId}: ${event} ${encodedPayload}`);
- output(event, encodedPayload);
- };
- // The listener used to process each message off the redis subscription,
- // message here is an object with an `event` and `payload` property. Some
- // events also include a queued_at value, but this is being removed shortly.
- /** @type {SubscriptionListener} */
- const listener = message => {
- const { event, payload } = message;
- // Streaming only needs to apply filtering to some channels and only to
- // some events. This is because majority of the filtering happens on the
- // Ruby on Rails side when producing the event for streaming.
- //
- // The only events that require filtering from the streaming server are
- // `update` and `status.update`, all other events are transmitted to the
- // client as soon as they're received (pass-through).
- //
- // The channels that need filtering are determined in the function
- // `channelNameToIds` defined below:
- if (!needsFiltering || (event !== 'update' && event !== 'status.update')) {
- transmit(event, payload);
- return;
- }
- // The rest of the logic from here on in this function is to handle
- // filtering of statuses:
- // Filter based on language:
- if (Array.isArray(req.chosenLanguages) && payload.language !== null && req.chosenLanguages.indexOf(payload.language) === -1) {
- log.silly(req.requestId, `Message ${payload.id} filtered by language (${payload.language})`);
- return;
- }
- // When the account is not logged in, it is not necessary to confirm the block or mute
- if (!req.accountId) {
- transmit(event, payload);
- return;
- }
- // Filter based on domain blocks, blocks, mutes, or custom filters:
- const targetAccountIds = [payload.account.id].concat(payload.mentions.map(item => item.id));
- const accountDomain = payload.account.acct.split('@')[1];
- // TODO: Move this logic out of the message handling loop
- pgPool.connect((err, client, releasePgConnection) => {
- if (err) {
- log.error(err);
- return;
- }
- const queries = [
- client.query(`SELECT 1
- FROM blocks
- WHERE (account_id = $1 AND target_account_id IN (${placeholders(targetAccountIds, 2)}))
- OR (account_id = $2 AND target_account_id = $1)
- UNION
- SELECT 1
- FROM mutes
- WHERE account_id = $1
- AND target_account_id IN (${placeholders(targetAccountIds, 2)})`, [req.accountId, payload.account.id].concat(targetAccountIds)),
- ];
- if (accountDomain) {
- queries.push(client.query('SELECT 1 FROM account_domain_blocks WHERE account_id = $1 AND domain = $2', [req.accountId, accountDomain]));
- }
- if (!payload.filtered && !req.cachedFilters) {
- queries.push(client.query('SELECT filter.id AS id, filter.phrase AS title, filter.context AS context, filter.expires_at AS expires_at, filter.action AS filter_action, keyword.keyword AS keyword, keyword.whole_word AS whole_word FROM custom_filter_keywords keyword JOIN custom_filters filter ON keyword.custom_filter_id = filter.id WHERE filter.account_id = $1 AND (filter.expires_at IS NULL OR filter.expires_at > NOW())', [req.accountId]));
- }
- Promise.all(queries).then(values => {
- releasePgConnection();
- // Handling blocks & mutes and domain blocks: If one of those applies,
- // then we don't transmit the payload of the event to the client
- if (values[0].rows.length > 0 || (accountDomain && values[1].rows.length > 0)) {
- return;
- }
- // If the payload already contains the `filtered` property, it means
- // that filtering has been applied on the ruby on rails side, as
- // such, we don't need to construct or apply the filters in streaming:
- if (Object.prototype.hasOwnProperty.call(payload, "filtered")) {
- transmit(event, payload);
- return;
- }
- // Handling for constructing the custom filters and caching them on the request
- // TODO: Move this logic out of the message handling lifecycle
- if (!req.cachedFilters) {
- const filterRows = values[accountDomain ? 2 : 1].rows;
- req.cachedFilters = filterRows.reduce((cache, filter) => {
- if (cache[filter.id]) {
- cache[filter.id].keywords.push([filter.keyword, filter.whole_word]);
- } else {
- cache[filter.id] = {
- keywords: [[filter.keyword, filter.whole_word]],
- expires_at: filter.expires_at,
- filter: {
- id: filter.id,
- title: filter.title,
- context: filter.context,
- expires_at: filter.expires_at,
- // filter.filter_action is the value from the
- // custom_filters.action database column, it is an integer
- // representing a value in an enum defined by Ruby on Rails:
- //
- // enum { warn: 0, hide: 1 }
- filter_action: ['warn', 'hide'][filter.filter_action],
- },
- };
- }
- return cache;
- }, {});
- // Construct the regular expressions for the custom filters: This
- // needs to be done in a separate loop as the database returns one
- // filterRow per keyword, so we need all the keywords before
- // constructing the regular expression
- Object.keys(req.cachedFilters).forEach((key) => {
- req.cachedFilters[key].regexp = new RegExp(req.cachedFilters[key].keywords.map(([keyword, whole_word]) => {
- let expr = keyword.replace(/[.*+?^${}()|[\]\\]/g, '\\$&');
- if (whole_word) {
- if (/^[\w]/.test(expr)) {
- expr = `\\b${expr}`;
- }
- if (/[\w]$/.test(expr)) {
- expr = `${expr}\\b`;
- }
- }
- return expr;
- }).join('|'), 'i');
- });
- }
- // Apply cachedFilters against the payload, constructing a
- // `filter_results` array of FilterResult entities
- if (req.cachedFilters) {
- const status = payload;
- // TODO: Calculate searchableContent in Ruby on Rails:
- const searchableContent = ([status.spoiler_text || '', status.content].concat((status.poll && status.poll.options) ? status.poll.options.map(option => option.title) : [])).concat(status.media_attachments.map(att => att.description)).join('\n\n').replace(/<br\s*\/?>/g, '\n').replace(/<\/p><p>/g, '\n\n');
- const searchableTextContent = JSDOM.fragment(searchableContent).textContent;
- const now = new Date();
- const filter_results = Object.values(req.cachedFilters).reduce((results, cachedFilter) => {
- // Check the filter hasn't expired before applying:
- if (cachedFilter.expires_at !== null && cachedFilter.expires_at < now) {
- return results;
- }
- // Just in-case JSDOM fails to find textContent in searchableContent
- if (!searchableTextContent) {
- return results;
- }
- const keyword_matches = searchableTextContent.match(cachedFilter.regexp);
- if (keyword_matches) {
- // results is an Array of FilterResult; status_matches is always
- // null as we only are only applying the keyword-based custom
- // filters, not the status-based custom filters.
- // https://docs.joinmastodon.org/entities/FilterResult/
- results.push({
- filter: cachedFilter.filter,
- keyword_matches,
- status_matches: null
- });
- }
- return results;
- }, []);
- // Send the payload + the FilterResults as the `filtered` property
- // to the streaming connection. To reach this code, the `event` must
- // have been either `update` or `status.update`, meaning the
- // `payload` is a Status entity, which has a `filtered` property:
- //
- // filtered: https://docs.joinmastodon.org/entities/Status/#filtered
- transmit(event, {
- ...payload,
- filtered: filter_results
- });
- } else {
- transmit(event, payload);
- }
- }).catch(err => {
- log.error(err);
- releasePgConnection();
- });
- });
- };
- ids.forEach(id => {
- subscribe(`${redisPrefix}${id}`, listener);
- });
- if (typeof attachCloseHandler === 'function') {
- attachCloseHandler(ids.map(id => `${redisPrefix}${id}`), listener);
- }
- return listener;
- };
- /**
- * @param {any} req
- * @param {any} res
- * @returns {function(string, string): void}
- */
- const streamToHttp = (req, res) => {
- const accountId = req.accountId || req.remoteAddress;
- const channelName = channelNameFromPath(req);
- connectedClients.labels({ type: 'eventsource' }).inc();
- // In theory we'll always have a channel name, but channelNameFromPath can return undefined:
- if (typeof channelName === 'string') {
- connectedChannels.labels({ type: 'eventsource', channel: channelName }).inc();
- }
- res.setHeader('Content-Type', 'text/event-stream');
- res.setHeader('Cache-Control', 'no-store');
- res.setHeader('Transfer-Encoding', 'chunked');
- res.write(':)\n');
- const heartbeat = setInterval(() => res.write(':thump\n'), 15000);
- req.on('close', () => {
- log.verbose(req.requestId, `Ending stream for ${accountId}`);
- // We decrement these counters here instead of in streamHttpEnd as in that
- // method we don't have knowledge of the channel names
- connectedClients.labels({ type: 'eventsource' }).dec();
- // In theory we'll always have a channel name, but channelNameFromPath can return undefined:
- if (typeof channelName === 'string') {
- connectedChannels.labels({ type: 'eventsource', channel: channelName }).dec();
- }
- clearInterval(heartbeat);
- });
- return (event, payload) => {
- res.write(`event: ${event}\n`);
- res.write(`data: ${payload}\n\n`);
- };
- };
- /**
- * @param {any} req
- * @param {function(): void} [closeHandler]
- * @returns {function(string[], SubscriptionListener): void}
- */
- const streamHttpEnd = (req, closeHandler = undefined) => (ids, listener) => {
- req.on('close', () => {
- ids.forEach(id => {
- unsubscribe(id, listener);
- });
- if (closeHandler) {
- closeHandler();
- }
- });
- };
- /**
- * @param {any} req
- * @param {any} ws
- * @param {string[]} streamName
- * @returns {function(string, string): void}
- */
- const streamToWs = (req, ws, streamName) => (event, payload) => {
- if (ws.readyState !== ws.OPEN) {
- log.error(req.requestId, 'Tried writing to closed socket');
- return;
- }
- ws.send(JSON.stringify({ stream: streamName, event, payload }), (err) => {
- if (err) {
- log.error(req.requestId, `Failed to send to websocket: ${err}`);
- }
- });
- };
- /**
- * @param {any} res
- */
- const httpNotFound = res => {
- res.writeHead(404, { 'Content-Type': 'application/json' });
- res.end(JSON.stringify({ error: 'Not found' }));
- };
- const api = express.Router();
- app.use(api);
- api.use(setRequestId);
- api.use(setRemoteAddress);
- api.use(allowCrossDomain);
- api.use(authenticationMiddleware);
- api.use(errorMiddleware);
- api.get('/api/v1/streaming/*', (req, res) => {
- channelNameToIds(req, channelNameFromPath(req), req.query).then(({ channelIds, options }) => {
- const onSend = streamToHttp(req, res);
- const onEnd = streamHttpEnd(req, subscriptionHeartbeat(channelIds));
- streamFrom(channelIds, req, onSend, onEnd, options.needsFiltering);
- }).catch(err => {
- log.verbose(req.requestId, 'Subscription error:', err.toString());
- httpNotFound(res);
- });
- });
- const wss = new WebSocket.Server({ server, verifyClient: wsVerifyClient });
- /**
- * @typedef StreamParams
- * @property {string} [tag]
- * @property {string} [list]
- * @property {string} [only_media]
- */
- /**
- * @param {any} req
- * @returns {string[]}
- */
- const channelsForUserStream = req => {
- const arr = [`timeline:${req.accountId}`];
- if (isInScope(req, ['crypto']) && req.deviceId) {
- arr.push(`timeline:${req.accountId}:${req.deviceId}`);
- }
- if (isInScope(req, ['read', 'read:notifications'])) {
- arr.push(`timeline:${req.accountId}:notifications`);
- }
- return arr;
- };
- /**
- * See app/lib/ascii_folder.rb for the canon definitions
- * of these constants
- */
- const NON_ASCII_CHARS = 'ÀÁÂÃÄÅàáâãäåĀāĂ㥹ÇçĆćĈĉĊċČčÐðĎďĐđÈÉÊËèéêëĒēĔĕĖėĘęĚěĜĝĞğĠġĢģĤĥĦħÌÍÎÏìíîïĨĩĪīĬĭĮįİıĴĵĶķĸĹĺĻļĽľĿŀŁłÑñŃńŅņŇňʼnŊŋÒÓÔÕÖØòóôõöøŌōŎŏŐőŔŕŖŗŘřŚśŜŝŞşŠšſŢţŤťŦŧÙÚÛÜùúûüŨũŪūŬŭŮůŰűŲųŴŵÝýÿŶŷŸŹźŻżŽž';
- const EQUIVALENT_ASCII_CHARS = 'AAAAAAaaaaaaAaAaAaCcCcCcCcCcDdDdDdEEEEeeeeEeEeEeEeEeGgGgGgGgHhHhIIIIiiiiIiIiIiIiIiJjKkkLlLlLlLlLlNnNnNnNnnNnOOOOOOooooooOoOoOoRrRrRrSsSsSsSssTtTtTtUUUUuuuuUuUuUuUuUuUuWwYyyYyYZzZzZz';
- /**
- * @param {string} str
- * @returns {string}
- */
- const foldToASCII = str => {
- const regex = new RegExp(NON_ASCII_CHARS.split('').join('|'), 'g');
- return str.replace(regex, match => {
- const index = NON_ASCII_CHARS.indexOf(match);
- return EQUIVALENT_ASCII_CHARS[index];
- });
- };
- /**
- * @param {string} str
- * @returns {string}
- */
- const normalizeHashtag = str => {
- return foldToASCII(str.normalize('NFKC').toLowerCase()).replace(/[^\p{L}\p{N}_\u00b7\u200c]/gu, '');
- };
- /**
- * @param {any} req
- * @param {string} name
- * @param {StreamParams} params
- * @returns {Promise.<{ channelIds: string[], options: { needsFiltering: boolean } }>}
- */
- const channelNameToIds = (req, name, params) => new Promise((resolve, reject) => {
- switch (name) {
- case 'user':
- resolve({
- channelIds: channelsForUserStream(req),
- options: { needsFiltering: false },
- });
- break;
- case 'user:notification':
- resolve({
- channelIds: [`timeline:${req.accountId}:notifications`],
- options: { needsFiltering: false },
- });
- break;
- case 'public':
- resolve({
- channelIds: ['timeline:public'],
- options: { needsFiltering: true },
- });
- break;
- case 'public:local':
- resolve({
- channelIds: ['timeline:public:local'],
- options: { needsFiltering: true },
- });
- break;
- case 'public:remote':
- resolve({
- channelIds: ['timeline:public:remote'],
- options: { needsFiltering: true },
- });
- break;
- case 'public:media':
- resolve({
- channelIds: ['timeline:public:media'],
- options: { needsFiltering: true },
- });
- break;
- case 'public:local:media':
- resolve({
- channelIds: ['timeline:public:local:media'],
- options: { needsFiltering: true },
- });
- break;
- case 'public:remote:media':
- resolve({
- channelIds: ['timeline:public:remote:media'],
- options: { needsFiltering: true },
- });
- break;
- case 'direct':
- resolve({
- channelIds: [`timeline:direct:${req.accountId}`],
- options: { needsFiltering: false },
- });
- break;
- case 'hashtag':
- if (!params.tag || params.tag.length === 0) {
- reject('No tag for stream provided');
- } else {
- resolve({
- channelIds: [`timeline:hashtag:${normalizeHashtag(params.tag)}`],
- options: { needsFiltering: true },
- });
- }
- break;
- case 'hashtag:local':
- if (!params.tag || params.tag.length === 0) {
- reject('No tag for stream provided');
- } else {
- resolve({
- channelIds: [`timeline:hashtag:${normalizeHashtag(params.tag)}:local`],
- options: { needsFiltering: true },
- });
- }
- break;
- case 'list':
- authorizeListAccess(params.list, req).then(() => {
- resolve({
- channelIds: [`timeline:list:${params.list}`],
- options: { needsFiltering: false },
- });
- }).catch(() => {
- reject('Not authorized to stream this list');
- });
- break;
- default:
- reject('Unknown stream type');
- }
- });
- /**
- * @param {string} channelName
- * @param {StreamParams} params
- * @returns {string[]}
- */
- const streamNameFromChannelName = (channelName, params) => {
- if (channelName === 'list') {
- return [channelName, params.list];
- } else if (['hashtag', 'hashtag:local'].includes(channelName)) {
- return [channelName, params.tag];
- } else {
- return [channelName];
- }
- };
- /**
- * @typedef WebSocketSession
- * @property {any} socket
- * @property {any} request
- * @property {Object.<string, { channelName: string, listener: SubscriptionListener, stopHeartbeat: function(): void }>} subscriptions
- */
- /**
- * @param {WebSocketSession} session
- * @param {string} channelName
- * @param {StreamParams} params
- * @returns {void}
- */
- const subscribeWebsocketToChannel = ({ socket, request, subscriptions }, channelName, params) => {
- checkScopes(request, channelName).then(() => channelNameToIds(request, channelName, params)).then(({
- channelIds,
- options,
- }) => {
- if (subscriptions[channelIds.join(';')]) {
- return;
- }
- const onSend = streamToWs(request, socket, streamNameFromChannelName(channelName, params));
- const stopHeartbeat = subscriptionHeartbeat(channelIds);
- const listener = streamFrom(channelIds, request, onSend, undefined, options.needsFiltering);
- connectedChannels.labels({ type: 'websocket', channel: channelName }).inc();
- subscriptions[channelIds.join(';')] = {
- channelName,
- listener,
- stopHeartbeat,
- };
- }).catch(err => {
- log.verbose(request.requestId, 'Subscription error:', err.toString());
- socket.send(JSON.stringify({ error: err.toString() }));
- });
- }
- const removeSubscription = (subscriptions, channelIds, request) => {
- log.verbose(request.requestId, `Ending stream from ${channelIds.join(', ')} for ${request.accountId}`);
- const subscription = subscriptions[channelIds.join(';')];
- if (!subscription) {
- return;
- }
- channelIds.forEach(channelId => {
- unsubscribe(`${redisPrefix}${channelId}`, subscription.listener);
- });
- connectedChannels.labels({ type: 'websocket', channel: subscription.channelName }).dec();
- subscription.stopHeartbeat();
- delete subscriptions[channelIds.join(';')];
- }
- /**
- * @param {WebSocketSession} session
- * @param {string} channelName
- * @param {StreamParams} params
- * @returns {void}
- */
- const unsubscribeWebsocketFromChannel = ({ socket, request, subscriptions }, channelName, params) => {
- channelNameToIds(request, channelName, params).then(({ channelIds }) => {
- removeSubscription(subscriptions, channelIds, request);
- }).catch(err => {
- log.verbose(request.requestId, 'Unsubscribe error:', err);
- // If we have a socket that is alive and open still, send the error back to the client:
- // FIXME: In other parts of the code ws === socket
- if (socket.isAlive && socket.readyState === socket.OPEN) {
- socket.send(JSON.stringify({ error: "Error unsubscribing from channel" }));
- }
- });
- }
- /**
- * @param {WebSocketSession} session
- */
- const subscribeWebsocketToSystemChannel = ({ socket, request, subscriptions }) => {
- const accessTokenChannelId = `timeline:access_token:${request.accessTokenId}`;
- const systemChannelId = `timeline:system:${request.accountId}`;
- const listener = createSystemMessageListener(request, {
- onKill() {
- socket.close();
- },
- });
- subscribe(`${redisPrefix}${accessTokenChannelId}`, listener);
- subscribe(`${redisPrefix}${systemChannelId}`, listener);
- subscriptions[accessTokenChannelId] = {
- channelName: 'system',
- listener,
- stopHeartbeat: () => {
- },
- };
- subscriptions[systemChannelId] = {
- channelName: 'system',
- listener,
- stopHeartbeat: () => {
- },
- };
- connectedChannels.labels({ type: 'websocket', channel: 'system' }).inc(2);
- };
- /**
- * @param {string|string[]} arrayOrString
- * @returns {string}
- */
- const firstParam = arrayOrString => {
- if (Array.isArray(arrayOrString)) {
- return arrayOrString[0];
- } else {
- return arrayOrString;
- }
- };
- wss.on('connection', (ws, req) => {
- const location = url.parse(req.url, true);
- req.requestId = uuid.v4();
- req.remoteAddress = ws._socket.remoteAddress;
- ws.isAlive = true;
- ws.on('pong', () => {
- ws.isAlive = true;
- });
- connectedClients.labels({ type: 'websocket' }).inc();
- /**
- * @type {WebSocketSession}
- */
- const session = {
- socket: ws,
- request: req,
- subscriptions: {},
- };
- const onEnd = () => {
- const subscriptions = Object.keys(session.subscriptions);
- subscriptions.forEach(channelIds => {
- removeSubscription(session.subscriptions, channelIds.split(';'), req)
- });
- // ensure garbage collection:
- session.socket = null;
- session.request = null;
- session.subscriptions = {};
- connectedClients.labels({ type: 'websocket' }).dec();
- };
- ws.on('close', onEnd);
- ws.on('error', onEnd);
- ws.on('message', (data, isBinary) => {
- if (isBinary) {
- log.warn('socket', 'Received binary data, closing connection');
- ws.close(1003, 'The mastodon streaming server does not support binary messages');
- return;
- }
- const message = data.toString('utf8');
- const json = parseJSON(message, session.request);
- if (!json) return;
- const { type, stream, ...params } = json;
- if (type === 'subscribe') {
- subscribeWebsocketToChannel(session, firstParam(stream), params);
- } else if (type === 'unsubscribe') {
- unsubscribeWebsocketFromChannel(session, firstParam(stream), params);
- } else {
- // Unknown action type
- }
- });
- subscribeWebsocketToSystemChannel(session);
- if (location.query.stream) {
- subscribeWebsocketToChannel(session, firstParam(location.query.stream), location.query);
- }
- });
- setInterval(() => {
- wss.clients.forEach(ws => {
- if (ws.isAlive === false) {
- ws.terminate();
- return;
- }
- ws.isAlive = false;
- ws.ping('', false);
- });
- }, 30000);
- attachServerWithConfig(server, address => {
- log.warn(`Streaming API now listening on ${address}`);
- });
- const onExit = () => {
- server.close();
- process.exit(0);
- };
- const onError = (err) => {
- log.error(err);
- server.close();
- process.exit(0);
- };
- process.on('SIGINT', onExit);
- process.on('SIGTERM', onExit);
- process.on('exit', onExit);
- process.on('uncaughtException', onError);
- };
- /**
- * @param {any} server
- * @param {function(string): void} [onSuccess]
- */
- const attachServerWithConfig = (server, onSuccess) => {
- if (process.env.SOCKET || process.env.PORT && isNaN(+process.env.PORT)) {
- server.listen(process.env.SOCKET || process.env.PORT, () => {
- if (onSuccess) {
- fs.chmodSync(server.address(), 0o666);
- onSuccess(server.address());
- }
- });
- } else {
- server.listen(+process.env.PORT || 4000, process.env.BIND || '127.0.0.1', () => {
- if (onSuccess) {
- onSuccess(`${server.address().address}:${server.address().port}`);
- }
- });
- }
- };
- startServer();
|