umami/lib/clickhouse.js

234 lines
5.2 KiB
JavaScript
Raw Normal View History

2022-08-26 07:04:32 +02:00
import { ClickHouse } from 'clickhouse';
import dateFormat from 'dateformat';
2022-08-28 06:38:35 +02:00
import debug from 'debug';
2022-08-26 07:04:32 +02:00
import { FILTER_IGNORED } from 'lib/constants';
2022-08-28 06:38:35 +02:00
import { CLICKHOUSE } from 'lib/db';
export const CLICKHOUSE_DATE_FORMATS = {
minute: '%Y-%m-%d %H:%M:00',
hour: '%Y-%m-%d %H:00:00',
day: '%Y-%m-%d',
month: '%Y-%m-01',
year: '%Y-01-01',
};
2022-08-29 05:20:54 +02:00
const log = debug('umami:clickhouse');
2022-08-26 07:04:32 +02:00
2022-10-07 00:00:16 +02:00
let clickhouse;
const enabled = Boolean(process.env.CLICKHOUSE_URL);
2022-08-26 07:04:32 +02:00
function getClient() {
2022-08-28 06:38:35 +02:00
const {
hostname,
port,
pathname,
username = 'default',
password,
} = new URL(process.env.CLICKHOUSE_URL);
const client = new ClickHouse({
url: hostname,
port: Number(port),
2022-08-26 07:04:32 +02:00
format: 'json',
config: {
2022-08-28 06:38:35 +02:00
database: pathname.replace('/', ''),
2022-08-26 07:04:32 +02:00
},
2022-08-28 06:38:35 +02:00
basicAuth: password ? { username, password } : null,
2022-08-26 07:04:32 +02:00
});
2022-08-28 06:38:35 +02:00
if (process.env.NODE_ENV !== 'production') {
2022-08-29 19:47:01 +02:00
global[CLICKHOUSE] = client;
2022-08-28 06:38:35 +02:00
}
2022-08-26 07:04:32 +02:00
2022-08-28 06:38:35 +02:00
log('Clickhouse initialized');
2022-08-26 07:04:32 +02:00
2022-08-28 06:38:35 +02:00
return client;
}
2022-08-26 07:04:32 +02:00
2022-08-26 07:43:22 +02:00
function getDateStringQuery(data, unit) {
2022-08-26 07:04:32 +02:00
return `formatDateTime(${data}, '${CLICKHOUSE_DATE_FORMATS[unit]}')`;
}
2022-08-26 07:43:22 +02:00
function getDateQuery(field, unit, timezone) {
2022-08-26 07:04:32 +02:00
if (timezone) {
return `date_trunc('${unit}', ${field}, '${timezone}')`;
}
return `date_trunc('${unit}', ${field})`;
}
2022-08-26 07:43:22 +02:00
function getDateFormat(date) {
2022-08-26 07:04:32 +02:00
return `'${dateFormat(date, 'UTC:yyyy-mm-dd HH:MM:ss')}'`;
}
2022-10-11 02:01:48 +02:00
function getCommaSeparatedStringFormat(data) {
2022-10-12 08:09:06 +02:00
return data.map(a => `'${a}'`).join(',') || '';
2022-10-09 01:12:33 +02:00
}
2022-08-26 07:43:22 +02:00
function getBetweenDates(field, start_at, end_at) {
return `${field} between ${getDateFormat(start_at)} and ${getDateFormat(end_at)}`;
}
function getJsonField(column, property) {
return `${column}.${property}`;
}
function getEventDataColumnsQuery(column, columns) {
const query = Object.keys(columns).reduce((arr, key) => {
const filter = columns[key];
if (filter === undefined) {
return arr;
}
2022-10-22 07:30:52 +02:00
arr.push(`${filter}(${getJsonField(column, key)}) as "${filter}(${key})"`);
return arr;
}, []);
return query.join(',\n');
}
function getEventDataFilterQuery(column, filters) {
const query = Object.keys(filters).reduce((arr, key) => {
const filter = filters[key];
if (filter === undefined) {
return arr;
}
arr.push(
`${getJsonField(column, key)} = ${typeof filter === 'string' ? `'${filter}'` : filter}`,
);
return arr;
}, []);
return query.join('\nand ');
2022-08-26 07:04:32 +02:00
}
2022-09-12 18:55:34 +02:00
function getFilterQuery(column, filters = {}, params = []) {
2022-08-26 07:04:32 +02:00
const query = Object.keys(filters).reduce((arr, key) => {
const filter = filters[key];
if (filter === undefined || filter === FILTER_IGNORED) {
return arr;
}
switch (key) {
case 'url':
case 'os':
case 'browser':
case 'device':
case 'country':
case 'event_name':
2022-09-12 18:55:34 +02:00
arr.push(`and ${key}=$${params.length + 1}`);
params.push(decodeURIComponent(filter));
2022-08-26 07:04:32 +02:00
break;
case 'referrer':
2022-09-12 18:55:34 +02:00
arr.push(`and referrer like $${params.length + 1}`);
params.push(`%${decodeURIComponent(filter)}%`);
2022-08-26 07:04:32 +02:00
break;
case 'domain':
2022-09-12 18:55:34 +02:00
arr.push(`and referrer not like $${params.length + 1}`);
arr.push(`and referrer not like '/%'`);
params.push(`%://${filter}/%`);
2022-08-26 07:04:32 +02:00
break;
case 'query':
2022-09-12 18:55:34 +02:00
arr.push(`and url like '%?%'`);
2022-08-26 07:04:32 +02:00
}
return arr;
}, []);
return query.join('\n');
}
2022-09-12 18:55:34 +02:00
function parseFilters(column, filters = {}, params = []) {
2022-08-26 07:04:32 +02:00
const { domain, url, event_url, referrer, os, browser, device, country, event_name, query } =
filters;
const pageviewFilters = { domain, url, referrer, query };
const sessionFilters = { os, browser, device, country };
const eventFilters = { url: event_url, event_name };
return {
pageviewFilters,
sessionFilters,
eventFilters,
event: { event_name },
2022-09-12 18:55:34 +02:00
pageviewQuery: getFilterQuery(column, pageviewFilters, params),
sessionQuery: getFilterQuery(column, sessionFilters, params),
eventQuery: getFilterQuery(column, eventFilters, params),
2022-08-26 07:04:32 +02:00
};
}
2022-08-29 05:20:54 +02:00
function formatQuery(str, params = []) {
let formattedString = str;
2022-08-26 07:04:32 +02:00
2022-08-29 05:20:54 +02:00
params.forEach((param, i) => {
let replace = param;
2022-08-26 07:04:32 +02:00
2022-08-29 05:20:54 +02:00
if (typeof param === 'string' || param instanceof String) {
2022-08-26 07:04:32 +02:00
replace = `'${replace}'`;
}
formattedString = formattedString.replace(`$${i + 1}`, replace);
});
return formattedString;
}
2022-08-29 05:20:54 +02:00
async function rawQuery(query, params = []) {
let formattedQuery = formatQuery(query, params);
2022-08-26 07:04:32 +02:00
2022-08-29 05:20:54 +02:00
if (process.env.LOG_QUERY) {
log(formattedQuery);
2022-08-26 07:04:32 +02:00
}
2022-10-07 00:00:16 +02:00
await connect();
2022-08-26 07:04:32 +02:00
return clickhouse.query(formattedQuery).toPromise();
}
2022-08-26 07:43:22 +02:00
async function findUnique(data) {
2022-08-26 07:04:32 +02:00
if (data.length > 1) {
throw `${data.length} records found when expecting 1.`;
}
return data[0] ?? null;
}
2022-08-26 07:20:30 +02:00
2022-08-26 07:43:22 +02:00
async function findFirst(data) {
2022-08-26 07:20:30 +02:00
return data[0] ?? null;
}
2022-08-26 07:43:22 +02:00
2022-10-07 00:00:16 +02:00
async function connect() {
if (!clickhouse) {
clickhouse = process.env.CLICKHOUSE_URL && (global[CLICKHOUSE] || getClient());
}
return clickhouse;
}
2022-08-28 06:38:35 +02:00
2022-08-26 07:43:22 +02:00
export default {
2022-10-07 00:00:16 +02:00
enabled,
2022-08-28 06:38:35 +02:00
client: clickhouse,
log,
2022-10-07 00:00:16 +02:00
connect,
2022-08-26 07:43:22 +02:00
getDateStringQuery,
getDateQuery,
getDateFormat,
2022-10-09 01:12:33 +02:00
getCommaSeparatedStringFormat,
2022-08-26 07:43:22 +02:00
getBetweenDates,
getEventDataColumnsQuery,
getEventDataFilterQuery,
2022-08-26 07:43:22 +02:00
getFilterQuery,
parseFilters,
findUnique,
findFirst,
2022-08-29 05:20:54 +02:00
rawQuery,
2022-08-26 07:43:22 +02:00
};