import clickhouse from '@/lib/clickhouse'; import { EVENT_COLUMNS, EVENT_TYPE, FILTER_COLUMNS, SESSION_COLUMNS } from '@/lib/constants'; import { CLICKHOUSE, PRISMA, runQuery } from '@/lib/db'; import prisma from '@/lib/prisma'; import { QueryFilters } from '@/lib/types'; export interface PageviewMetricsParameters { type: string; limit?: number | string; offset?: number | string; } export interface PageviewMetricsData { x: string; y: number; } export async function getPageviewMetrics( ...args: [websiteId: string, parameters: PageviewMetricsParameters, filters: QueryFilters] ) { return runQuery({ [PRISMA]: () => relationalQuery(...args), [CLICKHOUSE]: () => clickhouseQuery(...args), }); } async function relationalQuery( websiteId: string, parameters: PageviewMetricsParameters, filters: QueryFilters, ): Promise { const { type, limit = 500, offset = 0 } = parameters; let column = FILTER_COLUMNS[type] || type; const { rawQuery, parseFilters } = prisma; const { filterQuery, joinSessionQuery, cohortQuery, queryParams } = parseFilters( { ...filters, websiteId, eventType: column === 'event_name' ? EVENT_TYPE.customEvent : EVENT_TYPE.pageView, }, { joinSession: SESSION_COLUMNS.includes(type) }, ); let entryExitQuery = ''; let excludeDomain = ''; if (column === 'referrer_domain') { excludeDomain = `and website_event.referrer_domain != website_event.hostname and website_event.referrer_domain != ''`; } if (type === 'entry' || type === 'exit') { const order = type === 'entry' ? 'asc' : 'desc'; column = `x.${column}`; entryExitQuery = ` join ( select distinct on (visit_id) visit_id, url_path from website_event where website_event.website_id = {{websiteId::uuid}} and website_event.created_at between {{startDate}} and {{endDate}} and event_type = {{eventType}} order by visit_id, created_at ${order} ) x on x.visit_id = website_event.visit_id `; } return rawQuery( ` select ${column} x, count(distinct website_event.session_id) as y from website_event ${cohortQuery} ${joinSessionQuery} ${entryExitQuery} where website_event.website_id = {{websiteId::uuid}} and website_event.created_at between {{startDate}} and {{endDate}} ${excludeDomain} ${filterQuery} group by 1 order by 2 desc limit ${limit} offset ${offset} `, { ...queryParams, ...parameters }, ); } async function clickhouseQuery( websiteId: string, parameters: PageviewMetricsParameters, filters: QueryFilters, ): Promise<{ x: string; y: number }[]> { const { type, limit = 500, offset = 0 } = parameters; let column = FILTER_COLUMNS[type] || type; const { rawQuery, parseFilters } = clickhouse; const { filterQuery, cohortQuery, queryParams } = parseFilters({ ...filters, websiteId, eventType: column === 'event_name' ? EVENT_TYPE.customEvent : EVENT_TYPE.pageView, }); let sql = ''; let excludeDomain = ''; if (EVENT_COLUMNS.some(item => Object.keys(filters).includes(item))) { let entryExitQuery = ''; if (column === 'referrer_domain') { excludeDomain = `and referrer_domain != hostname and referrer_domain != ''`; } if (type === 'entry' || type === 'exit') { const aggregrate = type === 'entry' ? 'argMin' : 'argMax'; column = `x.${column}`; entryExitQuery = ` JOIN (select visit_id, ${aggregrate}(url_path, created_at) url_path from website_event where website_id = {websiteId:UUID} and created_at between {startDate:DateTime64} and {endDate:DateTime64} and event_type = {eventType:UInt32} group by visit_id) x ON x.visit_id = website_event.visit_id`; } sql = ` select ${column} x, uniq(website_event.session_id) as y from website_event ${cohortQuery} ${entryExitQuery} where website_id = {websiteId:UUID} and created_at between {startDate:DateTime64} and {endDate:DateTime64} ${excludeDomain} ${filterQuery} group by x order by y desc limit ${limit} offset ${offset} `; } else { let groupByQuery = ''; let columnQuery = `arrayJoin(${column})`; if (column === 'referrer_domain') { excludeDomain = `and t != ''`; } if (type === 'entry') { columnQuery = `argMinMerge(entry_url)`; } if (type === 'exit') { columnQuery = `argMaxMerge(exit_url)`; } if (type === 'entry' || type === 'exit') { groupByQuery = 'group by s'; } sql = ` select g.t as x, uniq(s) as y from ( select session_id s, ${columnQuery} as t from website_event_stats_hourly as website_event ${cohortQuery} where website_id = {websiteId:UUID} and created_at between {startDate:DateTime64} and {endDate:DateTime64} ${excludeDomain} ${filterQuery} ${groupByQuery}) as g group by x order by y desc limit ${limit} offset ${offset} `; } return rawQuery(sql, { ...queryParams, ...parameters }); }