import clickhouse from '@/lib/clickhouse'; import { EVENT_COLUMNS, EVENT_TYPE, FILTER_COLUMNS, SESSION_COLUMNS } from '@/lib/constants'; import { CLICKHOUSE, PRISMA, runQuery } from '@/lib/db'; import prisma from '@/lib/prisma'; import { QueryFilters } from '@/lib/types'; export interface PageviewMetricsParameters { type: string; limit?: number | string; offset?: number | string; } export interface PageviewMetricsData { x: string; y: number; } export async function getPageviewMetrics( ...args: [websiteId: string, parameters: PageviewMetricsParameters, filters: QueryFilters] ) { return runQuery({ [PRISMA]: () => relationalQuery(...args), [CLICKHOUSE]: () => clickhouseQuery(...args), }); } async function relationalQuery( websiteId: string, parameters: PageviewMetricsParameters, filters: QueryFilters, ): Promise { const { type, limit = 500, offset = 0 } = parameters; const column = FILTER_COLUMNS[type] || type; const { rawQuery, parseFilters } = prisma; const { filterQuery, joinSessionQuery, cohortQuery, queryParams } = parseFilters( { ...filters, websiteId, eventType: column === 'event_name' ? EVENT_TYPE.customEvent : EVENT_TYPE.pageView, }, { joinSession: SESSION_COLUMNS.includes(type) || column === 'referrer_domain', }, ); let entryExitQuery = ''; let excludeDomain = ''; if (column === 'referrer_domain') { excludeDomain = `and website_event.referrer_domain != website_event.hostname and website_event.referrer_domain != ''`; } if (type === 'entry' || type === 'exit') { const aggregrate = type === 'entry' ? 'min' : 'max'; entryExitQuery = ` join ( select visit_id, ${aggregrate}(created_at) target_created_at from website_event where website_event.website_id = {{websiteId::uuid}} and website_event.created_at between {{startDate}} and {{endDate}} and event_type = {{eventType}} group by visit_id ) x on x.visit_id = website_event.visit_id and x.target_created_at = website_event.created_at `; } return rawQuery( ` select ${column} x, ${column === 'referrer_domain' ? 'count(distinct website_event.session_id)' : 'count(*)'} as y from website_event ${joinSessionQuery} ${cohortQuery} ${entryExitQuery} where website_event.website_id = {{websiteId::uuid}} and website_event.created_at between {{startDate}} and {{endDate}} and event_type = {{eventType}} ${excludeDomain} ${filterQuery} group by 1 order by 2 desc limit ${limit} offset ${offset} `, queryParams, ); } async function clickhouseQuery( websiteId: string, parameters: PageviewMetricsParameters, filters: QueryFilters, ): Promise<{ x: string; y: number }[]> { const { type, limit = 500, offset = 0 } = parameters; const column = FILTER_COLUMNS[type] || type; const { rawQuery, parseFilters } = clickhouse; const { filterQuery, cohortQuery, queryParams } = parseFilters({ ...filters, websiteId, eventType: column === 'event_name' ? EVENT_TYPE.customEvent : EVENT_TYPE.pageView, }); let sql = ''; let excludeDomain = ''; if (EVENT_COLUMNS.some(item => Object.keys(filters).includes(item))) { let entryExitQuery = ''; if (column === 'referrer_domain') { excludeDomain = `and referrer_domain != hostname and referrer_domain != ''`; } if (type === 'entry' || type === 'exit') { const aggregrate = type === 'entry' ? 'min' : 'max'; entryExitQuery = ` JOIN (select visit_id, ${aggregrate}(created_at) target_created_at from website_event where website_id = {websiteId:UUID} and created_at between {startDate:DateTime64} and {endDate:DateTime64} and event_type = {eventType:UInt32} group by visit_id) x ON x.visit_id = website_event.visit_id and x.target_created_at = website_event.created_at`; } sql = ` select ${column} x, ${column === 'referrer_domain' ? 'uniq(session_id)' : 'count(*)'} as y from website_event ${entryExitQuery} where website_id = {websiteId:UUID} and created_at between {startDate:DateTime64} and {endDate:DateTime64} and event_type = {eventType:UInt32} ${excludeDomain} ${filterQuery} group by x order by y desc limit ${limit} offset ${offset} `; } else { let groupByQuery = ''; let columnQuery = `arrayJoin(${column})`; if (column === 'referrer_domain') { excludeDomain = `and t != hostname and t != ''`; columnQuery = `session_id s, arrayJoin(${column})`; } if (type === 'entry') { columnQuery = `visit_id x, argMinMerge(entry_url)`; } if (type === 'exit') { columnQuery = `visit_id x, argMaxMerge(exit_url)`; } if (type === 'entry' || type === 'exit') { groupByQuery = 'group by x'; } sql = ` select g.t as x, ${column === 'referrer_domain' ? 'uniq(s)' : 'count(*)'} as y from ( select ${columnQuery} as t from website_event_stats_hourly as website_event ${cohortQuery} where website_id = {websiteId:UUID} and created_at between {startDate:DateTime64} and {endDate:DateTime64} and event_type = {eventType:UInt32} ${excludeDomain} ${filterQuery} ${groupByQuery}) as g group by x order by y desc limit ${limit} offset ${offset} `; } return rawQuery(sql, queryParams); }