update funnels relational query

This commit is contained in:
Francis Cao 2023-07-20 21:13:29 -07:00
parent 25feee662b
commit 94967d45e1
2 changed files with 46 additions and 31 deletions

View file

@ -44,6 +44,18 @@ function getAddMinutesQuery(field: string, minutes: number) {
} }
} }
function getDropoffQuery() {
const db = getDatabaseType(process.env.DATABASE_URL);
if (db === POSTGRESQL) {
return `round((1.0 - count::numeric/lag(count, 1) over ()),2)`;
}
if (db === MYSQL) {
return `round((1.0 - count/LAG(count, 1) OVER (ORDER BY level)),2)`;
}
}
function getDateQuery(field: string, unit: string, timezone?: string): string { function getDateQuery(field: string, unit: string, timezone?: string): string {
const db = getDatabaseType(process.env.DATABASE_URL); const db = getDatabaseType(process.env.DATABASE_URL);
@ -147,29 +159,27 @@ function getFunnelQuery(
return urls.reduce( return urls.reduce(
(pv, cv, i) => { (pv, cv, i) => {
const levelNumber = i + 1; const levelNumber = i + 1;
const start = i > 0 ? ',' : ''; const startSum = i > 0 ? 'union ' : '';
const startFilter = i > 0 ? ', ' : '';
if (levelNumber >= 2) { if (levelNumber >= 2) {
pv.levelQuery += `\n pv.levelQuery += `\n
, level${levelNumber} AS ( , level${levelNumber} AS (
select cl.*, select distinct l.session_id, we.created_at
l0.created_at level_${levelNumber}_created_at, from level${i} l
l0.url_path as level_${levelNumber}_url join website_event we
from level${i} cl on l.session_id = we.session_id
left join website_event l0 where we.created_at between l.created_at
on cl.session_id = l0.session_id and ${getAddMinutesQuery(`l.created_at `, windowMinutes)}
and l0.created_at between cl.level_${i}_created_at and we.referrer_path = $${i + initParamLength}
and ${getAddMinutesQuery(`cl.level_${i}_created_at`, windowMinutes)} and we.url_path = $${levelNumber + initParamLength}
and l0.referrer_path = $${i + initParamLength} and we.website_id = $1${toUuid()}
and l0.url_path = $${levelNumber + initParamLength}
and created_at between $2 and $3
and website_id = $1${toUuid()}
)`; )`;
} }
pv.sumQuery += `\n${start}SUM(CASE WHEN level_${levelNumber}_url is not null THEN 1 ELSE 0 END) AS level${levelNumber}`; pv.sumQuery += `\n${startSum}select ${levelNumber} as level, count(distinct(session_id)) as count from level${levelNumber}`;
pv.urlFilterQuery += `\n${start}$${levelNumber + initParamLength} `; pv.urlFilterQuery += `${startFilter}$${levelNumber + initParamLength} `;
return pv; return pv;
}, },
@ -212,6 +222,7 @@ async function rawQuery(query: string, params: never[] = []): Promise<any> {
export default { export default {
...prisma, ...prisma,
getAddMinutesQuery, getAddMinutesQuery,
getDropoffQuery,
getDateQuery, getDateQuery,
getTimestampInterval, getTimestampInterval,
getFilterQuery, getFilterQuery,

View file

@ -34,7 +34,7 @@ async function relationalQuery(
}[] }[]
> { > {
const { windowMinutes, startDate, endDate, urls } = criteria; const { windowMinutes, startDate, endDate, urls } = criteria;
const { rawQuery, getFunnelQuery, toUuid } = prisma; const { rawQuery, getFunnelQuery, toUuid, getDropoffQuery } = prisma;
const { levelQuery, sumQuery, urlFilterQuery } = getFunnelQuery(urls, windowMinutes); const { levelQuery, sumQuery, urlFilterQuery } = getFunnelQuery(urls, windowMinutes);
const params: any = [websiteId, startDate, endDate, ...urls]; const params: any = [websiteId, startDate, endDate, ...urls];
@ -47,14 +47,18 @@ async function relationalQuery(
and website_id = $1${toUuid()} and website_id = $1${toUuid()}
and created_at between $2 and $3 and created_at between $2 and $3
),level1 AS ( ),level1 AS (
select distinct session_id, url_path as level_1_url, created_at as level_1_created_at select distinct session_id, created_at
from level0 from level0
where url_path = $4 where url_path = $4
)${levelQuery} )${levelQuery}, levelCount as (
${sumQuery}
SELECT ${sumQuery} order by level)
from level${urls.length}; select
`, level,
count,
${getDropoffQuery()} as drop_off
from levelCount;
`,
params, params,
).then((a: { [key: string]: number }) => { ).then((a: { [key: string]: number }) => {
return urls.map((b, i) => ({ x: b, y: a[0][`level${i + 1}`] || 0 })); return urls.map((b, i) => ({ x: b, y: a[0][`level${i + 1}`] || 0 }));
@ -77,7 +81,7 @@ async function clickhouseQuery(
> { > {
const { windowMinutes, startDate, endDate, urls } = criteria; const { windowMinutes, startDate, endDate, urls } = criteria;
const { rawQuery, getBetweenDates, getFunnelQuery } = clickhouse; const { rawQuery, getBetweenDates, getFunnelQuery } = clickhouse;
const { columnsQuery, conditionQuery, urlParams } = getFunnelQuery(urls); const { columnsQuery, urlParams } = getFunnelQuery(urls);
const params = { const params = {
websiteId, websiteId,
@ -87,22 +91,22 @@ async function clickhouseQuery(
return rawQuery<{ level: number; count: number }[]>( return rawQuery<{ level: number; count: number }[]>(
` `
SELECT level, select level,
count(*) AS count count(*) AS count
FROM ( from (
SELECT session_id, select session_id,
windowFunnel({window:UInt32}, 'strict_increase') windowFunnel({window:UInt32}, 'strict_increase')
( (
created_at created_at
${columnsQuery} ${columnsQuery}
) AS level ) AS level
FROM website_event from website_event
WHERE website_id = {websiteId:UUID} where website_id = {websiteId:UUID}
and ${getBetweenDates('created_at', startDate, endDate)} and ${getBetweenDates('created_at', startDate, endDate)}
GROUP BY 1 group by 1
) )
GROUP BY level group by level
ORDER BY level ASC; order by level asc;
`, `,
params, params,
).then(results => { ).then(results => {