Merge pull request #2149 from umami-software/bug/um-362-relational-funnels-query

Bug/um 362 relational funnels query
This commit is contained in:
Mike Cao 2023-07-28 18:20:26 -07:00 committed by GitHub
commit 200e9b8bfa
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
5 changed files with 132 additions and 118 deletions

View file

@ -161,6 +161,7 @@ export const labels = defineMessages({
overview: { id: 'labels.overview', defaultMessage: 'Overview' }, overview: { id: 'labels.overview', defaultMessage: 'Overview' },
totalRecords: { id: 'labels.total-records', defaultMessage: 'Total records' }, totalRecords: { id: 'labels.total-records', defaultMessage: 'Total records' },
insights: { id: 'label.insights', defaultMessage: 'Insights' }, insights: { id: 'label.insights', defaultMessage: 'Insights' },
dropoff: { id: 'label.dropoff', defaultMessage: 'Dropoff' },
}); });
export const messages = defineMessages({ export const messages = defineMessages({

View file

@ -6,13 +6,12 @@ import { ReportContext } from '../Report';
export function FunnelTable() { export function FunnelTable() {
const { report } = useContext(ReportContext); const { report } = useContext(ReportContext);
const { formatMessage, labels } = useMessages(); const { formatMessage, labels } = useMessages();
return ( return (
<DataTable <DataTable
data={report?.data} data={report?.data}
title={formatMessage(labels.url)} title={formatMessage(labels.url)}
metric={formatMessage(labels.visitors)} metric={formatMessage(labels.visitors)}
showPercentage={false} showPercentage={true}
/> />
); );
} }

View file

@ -77,29 +77,6 @@ function getFilterQuery(filters = {}, params = {}) {
return query.join('\n'); return query.join('\n');
} }
function getFunnelQuery(urls: string[]): {
columnsQuery: string;
conditionQuery: string;
urlParams: { [key: string]: string };
} {
return urls.reduce(
(pv, cv, i) => {
pv.columnsQuery += `\n,url_path = {url${i}:String}${
i > 0 && urls[i - 1] ? ` AND referrer_path = {url${i - 1}:String}` : ''
}`;
pv.conditionQuery += `${i > 0 ? ',' : ''} {url${i}:String}`;
pv.urlParams[`url${i}`] = cv;
return pv;
},
{
columnsQuery: '',
conditionQuery: '',
urlParams: {},
},
);
}
function parseFilters(filters: WebsiteMetricFilter = {}, params: any = {}) { function parseFilters(filters: WebsiteMetricFilter = {}, params: any = {}) {
return { return {
filterQuery: getFilterQuery(filters, params), filterQuery: getFilterQuery(filters, params),
@ -146,7 +123,6 @@ export default {
getDateQuery, getDateQuery,
getDateFormat, getDateFormat,
getFilterQuery, getFilterQuery,
getFunnelQuery,
parseFilters, parseFilters,
findUnique, findUnique,
findFirst, findFirst,

View file

@ -19,8 +19,8 @@ const POSTGRESQL_DATE_FORMATS = {
year: 'YYYY-01-01', year: 'YYYY-01-01',
}; };
function getAddMinutesQuery(field: string, minutes: number) { function getAddMinutesQuery(field: string, minutes: number): string {
const db = getDatabaseType(); const db = getDatabaseType(process.env.DATABASE_URL);
if (db === POSTGRESQL) { if (db === POSTGRESQL) {
return `${field} + interval '${minutes} minute'`; return `${field} + interval '${minutes} minute'`;
@ -80,53 +80,6 @@ function getFilterQuery(filters = {}, params = []): string {
return query.join('\n'); return query.join('\n');
} }
function getFunnelQuery(
urls: string[],
windowMinutes: number,
): {
levelQuery: string;
sumQuery: string;
urlFilterQuery: string;
} {
const initParamLength = 3;
return urls.reduce(
(pv, cv, i) => {
const levelNumber = i + 1;
const start = i > 0 ? ',' : '';
if (levelNumber >= 2) {
pv.levelQuery += `\n
, level${levelNumber} AS (
select cl.*,
l0.created_at level_${levelNumber}_created_at,
l0.url_path as level_${levelNumber}_url
from level${i} cl
left join website_event l0
on cl.session_id = l0.session_id
and l0.created_at between cl.level_${i}_created_at
and ${getAddMinutesQuery(`cl.level_${i}_created_at`, windowMinutes)}
and l0.referrer_path = $${i + initParamLength}
and l0.url_path = $${levelNumber + initParamLength}
and created_at between $2 and $3
and website_id = $1
)`;
}
pv.sumQuery += `\n${start}SUM(CASE WHEN level_${levelNumber}_url is not null THEN 1 ELSE 0 END) AS level${levelNumber}`;
pv.urlFilterQuery += `\n${start}$${levelNumber + initParamLength} `;
return pv;
},
{
levelQuery: '',
sumQuery: '',
urlFilterQuery: '',
},
);
}
function parseFilters( function parseFilters(
filters: { [key: string]: any } = {}, filters: { [key: string]: any } = {},
params = [], params = [],
@ -150,10 +103,8 @@ async function rawQuery(sql: string, data: object): Promise<any> {
if (db !== POSTGRESQL && db !== MYSQL) { if (db !== POSTGRESQL && db !== MYSQL) {
return Promise.reject(new Error('Unknown database.')); return Promise.reject(new Error('Unknown database.'));
} }
const query = sql?.replaceAll(/\{\{\s*(\w+)(::\w+)?\s*}}/g, (...args) => { const query = sql?.replaceAll(/\{\{\s*(\w+)(::\w+)?\s*}}/g, (...args) => {
const [, name, type] = args; const [, name, type] = args;
params.push(data[name]); params.push(data[name]);
return db === MYSQL ? '?' : `$${params.length}${type ?? ''}`; return db === MYSQL ? '?' : `$${params.length}${type ?? ''}`;
@ -168,7 +119,6 @@ export default {
getDateQuery, getDateQuery,
getTimestampIntervalQuery, getTimestampIntervalQuery,
getFilterQuery, getFilterQuery,
getFunnelQuery,
parseFilters, parseFilters,
rawQuery, rawQuery,
}; };

View file

@ -31,31 +31,74 @@ async function relationalQuery(
{ {
x: string; x: string;
y: number; y: number;
z: number;
}[] }[]
> { > {
const { windowMinutes, startDate, endDate, urls } = criteria; const { windowMinutes, startDate, endDate, urls } = criteria;
const { rawQuery, getFunnelQuery } = prisma; const { rawQuery, getAddMinutesQuery } = prisma;
const { levelQuery, sumQuery, urlFilterQuery } = getFunnelQuery(urls, windowMinutes); const { levelQuery, sumQuery } = getFunnelQuery(urls, windowMinutes);
function getFunnelQuery(
urls: string[],
windowMinutes: number,
): {
levelQuery: string;
sumQuery: string;
} {
return urls.reduce(
(pv, cv, i) => {
const levelNumber = i + 1;
const startSum = i > 0 ? 'union ' : '';
if (levelNumber >= 2) {
pv.levelQuery += `
, level${levelNumber} AS (
select distinct we.session_id, we.created_at
from level${i} l
join website_event we
on l.session_id = we.session_id
where we.created_at between l.created_at
and ${getAddMinutesQuery(`l.created_at `, windowMinutes)}
and we.referrer_path = {{${i - 1}}}
and we.url_path = {{${i}}}
and we.created_at <= {{endDate}}
and we.website_id = {{websiteId::uuid}}
)`;
}
pv.sumQuery += `\n${startSum}select ${levelNumber} as level, count(distinct(session_id)) as count from level${levelNumber}`;
return pv;
},
{
levelQuery: '',
sumQuery: '',
},
);
}
return rawQuery( return rawQuery(
`WITH level0 AS ( `WITH level1 AS (
select distinct session_id, url_path, referrer_path, created_at select distinct session_id, created_at
from website_event from website_event
where url_path in (${urlFilterQuery}) where website_id = {{websiteId::uuid}}
and website_id = {{websiteId::uuid}} and created_at between {{startDate}} and {{endDate}}
and created_at between {{startDate}} and {{endDate}} and url_path = {{0}})
),level1 AS ( ${levelQuery}
select distinct session_id, url_path as level_1_url, created_at as level_1_created_at ${sumQuery}
from level0 ORDER BY level;`,
where url_path = $4 {
)${levelQuery} websiteId,
startDate,
SELECT ${sumQuery} endDate,
from level${urls.length}; ...urls,
`, },
{ websiteId, startDate, endDate, ...urls }, ).then(results => {
).then((a: { [key: string]: number }) => { return urls.map((a, i) => ({
return urls.map((b, i) => ({ x: b, y: a[0][`level${i + 1}`] || 0 })); x: a,
y: results[i]?.count || 0,
z: (1 - (Number(results[i]?.count) * 1.0) / Number(results[i - 1]?.count)) * 100 || 0, // drop off
}));
}); });
} }
@ -71,42 +114,87 @@ async function clickhouseQuery(
{ {
x: string; x: string;
y: number; y: number;
z: number;
}[] }[]
> { > {
const { windowMinutes, startDate, endDate, urls } = criteria; const { windowMinutes, startDate, endDate, urls } = criteria;
const { rawQuery, getFunnelQuery } = clickhouse; const { rawQuery } = clickhouse;
const { columnsQuery, urlParams } = getFunnelQuery(urls); const { levelQuery, sumQuery, urlFilterQuery, urlParams } = getFunnelQuery(urls, windowMinutes);
function getFunnelQuery(
urls: string[],
windowMinutes: number,
): {
levelQuery: string;
sumQuery: string;
urlFilterQuery: string;
urlParams: { [key: string]: string };
} {
return urls.reduce(
(pv, cv, i) => {
const levelNumber = i + 1;
const startSum = i > 0 ? 'union all ' : '';
const startFilter = i > 0 ? ', ' : '';
if (levelNumber >= 2) {
pv.levelQuery += `\n
, level${levelNumber} AS (
select distinct y.session_id as session_id,
y.url_path as url_path,
y.referrer_path as referrer_path,
y.created_at as created_at
from level${i} x
join level0 y
on x.session_id = y.session_id
where y.created_at between x.created_at and x.created_at + interval ${windowMinutes} minute
and y.referrer_path = {url${i - 1}:String}
and y.url_path = {url${i}:String}
)`;
}
pv.sumQuery += `\n${startSum}select ${levelNumber} as level, count(distinct(session_id)) as count from level${levelNumber}`;
pv.urlFilterQuery += `${startFilter}{url${i}:String} `;
pv.urlParams[`url${i}`] = cv;
return pv;
},
{
levelQuery: '',
sumQuery: '',
urlFilterQuery: '',
urlParams: {},
},
);
}
return rawQuery<{ level: number; count: number }[]>( return rawQuery<{ level: number; count: number }[]>(
` `
SELECT level, WITH level0 AS (
count(*) AS count select distinct session_id, url_path, referrer_path, created_at
FROM ( from umami.website_event
SELECT session_id, where url_path in (${urlFilterQuery})
windowFunnel({window:UInt32}, 'strict_increase') and website_id = {websiteId:UUID}
( and created_at between {startDate:DateTime64} and {endDate:DateTime64}
created_at ), level1 AS (
${columnsQuery} select *
) AS level from level0
FROM website_event where url_path = {url0:String})
WHERE website_id = {websiteId:UUID} ${levelQuery}
AND created_at BETWEEN {startDate:DateTime} AND {endDate:DateTime} select *
GROUP BY 1 from (
) ${sumQuery}
GROUP BY level ) ORDER BY level;`,
ORDER BY level ASC;
`,
{ {
websiteId, websiteId,
startDate, startDate,
endDate, endDate,
window: windowMinutes * 60,
...urlParams, ...urlParams,
}, },
).then(results => { ).then(results => {
return urls.map((a, i) => ({ return urls.map((a, i) => ({
x: a, x: a,
y: results[i + 1]?.count || 0, y: results[i]?.count || 0,
z: (1 - (Number(results[i]?.count) * 1.0) / Number(results[i - 1]?.count)) * 100 || 0, // drop off
})); }));
}); });
} }