fix: importer 2..

This commit is contained in:
Carl-Gerhard Lindesvärd
2026-03-03 23:54:53 +01:00
parent 227d629dc5
commit 00f6cd6f50

View File

@@ -226,16 +226,27 @@ export async function createSessionsStartEndEvents(
"name NOT IN ('session_start', 'session_end')",
].join(' AND ');
const sessionBatchSubquery = `
(SELECT DISTINCT session_id
FROM ${TABLE_NAMES.events_imports}
WHERE ${baseWhere}
AND session_id > {lastSessionId:String}
ORDER BY session_id
LIMIT {limit:UInt32})
`;
while (true) {
const idsResult = await ch.query({
query: `
SELECT DISTINCT session_id
FROM ${TABLE_NAMES.events_imports}
WHERE ${baseWhere}
AND session_id > {lastSessionId:String}
ORDER BY session_id
LIMIT {limit:UInt32}
`,
query_params: { importId, lastSessionId, limit: SESSION_BATCH_SIZE },
format: 'JSONEachRow',
});
const idRows = (await idsResult.json()) as Array<{ session_id: string }>;
if (idRows.length === 0) {
break;
}
const maxSessionId = idRows.at(-1)!.session_id;
const sessionEventsQuery = `
SELECT
device_id,
@@ -252,13 +263,14 @@ export async function createSessionsStartEndEvents(
max(created_at) AS last_timestamp
FROM ${TABLE_NAMES.events_imports}
WHERE ${baseWhere}
AND session_id IN ${sessionBatchSubquery}
AND session_id > {lastSessionId:String}
AND session_id <= {maxSessionId:String}
GROUP BY session_id, device_id, project_id
`;
const sessionEventsResult = await ch.query({
query: sessionEventsQuery,
query_params: { importId, lastSessionId, limit: SESSION_BATCH_SIZE },
query_params: { importId, lastSessionId, maxSessionId },
format: 'JSONEachRow',
});
@@ -411,11 +423,8 @@ export async function createSessionsStartEndEvents(
await insertImportBatch(sessionEvents, importId);
}
if (sessionData.length === 0) {
break;
}
lastSessionId = sessionData.at(-1)!.session_id;
if (sessionData.length < SESSION_BATCH_SIZE) {
lastSessionId = maxSessionId;
if (idRows.length < SESSION_BATCH_SIZE) {
break;
}
}
@@ -476,15 +485,6 @@ export async function backfillSessionsToProduction(
const SESSION_BATCH_SIZE = 5000;
let lastSessionId = '';
const baseWhere = 'import_id = {importId:String} AND session_id > {lastSessionId:String}';
const sessionBatchSubquery = `
(SELECT DISTINCT session_id
FROM ${TABLE_NAMES.events_imports}
WHERE ${baseWhere}
ORDER BY session_id
LIMIT {limit:UInt32})
`;
while (true) {
const idsResult = await ch.query({
query: `
@@ -504,6 +504,8 @@ export async function backfillSessionsToProduction(
break;
}
const maxSessionId = idRows.at(-1)!.session_id;
const sessionsInsertQuery = `
INSERT INTO ${TABLE_NAMES.sessions} (
id, project_id, profile_id, device_id, created_at, ended_at,
@@ -560,13 +562,14 @@ export async function backfillSessionsToProduction(
FROM ${TABLE_NAMES.events_imports} e
WHERE
e.import_id = {importId:String}
AND e.session_id IN ${sessionBatchSubquery}
AND e.session_id > {lastSessionId:String}
AND e.session_id <= {maxSessionId:String}
GROUP BY e.session_id
`;
await ch.command({
query: sessionsInsertQuery,
query_params: { importId, lastSessionId, limit: SESSION_BATCH_SIZE },
query_params: { importId, lastSessionId, maxSessionId },
clickhouse_settings: {
wait_end_of_query: 1,
send_progress_in_http_headers: 1,
@@ -574,7 +577,7 @@ export async function backfillSessionsToProduction(
},
});
lastSessionId = idRows.at(-1)!.session_id;
lastSessionId = maxSessionId;
if (idRows.length < SESSION_BATCH_SIZE) {
break;
}