ditto/src/stats.ts

177 lines
5.6 KiB
TypeScript
Raw Normal View History

2023-12-10 23:42:44 +00:00
import { type AuthorStatsRow, db, type DittoDB, type EventStatsRow } from '@/db.ts';
import * as eventsDB from '@/db/events.ts';
import { type Event, findReplyTag, type InsertQueryBuilder } from '@/deps.ts';
2023-12-08 00:43:24 +00:00
2023-12-10 22:04:52 +00:00
type AuthorStat = keyof Omit<AuthorStatsRow, 'pubkey'>;
type EventStat = keyof Omit<EventStatsRow, 'event_id'>;
2023-12-08 00:43:24 +00:00
2023-12-10 22:04:52 +00:00
type AuthorStatDiff = ['author_stats', pubkey: string, stat: AuthorStat, diff: number];
type EventStatDiff = ['event_stats', eventId: string, stat: EventStat, diff: number];
2023-12-10 22:04:52 +00:00
type StatDiff = AuthorStatDiff | EventStatDiff;
2023-12-08 00:43:24 +00:00
/** Store stats for the event in LMDB. */
2023-12-10 23:48:21 +00:00
async function updateStats<K extends number>(event: Event<K>) {
let prev: Event<K> | undefined;
2023-12-10 23:42:44 +00:00
const queries: InsertQueryBuilder<DittoDB, any, unknown>[] = [];
// Kind 3 is a special case - replace the count with the new list.
if (event.kind === 3) {
2023-12-10 23:48:21 +00:00
prev = await maybeGetPrev(event);
if (!prev || event.created_at >= prev.created_at) {
queries.push(updateFollowingCountQuery(event as Event<3>));
}
2023-12-10 23:42:44 +00:00
}
2023-12-10 23:48:21 +00:00
const statDiffs = getStatsDiff(event, prev);
2023-12-10 22:04:52 +00:00
const pubkeyDiffs = statDiffs.filter(([table]) => table === 'author_stats') as AuthorStatDiff[];
const eventDiffs = statDiffs.filter(([table]) => table === 'event_stats') as EventStatDiff[];
2023-12-10 23:42:44 +00:00
if (pubkeyDiffs.length) queries.push(authorStatsQuery(pubkeyDiffs));
if (eventDiffs.length) queries.push(eventStatsQuery(eventDiffs));
if (queries.length) {
await Promise.all(queries.map((query) => query.execute()));
}
2023-12-10 17:10:11 +00:00
}
/** Calculate stats changes ahead of time so we can build an efficient query. */
2023-12-10 23:48:21 +00:00
function getStatsDiff<K extends number>(event: Event<K>, prev: Event<K> | undefined): StatDiff[] {
const statDiffs: StatDiff[] = [];
2023-12-10 22:32:43 +00:00
const firstTaggedId = event.tags.find(([name]) => name === 'e')?.[1];
2023-12-10 19:58:35 +00:00
const inReplyToId = findReplyTag(event as Event<1>)?.[1];
2023-12-08 00:43:24 +00:00
switch (event.kind) {
2023-12-10 17:10:11 +00:00
case 1:
2023-12-10 22:04:52 +00:00
statDiffs.push(['author_stats', event.pubkey, 'notes_count', 1]);
2023-12-10 19:58:35 +00:00
if (inReplyToId) {
statDiffs.push(['event_stats', inReplyToId, 'replies_count', 1]);
}
break;
2023-12-10 23:42:44 +00:00
case 3:
2023-12-10 23:48:21 +00:00
statDiffs.push(...getFollowDiff(event as Event<3>, prev as Event<3> | undefined));
2023-12-10 23:42:44 +00:00
break;
2023-12-08 00:43:24 +00:00
case 6:
2023-12-10 22:32:43 +00:00
if (firstTaggedId) {
statDiffs.push(['event_stats', firstTaggedId, 'reposts_count', 1]);
}
break;
2023-12-08 00:43:24 +00:00
case 7:
2023-12-10 22:32:43 +00:00
if (firstTaggedId) {
statDiffs.push(['event_stats', firstTaggedId, 'reactions_count', 1]);
}
2023-12-08 00:43:24 +00:00
}
return statDiffs;
2023-12-08 00:43:24 +00:00
}
2023-12-10 23:42:44 +00:00
/** Create an author stats query from the list of diffs. */
2023-12-10 22:04:52 +00:00
function authorStatsQuery(diffs: AuthorStatDiff[]) {
const values: AuthorStatsRow[] = diffs.map(([_, pubkey, stat, diff]) => {
const row: AuthorStatsRow = {
2023-12-10 19:12:35 +00:00
pubkey,
followers_count: 0,
following_count: 0,
notes_count: 0,
};
row[stat] = diff;
return row;
});
2023-12-10 17:10:11 +00:00
2023-12-10 22:04:52 +00:00
return db.insertInto('author_stats')
2023-12-10 19:12:35 +00:00
.values(values)
2023-12-10 17:10:11 +00:00
.onConflict((oc) =>
oc
.column('pubkey')
.doUpdateSet((eb) => ({
followers_count: eb('followers_count', '+', eb.ref('excluded.followers_count')),
following_count: eb('following_count', '+', eb.ref('excluded.following_count')),
notes_count: eb('notes_count', '+', eb.ref('excluded.notes_count')),
2023-12-10 17:10:11 +00:00
}))
);
2023-12-08 00:43:24 +00:00
}
2023-12-10 23:42:44 +00:00
/** Create an event stats query from the list of diffs. */
function eventStatsQuery(diffs: EventStatDiff[]) {
const values: EventStatsRow[] = diffs.map(([_, event_id, stat, diff]) => {
2023-12-10 19:12:35 +00:00
const row: EventStatsRow = {
event_id,
replies_count: 0,
reposts_count: 0,
reactions_count: 0,
};
row[stat] = diff;
return row;
});
return db.insertInto('event_stats')
2023-12-10 19:12:35 +00:00
.values(values)
.onConflict((oc) =>
oc
.column('event_id')
.doUpdateSet((eb) => ({
replies_count: eb('replies_count', '+', eb.ref('excluded.replies_count')),
reposts_count: eb('reposts_count', '+', eb.ref('excluded.reposts_count')),
reactions_count: eb('reactions_count', '+', eb.ref('excluded.reactions_count')),
}))
);
}
2023-12-10 23:48:21 +00:00
/** Get the last version of the event, if any. */
async function maybeGetPrev<K extends number>(event: Event<K>): Promise<Event<K>> {
2023-12-10 23:42:44 +00:00
const [prev] = await eventsDB.getFilters([
{ kinds: [event.kind], authors: [event.pubkey], limit: 1 },
]);
2023-12-10 23:48:21 +00:00
return prev;
2023-12-10 23:42:44 +00:00
}
/** Set the following count to the total number of unique "p" tags in the follow list. */
function updateFollowingCountQuery({ pubkey, tags }: Event<3>) {
const following_count = new Set(
tags
.filter(([name]) => name === 'p')
.map(([_, value]) => value),
).size;
return db.insertInto('author_stats')
.values({
pubkey,
following_count,
followers_count: 0,
notes_count: 0,
})
.onConflict((oc) =>
oc
.column('pubkey')
.doUpdateSet({ following_count })
);
}
/** Compare the old and new follow events (if any), and return a diff array. */
function getFollowDiff(event: Event<3>, prev?: Event<3>): AuthorStatDiff[] {
const prevTags = prev?.tags ?? [];
const prevPubkeys = new Set(
prevTags
.filter(([name]) => name === 'p')
.map(([_, value]) => value),
);
const pubkeys = new Set(
event.tags
.filter(([name]) => name === 'p')
.map(([_, value]) => value),
);
const added = [...pubkeys].filter((pubkey) => !prevPubkeys.has(pubkey));
const removed = [...prevPubkeys].filter((pubkey) => !pubkeys.has(pubkey));
return [
...added.map((pubkey): AuthorStatDiff => ['author_stats', pubkey, 'followers_count', 1]),
...removed.map((pubkey): AuthorStatDiff => ['author_stats', pubkey, 'followers_count', -1]),
];
}
2023-12-10 17:10:11 +00:00
export { updateStats };