feat: add Telegram integration with forum topic support and creator tracking

Adds full Telegram ZIP ingestion pipeline: TDLib worker service scans source
channels for archive files, deduplicates by content hash, extracts metadata,
uploads to archive channel, and indexes in Postgres. Forum supergroups are
scanned per-topic with topic names used as creator. Filename-based creator
extraction (e.g. "Mammoth Factory - 2026-01.zip") serves as fallback.

Includes admin UI for managing accounts/channels, simplified account setup
(API credentials via env vars), auth code/password submission dialog,
package browser with creator column, and live ingestion activity tracking.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
xCyanGrizzly
2026-02-24 16:02:06 +01:00
parent beb9cfb312
commit b427193d17
70 changed files with 8627 additions and 2 deletions

314
src/lib/telegram/queries.ts Normal file
View File

@@ -0,0 +1,314 @@
import { prisma } from "@/lib/prisma";
import type {
PackageListItem,
PackageDetail,
PackageFileItem,
IngestionAccountStatus,
} from "./types";
export async function listPackages(options: {
page: number;
limit: number;
channelId?: string;
creator?: string;
sortBy: "indexedAt" | "fileName" | "fileSize";
order: "asc" | "desc";
}) {
const where: Record<string, unknown> = {};
if (options.channelId) where.sourceChannelId = options.channelId;
if (options.creator) where.creator = options.creator;
const [items, total] = await Promise.all([
prisma.package.findMany({
where,
orderBy: { [options.sortBy]: options.order },
skip: (options.page - 1) * options.limit,
take: options.limit,
select: {
id: true,
fileName: true,
fileSize: true,
contentHash: true,
archiveType: true,
fileCount: true,
isMultipart: true,
indexedAt: true,
creator: true,
previewMsgId: true, // cheap null check — avoids loading blob
sourceChannel: { select: { id: true, title: true } },
},
}),
prisma.package.count({ where }),
]);
const mapped: PackageListItem[] = items.map((pkg) => ({
id: pkg.id,
fileName: pkg.fileName,
fileSize: pkg.fileSize.toString(),
contentHash: pkg.contentHash,
archiveType: pkg.archiveType,
fileCount: pkg.fileCount,
isMultipart: pkg.isMultipart,
hasPreview: pkg.previewMsgId !== null,
creator: pkg.creator,
indexedAt: pkg.indexedAt.toISOString(),
sourceChannel: pkg.sourceChannel,
}));
return {
items: mapped,
pagination: {
page: options.page,
limit: options.limit,
total,
totalPages: Math.ceil(total / options.limit),
},
};
}
export async function getPackageById(
id: string
): Promise<PackageDetail | null> {
const pkg = await prisma.package.findUnique({
where: { id },
include: {
sourceChannel: { select: { id: true, title: true } },
ingestionRun: { select: { id: true, startedAt: true } },
},
});
if (!pkg) return null;
let destChannel: { id: string; title: string } | null = null;
if (pkg.destChannelId) {
const ch = await prisma.telegramChannel.findUnique({
where: { id: pkg.destChannelId },
select: { id: true, title: true },
});
destChannel = ch;
}
return {
id: pkg.id,
fileName: pkg.fileName,
fileSize: pkg.fileSize.toString(),
contentHash: pkg.contentHash,
archiveType: pkg.archiveType,
fileCount: pkg.fileCount,
isMultipart: pkg.isMultipart,
hasPreview: pkg.previewMsgId !== null,
creator: pkg.creator,
partCount: pkg.partCount,
indexedAt: pkg.indexedAt.toISOString(),
sourceChannel: pkg.sourceChannel,
destChannel,
destMessageId: pkg.destMessageId?.toString() ?? null,
sourceMessageId: pkg.sourceMessageId.toString(),
ingestionRun: pkg.ingestionRun
? {
id: pkg.ingestionRun.id,
startedAt: pkg.ingestionRun.startedAt.toISOString(),
}
: null,
};
}
export async function listPackageFiles(options: {
packageId: string;
page: number;
limit: number;
extension?: string;
}) {
const where: { packageId: string; extension?: string } = {
packageId: options.packageId,
};
if (options.extension) {
where.extension = options.extension;
}
const [items, total] = await Promise.all([
prisma.packageFile.findMany({
where,
orderBy: { path: "asc" },
skip: (options.page - 1) * options.limit,
take: options.limit,
}),
prisma.packageFile.count({ where }),
]);
const mapped: PackageFileItem[] = items.map((f) => ({
id: f.id,
path: f.path,
fileName: f.fileName,
extension: f.extension,
compressedSize: f.compressedSize.toString(),
uncompressedSize: f.uncompressedSize.toString(),
crc32: f.crc32,
}));
return {
items: mapped,
pagination: {
page: options.page,
limit: options.limit,
total,
totalPages: Math.ceil(total / options.limit),
},
};
}
export async function searchPackages(options: {
query: string;
page: number;
limit: number;
searchIn: "packages" | "files" | "both";
}) {
const q = options.query;
if (options.searchIn === "files" || options.searchIn === "both") {
// Search in package files, return parent packages
const fileMatches = await prisma.packageFile.findMany({
where: {
OR: [
{ fileName: { contains: q, mode: "insensitive" } },
{ path: { contains: q, mode: "insensitive" } },
],
},
select: { packageId: true },
distinct: ["packageId"],
});
const packageIds = fileMatches.map((f) => f.packageId);
const packageNameIds =
options.searchIn === "both"
? (
await prisma.package.findMany({
where: { fileName: { contains: q, mode: "insensitive" } },
select: { id: true },
})
).map((p) => p.id)
: [];
const allIds = [...new Set([...packageIds, ...packageNameIds])];
const [items, total] = await Promise.all([
prisma.package.findMany({
where: { id: { in: allIds } },
orderBy: { indexedAt: "desc" },
skip: (options.page - 1) * options.limit,
take: options.limit,
select: {
id: true,
fileName: true,
fileSize: true,
contentHash: true,
archiveType: true,
fileCount: true,
isMultipart: true,
indexedAt: true,
creator: true,
previewMsgId: true,
sourceChannel: { select: { id: true, title: true } },
},
}),
Promise.resolve(allIds.length),
]);
const mapped: PackageListItem[] = items.map((pkg) => ({
id: pkg.id,
fileName: pkg.fileName,
fileSize: pkg.fileSize.toString(),
contentHash: pkg.contentHash,
archiveType: pkg.archiveType,
fileCount: pkg.fileCount,
isMultipart: pkg.isMultipart,
hasPreview: pkg.previewMsgId !== null,
creator: pkg.creator,
indexedAt: pkg.indexedAt.toISOString(),
sourceChannel: pkg.sourceChannel,
}));
return {
items: mapped,
pagination: {
page: options.page,
limit: options.limit,
total,
totalPages: Math.ceil(total / options.limit),
},
};
}
// Search packages only
return listPackages({
page: options.page,
limit: options.limit,
sortBy: "indexedAt",
order: "desc",
});
}
export async function getIngestionStatus(): Promise<IngestionAccountStatus[]> {
const accounts = await prisma.telegramAccount.findMany({
orderBy: { createdAt: "asc" },
});
const statuses: IngestionAccountStatus[] = [];
for (const account of accounts) {
const lastRun = await prisma.ingestionRun.findFirst({
where: { accountId: account.id, status: { not: "RUNNING" } },
orderBy: { startedAt: "desc" },
});
const currentRun = await prisma.ingestionRun.findFirst({
where: { accountId: account.id, status: "RUNNING" },
orderBy: { startedAt: "desc" },
});
statuses.push({
id: account.id,
displayName: account.displayName,
phone: account.phone,
isActive: account.isActive,
authState: account.authState,
lastSeenAt: account.lastSeenAt?.toISOString() ?? null,
lastRun: lastRun
? {
id: lastRun.id,
status: lastRun.status,
startedAt: lastRun.startedAt.toISOString(),
finishedAt: lastRun.finishedAt?.toISOString() ?? null,
messagesScanned: lastRun.messagesScanned,
zipsFound: lastRun.zipsFound,
zipsDuplicate: lastRun.zipsDuplicate,
zipsIngested: lastRun.zipsIngested,
}
: null,
currentRun: currentRun
? {
id: currentRun.id,
startedAt: currentRun.startedAt.toISOString(),
messagesScanned: currentRun.messagesScanned,
zipsFound: currentRun.zipsFound,
zipsDuplicate: currentRun.zipsDuplicate,
zipsIngested: currentRun.zipsIngested,
// Live activity tracking
currentActivity: currentRun.currentActivity,
currentStep: currentRun.currentStep,
currentChannel: currentRun.currentChannel,
currentFile: currentRun.currentFile,
currentFileNum: currentRun.currentFileNum,
totalFiles: currentRun.totalFiles,
downloadedBytes: currentRun.downloadedBytes?.toString() ?? null,
totalBytes: currentRun.totalBytes?.toString() ?? null,
downloadPercent: currentRun.downloadPercent,
lastActivityAt: currentRun.lastActivityAt?.toISOString() ?? null,
}
: null,
});
}
return statuses;
}