Files
AFFiNE-Mirror/packages/backend/server/src/models/doc.ts
fengmk2 346c0df800 chore(server): support disable indexer plugin (#12408)
close CLOUD-220

<!-- This is an auto-generated comment: release notes by coderabbit.ai -->

## Summary by CodeRabbit

- **New Features**
  - Introduced a new service to handle indexing-related events and scheduled tasks, improving the management of document and workspace indexing.
  - Added support for configuring the indexer feature via the AFFINE_INDEXER_ENABLED environment variable.

- **Bug Fixes**
  - Ensured that indexing and deletion jobs are only enqueued when the indexer feature is enabled.

- **Tests**
  - Added comprehensive tests for the new indexing event service, covering various configuration scenarios.
  - Removed obsolete test related to auto-indexing scheduling.

- **Chores**
  - Updated configuration descriptions and mappings to improve clarity and environment variable support.

<!-- end of auto-generated comment: release notes by coderabbit.ai -->
2025-05-21 13:19:02 +00:00

641 lines
16 KiB
TypeScript

import { Injectable } from '@nestjs/common';
import { Transactional } from '@nestjs-cls/transactional';
import type { Update } from '@prisma/client';
import { Prisma } from '@prisma/client';
import { EventBus, PaginationInput } from '../base';
import { DocIsNotPublic } from '../base/error';
import { BaseModel } from './base';
import { Doc, DocRole, PublicDocMode, publicUserSelect } from './common';
declare global {
interface Events {
'doc.created': {
workspaceId: string;
docId: string;
editor?: string;
};
'doc.updated': {
workspaceId: string;
docId: string;
};
}
}
export type DocMetaUpsertInput = Omit<
Prisma.WorkspaceDocUncheckedCreateInput,
'workspaceId' | 'docId'
>;
/**
* Workspace Doc Model
*
* This model is responsible for managing the workspace docs, including:
* - Updates: the changes made to the doc.
* - History: the doc history of the doc.
* - Doc: the doc itself.
* - DocMeta: the doc meta.
*/
@Injectable()
export class DocModel extends BaseModel {
constructor(private readonly event: EventBus) {
super();
}
// #region Update
private updateToDocRecord(row: Update): Doc {
return {
spaceId: row.workspaceId,
docId: row.id,
blob: row.blob,
timestamp: row.createdAt.getTime(),
editorId: row.createdBy || undefined,
};
}
private docRecordToUpdate(record: Doc): Update {
return {
workspaceId: record.spaceId,
id: record.docId,
blob: record.blob,
createdAt: new Date(record.timestamp),
createdBy: record.editorId || null,
seq: null,
};
}
async createUpdates(updates: Doc[]) {
return await this.db.update.createMany({
data: updates.map(r => this.docRecordToUpdate(r)),
});
}
/**
* Find updates by workspaceId and docId.
*/
async findUpdates(workspaceId: string, docId: string): Promise<Doc[]> {
const rows = await this.db.update.findMany({
where: {
workspaceId,
id: docId,
},
orderBy: {
createdAt: 'asc',
},
take: 100,
});
return rows.map(r => this.updateToDocRecord(r));
}
/**
* Get the pending updates count by workspaceId and docId.
*/
async getUpdateCount(workspaceId: string, docId: string) {
return await this.db.update.count({
where: {
workspaceId,
id: docId,
},
});
}
/**
* Get the global pending updates count.
*/
async getGlobalUpdateCount() {
return await this.db.update.count();
}
async groupedUpdatesCount() {
return await this.db.update.groupBy({
by: ['workspaceId', 'id'],
_count: true,
});
}
/**
* Delete updates by workspaceId, docId, and createdAts.
*/
async deleteUpdates(
workspaceId: string,
docId: string,
timestamps: number[]
) {
const { count } = await this.db.update.deleteMany({
where: {
workspaceId,
id: docId,
createdAt: {
in: timestamps.map(t => new Date(t)),
},
},
});
if (count > 0) {
this.logger.log(
`Deleted ${count} updates for workspace ${workspaceId} doc ${docId}`
);
}
return count;
}
// #endregion
// #region Doc
/**
* insert or update a doc.
*/
async upsert(doc: Doc) {
const { spaceId, docId, blob, timestamp, editorId } = doc;
const updatedAt = new Date(timestamp);
// CONCERNS:
// i. Because we save the real user's last seen action time as `updatedAt`,
// it's possible to simply compare the `updatedAt` to determine if the snapshot is older than the one we are going to save.
//
// ii. Prisma doesn't support `upsert` with additional `where` condition along side unique constraint.
// In our case, we need to manually check the `updatedAt` to avoid overriding the newer snapshot.
// where: { workspaceId_id: {}, updatedAt: { lt: updatedAt } }
// ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
const result: { updatedAt: Date }[] = await this.db.$queryRaw`
INSERT INTO "snapshots" ("workspace_id", "guid", "blob", "created_at", "updated_at", "created_by", "updated_by")
VALUES (${spaceId}, ${docId}, ${blob}, DEFAULT, ${updatedAt}, ${editorId}, ${editorId})
ON CONFLICT ("workspace_id", "guid")
DO UPDATE SET "blob" = ${blob}, "updated_at" = ${updatedAt}, "updated_by" = ${editorId}
WHERE "snapshots"."workspace_id" = ${spaceId} AND "snapshots"."guid" = ${docId} AND "snapshots"."updated_at" <= ${updatedAt}
RETURNING "snapshots"."workspace_id" as "workspaceId", "snapshots"."guid" as "id", "snapshots"."updated_at" as "updatedAt"
`;
// if the condition `snapshot.updatedAt > updatedAt` is true, by which means the snapshot has already been updated by other process,
// the updates has been applied to current `doc` must have been seen by the other process as well.
// The `updatedSnapshot` will be `undefined` in this case.
return result.at(0);
}
/**
* Get a doc by workspaceId and docId.
*/
async get(workspaceId: string, docId: string): Promise<Doc | null> {
const row = await this.getSnapshot(workspaceId, docId);
if (!row) {
return null;
}
return {
spaceId: row.workspaceId,
docId: row.id,
blob: row.blob,
timestamp: row.updatedAt.getTime(),
editorId: row.updatedBy || undefined,
};
}
async getSnapshot<Select extends Prisma.SnapshotSelect>(
workspaceId: string,
docId: string,
options?: { select?: Select }
) {
return (await this.db.snapshot.findUnique({
where: {
workspaceId_id: {
workspaceId,
id: docId,
},
},
select: options?.select,
})) as Prisma.SnapshotGetPayload<{ select: Select }> | null;
}
async getAuthors(workspaceId: string, docId: string) {
return await this.db.snapshot.findUnique({
where: {
workspaceId_id: {
workspaceId,
id: docId,
},
},
select: {
createdAt: true,
updatedAt: true,
createdByUser: { select: publicUserSelect },
updatedByUser: { select: publicUserSelect },
},
});
}
/**
* Check if all doc exists in the workspace.
* Ignore pending updates.
*/
async existsAll(workspaceId: string, docIds: string[]) {
const count = await this.db.snapshot.count({
where: {
workspaceId,
id: { in: docIds },
},
});
if (count === docIds.length) {
return true;
}
return false;
}
/**
* Detect a doc exists or not, including updates
*/
async exists(workspaceId: string, docId: string) {
const count = await this.db.snapshot.count({
where: {
workspaceId,
id: docId,
},
});
if (count > 0) {
return true;
}
const updateCount = await this.getUpdateCount(workspaceId, docId);
return updateCount > 0;
}
/**
* Delete a doc and it's updates and snapshots.
*/
@Transactional()
async delete(workspaceId: string, docId: string) {
const ident = { where: { workspaceId, id: docId } };
const { count: snapshots } = await this.db.snapshot.deleteMany(ident);
const { count: updates } = await this.db.update.deleteMany(ident);
const { count: histories } =
await this.db.snapshotHistory.deleteMany(ident);
this.logger.log(
`Deleted workspace ${workspaceId} doc ${docId}, including ${snapshots} snapshots, ${updates} updates, and ${histories} histories`
);
}
/**
* Delete the whole workspace's docs and their updates and snapshots.
*/
@Transactional()
async deleteAllByWorkspaceId(workspaceId: string) {
const ident = { where: { workspaceId } };
const { count: snapshots } = await this.db.snapshot.deleteMany(ident);
const { count: updates } = await this.db.update.deleteMany(ident);
const { count: histories } =
await this.db.snapshotHistory.deleteMany(ident);
this.logger.log(
`Deleted workspace ${workspaceId} all docs, including ${snapshots} snapshots, ${updates} updates, and ${histories} histories`
);
return snapshots;
}
/**
* Find the timestamps of docs by workspaceId.
*
* @param after Only return timestamps after this timestamp.
*/
async findTimestampsByWorkspaceId(workspaceId: string, after?: number) {
const snapshots = await this.db.snapshot.findMany({
select: {
id: true,
updatedAt: true,
},
where: {
workspaceId,
...(after
? {
updatedAt: {
gt: new Date(after),
},
}
: {}),
},
});
const updates = await this.db.update.groupBy({
where: {
workspaceId,
...(after
? {
// [createdAt] in updates table is indexed, so it's fast
createdAt: {
gt: new Date(after),
},
}
: {}),
},
by: ['id'],
_max: {
createdAt: true,
},
});
const result: Record<string, number> = {};
snapshots.forEach(s => {
result[s.id] = s.updatedAt.getTime();
});
updates.forEach(u => {
if (u._max.createdAt) {
result[u.id] = u._max.createdAt.getTime();
}
});
return result;
}
// #endregion
// #region DocMeta
/**
* Create or update the doc meta.
*/
async upsertMeta(
workspaceId: string,
docId: string,
data?: DocMetaUpsertInput
) {
const doc = await this.db.workspaceDoc.upsert({
where: {
workspaceId_docId: {
workspaceId,
docId,
},
},
update: {
...data,
},
create: {
...data,
workspaceId,
docId,
},
});
this.event.emit('doc.updated', {
workspaceId,
docId,
});
return doc;
}
/**
* Get the doc meta.
*/
async getMeta<Select extends Prisma.WorkspaceDocSelect>(
workspaceId: string,
docId: string,
options?: {
select?: Select;
}
) {
return (await this.db.workspaceDoc.findUnique({
where: {
workspaceId_docId: {
workspaceId,
docId,
},
},
select: options?.select,
})) as Prisma.WorkspaceDocGetPayload<{ select: Select }> | null;
}
async setDefaultRole(workspaceId: string, docId: string, role: DocRole) {
return await this.upsertMeta(workspaceId, docId, {
defaultRole: role,
});
}
async findDefaultRoles(workspaceId: string, docIds: string[]) {
const docs = await this.findMetas(
docIds.map(docId => ({
workspaceId,
docId,
})),
{
select: {
defaultRole: true,
public: true,
},
}
);
return docs.map(doc => ({
external: doc?.public ? DocRole.External : null,
workspace: doc?.defaultRole ?? DocRole.Manager,
}));
}
async findAuthors(ids: { workspaceId: string; docId: string }[]) {
const rows = await this.db.snapshot.findMany({
where: {
workspaceId: { in: ids.map(id => id.workspaceId) },
id: { in: ids.map(id => id.docId) },
},
select: {
workspaceId: true,
id: true,
createdAt: true,
updatedAt: true,
createdByUser: { select: publicUserSelect },
updatedByUser: { select: publicUserSelect },
},
});
const resultMap = new Map(
rows.map(row => [`${row.workspaceId}-${row.id}`, row])
);
return ids.map(
id => resultMap.get(`${id.workspaceId}-${id.docId}`) ?? null
);
}
async findMetas<Select extends Prisma.WorkspaceDocSelect>(
ids: { workspaceId: string; docId: string }[],
options?: { select?: Select }
) {
let select = options?.select;
if (select) {
// add workspaceId and docId to the select
select = {
...select,
workspaceId: true,
docId: true,
};
}
const rows = (await this.db.workspaceDoc.findMany({
where: {
workspaceId: { in: ids.map(id => id.workspaceId) },
docId: { in: ids.map(id => id.docId) },
},
select,
})) as (Prisma.WorkspaceDocGetPayload<{ select: Select }> & {
workspaceId: string;
docId: string;
})[];
const resultMap = new Map(
rows.map(row => [`${row.workspaceId}-${row.docId}`, row])
);
return ids.map(
id => resultMap.get(`${id.workspaceId}-${id.docId}`) ?? null
);
}
/**
* Find the workspace public doc metas.
*/
async findPublics(workspaceId: string) {
return await this.db.workspaceDoc.findMany({
where: {
workspaceId,
public: true,
},
});
}
/**
* Get the workspace public docs count.
*/
async getPublicsCount(workspaceId: string) {
return await this.db.workspaceDoc.count({
where: {
workspaceId,
public: true,
},
});
}
/**
* Check if the workspace has any public docs.
*/
async hasPublic(workspaceId: string) {
const count = await this.getPublicsCount(workspaceId);
return count > 0;
}
/**
* Publish a doc as public.
*/
async publish(
workspaceId: string,
docId: string,
mode: PublicDocMode = PublicDocMode.Page
) {
return await this.upsertMeta(workspaceId, docId, {
public: true,
mode,
});
}
@Transactional()
async unpublish(workspaceId: string, docId: string) {
const docMeta = await this.getMeta(workspaceId, docId);
if (!docMeta?.public) {
throw new DocIsNotPublic();
}
return await this.upsertMeta(workspaceId, docId, {
public: false,
});
}
/**
* Check if the doc is public.
*/
async isPublic(workspaceId: string, docId: string) {
const docMeta = await this.getMeta(workspaceId, docId, {
select: {
public: true,
},
});
return docMeta?.public ?? false;
}
async getDocInfo(workspaceId: string, docId: string) {
const rows = await this.db.$queryRaw<
{
workspaceId: string;
docId: string;
mode: PublicDocMode;
public: boolean;
defaultRole: DocRole;
createdAt: Date;
updatedAt: Date;
creatorId?: string;
lastUpdaterId?: string;
}[]
>`
SELECT
"workspace_pages"."workspace_id" as "workspaceId",
"workspace_pages"."page_id" as "docId",
"workspace_pages"."mode" as "mode",
"workspace_pages"."public" as "public",
"workspace_pages"."defaultRole" as "defaultRole",
"snapshots"."created_at" as "createdAt",
"snapshots"."updated_at" as "updatedAt",
"snapshots"."created_by" as "creatorId",
"snapshots"."updated_by" as "lastUpdaterId"
FROM "workspace_pages"
INNER JOIN "snapshots"
ON "workspace_pages"."workspace_id" = "snapshots"."workspace_id"
AND "workspace_pages"."page_id" = "snapshots"."guid"
WHERE
"workspace_pages"."workspace_id" = ${workspaceId}
AND "workspace_pages"."page_id" = ${docId}
LIMIT 1;
`;
return rows.at(0) ?? null;
}
async paginateDocInfo(workspaceId: string, pagination: PaginationInput) {
const count = await this.db.workspaceDoc.count({
where: {
workspaceId,
},
});
const after = pagination.after
? Prisma.sql`AND "snapshots"."created_at" > ${new Date(pagination.after)}`
: Prisma.sql``;
const rows = await this.db.$queryRaw<
{
workspaceId: string;
docId: string;
mode: PublicDocMode;
public: boolean;
defaultRole: DocRole;
createdAt: Date;
updatedAt: Date;
creatorId?: string;
lastUpdaterId?: string;
}[]
>`
SELECT
"workspace_pages"."workspace_id" as "workspaceId",
"workspace_pages"."page_id" as "docId",
"workspace_pages"."mode" as "mode",
"workspace_pages"."public" as "public",
"workspace_pages"."defaultRole" as "defaultRole",
"snapshots"."created_at" as "createdAt",
"snapshots"."updated_at" as "updatedAt",
"snapshots"."created_by" as "creatorId",
"snapshots"."updated_by" as "lastUpdaterId"
FROM "workspace_pages"
INNER JOIN "snapshots"
ON "workspace_pages"."workspace_id" = "snapshots"."workspace_id"
AND "workspace_pages"."page_id" = "snapshots"."guid"
WHERE
"workspace_pages"."workspace_id" = ${workspaceId}
${after}
ORDER BY
"snapshots"."created_at" ASC
LIMIT ${pagination.first}
OFFSET ${pagination.offset}
`;
return [count, rows] as const;
}
// #endregion
}