Spaces:
Running
Running
import { MONGODB_URL, MONGODB_DB_NAME, MONGODB_DIRECT_CONNECTION } from "$env/static/private"; | |
import { GridFSBucket, MongoClient } from "mongodb"; | |
import type { Conversation } from "$lib/types/Conversation"; | |
import type { SharedConversation } from "$lib/types/SharedConversation"; | |
import type { AbortedGeneration } from "$lib/types/AbortedGeneration"; | |
import type { Settings } from "$lib/types/Settings"; | |
import type { User } from "$lib/types/User"; | |
import type { MessageEvent } from "$lib/types/MessageEvent"; | |
import type { Session } from "$lib/types/Session"; | |
import type { Assistant } from "$lib/types/Assistant"; | |
import type { Report } from "$lib/types/Report"; | |
import type { ConversationStats } from "$lib/types/ConversationStats"; | |
import type { MigrationResult } from "$lib/types/MigrationResult"; | |
import type { Semaphore } from "$lib/types/Semaphore"; | |
import type { AssistantStats } from "$lib/types/AssistantStats"; | |
if (!MONGODB_URL) { | |
throw new Error( | |
"Please specify the MONGODB_URL environment variable inside .env.local. Set it to mongodb://localhost:27017 if you are running MongoDB locally, or to a MongoDB Atlas free instance for example." | |
); | |
} | |
export const CONVERSATION_STATS_COLLECTION = "conversations.stats"; | |
const client = new MongoClient(MONGODB_URL, { | |
directConnection: MONGODB_DIRECT_CONNECTION === "true", | |
}); | |
export const connectPromise = client.connect().catch(console.error); | |
export function getCollections(mongoClient: MongoClient) { | |
const db = mongoClient.db(MONGODB_DB_NAME + (import.meta.env.MODE === "test" ? "-test" : "")); | |
const conversations = db.collection<Conversation>("conversations"); | |
const conversationStats = db.collection<ConversationStats>(CONVERSATION_STATS_COLLECTION); | |
const assistants = db.collection<Assistant>("assistants"); | |
const assistantStats = db.collection<AssistantStats>("assistants.stats"); | |
const reports = db.collection<Report>("reports"); | |
const sharedConversations = db.collection<SharedConversation>("sharedConversations"); | |
const abortedGenerations = db.collection<AbortedGeneration>("abortedGenerations"); | |
const settings = db.collection<Settings>("settings"); | |
const users = db.collection<User>("users"); | |
const sessions = db.collection<Session>("sessions"); | |
const messageEvents = db.collection<MessageEvent>("messageEvents"); | |
const bucket = new GridFSBucket(db, { bucketName: "files" }); | |
const migrationResults = db.collection<MigrationResult>("migrationResults"); | |
const semaphores = db.collection<Semaphore>("semaphores"); | |
return { | |
conversations, | |
conversationStats, | |
assistants, | |
assistantStats, | |
reports, | |
sharedConversations, | |
abortedGenerations, | |
settings, | |
users, | |
sessions, | |
messageEvents, | |
bucket, | |
migrationResults, | |
semaphores, | |
}; | |
} | |
const db = client.db(MONGODB_DB_NAME + (import.meta.env.MODE === "test" ? "-test" : "")); | |
const collections = getCollections(client); | |
const { | |
conversations, | |
conversationStats, | |
assistants, | |
assistantStats, | |
reports, | |
sharedConversations, | |
abortedGenerations, | |
settings, | |
users, | |
sessions, | |
messageEvents, | |
semaphores, | |
} = collections; | |
export { client, db, collections }; | |
client.on("open", () => { | |
conversations | |
.createIndex( | |
{ sessionId: 1, updatedAt: -1 }, | |
{ partialFilterExpression: { sessionId: { $exists: true } } } | |
) | |
.catch(console.error); | |
conversations | |
.createIndex( | |
{ userId: 1, updatedAt: -1 }, | |
{ partialFilterExpression: { userId: { $exists: true } } } | |
) | |
.catch(console.error); | |
conversations | |
.createIndex( | |
{ "message.id": 1, "message.ancestors": 1 }, | |
{ partialFilterExpression: { userId: { $exists: true } } } | |
) | |
.catch(console.error); | |
// To do stats on conversations | |
conversations.createIndex({ updatedAt: 1 }).catch(console.error); | |
// Not strictly necessary, could use _id, but more convenient. Also for stats | |
conversations.createIndex({ createdAt: 1 }).catch(console.error); | |
// To do stats on conversation messages | |
conversations.createIndex({ "messages.createdAt": 1 }, { sparse: true }).catch(console.error); | |
// Unique index for stats | |
conversationStats | |
.createIndex( | |
{ | |
type: 1, | |
"date.field": 1, | |
"date.span": 1, | |
"date.at": 1, | |
distinct: 1, | |
}, | |
{ unique: true } | |
) | |
.catch(console.error); | |
// Allow easy check of last computed stat for given type/dateField | |
conversationStats | |
.createIndex({ | |
type: 1, | |
"date.field": 1, | |
"date.at": 1, | |
}) | |
.catch(console.error); | |
abortedGenerations.createIndex({ updatedAt: 1 }, { expireAfterSeconds: 30 }).catch(console.error); | |
abortedGenerations.createIndex({ conversationId: 1 }, { unique: true }).catch(console.error); | |
sharedConversations.createIndex({ hash: 1 }, { unique: true }).catch(console.error); | |
settings.createIndex({ sessionId: 1 }, { unique: true, sparse: true }).catch(console.error); | |
settings.createIndex({ userId: 1 }, { unique: true, sparse: true }).catch(console.error); | |
settings.createIndex({ assistants: 1 }).catch(console.error); | |
users.createIndex({ hfUserId: 1 }, { unique: true }).catch(console.error); | |
users.createIndex({ sessionId: 1 }, { unique: true, sparse: true }).catch(console.error); | |
// No unicity because due to renames & outdated info from oauth provider, there may be the same username on different users | |
users.createIndex({ username: 1 }).catch(console.error); | |
messageEvents.createIndex({ createdAt: 1 }, { expireAfterSeconds: 60 }).catch(console.error); | |
sessions.createIndex({ expiresAt: 1 }, { expireAfterSeconds: 0 }).catch(console.error); | |
sessions.createIndex({ sessionId: 1 }, { unique: true }).catch(console.error); | |
assistants.createIndex({ createdById: 1, userCount: -1 }).catch(console.error); | |
assistants.createIndex({ userCount: 1 }).catch(console.error); | |
assistants.createIndex({ featured: 1, userCount: -1 }).catch(console.error); | |
assistants.createIndex({ modelId: 1, userCount: -1 }).catch(console.error); | |
assistants.createIndex({ searchTokens: 1 }).catch(console.error); | |
assistants.createIndex({ last24HoursCount: 1 }).catch(console.error); | |
assistantStats | |
// Order of keys is important for the queries | |
.createIndex({ "date.span": 1, "date.at": 1, assistantId: 1 }, { unique: true }) | |
.catch(console.error); | |
reports.createIndex({ assistantId: 1 }).catch(console.error); | |
reports.createIndex({ createdBy: 1, assistantId: 1 }).catch(console.error); | |
// Unique index for semaphore and migration results | |
semaphores.createIndex({ key: 1 }, { unique: true }).catch(console.error); | |
semaphores.createIndex({ createdAt: 1 }, { expireAfterSeconds: 60 }).catch(console.error); | |
}); | |