docs(ocr): update provider schema comments with more details

Add more context about ID format for custom providers and clarify name usage for built-in providers Explain JSON config validation requirements and mark timestamps as potentially unused
2025-12-24 18:50:56 +08:00 · 2025-10-20 00:48:40 +08:00 · 2025-10-20 00:48:40 +08:00 · ab7fed8907
commit ab7fed8907
parent ec68886e4a
1 changed files with 6 additions and 2 deletions
--- a/src/main/data/db/schemas/ocr/provider.ts
+++ b/src/main/data/db/schemas/ocr/provider.ts
@ -9,13 +9,14 @@ export const ocrProviderTable = sqliteTable(
    /**
     * Unique identifier for the provider.
     * For built-in providers, it's 'tesseract', 'system', etc.
-     * For custom providers, it can be any unique string.
+     * For custom providers, it can be any unique string (we typically use UUID v4).
     * As the primary key, it ensures the uniqueness of each provider.
     */
    id: text('id').primaryKey(),

    /**
     * Display name of the provider, e.g., "Tesseract OCR".
+     * For built-in providers, this value is used internally and is not exposed to users; the display name shown in the UI is locale-based by i18n.
     * Cannot be null.
     */
    name: text('name').notNull(),
@ -32,11 +33,14 @@ export const ocrProviderTable = sqliteTable(
     * Provider-specific configuration. This is a polymorphic field, its structure varies by provider type.
     * For example, Tesseract's configuration is entirely different from PaddleOCR's.
     * Storing it as JSON is the most flexible approach to accommodate any configuration structure.
+     * Since this is a polymorphic field, both frontend and backend must validate
+     * that the structure matches the expected schema for the corresponding provider type
+     * before saving.
     * This field is nullable because `config` in the `OcrProvider` type is optional.
     */
    config: text('config', { mode: 'json' }).$type<OcrProviderConfig>(),

-    /** Timestamps. */
+    /** Timestamps. May not useful. */
    ...createUpdateTimestamps
  },
  (t) => [index('name').on(t.name)]