Files
lcbp3/specs/03-Data-and-Storage/deltas/2026-06-03-update-ai-available-models-typhoon.sql
admin 3274dede7a
CI / CD Pipeline / build (push) Failing after 4m28s
CI / CD Pipeline / deploy (push) Has been skipped
690603:2041 ADR-034-134 #01
2026-06-03 20:41:42 +07:00

50 lines
1.7 KiB
SQL

-- Delta: Update ai_available_models for Thai-Optimized Model Stack (ADR-034)
-- Date: 2026-06-03
-- Author: AI Assistant
-- Related: ADR-034 — Thai-Optimized AI Model Stack, supersedes ADR-023A Section 2.1
-- Rollback: 2026-06-03-update-ai-available-models-typhoon.rollback.sql
-- 1. Insert new main model (typhoon2.5-np-dms) as default, demote old defaults
INSERT INTO ai_available_models (model_name, model_version, description, vram_gb, is_active, is_default)
VALUES (
'typhoon2.5-np-dms:latest',
'latest',
'Thai-optimized main AI model based on typhoon2.5-qwen3-4b (~2.5GB VRAM, standby mode) — ADR-034',
2.50,
TRUE,
TRUE
)
ON DUPLICATE KEY UPDATE
description = VALUES(description),
vram_gb = VALUES(vram_gb),
is_active = TRUE,
is_default = TRUE,
updated_at = NOW();
-- Demote old gemma4 models from default status
UPDATE ai_available_models
SET is_default = FALSE, updated_at = NOW()
WHERE model_name IN ('gemma4:e2b', 'gemma4:e4b', 'typhoon2.1-gemma3-4b');
-- 2. Insert OCR model (typhoon-np-dms-ocr) — not default, keep_alive=0 (unload after each job)
INSERT INTO ai_available_models (model_name, model_version, description, vram_gb, is_active, is_default)
VALUES (
'typhoon-np-dms-ocr:latest',
'latest',
'Thai OCR model based on typhoon-ocr1.5-3b (~3.2GB VRAM, unloads after each job) — ADR-034',
3.20,
TRUE,
FALSE
)
ON DUPLICATE KEY UPDATE
description = VALUES(description),
vram_gb = VALUES(vram_gb),
is_active = TRUE,
updated_at = NOW();
-- 3. Update active model in system_settings to typhoon2.5-np-dms:latest
UPDATE system_settings
SET setting_value = 'typhoon2.5-np-dms:latest',
updated_at = NOW()
WHERE setting_key = 'AI_ACTIVE_MODEL';