diff --git a/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/ocr-sidecar/app.py b/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/ocr-sidecar/app.py index 2238a17f..5eb62be9 100644 --- a/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/ocr-sidecar/app.py +++ b/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/ocr-sidecar/app.py @@ -238,7 +238,7 @@ def process_with_typhoon_ocr(pil_image: Image.Image, options_override: dict = {} "top_p": 0.1, "repeat_penalty": 1.1, "num_gpu": 99, # บังคับ GPU layers สูงสุด — ป้องกัน Ollama fallback ไป CPU โดยไม่จำเป็น - "num_ctx": 2048, # ลด KV cache + compute graph จาก 6.7 GiB → ~1.7 GiB เพื่อให้ model fit ใน VRAM 8GB + "num_ctx": 4096, # image tokens ~2772 → ต้องการ context > 2048; 4096 รองรับ image + output โดยไม่ truncate **options_override, } payload = { diff --git a/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/typhoon-np-dms-ocr.model.md b/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/typhoon-np-dms-ocr.model.md index 7fbaee81..a82b6364 100644 --- a/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/typhoon-np-dms-ocr.model.md +++ b/specs/04-Infrastructure-OPS/04-00-docker-compose/Desk-5439/typhoon-np-dms-ocr.model.md @@ -1,6 +1,6 @@ FROM scb10x/typhoon-ocr1.5-3b:latest -PARAMETER num_ctx 2048 +PARAMETER num_ctx 4096 PARAMETER num_predict 2048 PARAMETER temperature 0.1 PARAMETER top_p 0.1