Update src/model_loader.py
Browse files- src/model_loader.py +0 -10
src/model_loader.py
CHANGED
|
@@ -1,14 +1,4 @@
|
|
| 1 |
# src/model_loader.py
|
| 2 |
-
# -----------------------------------------------------------------------------
|
| 3 |
-
# Why this change
|
| 4 |
-
# -----------------------------------------------------------------------------
|
| 5 |
-
# - Fix fallback model id → 'google/medgemma-4b-text-it' (previous typo caused
|
| 6 |
-
# CPU-only runs to fail).
|
| 7 |
-
# - Keep primary on GPU in 4-bit (bnb, nf4) when available; otherwise fallback.
|
| 8 |
-
# - Provide a single generate_chat(messages, **gen_kwargs) entry point with
|
| 9 |
-
# consistent logging and without relying on chat templates (manual prompt).
|
| 10 |
-
# - Lightweight logs show model choice, cache path, and generation time.
|
| 11 |
-
# -----------------------------------------------------------------------------
|
| 12 |
|
| 13 |
from __future__ import annotations
|
| 14 |
|
|
|
|
| 1 |
# src/model_loader.py
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
|
| 3 |
from __future__ import annotations
|
| 4 |
|