Upload Healthcare-SLM v2
Browse files
config.py
CHANGED
|
@@ -43,8 +43,8 @@ class SLMConfig:
|
|
| 43 |
ffn_multiplier: float = 2.667
|
| 44 |
|
| 45 |
# ββ RoPE βββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 46 |
-
max_position_embeddings: int =
|
| 47 |
-
rope_theta: float =
|
| 48 |
|
| 49 |
# ββ Sliding Window βββββββββββββββββββββββββββββββββββββββββββββ
|
| 50 |
sliding_window: Optional[int] = None
|
|
@@ -64,7 +64,7 @@ class SLMConfig:
|
|
| 64 |
device: str = "auto"
|
| 65 |
|
| 66 |
# ββ Generation βββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 67 |
-
max_new_tokens: int =
|
| 68 |
temperature: float = 0.8
|
| 69 |
top_k: int = 50
|
| 70 |
top_p: float = 0.9
|
|
|
|
| 43 |
ffn_multiplier: float = 2.667
|
| 44 |
|
| 45 |
# ββ RoPE βββββββββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 46 |
+
max_position_embeddings: int = 100_000_000_000 # 100B tokens via RoPE
|
| 47 |
+
rope_theta: float = 50_000_000_000.0 # Scaled for 100B context
|
| 48 |
|
| 49 |
# ββ Sliding Window βββββββββββββββββββββββββββββββββββββββββββββ
|
| 50 |
sliding_window: Optional[int] = None
|
|
|
|
| 64 |
device: str = "auto"
|
| 65 |
|
| 66 |
# ββ Generation βββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 67 |
+
max_new_tokens: int = 1_000_000 # 1M output tokens
|
| 68 |
temperature: float = 0.8
|
| 69 |
top_k: int = 50
|
| 70 |
top_p: float = 0.9
|