sathishphdai commited on
Commit
8cf7869
Β·
verified Β·
1 Parent(s): 2a36c8b

Upload Healthcare-SLM v2

Browse files
Files changed (1) hide show
  1. config.py +3 -3
config.py CHANGED
@@ -43,8 +43,8 @@ class SLMConfig:
43
  ffn_multiplier: float = 2.667
44
 
45
  # ── RoPE ───────────────────────────────────────────────────────
46
- max_position_embeddings: int = 1_000_000
47
- rope_theta: float = 500000.0
48
 
49
  # ── Sliding Window ─────────────────────────────────────────────
50
  sliding_window: Optional[int] = None
@@ -64,7 +64,7 @@ class SLMConfig:
64
  device: str = "auto"
65
 
66
  # ── Generation ─────────────────────────────────────────────────
67
- max_new_tokens: int = 1024
68
  temperature: float = 0.8
69
  top_k: int = 50
70
  top_p: float = 0.9
 
43
  ffn_multiplier: float = 2.667
44
 
45
  # ── RoPE ───────────────────────────────────────────────────────
46
+ max_position_embeddings: int = 100_000_000_000 # 100B tokens via RoPE
47
+ rope_theta: float = 50_000_000_000.0 # Scaled for 100B context
48
 
49
  # ── Sliding Window ─────────────────────────────────────────────
50
  sliding_window: Optional[int] = None
 
64
  device: str = "auto"
65
 
66
  # ── Generation ─────────────────────────────────────────────────
67
+ max_new_tokens: int = 1_000_000 # 1M output tokens
68
  temperature: float = 0.8
69
  top_k: int = 50
70
  top_p: float = 0.9