fix
This commit is contained in:
@@ -5,7 +5,7 @@ from transformers import AutoConfig
|
||||
@dataclass
|
||||
class Config:
|
||||
model: str = ''
|
||||
max_num_batched_tokens: int = 16384
|
||||
max_num_batched_tokens: int = 32768
|
||||
max_num_seqs: int = 512
|
||||
max_model_len: int = 4096
|
||||
gpu_memory_utilization: float = 0.95
|
||||
|
||||
Reference in New Issue
Block a user