mirror of
https://github.com/datalab-to/chandra.git
synced 2025-11-29 08:33:13 +00:00
Compare commits
1 Commits
v0.1.2
...
settings-f
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
eaa31d169d |
@@ -73,7 +73,7 @@ def load_model():
|
||||
"dtype": settings.TORCH_DTYPE,
|
||||
"device_map": device_map,
|
||||
}
|
||||
if settings.TORCH_ATTN:
|
||||
if settings.TORCH_ATTN_IMPLEMENTATION:
|
||||
kwargs["attn_implementation"] = settings.TORCH_ATTN_IMPLEMENTATION
|
||||
|
||||
model = Qwen3VLForConditionalGeneration.from_pretrained(
|
||||
|
||||
@@ -13,7 +13,7 @@ class Settings(BaseSettings):
|
||||
MODEL_CHECKPOINT: str = "datalab-to/chandra"
|
||||
TORCH_DEVICE: str | None = None
|
||||
MAX_OUTPUT_TOKENS: int = 8192
|
||||
TORCH_ATTN: str | None = None
|
||||
TORCH_ATTN_IMPLEMENTATION: str | None = None
|
||||
|
||||
# vLLM server settings
|
||||
VLLM_API_KEY: str = "EMPTY"
|
||||
|
||||
Reference in New Issue
Block a user