File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed
src/lighteval/models/vllm Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change 37
37
GenerativeResponse ,
38
38
LoglikelihoodResponse ,
39
39
)
40
- from lighteval .models .utils import _get_dtype , _simplify_name
40
+ from lighteval .models .utils import _simplify_name
41
41
from lighteval .tasks .requests import (
42
42
GreedyUntilRequest ,
43
43
LoglikelihoodRequest ,
@@ -78,7 +78,7 @@ class VLLMModelConfig:
78
78
pretrained : str
79
79
gpu_memory_utilization : float = 0.9 # lower this if you are running out of memory
80
80
revision : str = "main" # revision of the model
81
- dtype : str | None = None
81
+ dtype : str = "bfloat16"
82
82
tensor_parallel_size : int = 1 # how many GPUs to use for tensor parallelism
83
83
pipeline_parallel_size : int = 1 # how many GPUs to use for pipeline parallelism
84
84
data_parallel_size : int = 1 # how many GPUs to use for data parallelism
@@ -128,7 +128,7 @@ def __init__(
128
128
129
129
self .model_name = _simplify_name (config .pretrained )
130
130
self .model_sha = "" # config.get_model_sha()
131
- self .precision = _get_dtype ( config .dtype , config = self . _config )
131
+ self .precision = config .dtype
132
132
133
133
self .model_info = ModelInfo (model_name = self .model_name , model_sha = self .model_sha )
134
134
self .pairwise_tokenization = config .pairwise_tokenization
You can’t perform that action at this time.
0 commit comments