Skip to content

Commit 9bf8cf4

Browse files
Added revision parameter for Inference Endpoint deployment (#127)
1 parent 8f7c59d commit 9bf8cf4

File tree

3 files changed

+4
-0
lines changed

3 files changed

+4
-0
lines changed

run_evals_accelerate.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,7 @@ def get_parser():
7171
parser.add_argument("--inference_server_auth", type=str, default=None)
7272
# Model type 3) Inference endpoints
7373
task_type_group.add_argument("--endpoint_model_name", type=str)
74+
parser.add_argument("--revision", type=str)
7475
parser.add_argument("--accelerator", type=str, default=None)
7576
parser.add_argument("--vendor", type=str, default=None)
7677
parser.add_argument("--region", type=str, default=None)

src/lighteval/models/endpoint_model.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,7 @@ def __init__(
7070
self.endpoint: InferenceEndpoint = create_inference_endpoint(
7171
name=config.name,
7272
repository=config.repository,
73+
revision=config.revision,
7374
framework=config.framework,
7475
task="text-generation",
7576
accelerator=config.accelerator,

src/lighteval/models/model_config.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -238,6 +238,7 @@ class InferenceEndpointModelConfig:
238238
endpoint_type: str = "protected"
239239
should_reuse_existing: bool = False
240240
add_special_tokens: bool = True
241+
revision: str = "main"
241242

242243
def get_dtype_args(self) -> Dict[str, str]:
243244
model_dtype = self.model_dtype.lower()
@@ -296,6 +297,7 @@ def create_model_config(args: Namespace, accelerator: Union["Accelerator", None]
296297
instance_type=args.instance_type,
297298
should_reuse_existing=args.reuse_existing,
298299
model_dtype=args.model_dtype,
300+
revision=args.revision or "main",
299301
)
300302
return InferenceModelConfig(model=args.endpoint_model_name)
301303

0 commit comments

Comments
 (0)