From 99b023d195f0cbd0f848f2a609452bfc86517ac8 Mon Sep 17 00:00:00 2001 From: William Pietri Date: Thu, 14 Nov 2024 05:13:42 -0800 Subject: [PATCH] A Huggingface endpoint broke; this uses the replacement endpoint. (#686) --- .../huggingface/modelgauge/suts/huggingface_chat_completion.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/plugins/huggingface/modelgauge/suts/huggingface_chat_completion.py b/plugins/huggingface/modelgauge/suts/huggingface_chat_completion.py index 378be005..12e1add4 100644 --- a/plugins/huggingface/modelgauge/suts/huggingface_chat_completion.py +++ b/plugins/huggingface/modelgauge/suts/huggingface_chat_completion.py @@ -1,5 +1,6 @@ from dataclasses import asdict from typing import Dict, List, Optional + from huggingface_hub import get_inference_endpoint, InferenceClient, InferenceEndpointStatus # type: ignore from huggingface_hub.utils import HfHubHTTPError # type: ignore from pydantic import BaseModel @@ -128,7 +129,7 @@ def translate_response( SUTS.register( HuggingFaceChatCompletionSUT, "gemma-2-9b-it-hf", - "gemma-2-9b-it-qfa", + "gemma-2-9b-it-plf", HF_SECRET, )