Spaces:

alfraser
/

llm-arch

Runtime error

alfraser commited on Jan 19, 2024

Commit

27e1387

1 Parent(s): 6000142

Added option to name an inference endpoint so it is human readable

Files changed (1) hide show

src/architectures.py CHANGED Viewed

@@ -369,8 +369,9 @@ class HFInferenceEndpoint(ArchitectureComponent):
     A concrete pipeline component which sends the user text to a given llama chat based
     inference endpoint on HuggingFace
     """
-    def __init__(self, endpoint_url: str, system_prompt: str, max_new_tokens: int, temperature: float = 1.0):
         self.endpoint_url: str = endpoint_url
         self.system_prompt: str = system_prompt
         self.max_new_tokens = max_new_tokens
         self.api_token = hf_api_token()
@@ -380,7 +381,8 @@ class HFInferenceEndpoint(ArchitectureComponent):
         """
         Custom config details as markdown
         """
-        desc = f"Endpoint: {self.endpoint_url};  "
         desc += f"Max tokens: {self.max_tokens};  "
         desc += f"Temperature: {self.temperature};  "
         desc += f"System prompt: {self.system_prompt}"

     A concrete pipeline component which sends the user text to a given llama chat based
     inference endpoint on HuggingFace
     """
+    def __init__(self, endpoint_url: str, model_name: str, system_prompt: str, max_new_tokens: int, temperature: float = 1.0):
         self.endpoint_url: str = endpoint_url
+        self.model_name: str = model_name
         self.system_prompt: str = system_prompt
         self.max_new_tokens = max_new_tokens
         self.api_token = hf_api_token()
         """
         Custom config details as markdown
         """
+        desc = f"Model: {self.model_name};  "
+        desc += f"Endpoint: {self.endpoint_url};  "
         desc += f"Max tokens: {self.max_tokens};  "
         desc += f"Temperature: {self.temperature};  "
         desc += f"System prompt: {self.system_prompt}"