Spaces:
Runtime error
Runtime error
import urllib3 | |
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning) | |
from pydantic import Extra | |
import requests | |
from typing import Any, List, Mapping, Optional | |
from langchain.callbacks.manager import CallbackManagerForLLMRun | |
from langchain.llms.base import LLM | |
class URALLM(LLM): | |
llm_url = os.environ.get("URL") | |
class Config: | |
extra = Extra.forbid | |
def _llm_type(self) -> str: | |
return "URALLM" | |
def _call( | |
self, | |
inputs: str, | |
stop: Optional[List[str]] = None, | |
run_manager: Optional[CallbackManagerForLLMRun] = None, | |
**kwargs: Any, | |
) -> str: | |
if stop is not None: | |
raise ValueError("stop kwargs are not permitted.") | |
payload = { | |
"inputs": inputs, | |
# "return_full_text":True, | |
# "do_sample":True, | |
"parameters": {"max_new_tokens":512, | |
"temperature":0.01, | |
"repetition_penalty":1.1, | |
"do_sample":True, | |
"top_k":10 | |
} | |
} | |
headers = {"Content-Type": "application/json", "Authorization": os.environ.get("TOKEN")} | |
response = requests.post(self.llm_url, json=payload, headers=headers, verify=False) | |
response.raise_for_status() | |
# print("API Response:", response.json()) | |
return response.json()['generated_text'] # get the response from the API | |
# return response.json().get('generated_text', '') | |
def _identifying_params(self) -> Mapping[str, Any]: | |
"""Get the identifying parameters.""" | |
return {"llmUrl": self.llm_url} | |