Spaces:

johann22
/

idefics-stream

Runtime error

idefics-stream / app.py

Update app.py

ed0e96f 12 months ago

931 Bytes

	from text_generation import Client
	import os

	API_TOKEN = os.environ.get("API_TOKEN")
	API_URL = "https://api-inference.huggingface.co/models/HuggingFaceM4/idefics-9b-instruct"
	DECODING_STRATEGY = "Greedy"
	QUERY = "User: What is in this image?![](https://upload.wikimedia.org/wikipedia/commons/8/86/Id%C3%A9fix.JPG)<end_of_utterance>\nAssistant:"

	client = Client(
	base_url=API_URL,
	headers={"x-use-cache": "0", "Authorization": f"Bearer {API_TOKEN}"},
	)
	generation_args = {
	"max_new_tokens": 256,
	"repetition_penalty": 1.0,
	"stop_sequences": ["<end_of_utterance>", "\nUser:"],
	}

	if DECODING_STRATEGY == "Greedy":
	generation_args["do_sample"] = False
	elif DECODING_STRATEGY == "Top P Sampling":
	generation_args["temperature"] = 1.
	generation_args["do_sample"] = True
	generation_args["top_p"] = 0.95

	generated_text = client.generate(prompt=QUERY, **generation_args)
	print(generated_text)