from text_generation import Client import os API_TOKEN = os.environ.get("API_TOKEN") API_URL = "https://api-inference.huggingface.co/models/HuggingFaceM4/idefics-9b-instruct" DECODING_STRATEGY = "Greedy" QUERY = "User: What is in this image?![](https://upload.wikimedia.org/wikipedia/commons/8/86/Id%C3%A9fix.JPG)\nAssistant:" client = Client( base_url=API_URL, headers={"x-use-cache": "0", "Authorization": f"Bearer {API_TOKEN}"}, ) generation_args = { "max_new_tokens": 256, "repetition_penalty": 1.0, "stop_sequences": ["", "\nUser:"], } if DECODING_STRATEGY == "Greedy": generation_args["do_sample"] = False elif DECODING_STRATEGY == "Top P Sampling": generation_args["temperature"] = 1. generation_args["do_sample"] = True generation_args["top_p"] = 0.95 generated_text = client.generate(prompt=QUERY, **generation_args) print(generated_text)