Spaces:

johann22
/

idefics-stream

Runtime error

App Files Files Community

johann22 commited on Dec 30, 2023

Commit

b34cc6a

•

1 Parent(s): 9ee0176

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -39

app.py CHANGED Viewed

@@ -1,39 +1,26 @@
-import torch
-from transformers import IdeficsForVisionText2Text, AutoProcessor
-device = "cuda" if torch.cuda.is_available() else "cpu"
-checkpoint = "HuggingFaceM4/idefics-9b-instruct"
-model = IdeficsForVisionText2Text.from_pretrained(checkpoint, torch_dtype=torch.bfloat16).to(device)
-processor = AutoProcessor.from_pretrained(checkpoint)
-# We feed to the model an arbitrary sequence of text strings and images. Images can be either URLs or PIL Images.
-prompts = [
-    [
-        "User: What is in this image?",
-        "https://upload.wikimedia.org/wikipedia/commons/8/86/Id%C3%A9fix.JPG",
-        "<end_of_utterance>",
-        "\nAssistant: This picture depicts Idefix, the dog of Obelix in Asterix and Obelix. Idefix is running on the ground.<end_of_utterance>",
-        "\nUser:",
-        "https://static.wikia.nocookie.net/asterix/images/2/25/R22b.gif/revision/latest?cb=20110815073052",
-        "And who is that?<end_of_utterance>",
-        "\nAssistant:",
-    ],
-]
-# --batched mode
-inputs = processor(prompts, add_end_of_utterance_token=False, return_tensors="pt").to(device)
-# --single sample mode
-# inputs = processor(prompts[0], return_tensors="pt").to(device)
-# Generation args
-exit_condition = processor.tokenizer("<end_of_utterance>", add_special_tokens=False).input_ids
-bad_words_ids = processor.tokenizer(["<image>", "<fake_token_around_image>"], add_special_tokens=False).input_ids
-generated_ids = model.generate(**inputs, eos_token_id=exit_condition, bad_words_ids=bad_words_ids, max_length=100)
-generated_text = processor.batch_decode(generated_ids, skip_special_tokens=True)
-for i, t in enumerate(generated_text):
-    print(f"{i}:\n{t}\n")

+from text_generation import Client
+API_TOKEN = ""
+API_URL = "https://api-inference.huggingface.co/models/HuggingFaceM4/idefics-80b-instruct"
+DECODING_STRATEGY = "Greedy"
+QUERY = "User: What is in this image?![](https://upload.wikimedia.org/wikipedia/commons/8/86/Id%C3%A9fix.JPG)<end_of_utterance>\nAssistant:"
+client = Client(
+    base_url=API_URL,
+    headers={"x-use-cache": "0", "Authorization": f"Bearer {API_TOKEN}"},
+)
+generation_args = {
+    "max_new_tokens": 256,
+    "repetition_penalty": 1.0,
+    "stop_sequences": ["<end_of_utterance>", "\nUser:"],
+}
+if DECODING_STRATEGY == "Greedy":
+    generation_args["do_sample"] = False
+elif DECODING_STRATEGY == "Top P Sampling":
+    generation_args["temperature"] = 1.
+    generation_args["do_sample"] = True
+    generation_args["top_p"] = 0.95
+generated_text = client.generate(prompt=QUERY, **generation_args)
+print(generated_text)