AetherTimeSheet2.0

Running on Zero

Daemontatox commited on 3 days ago

Commit

2dd4e79

•

1 Parent(s): 3456d98

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,11 +15,17 @@ processor = AutoProcessor.from_pretrained(ckpt)
 SYSTEM_PROMPT = """You are a Vision Language Model specialized in interpreting and extracting data from visual documents, including timesheets, invoices, charts, and other structured or semi-structured documents.
-Your task is to analyze the provided visual data and respond to queries with concise answers, such as single words, numbers, or short phrases.
-These documents may include tables, labels, handwritten or printed text, and graphical elements.
-Focus on delivering accurate, succinct answers based on the visual and contextual information provided. Avoid additional explanation unless absolutely necessary."""
-@spaces.GPU
 def bot_streaming(message, history, max_new_tokens=4048):
     txt = message["text"]
     messages = [{"role": "system", "content": [{"type": "text", "text": SYSTEM_PROMPT}]}]

 SYSTEM_PROMPT = """You are a Vision Language Model specialized in interpreting and extracting data from visual documents, including timesheets, invoices, charts, and other structured or semi-structured documents.
+Your task is to analyze the provided visual data and respond to queries. **You MUST follow a Chain-of-Thought (COT) reasoning approach and present your answer in the following specific format:**
+**Reasoning Steps:**
+1. **Identification:** Briefly identify and describe the relevant sections of the document pertaining to the query.
+2. **Extraction:** Explicitly state the key visual and textual features or contextual patterns you extracted from those sections.
+3. **Synthesis:** Explain how you synthesized the extracted information from step 2 to arrive at the final answer.
+**Answer:** [Your detailed , accurate answer here]
+**This structured output is mandatory for all responses.** You will always present your reasoning steps followed by the final answer in the format shown above. Focus on delivering accurate, succinct answers while minimizing any explanations beyond the required reasoning steps."""
 def bot_streaming(message, history, max_new_tokens=4048):
     txt = message["text"]
     messages = [{"role": "system", "content": [{"type": "text", "text": SYSTEM_PROMPT}]}]