DEADLOCK007X commited on
Commit
dc037ee
·
1 Parent(s): ec5407e

Reinitialize repository at backend level with ai_evaluator and services

Browse files
Files changed (2) hide show
  1. .gitattributes +0 -35
  2. tinyllama_inference.py +16 -14
.gitattributes DELETED
@@ -1,35 +0,0 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tinyllama_inference.py CHANGED
@@ -14,15 +14,27 @@ def load_model():
14
  model = AutoModelForCausalLM.from_pretrained(model_name)
15
  return tokenizer, model
16
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  def evaluate_code(question, code):
18
- # Revised prompt with explicit instructions about arithmetic correctness.
19
  prompt = f"""You are an expert code evaluator.
20
  Evaluate the following solution for the given problem.
21
  The problem asks for a function that returns the square of a number.
22
  A correct solution must multiply the number by itself (using x*x or x**2).
23
  If the solution uses any other operation (such as addition), it is completely incorrect.
24
  Rate the solution as follows:
25
- - 5 stars: Perfect solution; the solution is correct, efficient, and follows best practices.
26
  - 4 stars: Correct solution with minor issues.
27
  - 3 stars: Partially correct solution with noticeable issues.
28
  - 2 stars: Incorrect solution with some correct elements.
@@ -49,22 +61,12 @@ Your response:"""
49
  response_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
50
  print("Raw model response:", response_text) # Debug output
51
 
52
- # Extract JSON: use regex to capture all JSON blocks and select one with expected keys
53
- matches = re.findall(r'\{.*?\}', response_text, re.DOTALL)
54
- result = None
55
- for m in reversed(matches):
56
- try:
57
- temp = json.loads(m)
58
- if isinstance(temp, dict) and "stars" in temp and "feedback" in temp:
59
- result = temp
60
- break
61
- except Exception:
62
- continue
63
  if result is None:
64
  result = {"stars": 0, "feedback": "Evaluation failed. Unable to extract valid JSON from AI response."}
65
-
66
  return result
67
 
 
68
  if __name__ == "__main__":
69
  import sys
70
  if len(sys.argv) < 3:
 
14
  model = AutoModelForCausalLM.from_pretrained(model_name)
15
  return tokenizer, model
16
 
17
+ def extract_json(response_text):
18
+ # Attempt to extract all JSON blocks (non-greedy, with DOTALL)
19
+ matches = re.findall(r'\{.*?\}', response_text, re.DOTALL)
20
+ for m in reversed(matches):
21
+ try:
22
+ temp = json.loads(m)
23
+ if isinstance(temp, dict) and "stars" in temp and "feedback" in temp:
24
+ return temp
25
+ except Exception:
26
+ continue
27
+ return None
28
+
29
  def evaluate_code(question, code):
30
+ # Revised prompt that explicitly states the expected arithmetic operation for square.
31
  prompt = f"""You are an expert code evaluator.
32
  Evaluate the following solution for the given problem.
33
  The problem asks for a function that returns the square of a number.
34
  A correct solution must multiply the number by itself (using x*x or x**2).
35
  If the solution uses any other operation (such as addition), it is completely incorrect.
36
  Rate the solution as follows:
37
+ - 5 stars: Perfect solution; correct, efficient, and follows best practices.
38
  - 4 stars: Correct solution with minor issues.
39
  - 3 stars: Partially correct solution with noticeable issues.
40
  - 2 stars: Incorrect solution with some correct elements.
 
61
  response_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
62
  print("Raw model response:", response_text) # Debug output
63
 
64
+ result = extract_json(response_text)
 
 
 
 
 
 
 
 
 
 
65
  if result is None:
66
  result = {"stars": 0, "feedback": "Evaluation failed. Unable to extract valid JSON from AI response."}
 
67
  return result
68
 
69
+ # For direct command-line testing.
70
  if __name__ == "__main__":
71
  import sys
72
  if len(sys.argv) < 3: