artarif/llm-course-hw2-reward-model-trainer
Browse files- README.md +1 -1
- model.safetensors +1 -1
- training_args.bin +1 -1
README.md
CHANGED
@@ -35,7 +35,7 @@ This model was trained with Reward.
|
|
35 |
|
36 |
### Framework versions
|
37 |
|
38 |
-
- TRL: 0.
|
39 |
- Transformers: 4.49.0
|
40 |
- Pytorch: 2.6.0+cu124
|
41 |
- Datasets: 3.4.1
|
|
|
35 |
|
36 |
### Framework versions
|
37 |
|
38 |
+
- TRL: 0.16.0
|
39 |
- Transformers: 4.49.0
|
40 |
- Pytorch: 2.6.0+cu124
|
41 |
- Datasets: 3.4.1
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 538092792
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:844bd0aa41ab1475af0c5ddab41b720d93891db452f2654ad0e4c2539497c69c
|
3 |
size 538092792
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5368
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08ab124f486b4e119a41d214d5dae2296647e5dffeb189f2fb2ad7e2cbc000d5
|
3 |
size 5368
|