Training in progress, step 200
Browse files- model.safetensors +1 -1
- reward_data/all_rewards.csv +2 -2
- reward_plots/advantage_plot_step_150.png +0 -0
- reward_plots/advantage_plot_step_160.png +0 -0
- reward_plots/advantage_plot_step_170.png +0 -0
- reward_plots/advantage_plot_step_180.png +0 -0
- reward_plots/advantage_plot_step_190.png +0 -0
- reward_plots/reward_comparison_step_150.png +0 -0
- reward_plots/reward_comparison_step_160.png +0 -0
- reward_plots/reward_comparison_step_170.png +0 -0
- reward_plots/reward_comparison_step_180.png +0 -0
- reward_plots/reward_comparison_step_190.png +0 -0
- training_args.bin +1 -1
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3554214752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bd5edfcc9cd8360d40be777e38400fbb09142ebfeebe305d37dfac3dd5ef29f
|
| 3 |
size 3554214752
|
reward_data/all_rewards.csv
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:201db9aeafea34bffbbed038550d9ee9c0601060d195574adcaff84f32fc9e38
|
| 3 |
+
size 162266208
|
reward_plots/advantage_plot_step_150.png
ADDED
|
reward_plots/advantage_plot_step_160.png
ADDED
|
reward_plots/advantage_plot_step_170.png
ADDED
|
reward_plots/advantage_plot_step_180.png
ADDED
|
reward_plots/advantage_plot_step_190.png
ADDED
|
reward_plots/reward_comparison_step_150.png
ADDED
|
reward_plots/reward_comparison_step_160.png
ADDED
|
reward_plots/reward_comparison_step_170.png
ADDED
|
reward_plots/reward_comparison_step_180.png
ADDED
|
reward_plots/reward_comparison_step_190.png
ADDED
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 8504
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c35427105f08dd66e4f9765e50c93467db2ad339acfa5baa425376f928e85763
|
| 3 |
size 8504
|