Jerry Ji commited on
Commit
8f9976c
·
1 Parent(s): a71693c

Training in progress, epoch 1

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c4851d0fda021876b9eb5ecbd6ec0d108d643bb4b81a517a68af72134d8b407
3
  size 218138576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9dcafb75e33763bcbb1dcac4844987b4bc4804afc8cd5a98e4c454d0a897ab4
3
  size 218138576
all_results.json CHANGED
@@ -1,21 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "eval_logits/chosen": -2.0658671855926514,
4
- "eval_logits/rejected": -1.9411793947219849,
5
- "eval_logps/chosen": -266.13037109375,
6
- "eval_logps/rejected": -228.2694091796875,
7
- "eval_loss": 0.5265706777572632,
8
- "eval_rewards/accuracies": 0.7459999918937683,
9
- "eval_rewards/chosen": -0.1469534933567047,
10
- "eval_rewards/margins": 0.7515553832054138,
11
- "eval_rewards/rejected": -0.8985088467597961,
12
- "eval_runtime": 453.4186,
13
- "eval_samples": 2000,
14
- "eval_samples_per_second": 4.411,
15
- "eval_steps_per_second": 0.276,
16
- "train_loss": 0.5642705829018732,
17
- "train_runtime": 71197.0849,
18
  "train_samples": 61966,
19
- "train_samples_per_second": 2.611,
20
- "train_steps_per_second": 0.041
21
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "train_loss": 0.3465735912322998,
4
+ "train_runtime": 29.428,
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "train_samples": 61966,
6
+ "train_samples_per_second": 0.34,
7
+ "train_steps_per_second": 0.034
8
  }
runs/Dec10_15-50-15_uclaml03.cs.ucla.edu/events.out.tfevents.1702252337.uclaml03.cs.ucla.edu.2934315.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a95af9f0d4bdb525ac33ddcad00eac1c6938a94f290dd586076e256e29c9d409
3
+ size 6089
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 3.0,
3
- "train_loss": 0.5642705829018732,
4
- "train_runtime": 71197.0849,
5
  "train_samples": 61966,
6
- "train_samples_per_second": 2.611,
7
- "train_steps_per_second": 0.041
8
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "train_loss": 0.3465735912322998,
4
+ "train_runtime": 29.428,
5
  "train_samples": 61966,
6
+ "train_samples_per_second": 0.34,
7
+ "train_steps_per_second": 0.034
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff