Spaces:
Running
Running
Upload 3 files
Browse files
DeepLearning/w9-qna/results/round3/training_logs.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
[{"loss": 0.5258, "grad_norm": 18.963003158569336, "learning_rate": 3.3374896093100582e-06, "epoch": 1.0, "step": 401}, {"eval_loss": 1.0631824731826782, "eval_exact_match": 73.66003062787136, "eval_f1": 82.79254847168508, "eval_runtime": 4.8928, "eval_samples_per_second": 133.461, "eval_steps_per_second": 8.38, "epoch": 1.0, "step": 401}, {"loss": 0.4471, "grad_norm": 23.054668426513672, "learning_rate": 1.6708229426433918e-06, "epoch": 2.0, "step": 802}, {"eval_loss": 1.107834815979004, "eval_exact_match": 73.20061255742726, "eval_f1": 82.10420088525576, "eval_runtime": 4.9337, "eval_samples_per_second": 132.356, "eval_steps_per_second": 8.31, "epoch": 2.0, "step": 802}, {"loss": 0.408, "grad_norm": 7.869227886199951, "learning_rate": 4.156275976724855e-09, "epoch": 3.0, "step": 1203}, {"eval_loss": 1.1187056303024292, "eval_exact_match": 73.20061255742726, "eval_f1": 82.10358379374121, "eval_runtime": 4.9137, "eval_samples_per_second": 132.894, "eval_steps_per_second": 8.344, "epoch": 3.0, "step": 1203}, {"train_runtime": 451.6812, "train_samples_per_second": 42.568, "train_steps_per_second": 2.663, "total_flos": 1884050365736448.0, "train_loss": 0.460304228544037, "epoch": 3.0, "step": 1203}]
|
DeepLearning/w9-qna/results/round4/training_logs.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
[{"loss": 0.5764, "grad_norm": 16.149080276489258, "learning_rate": 2.5341629505209035e-05, "epoch": 1.0, "step": 401}, {"eval_loss": 1.0490880012512207, "eval_exact_match": 70.44410413476264, "eval_f1": 79.7864129562234, "eval_runtime": 5.0132, "eval_samples_per_second": 130.255, "eval_steps_per_second": 8.178, "epoch": 1.0, "step": 401}, {"loss": 0.3658, "grad_norm": 16.622486114501953, "learning_rate": 9.109201741722674e-06, "epoch": 2.0, "step": 802}, {"eval_loss": 1.2295763492584229, "eval_exact_match": 69.67840735068913, "eval_f1": 79.44645919529016, "eval_runtime": 5.0933, "eval_samples_per_second": 128.207, "eval_steps_per_second": 8.05, "epoch": 2.0, "step": 802}, {"loss": 0.2119, "grad_norm": 7.273800849914551, "learning_rate": 6.322752502396778e-11, "epoch": 3.0, "step": 1203}, {"eval_loss": 1.3621764183044434, "eval_exact_match": 70.59724349157733, "eval_f1": 80.07283157510818, "eval_runtime": 5.0306, "eval_samples_per_second": 129.805, "eval_steps_per_second": 8.15, "epoch": 3.0, "step": 1203}, {"train_runtime": 461.2654, "train_samples_per_second": 41.683, "train_steps_per_second": 2.608, "total_flos": 1884050365736448.0, "train_loss": 0.38471311345659287, "epoch": 3.0, "step": 1203}]
|
DeepLearning/w9-qna/results/training_logs.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
[{"loss": 0.
|
|
|
|
| 1 |
+
[{"loss": 0.5764, "grad_norm": 16.149080276489258, "learning_rate": 2.5341629505209035e-05, "epoch": 1.0, "step": 401}, {"eval_loss": 1.0490880012512207, "eval_exact_match": 70.44410413476264, "eval_f1": 79.7864129562234, "eval_runtime": 5.0132, "eval_samples_per_second": 130.255, "eval_steps_per_second": 8.178, "epoch": 1.0, "step": 401}, {"loss": 0.3658, "grad_norm": 16.622486114501953, "learning_rate": 9.109201741722674e-06, "epoch": 2.0, "step": 802}, {"eval_loss": 1.2295763492584229, "eval_exact_match": 69.67840735068913, "eval_f1": 79.44645919529016, "eval_runtime": 5.0933, "eval_samples_per_second": 128.207, "eval_steps_per_second": 8.05, "epoch": 2.0, "step": 802}, {"loss": 0.2119, "grad_norm": 7.273800849914551, "learning_rate": 6.322752502396778e-11, "epoch": 3.0, "step": 1203}, {"eval_loss": 1.3621764183044434, "eval_exact_match": 70.59724349157733, "eval_f1": 80.07283157510818, "eval_runtime": 5.0306, "eval_samples_per_second": 129.805, "eval_steps_per_second": 8.15, "epoch": 3.0, "step": 1203}, {"train_runtime": 461.2654, "train_samples_per_second": 41.683, "train_steps_per_second": 2.608, "total_flos": 1884050365736448.0, "train_loss": 0.38471311345659287, "epoch": 3.0, "step": 1203}]
|