flan-t5-small-compression-v2 / trainer_log_history.csv
dotslashderek's picture
Training in progress, epoch 1
af48b5e verified
loss,grad_norm,learning_rate,epoch,step,eval_loss,eval_rouge1,eval_rouge2,eval_rougeL,eval_rougeLsum,eval_comp_ratio_mean,eval_comp_ratio_p90,eval_pct_violations,eval_runtime,eval_samples_per_second,eval_steps_per_second,train_runtime,train_samples_per_second,train_steps_per_second,total_flos,train_loss
1.2576,4.137552261352539,9.993726474278545e-05,1.0,1594,,,,,,,,,,,,,,,,
,,,1.0,1594,0.6456611752510071,0.8528364838438867,0.6586661877158779,0.819669484356327,0.8199279895987595,0.6625529499788416,0.7735849056603774,0.0,346.9901,6.484,0.813,,,,,
0.7688,2.573607921600342,8.889585947302385e-05,2.0,3188,,,,,,,,,,,,,,,,
,,,2.0,3188,0.5727154016494751,0.8689474874470693,0.6851048712818919,0.8344968972913525,0.8348697620320389,0.6647169049402463,0.7693568726355614,0.0,353.1245,6.372,0.799,,,,,
0.6591,2.8348424434661865,7.778474836191274e-05,3.0,4782,,,,,,,,,,,,,,,,
,,,3.0,4782,0.540533185005188,0.8750090385391008,0.6962724429732516,0.8413137437626381,0.8416859973545814,0.6684329676796582,0.7692307692307693,0.0,348.9787,6.447,0.808,,,,,
0.5957,3.485762357711792,6.667363725080162e-05,4.0,6376,,,,,,,,,,,,,,,,
,,,4.0,6376,0.5332812666893005,0.8771052673801956,0.7001549309721768,0.8437587332299845,0.8440177737862178,0.6599911370905979,0.7659574468085106,0.0,350.5534,6.418,0.804,,,,,
0.548,3.5571165084838867,5.5562526139690505e-05,5.0,7970,,,,,,,,,,,,,,,,
,,,5.0,7970,0.5211982727050781,0.8791677438074604,0.705867129952528,0.8467215753256596,0.8470289702216209,0.6616752445040748,0.7647977941176471,0.00044444444444444447,351.9587,6.393,0.801,,,,,
0.5139,2.7198104858398438,4.4451415028579393e-05,6.0,9564,,,,,,,,,,,,,,,,
,,,6.0,9564,0.519557535648346,0.8798753890192361,0.7063785492018196,0.8472026138402767,0.8473323428755936,0.659716430748814,0.7636363636363637,0.0,350.8448,6.413,0.804,,,,,
0.4862,3.862455129623413,3.334030391746828e-05,7.0,11158,,,,,,,,,,,,,,,,
,,,7.0,11158,0.5143899917602539,0.8804832259801447,0.7076066408588376,0.8472581234680618,0.8474001918954426,0.6656473506268799,0.7704918032786885,0.00044444444444444447,352.5406,6.382,0.8,,,,,
0.466,3.4800119400024414,2.2229192806357174e-05,8.0,12752,,,,,,,,,,,,,,,,
,,,8.0,12752,0.5157203674316406,0.8819074337590058,0.709796994728016,0.848893205872066,0.8492418483342343,0.6622329738091887,0.7674418604651163,0.0,350.3672,6.422,0.805,,,,,
0.4499,2.951266288757324,1.1118081695246062e-05,9.0,14346,,,,,,,,,,,,,,,,
,,,9.0,14346,0.5155828595161438,0.8816110197232148,0.7095513359852312,0.8486239346338051,0.8488813378849979,0.6603841749226899,0.7659574468085106,0.0,351.7325,6.397,0.802,,,,,
0.4393,2.2352824211120605,6.97058413495051e-09,10.0,15940,,,,,,,,,,,,,,,,
,,,10.0,15940,0.5180955529212952,0.88198348953885,0.7104253099452262,0.848536449353483,0.8488333749106418,0.6611201077120823,0.7674418604651163,0.0,352.9325,6.375,0.799,,,,,
,,,10.0,15940,,,,,,,,,,,,7097.2826,17.965,2.246,2976335712768000.0,0.6184487030527074