WebWatcher-7B / trainer_log.jsonl
oriuta's picture
Upload folder using huggingface_hub
ec5b221 verified
{"current_steps": 10, "total_steps": 576, "loss": 1.1038, "lr": 7.758620689655173e-07, "epoch": 0.05194805194805195, "percentage": 1.74, "elapsed_time": "0:04:03", "remaining_time": "3:49:51"}
{"current_steps": 20, "total_steps": 576, "loss": 0.992, "lr": 1.6379310344827587e-06, "epoch": 0.1038961038961039, "percentage": 3.47, "elapsed_time": "0:07:56", "remaining_time": "3:40:48"}
{"current_steps": 30, "total_steps": 576, "loss": 0.84, "lr": 2.5e-06, "epoch": 0.15584415584415584, "percentage": 5.21, "elapsed_time": "0:11:49", "remaining_time": "3:35:08"}
{"current_steps": 40, "total_steps": 576, "loss": 0.7842, "lr": 3.362068965517242e-06, "epoch": 0.2077922077922078, "percentage": 6.94, "elapsed_time": "0:16:00", "remaining_time": "3:34:29"}
{"current_steps": 50, "total_steps": 576, "loss": 0.7462, "lr": 4.224137931034483e-06, "epoch": 0.2597402597402597, "percentage": 8.68, "elapsed_time": "0:20:01", "remaining_time": "3:30:35"}
{"current_steps": 60, "total_steps": 576, "loss": 0.7281, "lr": 4.999954022123679e-06, "epoch": 0.3116883116883117, "percentage": 10.42, "elapsed_time": "0:24:04", "remaining_time": "3:27:06"}
{"current_steps": 70, "total_steps": 576, "loss": 0.7182, "lr": 4.994438722989841e-06, "epoch": 0.36363636363636365, "percentage": 12.15, "elapsed_time": "0:27:55", "remaining_time": "3:21:52"}
{"current_steps": 80, "total_steps": 576, "loss": 0.71, "lr": 4.979751088147192e-06, "epoch": 0.4155844155844156, "percentage": 13.89, "elapsed_time": "0:32:02", "remaining_time": "3:18:41"}
{"current_steps": 90, "total_steps": 576, "loss": 0.7064, "lr": 4.955945125704375e-06, "epoch": 0.4675324675324675, "percentage": 15.62, "elapsed_time": "0:36:05", "remaining_time": "3:14:52"}
{"current_steps": 100, "total_steps": 576, "loss": 0.677, "lr": 4.923108372900683e-06, "epoch": 0.5194805194805194, "percentage": 17.36, "elapsed_time": "0:40:08", "remaining_time": "3:11:03"}
{"current_steps": 110, "total_steps": 576, "loss": 0.6915, "lr": 4.881361574221648e-06, "epoch": 0.5714285714285714, "percentage": 19.1, "elapsed_time": "0:44:14", "remaining_time": "3:07:23"}
{"current_steps": 120, "total_steps": 576, "loss": 0.6861, "lr": 4.830858237407799e-06, "epoch": 0.6233766233766234, "percentage": 20.83, "elapsed_time": "0:48:29", "remaining_time": "3:04:15"}
{"current_steps": 130, "total_steps": 576, "loss": 0.6975, "lr": 4.771784068989186e-06, "epoch": 0.6753246753246753, "percentage": 22.57, "elapsed_time": "0:52:54", "remaining_time": "3:01:31"}
{"current_steps": 140, "total_steps": 576, "loss": 0.6799, "lr": 4.7043562914212915e-06, "epoch": 0.7272727272727273, "percentage": 24.31, "elapsed_time": "0:57:02", "remaining_time": "2:57:38"}
{"current_steps": 150, "total_steps": 576, "loss": 0.6913, "lr": 4.6288228443332786e-06, "epoch": 0.7792207792207793, "percentage": 26.04, "elapsed_time": "1:01:10", "remaining_time": "2:53:44"}
{"current_steps": 160, "total_steps": 576, "loss": 0.6805, "lr": 4.5454614728256995e-06, "epoch": 0.8311688311688312, "percentage": 27.78, "elapsed_time": "1:05:20", "remaining_time": "2:49:53"}
{"current_steps": 170, "total_steps": 576, "loss": 0.6643, "lr": 4.454578706170075e-06, "epoch": 0.8831168831168831, "percentage": 29.51, "elapsed_time": "1:09:35", "remaining_time": "2:46:11"}
{"current_steps": 180, "total_steps": 576, "loss": 0.658, "lr": 4.356508730665804e-06, "epoch": 0.935064935064935, "percentage": 31.25, "elapsed_time": "1:13:38", "remaining_time": "2:42:00"}
{"current_steps": 190, "total_steps": 576, "loss": 0.6886, "lr": 4.251612160799017e-06, "epoch": 0.987012987012987, "percentage": 32.99, "elapsed_time": "1:18:03", "remaining_time": "2:38:34"}
{"current_steps": 200, "total_steps": 576, "loss": 0.6175, "lr": 4.140274713221985e-06, "epoch": 1.0415584415584416, "percentage": 34.72, "elapsed_time": "1:38:15", "remaining_time": "3:04:43"}
{"current_steps": 210, "total_steps": 576, "loss": 0.5921, "lr": 4.022905788428984e-06, "epoch": 1.0935064935064935, "percentage": 36.46, "elapsed_time": "1:42:31", "remaining_time": "2:58:41"}
{"current_steps": 220, "total_steps": 576, "loss": 0.6058, "lr": 3.899936965343989e-06, "epoch": 1.1454545454545455, "percentage": 38.19, "elapsed_time": "1:46:33", "remaining_time": "2:52:26"}
{"current_steps": 230, "total_steps": 576, "loss": 0.6233, "lr": 3.7718204143557337e-06, "epoch": 1.1974025974025975, "percentage": 39.93, "elapsed_time": "1:50:40", "remaining_time": "2:46:29"}
{"current_steps": 240, "total_steps": 576, "loss": 0.6183, "lr": 3.6390272346356225e-06, "epoch": 1.2493506493506494, "percentage": 41.67, "elapsed_time": "1:54:35", "remaining_time": "2:40:26"}
{"current_steps": 250, "total_steps": 576, "loss": 0.5841, "lr": 3.5020457218523407e-06, "epoch": 1.3012987012987014, "percentage": 43.4, "elapsed_time": "1:58:44", "remaining_time": "2:34:50"}
{"current_steps": 260, "total_steps": 576, "loss": 0.6015, "lr": 3.3613795726529795e-06, "epoch": 1.3532467532467534, "percentage": 45.14, "elapsed_time": "2:02:55", "remaining_time": "2:29:23"}
{"current_steps": 270, "total_steps": 576, "loss": 0.5974, "lr": 3.2175460325130176e-06, "epoch": 1.4051948051948053, "percentage": 46.88, "elapsed_time": "2:06:51", "remaining_time": "2:23:46"}
{"current_steps": 280, "total_steps": 576, "loss": 0.586, "lr": 3.0710739937657035e-06, "epoch": 1.457142857142857, "percentage": 48.61, "elapsed_time": "2:11:22", "remaining_time": "2:18:52"}
{"current_steps": 290, "total_steps": 576, "loss": 0.6151, "lr": 2.9225020508046233e-06, "epoch": 1.509090909090909, "percentage": 50.35, "elapsed_time": "2:15:21", "remaining_time": "2:13:29"}
{"current_steps": 300, "total_steps": 576, "loss": 0.5882, "lr": 2.7723765196106773e-06, "epoch": 1.561038961038961, "percentage": 52.08, "elapsed_time": "2:19:23", "remaining_time": "2:08:14"}
{"current_steps": 310, "total_steps": 576, "loss": 0.6164, "lr": 2.621249428885908e-06, "epoch": 1.612987012987013, "percentage": 53.82, "elapsed_time": "2:23:39", "remaining_time": "2:03:16"}
{"current_steps": 320, "total_steps": 576, "loss": 0.5999, "lr": 2.4696764901809926e-06, "epoch": 1.664935064935065, "percentage": 55.56, "elapsed_time": "2:27:45", "remaining_time": "1:58:12"}
{"current_steps": 330, "total_steps": 576, "loss": 0.588, "lr": 2.3182150544804878e-06, "epoch": 1.716883116883117, "percentage": 57.29, "elapsed_time": "2:31:43", "remaining_time": "1:53:06"}
{"current_steps": 340, "total_steps": 576, "loss": 0.5786, "lr": 2.1674220627596814e-06, "epoch": 1.7688311688311689, "percentage": 59.03, "elapsed_time": "2:35:52", "remaining_time": "1:48:11"}
{"current_steps": 350, "total_steps": 576, "loss": 0.5822, "lr": 2.017851998049107e-06, "epoch": 1.8207792207792208, "percentage": 60.76, "elapsed_time": "2:39:56", "remaining_time": "1:43:16"}
{"current_steps": 360, "total_steps": 576, "loss": 0.5837, "lr": 1.8700548465371877e-06, "epoch": 1.8727272727272726, "percentage": 62.5, "elapsed_time": "2:44:00", "remaining_time": "1:38:24"}
{"current_steps": 370, "total_steps": 576, "loss": 0.5871, "lr": 1.7245740752082901e-06, "epoch": 1.9246753246753245, "percentage": 64.24, "elapsed_time": "2:48:07", "remaining_time": "1:33:36"}
{"current_steps": 380, "total_steps": 576, "loss": 0.5838, "lr": 1.5819446334526363e-06, "epoch": 1.9766233766233765, "percentage": 65.97, "elapsed_time": "2:52:28", "remaining_time": "1:28:57"}
{"current_steps": 390, "total_steps": 576, "loss": 0.5697, "lr": 1.4426909859963716e-06, "epoch": 2.031168831168831, "percentage": 67.71, "elapsed_time": "3:00:56", "remaining_time": "1:26:17"}
{"current_steps": 400, "total_steps": 576, "loss": 0.5431, "lr": 1.3073251843849503e-06, "epoch": 2.083116883116883, "percentage": 69.44, "elapsed_time": "3:05:06", "remaining_time": "1:21:26"}
{"current_steps": 410, "total_steps": 576, "loss": 0.5016, "lr": 1.1763449841111906e-06, "epoch": 2.135064935064935, "percentage": 71.18, "elapsed_time": "3:09:14", "remaining_time": "1:16:37"}
{"current_steps": 420, "total_steps": 576, "loss": 0.5098, "lr": 1.05023201431156e-06, "epoch": 2.187012987012987, "percentage": 72.92, "elapsed_time": "3:13:31", "remaining_time": "1:11:52"}
{"current_steps": 430, "total_steps": 576, "loss": 0.5287, "lr": 9.294500067608941e-07, "epoch": 2.238961038961039, "percentage": 74.65, "elapsed_time": "3:17:39", "remaining_time": "1:07:06"}
{"current_steps": 440, "total_steps": 576, "loss": 0.516, "lr": 8.144430906777756e-07, "epoch": 2.290909090909091, "percentage": 76.39, "elapsed_time": "3:21:34", "remaining_time": "1:02:18"}
{"current_steps": 450, "total_steps": 576, "loss": 0.5143, "lr": 7.056341596107299e-07, "epoch": 2.342857142857143, "percentage": 78.12, "elapsed_time": "3:25:33", "remaining_time": "0:57:33"}
{"current_steps": 460, "total_steps": 576, "loss": 0.5239, "lr": 6.034233164104184e-07, "epoch": 2.394805194805195, "percentage": 79.86, "elapsed_time": "3:29:36", "remaining_time": "0:52:51"}
{"current_steps": 470, "total_steps": 576, "loss": 0.5196, "lr": 5.081864020058125e-07, "epoch": 2.446753246753247, "percentage": 81.6, "elapsed_time": "3:33:43", "remaining_time": "0:48:12"}
{"current_steps": 480, "total_steps": 576, "loss": 0.5272, "lr": 4.20273613394232e-07, "epoch": 2.498701298701299, "percentage": 83.33, "elapsed_time": "3:38:03", "remaining_time": "0:43:36"}
{"current_steps": 490, "total_steps": 576, "loss": 0.5169, "lr": 3.400082159270418e-07, "epoch": 2.5506493506493504, "percentage": 85.07, "elapsed_time": "3:42:18", "remaining_time": "0:39:01"}
{"current_steps": 500, "total_steps": 576, "loss": 0.5253, "lr": 2.676853546260791e-07, "epoch": 2.602597402597403, "percentage": 86.81, "elapsed_time": "3:46:22", "remaining_time": "0:34:24"}
{"current_steps": 510, "total_steps": 576, "loss": 0.5277, "lr": 2.0357096890174482e-07, "epoch": 2.6545454545454543, "percentage": 88.54, "elapsed_time": "3:50:42", "remaining_time": "0:29:51"}
{"current_steps": 520, "total_steps": 576, "loss": 0.5381, "lr": 1.4790081466345863e-07, "epoch": 2.7064935064935067, "percentage": 90.28, "elapsed_time": "3:54:42", "remaining_time": "0:25:16"}
{"current_steps": 530, "total_steps": 576, "loss": 0.5028, "lr": 1.0087959741828607e-07, "epoch": 2.7584415584415583, "percentage": 92.01, "elapsed_time": "3:58:42", "remaining_time": "0:20:43"}
{"current_steps": 540, "total_steps": 576, "loss": 0.525, "lr": 6.268021954544095e-08, "epoch": 2.8103896103896107, "percentage": 93.75, "elapsed_time": "4:02:59", "remaining_time": "0:16:11"}
{"current_steps": 550, "total_steps": 576, "loss": 0.5231, "lr": 3.3443144514516965e-08, "epoch": 2.862337662337662, "percentage": 95.49, "elapsed_time": "4:06:57", "remaining_time": "0:11:40"}
{"current_steps": 560, "total_steps": 576, "loss": 0.5317, "lr": 1.3275880385284767e-08, "epoch": 2.914285714285714, "percentage": 97.22, "elapsed_time": "4:11:10", "remaining_time": "0:07:10"}
{"current_steps": 570, "total_steps": 576, "loss": 0.5093, "lr": 2.252584488296461e-09, "epoch": 2.966233766233766, "percentage": 98.96, "elapsed_time": "4:15:11", "remaining_time": "0:02:41"}
{"current_steps": 576, "total_steps": 576, "epoch": 2.9974025974025973, "percentage": 100.0, "elapsed_time": "4:21:34", "remaining_time": "0:00:00"}