| { | |
| "global_steps": 27050, | |
| "loss": { | |
| "train": [ | |
| { | |
| "step": 50, | |
| "logs": { | |
| "loss": 1.2091, | |
| "epoch": 0.018484288354898338, | |
| "learning_rate": 1.0584432680980562e-05 | |
| } | |
| }, | |
| { | |
| "step": 100, | |
| "logs": { | |
| "loss": 1.1315, | |
| "epoch": 0.036968576709796676, | |
| "learning_rate": 1.2459822860720352e-05 | |
| } | |
| }, | |
| { | |
| "step": 150, | |
| "logs": { | |
| "loss": 1.1118, | |
| "epoch": 0.05545286506469501, | |
| "learning_rate": 1.355685579689696e-05 | |
| } | |
| }, | |
| { | |
| "step": 200, | |
| "logs": { | |
| "loss": 1.1091, | |
| "epoch": 0.07393715341959335, | |
| "learning_rate": 1.4335213053988223e-05 | |
| } | |
| }, | |
| { | |
| "step": 250, | |
| "logs": { | |
| "loss": 1.1063, | |
| "epoch": 0.09242144177449169, | |
| "learning_rate": 1.4938953847726847e-05 | |
| } | |
| }, | |
| { | |
| "step": 300, | |
| "logs": { | |
| "loss": 1.1012, | |
| "epoch": 0.11090573012939002, | |
| "learning_rate": 1.5432245994674192e-05 | |
| } | |
| }, | |
| { | |
| "step": 350, | |
| "logs": { | |
| "loss": 1.0844, | |
| "epoch": 0.12939001848428835, | |
| "learning_rate": 1.5849318562425815e-05 | |
| } | |
| }, | |
| { | |
| "step": 400, | |
| "logs": { | |
| "loss": 1.0911, | |
| "epoch": 0.1478743068391867, | |
| "learning_rate": 1.6210603254020138e-05 | |
| } | |
| }, | |
| { | |
| "step": 450, | |
| "logs": { | |
| "loss": 1.0816, | |
| "epoch": 0.16635859519408502, | |
| "learning_rate": 1.652927893686328e-05 | |
| } | |
| }, | |
| { | |
| "step": 500, | |
| "logs": { | |
| "loss": 1.0819, | |
| "epoch": 0.18484288354898337, | |
| "learning_rate": 1.6814344049111566e-05 | |
| } | |
| }, | |
| { | |
| "step": 550, | |
| "logs": { | |
| "loss": 1.0757, | |
| "epoch": 0.2033271719038817, | |
| "learning_rate": 1.70722168104602e-05 | |
| } | |
| }, | |
| { | |
| "step": 600, | |
| "logs": { | |
| "loss": 1.0706, | |
| "epoch": 0.22181146025878004, | |
| "learning_rate": 1.7307636196960783e-05 | |
| } | |
| }, | |
| { | |
| "step": 650, | |
| "logs": { | |
| "loss": 1.0698, | |
| "epoch": 0.24029574861367836, | |
| "learning_rate": 1.7524201039271304e-05 | |
| } | |
| }, | |
| { | |
| "step": 700, | |
| "logs": { | |
| "loss": 1.0632, | |
| "epoch": 0.2587800369685767, | |
| "learning_rate": 1.7724708765356604e-05 | |
| } | |
| }, | |
| { | |
| "step": 750, | |
| "logs": { | |
| "loss": 1.0601, | |
| "epoch": 0.27726432532347506, | |
| "learning_rate": 1.7911376992503148e-05 | |
| } | |
| }, | |
| { | |
| "step": 800, | |
| "logs": { | |
| "loss": 1.0582, | |
| "epoch": 0.2957486136783734, | |
| "learning_rate": 1.808599345743407e-05 | |
| } | |
| }, | |
| { | |
| "step": 850, | |
| "logs": { | |
| "loss": 1.0512, | |
| "epoch": 0.3142329020332717, | |
| "learning_rate": 1.825002041317456e-05 | |
| } | |
| }, | |
| { | |
| "step": 900, | |
| "logs": { | |
| "loss": 1.0544, | |
| "epoch": 0.33271719038817005, | |
| "learning_rate": 1.840466914065299e-05 | |
| } | |
| }, | |
| { | |
| "step": 950, | |
| "logs": { | |
| "loss": 1.043, | |
| "epoch": 0.3512014787430684, | |
| "learning_rate": 1.855095428760744e-05 | |
| } | |
| }, | |
| { | |
| "step": 1000, | |
| "logs": { | |
| "loss": 1.047, | |
| "epoch": 0.36968576709796674, | |
| "learning_rate": 1.8689734253201903e-05 | |
| } | |
| }, | |
| { | |
| "step": 1050, | |
| "logs": { | |
| "loss": 1.0408, | |
| "epoch": 0.38817005545286504, | |
| "learning_rate": 1.8821741709263542e-05 | |
| } | |
| }, | |
| { | |
| "step": 1100, | |
| "logs": { | |
| "loss": 1.0431, | |
| "epoch": 0.4066543438077634, | |
| "learning_rate": 1.89476070147965e-05 | |
| } | |
| }, | |
| { | |
| "step": 1150, | |
| "logs": { | |
| "loss": 1.0431, | |
| "epoch": 0.42513863216266173, | |
| "learning_rate": 1.9067876421445012e-05 | |
| } | |
| }, | |
| { | |
| "step": 1200, | |
| "logs": { | |
| "loss": 1.034, | |
| "epoch": 0.4436229205175601, | |
| "learning_rate": 1.9183026401502057e-05 | |
| } | |
| }, | |
| { | |
| "step": 1250, | |
| "logs": { | |
| "loss": 1.039, | |
| "epoch": 0.46210720887245843, | |
| "learning_rate": 1.9293475049105016e-05 | |
| } | |
| }, | |
| { | |
| "step": 1300, | |
| "logs": { | |
| "loss": 1.0304, | |
| "epoch": 0.4805914972273567, | |
| "learning_rate": 1.9399591243986016e-05 | |
| } | |
| }, | |
| { | |
| "step": 1350, | |
| "logs": { | |
| "loss": 1.0385, | |
| "epoch": 0.49907578558225507, | |
| "learning_rate": 1.950170208484624e-05 | |
| } | |
| }, | |
| { | |
| "step": 1400, | |
| "logs": { | |
| "loss": 1.027, | |
| "epoch": 0.5175600739371534, | |
| "learning_rate": 1.9600098970219974e-05 | |
| } | |
| }, | |
| { | |
| "step": 1450, | |
| "logs": { | |
| "loss": 1.0281, | |
| "epoch": 0.5360443622920518, | |
| "learning_rate": 1.9695042611797287e-05 | |
| } | |
| }, | |
| { | |
| "step": 1500, | |
| "logs": { | |
| "loss": 1.0282, | |
| "epoch": 0.5545286506469501, | |
| "learning_rate": 1.978676719749536e-05 | |
| } | |
| }, | |
| { | |
| "step": 1550, | |
| "logs": { | |
| "loss": 1.0186, | |
| "epoch": 0.5730129390018485, | |
| "learning_rate": 1.9875483871657987e-05 | |
| } | |
| }, | |
| { | |
| "step": 1600, | |
| "logs": { | |
| "loss": 1.0237, | |
| "epoch": 0.5914972273567468, | |
| "learning_rate": 1.9961383662539012e-05 | |
| } | |
| }, | |
| { | |
| "step": 1650, | |
| "logs": { | |
| "loss": 1.0176, | |
| "epoch": 0.609981515711645, | |
| "learning_rate": 1.9978762732528416e-05 | |
| } | |
| }, | |
| { | |
| "step": 1700, | |
| "logs": { | |
| "loss": 1.4539, | |
| "epoch": 0.6284658040665434, | |
| "learning_rate": 1.9939434459432887e-05 | |
| } | |
| }, | |
| { | |
| "step": 1750, | |
| "logs": { | |
| "loss": 1.2593, | |
| "epoch": 0.6469500924214417, | |
| "learning_rate": 1.990010618633736e-05 | |
| } | |
| }, | |
| { | |
| "step": 1800, | |
| "logs": { | |
| "loss": 1.5937, | |
| "epoch": 0.6654343807763401, | |
| "learning_rate": 1.986077791324183e-05 | |
| } | |
| }, | |
| { | |
| "step": 1850, | |
| "logs": { | |
| "loss": 1.0165, | |
| "epoch": 0.6839186691312384, | |
| "learning_rate": 1.9821449640146302e-05 | |
| } | |
| }, | |
| { | |
| "step": 1900, | |
| "logs": { | |
| "loss": 1.4354, | |
| "epoch": 0.7024029574861368, | |
| "learning_rate": 1.9782121367050776e-05 | |
| } | |
| }, | |
| { | |
| "step": 1950, | |
| "logs": { | |
| "loss": 1.021, | |
| "epoch": 0.7208872458410351, | |
| "learning_rate": 1.9742793093955247e-05 | |
| } | |
| }, | |
| { | |
| "step": 2000, | |
| "logs": { | |
| "loss": 1.0078, | |
| "epoch": 0.7393715341959335, | |
| "learning_rate": 1.9703464820859717e-05 | |
| } | |
| }, | |
| { | |
| "step": 2050, | |
| "logs": { | |
| "loss": 1.0057, | |
| "epoch": 0.7578558225508318, | |
| "learning_rate": 1.966413654776419e-05 | |
| } | |
| }, | |
| { | |
| "step": 2100, | |
| "logs": { | |
| "loss": 1.0001, | |
| "epoch": 0.7763401109057301, | |
| "learning_rate": 1.9624808274668662e-05 | |
| } | |
| }, | |
| { | |
| "step": 2150, | |
| "logs": { | |
| "loss": 1.006, | |
| "epoch": 0.7948243992606284, | |
| "learning_rate": 1.9585480001573133e-05 | |
| } | |
| }, | |
| { | |
| "step": 2200, | |
| "logs": { | |
| "loss": 1.0103, | |
| "epoch": 0.8133086876155268, | |
| "learning_rate": 1.9546151728477603e-05 | |
| } | |
| }, | |
| { | |
| "step": 2250, | |
| "logs": { | |
| "loss": 1.0046, | |
| "epoch": 0.8317929759704251, | |
| "learning_rate": 1.9506823455382077e-05 | |
| } | |
| }, | |
| { | |
| "step": 2300, | |
| "logs": { | |
| "loss": 0.9941, | |
| "epoch": 0.8502772643253235, | |
| "learning_rate": 1.9467495182286548e-05 | |
| } | |
| }, | |
| { | |
| "step": 2350, | |
| "logs": { | |
| "loss": 0.9963, | |
| "epoch": 0.8687615526802218, | |
| "learning_rate": 1.942816690919102e-05 | |
| } | |
| }, | |
| { | |
| "step": 2400, | |
| "logs": { | |
| "loss": 0.9926, | |
| "epoch": 0.8872458410351202, | |
| "learning_rate": 1.938883863609549e-05 | |
| } | |
| }, | |
| { | |
| "step": 2450, | |
| "logs": { | |
| "loss": 0.9918, | |
| "epoch": 0.9057301293900185, | |
| "learning_rate": 1.934951036299996e-05 | |
| } | |
| }, | |
| { | |
| "step": 2500, | |
| "logs": { | |
| "loss": 0.9899, | |
| "epoch": 0.9242144177449169, | |
| "learning_rate": 1.9310182089904434e-05 | |
| } | |
| }, | |
| { | |
| "step": 2550, | |
| "logs": { | |
| "loss": 0.9887, | |
| "epoch": 0.9426987060998152, | |
| "learning_rate": 1.9270853816808904e-05 | |
| } | |
| }, | |
| { | |
| "step": 2600, | |
| "logs": { | |
| "loss": 0.9942, | |
| "epoch": 0.9611829944547134, | |
| "learning_rate": 1.9231525543713375e-05 | |
| } | |
| }, | |
| { | |
| "step": 2650, | |
| "logs": { | |
| "loss": 0.9817, | |
| "epoch": 0.9796672828096118, | |
| "learning_rate": 1.919219727061785e-05 | |
| } | |
| }, | |
| { | |
| "step": 2700, | |
| "logs": { | |
| "loss": 0.9811, | |
| "epoch": 0.9981515711645101, | |
| "learning_rate": 1.915286899752232e-05 | |
| } | |
| }, | |
| { | |
| "step": 2750, | |
| "logs": { | |
| "loss": 0.8466, | |
| "epoch": 1.0166358595194085, | |
| "learning_rate": 1.911354072442679e-05 | |
| } | |
| }, | |
| { | |
| "step": 2800, | |
| "logs": { | |
| "loss": 0.8316, | |
| "epoch": 1.0351201478743068, | |
| "learning_rate": 1.9074212451331264e-05 | |
| } | |
| }, | |
| { | |
| "step": 2850, | |
| "logs": { | |
| "loss": 0.8363, | |
| "epoch": 1.0536044362292052, | |
| "learning_rate": 1.9034884178235735e-05 | |
| } | |
| }, | |
| { | |
| "step": 2900, | |
| "logs": { | |
| "loss": 0.8378, | |
| "epoch": 1.0720887245841035, | |
| "learning_rate": 1.8995555905140205e-05 | |
| } | |
| }, | |
| { | |
| "step": 2950, | |
| "logs": { | |
| "loss": 0.8386, | |
| "epoch": 1.0905730129390019, | |
| "learning_rate": 1.895622763204468e-05 | |
| } | |
| }, | |
| { | |
| "step": 3000, | |
| "logs": { | |
| "loss": 0.8465, | |
| "epoch": 1.1090573012939002, | |
| "learning_rate": 1.891689935894915e-05 | |
| } | |
| }, | |
| { | |
| "step": 3050, | |
| "logs": { | |
| "loss": 0.8375, | |
| "epoch": 1.1275415896487986, | |
| "learning_rate": 1.887757108585362e-05 | |
| } | |
| }, | |
| { | |
| "step": 3100, | |
| "logs": { | |
| "loss": 0.8379, | |
| "epoch": 1.146025878003697, | |
| "learning_rate": 1.8838242812758095e-05 | |
| } | |
| }, | |
| { | |
| "step": 3150, | |
| "logs": { | |
| "loss": 0.836, | |
| "epoch": 1.1645101663585953, | |
| "learning_rate": 1.8798914539662565e-05 | |
| } | |
| }, | |
| { | |
| "step": 3200, | |
| "logs": { | |
| "loss": 0.8411, | |
| "epoch": 1.1829944547134936, | |
| "learning_rate": 1.8759586266567036e-05 | |
| } | |
| }, | |
| { | |
| "step": 3250, | |
| "logs": { | |
| "loss": 0.8442, | |
| "epoch": 1.201478743068392, | |
| "learning_rate": 1.872025799347151e-05 | |
| } | |
| }, | |
| { | |
| "step": 3300, | |
| "logs": { | |
| "loss": 0.8397, | |
| "epoch": 1.21996303142329, | |
| "learning_rate": 1.868092972037598e-05 | |
| } | |
| }, | |
| { | |
| "step": 3350, | |
| "logs": { | |
| "loss": 0.8415, | |
| "epoch": 1.2384473197781884, | |
| "learning_rate": 1.864160144728045e-05 | |
| } | |
| }, | |
| { | |
| "step": 3400, | |
| "logs": { | |
| "loss": 0.8397, | |
| "epoch": 1.2569316081330868, | |
| "learning_rate": 1.8602273174184925e-05 | |
| } | |
| }, | |
| { | |
| "step": 3450, | |
| "logs": { | |
| "loss": 0.8396, | |
| "epoch": 1.2754158964879851, | |
| "learning_rate": 1.8562944901089396e-05 | |
| } | |
| }, | |
| { | |
| "step": 3500, | |
| "logs": { | |
| "loss": 0.8452, | |
| "epoch": 1.2939001848428835, | |
| "learning_rate": 1.8523616627993866e-05 | |
| } | |
| }, | |
| { | |
| "step": 3550, | |
| "logs": { | |
| "loss": 0.8362, | |
| "epoch": 1.3123844731977818, | |
| "learning_rate": 1.848428835489834e-05 | |
| } | |
| }, | |
| { | |
| "step": 3600, | |
| "logs": { | |
| "loss": 0.8396, | |
| "epoch": 1.3308687615526802, | |
| "learning_rate": 1.844496008180281e-05 | |
| } | |
| }, | |
| { | |
| "step": 3650, | |
| "logs": { | |
| "loss": 0.8334, | |
| "epoch": 1.3493530499075785, | |
| "learning_rate": 1.840563180870728e-05 | |
| } | |
| }, | |
| { | |
| "step": 3700, | |
| "logs": { | |
| "loss": 0.834, | |
| "epoch": 1.3678373382624769, | |
| "learning_rate": 1.8366303535611752e-05 | |
| } | |
| }, | |
| { | |
| "step": 3750, | |
| "logs": { | |
| "loss": 0.8333, | |
| "epoch": 1.3863216266173752, | |
| "learning_rate": 1.8326975262516223e-05 | |
| } | |
| }, | |
| { | |
| "step": 3800, | |
| "logs": { | |
| "loss": 0.8357, | |
| "epoch": 1.4048059149722736, | |
| "learning_rate": 1.8287646989420697e-05 | |
| } | |
| }, | |
| { | |
| "step": 3850, | |
| "logs": { | |
| "loss": 0.8374, | |
| "epoch": 1.423290203327172, | |
| "learning_rate": 1.8248318716325167e-05 | |
| } | |
| }, | |
| { | |
| "step": 3900, | |
| "logs": { | |
| "loss": 0.837, | |
| "epoch": 1.4417744916820703, | |
| "learning_rate": 1.8208990443229638e-05 | |
| } | |
| }, | |
| { | |
| "step": 3950, | |
| "logs": { | |
| "loss": 0.835, | |
| "epoch": 1.4602587800369686, | |
| "learning_rate": 1.816966217013411e-05 | |
| } | |
| }, | |
| { | |
| "step": 4000, | |
| "logs": { | |
| "loss": 0.8352, | |
| "epoch": 1.478743068391867, | |
| "learning_rate": 1.8130333897038583e-05 | |
| } | |
| }, | |
| { | |
| "step": 4050, | |
| "logs": { | |
| "loss": 0.8475, | |
| "epoch": 1.4972273567467653, | |
| "learning_rate": 1.8091005623943053e-05 | |
| } | |
| }, | |
| { | |
| "step": 4100, | |
| "logs": { | |
| "loss": 0.8339, | |
| "epoch": 1.5157116451016637, | |
| "learning_rate": 1.8051677350847524e-05 | |
| } | |
| }, | |
| { | |
| "step": 4150, | |
| "logs": { | |
| "loss": 0.8382, | |
| "epoch": 1.534195933456562, | |
| "learning_rate": 1.8012349077751998e-05 | |
| } | |
| }, | |
| { | |
| "step": 4200, | |
| "logs": { | |
| "loss": 0.8376, | |
| "epoch": 1.5526802218114601, | |
| "learning_rate": 1.797302080465647e-05 | |
| } | |
| }, | |
| { | |
| "step": 4250, | |
| "logs": { | |
| "loss": 0.8302, | |
| "epoch": 1.5711645101663585, | |
| "learning_rate": 1.793369253156094e-05 | |
| } | |
| }, | |
| { | |
| "step": 4300, | |
| "logs": { | |
| "loss": 0.8312, | |
| "epoch": 1.5896487985212568, | |
| "learning_rate": 1.7894364258465413e-05 | |
| } | |
| }, | |
| { | |
| "step": 4350, | |
| "logs": { | |
| "loss": 0.8361, | |
| "epoch": 1.6081330868761552, | |
| "learning_rate": 1.7855035985369884e-05 | |
| } | |
| }, | |
| { | |
| "step": 4400, | |
| "logs": { | |
| "loss": 0.8321, | |
| "epoch": 1.6266173752310535, | |
| "learning_rate": 1.7815707712274354e-05 | |
| } | |
| }, | |
| { | |
| "step": 4450, | |
| "logs": { | |
| "loss": 0.8374, | |
| "epoch": 1.645101663585952, | |
| "learning_rate": 1.777637943917883e-05 | |
| } | |
| }, | |
| { | |
| "step": 4500, | |
| "logs": { | |
| "loss": 0.8287, | |
| "epoch": 1.6635859519408502, | |
| "learning_rate": 1.77370511660833e-05 | |
| } | |
| }, | |
| { | |
| "step": 4550, | |
| "logs": { | |
| "loss": 0.8367, | |
| "epoch": 1.6820702402957486, | |
| "learning_rate": 1.769772289298777e-05 | |
| } | |
| }, | |
| { | |
| "step": 4600, | |
| "logs": { | |
| "loss": 0.8439, | |
| "epoch": 1.700554528650647, | |
| "learning_rate": 1.7658394619892244e-05 | |
| } | |
| }, | |
| { | |
| "step": 4650, | |
| "logs": { | |
| "loss": 0.829, | |
| "epoch": 1.7190388170055453, | |
| "learning_rate": 1.7619066346796714e-05 | |
| } | |
| }, | |
| { | |
| "step": 4700, | |
| "logs": { | |
| "loss": 0.8325, | |
| "epoch": 1.7375231053604436, | |
| "learning_rate": 1.7579738073701185e-05 | |
| } | |
| }, | |
| { | |
| "step": 4750, | |
| "logs": { | |
| "loss": 0.837, | |
| "epoch": 1.756007393715342, | |
| "learning_rate": 1.754040980060566e-05 | |
| } | |
| }, | |
| { | |
| "step": 4800, | |
| "logs": { | |
| "loss": 0.8371, | |
| "epoch": 1.7744916820702403, | |
| "learning_rate": 1.750108152751013e-05 | |
| } | |
| }, | |
| { | |
| "step": 4850, | |
| "logs": { | |
| "loss": 0.832, | |
| "epoch": 1.7929759704251387, | |
| "learning_rate": 1.74617532544146e-05 | |
| } | |
| }, | |
| { | |
| "step": 4900, | |
| "logs": { | |
| "loss": 0.8342, | |
| "epoch": 1.811460258780037, | |
| "learning_rate": 1.7422424981319074e-05 | |
| } | |
| }, | |
| { | |
| "step": 4950, | |
| "logs": { | |
| "loss": 0.8331, | |
| "epoch": 1.8299445471349354, | |
| "learning_rate": 1.7383096708223545e-05 | |
| } | |
| }, | |
| { | |
| "step": 5000, | |
| "logs": { | |
| "loss": 0.8234, | |
| "epoch": 1.8484288354898337, | |
| "learning_rate": 1.7343768435128015e-05 | |
| } | |
| }, | |
| { | |
| "step": 5050, | |
| "logs": { | |
| "loss": 0.8311, | |
| "epoch": 1.866913123844732, | |
| "learning_rate": 1.7304440162032486e-05 | |
| } | |
| }, | |
| { | |
| "step": 5100, | |
| "logs": { | |
| "loss": 0.8259, | |
| "epoch": 1.8853974121996304, | |
| "learning_rate": 1.726511188893696e-05 | |
| } | |
| }, | |
| { | |
| "step": 5150, | |
| "logs": { | |
| "loss": 0.8253, | |
| "epoch": 1.9038817005545285, | |
| "learning_rate": 1.722578361584143e-05 | |
| } | |
| }, | |
| { | |
| "step": 5200, | |
| "logs": { | |
| "loss": 0.8297, | |
| "epoch": 1.922365988909427, | |
| "learning_rate": 1.71864553427459e-05 | |
| } | |
| }, | |
| { | |
| "step": 5250, | |
| "logs": { | |
| "loss": 0.8264, | |
| "epoch": 1.9408502772643252, | |
| "learning_rate": 1.7147127069650372e-05 | |
| } | |
| }, | |
| { | |
| "step": 5300, | |
| "logs": { | |
| "loss": 0.8283, | |
| "epoch": 1.9593345656192236, | |
| "learning_rate": 1.7107798796554846e-05 | |
| } | |
| }, | |
| { | |
| "step": 5350, | |
| "logs": { | |
| "loss": 0.8262, | |
| "epoch": 1.977818853974122, | |
| "learning_rate": 1.7068470523459316e-05 | |
| } | |
| }, | |
| { | |
| "step": 5400, | |
| "logs": { | |
| "loss": 0.829, | |
| "epoch": 1.9963031423290203, | |
| "learning_rate": 1.7029142250363787e-05 | |
| } | |
| }, | |
| { | |
| "step": 5450, | |
| "logs": { | |
| "loss": 0.6969, | |
| "epoch": 2.014787430683919, | |
| "learning_rate": 1.6989813977268258e-05 | |
| } | |
| }, | |
| { | |
| "step": 5500, | |
| "logs": { | |
| "loss": 0.6715, | |
| "epoch": 2.033271719038817, | |
| "learning_rate": 1.695048570417273e-05 | |
| } | |
| }, | |
| { | |
| "step": 5550, | |
| "logs": { | |
| "loss": 0.6636, | |
| "epoch": 2.0517560073937156, | |
| "learning_rate": 1.6911157431077202e-05 | |
| } | |
| }, | |
| { | |
| "step": 5600, | |
| "logs": { | |
| "loss": 0.6649, | |
| "epoch": 2.0702402957486137, | |
| "learning_rate": 1.6871829157981673e-05 | |
| } | |
| }, | |
| { | |
| "step": 5650, | |
| "logs": { | |
| "loss": 0.665, | |
| "epoch": 2.088724584103512, | |
| "learning_rate": 1.6832500884886147e-05 | |
| } | |
| }, | |
| { | |
| "step": 5700, | |
| "logs": { | |
| "loss": 0.6746, | |
| "epoch": 2.1072088724584104, | |
| "learning_rate": 1.6793172611790617e-05 | |
| } | |
| }, | |
| { | |
| "step": 5750, | |
| "logs": { | |
| "loss": 0.6678, | |
| "epoch": 2.1256931608133085, | |
| "learning_rate": 1.6753844338695088e-05 | |
| } | |
| }, | |
| { | |
| "step": 5800, | |
| "logs": { | |
| "loss": 0.6739, | |
| "epoch": 2.144177449168207, | |
| "learning_rate": 1.6714516065599562e-05 | |
| } | |
| }, | |
| { | |
| "step": 5850, | |
| "logs": { | |
| "loss": 0.6666, | |
| "epoch": 2.162661737523105, | |
| "learning_rate": 1.6675187792504033e-05 | |
| } | |
| }, | |
| { | |
| "step": 5900, | |
| "logs": { | |
| "loss": 0.674, | |
| "epoch": 2.1811460258780038, | |
| "learning_rate": 1.6635859519408503e-05 | |
| } | |
| }, | |
| { | |
| "step": 5950, | |
| "logs": { | |
| "loss": 0.6737, | |
| "epoch": 2.199630314232902, | |
| "learning_rate": 1.6596531246312977e-05 | |
| } | |
| }, | |
| { | |
| "step": 6000, | |
| "logs": { | |
| "loss": 0.675, | |
| "epoch": 2.2181146025878005, | |
| "learning_rate": 1.6557202973217448e-05 | |
| } | |
| }, | |
| { | |
| "step": 6050, | |
| "logs": { | |
| "loss": 0.6743, | |
| "epoch": 2.2365988909426986, | |
| "learning_rate": 1.651787470012192e-05 | |
| } | |
| }, | |
| { | |
| "step": 6100, | |
| "logs": { | |
| "loss": 0.6718, | |
| "epoch": 2.255083179297597, | |
| "learning_rate": 1.647854642702639e-05 | |
| } | |
| }, | |
| { | |
| "step": 6150, | |
| "logs": { | |
| "loss": 0.6735, | |
| "epoch": 2.2735674676524953, | |
| "learning_rate": 1.6439218153930863e-05 | |
| } | |
| }, | |
| { | |
| "step": 6200, | |
| "logs": { | |
| "loss": 0.6798, | |
| "epoch": 2.292051756007394, | |
| "learning_rate": 1.6399889880835334e-05 | |
| } | |
| }, | |
| { | |
| "step": 6250, | |
| "logs": { | |
| "loss": 0.6768, | |
| "epoch": 2.310536044362292, | |
| "learning_rate": 1.6360561607739804e-05 | |
| } | |
| }, | |
| { | |
| "step": 6300, | |
| "logs": { | |
| "loss": 0.6796, | |
| "epoch": 2.3290203327171906, | |
| "learning_rate": 1.632123333464428e-05 | |
| } | |
| }, | |
| { | |
| "step": 6350, | |
| "logs": { | |
| "loss": 0.6813, | |
| "epoch": 2.3475046210720887, | |
| "learning_rate": 1.628190506154875e-05 | |
| } | |
| }, | |
| { | |
| "step": 6400, | |
| "logs": { | |
| "loss": 0.6774, | |
| "epoch": 2.3659889094269873, | |
| "learning_rate": 1.624257678845322e-05 | |
| } | |
| }, | |
| { | |
| "step": 6450, | |
| "logs": { | |
| "loss": 0.6745, | |
| "epoch": 2.3844731977818854, | |
| "learning_rate": 1.6203248515357694e-05 | |
| } | |
| }, | |
| { | |
| "step": 6500, | |
| "logs": { | |
| "loss": 0.6809, | |
| "epoch": 2.402957486136784, | |
| "learning_rate": 1.6163920242262164e-05 | |
| } | |
| }, | |
| { | |
| "step": 6550, | |
| "logs": { | |
| "loss": 0.6831, | |
| "epoch": 2.421441774491682, | |
| "learning_rate": 1.6124591969166635e-05 | |
| } | |
| }, | |
| { | |
| "step": 6600, | |
| "logs": { | |
| "loss": 0.6803, | |
| "epoch": 2.43992606284658, | |
| "learning_rate": 1.608526369607111e-05 | |
| } | |
| }, | |
| { | |
| "step": 6650, | |
| "logs": { | |
| "loss": 0.6791, | |
| "epoch": 2.4584103512014788, | |
| "learning_rate": 1.604593542297558e-05 | |
| } | |
| }, | |
| { | |
| "step": 6700, | |
| "logs": { | |
| "loss": 0.6812, | |
| "epoch": 2.476894639556377, | |
| "learning_rate": 1.600660714988005e-05 | |
| } | |
| }, | |
| { | |
| "step": 6750, | |
| "logs": { | |
| "loss": 0.6866, | |
| "epoch": 2.4953789279112755, | |
| "learning_rate": 1.596727887678452e-05 | |
| } | |
| }, | |
| { | |
| "step": 6800, | |
| "logs": { | |
| "loss": 0.6837, | |
| "epoch": 2.5138632162661736, | |
| "learning_rate": 1.5927950603688995e-05 | |
| } | |
| }, | |
| { | |
| "step": 6850, | |
| "logs": { | |
| "loss": 0.6814, | |
| "epoch": 2.532347504621072, | |
| "learning_rate": 1.5888622330593465e-05 | |
| } | |
| }, | |
| { | |
| "step": 6900, | |
| "logs": { | |
| "loss": 0.6845, | |
| "epoch": 2.5508317929759703, | |
| "learning_rate": 1.5849294057497936e-05 | |
| } | |
| }, | |
| { | |
| "step": 6950, | |
| "logs": { | |
| "loss": 0.6832, | |
| "epoch": 2.569316081330869, | |
| "learning_rate": 1.5809965784402407e-05 | |
| } | |
| }, | |
| { | |
| "step": 7000, | |
| "logs": { | |
| "loss": 0.6795, | |
| "epoch": 2.587800369685767, | |
| "learning_rate": 1.5770637511306877e-05 | |
| } | |
| }, | |
| { | |
| "step": 7050, | |
| "logs": { | |
| "loss": 0.679, | |
| "epoch": 2.6062846580406656, | |
| "learning_rate": 1.573130923821135e-05 | |
| } | |
| }, | |
| { | |
| "step": 7100, | |
| "logs": { | |
| "loss": 0.6851, | |
| "epoch": 2.6247689463955637, | |
| "learning_rate": 1.5691980965115822e-05 | |
| } | |
| }, | |
| { | |
| "step": 7150, | |
| "logs": { | |
| "loss": 0.692, | |
| "epoch": 2.6432532347504623, | |
| "learning_rate": 1.5652652692020292e-05 | |
| } | |
| }, | |
| { | |
| "step": 7200, | |
| "logs": { | |
| "loss": 0.6956, | |
| "epoch": 2.6617375231053604, | |
| "learning_rate": 1.5613324418924766e-05 | |
| } | |
| }, | |
| { | |
| "step": 7250, | |
| "logs": { | |
| "loss": 0.6883, | |
| "epoch": 2.680221811460259, | |
| "learning_rate": 1.5573996145829237e-05 | |
| } | |
| }, | |
| { | |
| "step": 7300, | |
| "logs": { | |
| "loss": 0.6806, | |
| "epoch": 2.698706099815157, | |
| "learning_rate": 1.5534667872733708e-05 | |
| } | |
| }, | |
| { | |
| "step": 7350, | |
| "logs": { | |
| "loss": 0.6832, | |
| "epoch": 2.7171903881700556, | |
| "learning_rate": 1.549533959963818e-05 | |
| } | |
| }, | |
| { | |
| "step": 7400, | |
| "logs": { | |
| "loss": 0.6871, | |
| "epoch": 2.7356746765249538, | |
| "learning_rate": 1.5456011326542652e-05 | |
| } | |
| }, | |
| { | |
| "step": 7450, | |
| "logs": { | |
| "loss": 0.6843, | |
| "epoch": 2.7541589648798523, | |
| "learning_rate": 1.5416683053447123e-05 | |
| } | |
| }, | |
| { | |
| "step": 7500, | |
| "logs": { | |
| "loss": 0.6869, | |
| "epoch": 2.7726432532347505, | |
| "learning_rate": 1.5377354780351597e-05 | |
| } | |
| }, | |
| { | |
| "step": 7550, | |
| "logs": { | |
| "loss": 0.689, | |
| "epoch": 2.7911275415896486, | |
| "learning_rate": 1.5338026507256067e-05 | |
| } | |
| }, | |
| { | |
| "step": 7600, | |
| "logs": { | |
| "loss": 0.6864, | |
| "epoch": 2.809611829944547, | |
| "learning_rate": 1.5298698234160538e-05 | |
| } | |
| }, | |
| { | |
| "step": 7650, | |
| "logs": { | |
| "loss": 0.6875, | |
| "epoch": 2.8280961182994453, | |
| "learning_rate": 1.5259369961065012e-05 | |
| } | |
| }, | |
| { | |
| "step": 7700, | |
| "logs": { | |
| "loss": 0.6844, | |
| "epoch": 2.846580406654344, | |
| "learning_rate": 1.5220041687969483e-05 | |
| } | |
| }, | |
| { | |
| "step": 7750, | |
| "logs": { | |
| "loss": 0.6916, | |
| "epoch": 2.865064695009242, | |
| "learning_rate": 1.5180713414873953e-05 | |
| } | |
| }, | |
| { | |
| "step": 7800, | |
| "logs": { | |
| "loss": 0.6849, | |
| "epoch": 2.8835489833641406, | |
| "learning_rate": 1.5141385141778426e-05 | |
| } | |
| }, | |
| { | |
| "step": 7850, | |
| "logs": { | |
| "loss": 0.6835, | |
| "epoch": 2.9020332717190387, | |
| "learning_rate": 1.5102056868682898e-05 | |
| } | |
| }, | |
| { | |
| "step": 7900, | |
| "logs": { | |
| "loss": 0.6866, | |
| "epoch": 2.9205175600739373, | |
| "learning_rate": 1.5062728595587369e-05 | |
| } | |
| }, | |
| { | |
| "step": 7950, | |
| "logs": { | |
| "loss": 0.6863, | |
| "epoch": 2.9390018484288354, | |
| "learning_rate": 1.502340032249184e-05 | |
| } | |
| }, | |
| { | |
| "step": 8000, | |
| "logs": { | |
| "loss": 0.6903, | |
| "epoch": 2.957486136783734, | |
| "learning_rate": 1.4984072049396311e-05 | |
| } | |
| }, | |
| { | |
| "step": 8050, | |
| "logs": { | |
| "loss": 0.686, | |
| "epoch": 2.975970425138632, | |
| "learning_rate": 1.4944743776300784e-05 | |
| } | |
| }, | |
| { | |
| "step": 8100, | |
| "logs": { | |
| "loss": 0.6909, | |
| "epoch": 2.9944547134935307, | |
| "learning_rate": 1.4905415503205256e-05 | |
| } | |
| }, | |
| { | |
| "step": 8150, | |
| "logs": { | |
| "loss": 0.5832, | |
| "epoch": 3.0129390018484288, | |
| "learning_rate": 1.4866087230109727e-05 | |
| } | |
| }, | |
| { | |
| "step": 8200, | |
| "logs": { | |
| "loss": 0.5314, | |
| "epoch": 3.0314232902033273, | |
| "learning_rate": 1.4826758957014197e-05 | |
| } | |
| }, | |
| { | |
| "step": 8250, | |
| "logs": { | |
| "loss": 0.5332, | |
| "epoch": 3.0499075785582255, | |
| "learning_rate": 1.4787430683918671e-05 | |
| } | |
| }, | |
| { | |
| "step": 8300, | |
| "logs": { | |
| "loss": 0.5359, | |
| "epoch": 3.068391866913124, | |
| "learning_rate": 1.4748102410823142e-05 | |
| } | |
| }, | |
| { | |
| "step": 8350, | |
| "logs": { | |
| "loss": 0.5398, | |
| "epoch": 3.086876155268022, | |
| "learning_rate": 1.4708774137727613e-05 | |
| } | |
| }, | |
| { | |
| "step": 8400, | |
| "logs": { | |
| "loss": 0.5433, | |
| "epoch": 3.1053604436229203, | |
| "learning_rate": 1.4669445864632087e-05 | |
| } | |
| }, | |
| { | |
| "step": 8450, | |
| "logs": { | |
| "loss": 0.5368, | |
| "epoch": 3.123844731977819, | |
| "learning_rate": 1.4630117591536557e-05 | |
| } | |
| }, | |
| { | |
| "step": 8500, | |
| "logs": { | |
| "loss": 0.5419, | |
| "epoch": 3.142329020332717, | |
| "learning_rate": 1.4590789318441028e-05 | |
| } | |
| }, | |
| { | |
| "step": 8550, | |
| "logs": { | |
| "loss": 0.5398, | |
| "epoch": 3.1608133086876156, | |
| "learning_rate": 1.45514610453455e-05 | |
| } | |
| }, | |
| { | |
| "step": 8600, | |
| "logs": { | |
| "loss": 0.5442, | |
| "epoch": 3.1792975970425137, | |
| "learning_rate": 1.4512132772249972e-05 | |
| } | |
| }, | |
| { | |
| "step": 8650, | |
| "logs": { | |
| "loss": 0.544, | |
| "epoch": 3.1977818853974123, | |
| "learning_rate": 1.4472804499154443e-05 | |
| } | |
| }, | |
| { | |
| "step": 8700, | |
| "logs": { | |
| "loss": 0.5455, | |
| "epoch": 3.2162661737523104, | |
| "learning_rate": 1.4433476226058915e-05 | |
| } | |
| }, | |
| { | |
| "step": 8750, | |
| "logs": { | |
| "loss": 0.548, | |
| "epoch": 3.234750462107209, | |
| "learning_rate": 1.4394147952963386e-05 | |
| } | |
| }, | |
| { | |
| "step": 8800, | |
| "logs": { | |
| "loss": 0.5453, | |
| "epoch": 3.253234750462107, | |
| "learning_rate": 1.4354819679867858e-05 | |
| } | |
| }, | |
| { | |
| "step": 8850, | |
| "logs": { | |
| "loss": 0.5416, | |
| "epoch": 3.2717190388170057, | |
| "learning_rate": 1.431549140677233e-05 | |
| } | |
| }, | |
| { | |
| "step": 8900, | |
| "logs": { | |
| "loss": 0.5542, | |
| "epoch": 3.290203327171904, | |
| "learning_rate": 1.4276163133676801e-05 | |
| } | |
| }, | |
| { | |
| "step": 8950, | |
| "logs": { | |
| "loss": 0.5469, | |
| "epoch": 3.3086876155268024, | |
| "learning_rate": 1.4236834860581272e-05 | |
| } | |
| }, | |
| { | |
| "step": 9000, | |
| "logs": { | |
| "loss": 0.5545, | |
| "epoch": 3.3271719038817005, | |
| "learning_rate": 1.4197506587485746e-05 | |
| } | |
| }, | |
| { | |
| "step": 9050, | |
| "logs": { | |
| "loss": 0.5538, | |
| "epoch": 3.345656192236599, | |
| "learning_rate": 1.4158178314390216e-05 | |
| } | |
| }, | |
| { | |
| "step": 9100, | |
| "logs": { | |
| "loss": 0.5504, | |
| "epoch": 3.364140480591497, | |
| "learning_rate": 1.4118850041294687e-05 | |
| } | |
| }, | |
| { | |
| "step": 9150, | |
| "logs": { | |
| "loss": 0.5511, | |
| "epoch": 3.3826247689463957, | |
| "learning_rate": 1.4079521768199161e-05 | |
| } | |
| }, | |
| { | |
| "step": 9200, | |
| "logs": { | |
| "loss": 0.554, | |
| "epoch": 3.401109057301294, | |
| "learning_rate": 1.4040193495103632e-05 | |
| } | |
| }, | |
| { | |
| "step": 9250, | |
| "logs": { | |
| "loss": 0.5541, | |
| "epoch": 3.4195933456561924, | |
| "learning_rate": 1.4000865222008102e-05 | |
| } | |
| }, | |
| { | |
| "step": 9300, | |
| "logs": { | |
| "loss": 0.5502, | |
| "epoch": 3.4380776340110906, | |
| "learning_rate": 1.3961536948912575e-05 | |
| } | |
| }, | |
| { | |
| "step": 9350, | |
| "logs": { | |
| "loss": 0.5513, | |
| "epoch": 3.4565619223659887, | |
| "learning_rate": 1.3922208675817047e-05 | |
| } | |
| }, | |
| { | |
| "step": 9400, | |
| "logs": { | |
| "loss": 0.5579, | |
| "epoch": 3.4750462107208873, | |
| "learning_rate": 1.3882880402721517e-05 | |
| } | |
| }, | |
| { | |
| "step": 9450, | |
| "logs": { | |
| "loss": 0.5636, | |
| "epoch": 3.4935304990757854, | |
| "learning_rate": 1.384355212962599e-05 | |
| } | |
| }, | |
| { | |
| "step": 9500, | |
| "logs": { | |
| "loss": 0.5617, | |
| "epoch": 3.512014787430684, | |
| "learning_rate": 1.380422385653046e-05 | |
| } | |
| }, | |
| { | |
| "step": 9550, | |
| "logs": { | |
| "loss": 0.5549, | |
| "epoch": 3.530499075785582, | |
| "learning_rate": 1.3764895583434933e-05 | |
| } | |
| }, | |
| { | |
| "step": 9600, | |
| "logs": { | |
| "loss": 0.5599, | |
| "epoch": 3.5489833641404807, | |
| "learning_rate": 1.3725567310339405e-05 | |
| } | |
| }, | |
| { | |
| "step": 9650, | |
| "logs": { | |
| "loss": 0.5565, | |
| "epoch": 3.567467652495379, | |
| "learning_rate": 1.3686239037243876e-05 | |
| } | |
| }, | |
| { | |
| "step": 9700, | |
| "logs": { | |
| "loss": 0.5565, | |
| "epoch": 3.5859519408502774, | |
| "learning_rate": 1.3646910764148346e-05 | |
| } | |
| }, | |
| { | |
| "step": 9750, | |
| "logs": { | |
| "loss": 0.5558, | |
| "epoch": 3.6044362292051755, | |
| "learning_rate": 1.360758249105282e-05 | |
| } | |
| }, | |
| { | |
| "step": 9800, | |
| "logs": { | |
| "loss": 0.5599, | |
| "epoch": 3.622920517560074, | |
| "learning_rate": 1.356825421795729e-05 | |
| } | |
| }, | |
| { | |
| "step": 9850, | |
| "logs": { | |
| "loss": 0.561, | |
| "epoch": 3.641404805914972, | |
| "learning_rate": 1.3528925944861761e-05 | |
| } | |
| }, | |
| { | |
| "step": 9900, | |
| "logs": { | |
| "loss": 0.5596, | |
| "epoch": 3.6598890942698707, | |
| "learning_rate": 1.3489597671766235e-05 | |
| } | |
| }, | |
| { | |
| "step": 9950, | |
| "logs": { | |
| "loss": 0.5596, | |
| "epoch": 3.678373382624769, | |
| "learning_rate": 1.3450269398670706e-05 | |
| } | |
| }, | |
| { | |
| "step": 10000, | |
| "logs": { | |
| "loss": 0.5579, | |
| "epoch": 3.6968576709796674, | |
| "learning_rate": 1.3410941125575177e-05 | |
| } | |
| }, | |
| { | |
| "step": 10050, | |
| "logs": { | |
| "loss": 0.5611, | |
| "epoch": 3.7153419593345656, | |
| "learning_rate": 1.3371612852479649e-05 | |
| } | |
| }, | |
| { | |
| "step": 10100, | |
| "logs": { | |
| "loss": 0.5627, | |
| "epoch": 3.733826247689464, | |
| "learning_rate": 1.3332284579384121e-05 | |
| } | |
| }, | |
| { | |
| "step": 10150, | |
| "logs": { | |
| "loss": 0.5613, | |
| "epoch": 3.7523105360443623, | |
| "learning_rate": 1.3292956306288592e-05 | |
| } | |
| }, | |
| { | |
| "step": 10200, | |
| "logs": { | |
| "loss": 0.5607, | |
| "epoch": 3.770794824399261, | |
| "learning_rate": 1.3253628033193064e-05 | |
| } | |
| }, | |
| { | |
| "step": 10250, | |
| "logs": { | |
| "loss": 0.5651, | |
| "epoch": 3.789279112754159, | |
| "learning_rate": 1.3214299760097535e-05 | |
| } | |
| }, | |
| { | |
| "step": 10300, | |
| "logs": { | |
| "loss": 0.5604, | |
| "epoch": 3.807763401109057, | |
| "learning_rate": 1.3174971487002005e-05 | |
| } | |
| }, | |
| { | |
| "step": 10350, | |
| "logs": { | |
| "loss": 0.5676, | |
| "epoch": 3.8262476894639557, | |
| "learning_rate": 1.313564321390648e-05 | |
| } | |
| }, | |
| { | |
| "step": 10400, | |
| "logs": { | |
| "loss": 0.5601, | |
| "epoch": 3.844731977818854, | |
| "learning_rate": 1.309631494081095e-05 | |
| } | |
| }, | |
| { | |
| "step": 10450, | |
| "logs": { | |
| "loss": 0.5645, | |
| "epoch": 3.8632162661737524, | |
| "learning_rate": 1.305698666771542e-05 | |
| } | |
| }, | |
| { | |
| "step": 10500, | |
| "logs": { | |
| "loss": 0.5653, | |
| "epoch": 3.8817005545286505, | |
| "learning_rate": 1.3017658394619895e-05 | |
| } | |
| }, | |
| { | |
| "step": 10550, | |
| "logs": { | |
| "loss": 0.5618, | |
| "epoch": 3.900184842883549, | |
| "learning_rate": 1.2978330121524365e-05 | |
| } | |
| }, | |
| { | |
| "step": 10600, | |
| "logs": { | |
| "loss": 0.5624, | |
| "epoch": 3.918669131238447, | |
| "learning_rate": 1.2939001848428836e-05 | |
| } | |
| }, | |
| { | |
| "step": 10650, | |
| "logs": { | |
| "loss": 0.5621, | |
| "epoch": 3.9371534195933457, | |
| "learning_rate": 1.289967357533331e-05 | |
| } | |
| }, | |
| { | |
| "step": 10700, | |
| "logs": { | |
| "loss": 0.5633, | |
| "epoch": 3.955637707948244, | |
| "learning_rate": 1.286034530223778e-05 | |
| } | |
| }, | |
| { | |
| "step": 10750, | |
| "logs": { | |
| "loss": 0.5645, | |
| "epoch": 3.9741219963031424, | |
| "learning_rate": 1.2821017029142251e-05 | |
| } | |
| }, | |
| { | |
| "step": 10800, | |
| "logs": { | |
| "loss": 0.5675, | |
| "epoch": 3.9926062846580406, | |
| "learning_rate": 1.2781688756046723e-05 | |
| } | |
| }, | |
| { | |
| "step": 10850, | |
| "logs": { | |
| "loss": 0.4943, | |
| "epoch": 4.011090573012939, | |
| "learning_rate": 1.2742360482951194e-05 | |
| } | |
| }, | |
| { | |
| "step": 10900, | |
| "logs": { | |
| "loss": 0.4282, | |
| "epoch": 4.029574861367838, | |
| "learning_rate": 1.2703032209855666e-05 | |
| } | |
| }, | |
| { | |
| "step": 10950, | |
| "logs": { | |
| "loss": 0.4285, | |
| "epoch": 4.048059149722736, | |
| "learning_rate": 1.2663703936760139e-05 | |
| } | |
| }, | |
| { | |
| "step": 11000, | |
| "logs": { | |
| "loss": 0.4307, | |
| "epoch": 4.066543438077634, | |
| "learning_rate": 1.262437566366461e-05 | |
| } | |
| }, | |
| { | |
| "step": 11050, | |
| "logs": { | |
| "loss": 0.4372, | |
| "epoch": 4.085027726432532, | |
| "learning_rate": 1.258504739056908e-05 | |
| } | |
| }, | |
| { | |
| "step": 11100, | |
| "logs": { | |
| "loss": 0.4377, | |
| "epoch": 4.103512014787431, | |
| "learning_rate": 1.2545719117473554e-05 | |
| } | |
| }, | |
| { | |
| "step": 11150, | |
| "logs": { | |
| "loss": 0.4296, | |
| "epoch": 4.121996303142329, | |
| "learning_rate": 1.2506390844378025e-05 | |
| } | |
| }, | |
| { | |
| "step": 11200, | |
| "logs": { | |
| "loss": 0.4358, | |
| "epoch": 4.140480591497227, | |
| "learning_rate": 1.2467062571282495e-05 | |
| } | |
| }, | |
| { | |
| "step": 11250, | |
| "logs": { | |
| "loss": 0.4383, | |
| "epoch": 4.1589648798521255, | |
| "learning_rate": 1.2427734298186969e-05 | |
| } | |
| }, | |
| { | |
| "step": 11300, | |
| "logs": { | |
| "loss": 0.4355, | |
| "epoch": 4.177449168207024, | |
| "learning_rate": 1.238840602509144e-05 | |
| } | |
| }, | |
| { | |
| "step": 11350, | |
| "logs": { | |
| "loss": 0.44, | |
| "epoch": 4.195933456561923, | |
| "learning_rate": 1.234907775199591e-05 | |
| } | |
| }, | |
| { | |
| "step": 11400, | |
| "logs": { | |
| "loss": 0.4393, | |
| "epoch": 4.214417744916821, | |
| "learning_rate": 1.2309749478900384e-05 | |
| } | |
| }, | |
| { | |
| "step": 11450, | |
| "logs": { | |
| "loss": 0.4427, | |
| "epoch": 4.232902033271719, | |
| "learning_rate": 1.2270421205804855e-05 | |
| } | |
| }, | |
| { | |
| "step": 11500, | |
| "logs": { | |
| "loss": 0.4399, | |
| "epoch": 4.251386321626617, | |
| "learning_rate": 1.2231092932709326e-05 | |
| } | |
| }, | |
| { | |
| "step": 11550, | |
| "logs": { | |
| "loss": 0.4401, | |
| "epoch": 4.269870609981516, | |
| "learning_rate": 1.2191764659613798e-05 | |
| } | |
| }, | |
| { | |
| "step": 11600, | |
| "logs": { | |
| "loss": 0.4446, | |
| "epoch": 4.288354898336414, | |
| "learning_rate": 1.2152436386518269e-05 | |
| } | |
| }, | |
| { | |
| "step": 11650, | |
| "logs": { | |
| "loss": 0.4436, | |
| "epoch": 4.306839186691312, | |
| "learning_rate": 1.211310811342274e-05 | |
| } | |
| }, | |
| { | |
| "step": 11700, | |
| "logs": { | |
| "loss": 0.4478, | |
| "epoch": 4.32532347504621, | |
| "learning_rate": 1.2073779840327213e-05 | |
| } | |
| }, | |
| { | |
| "step": 11750, | |
| "logs": { | |
| "loss": 0.447, | |
| "epoch": 4.343807763401109, | |
| "learning_rate": 1.2034451567231684e-05 | |
| } | |
| }, | |
| { | |
| "step": 11800, | |
| "logs": { | |
| "loss": 0.4505, | |
| "epoch": 4.3622920517560075, | |
| "learning_rate": 1.1995123294136154e-05 | |
| } | |
| }, | |
| { | |
| "step": 11850, | |
| "logs": { | |
| "loss": 0.4461, | |
| "epoch": 4.380776340110906, | |
| "learning_rate": 1.1955795021040628e-05 | |
| } | |
| }, | |
| { | |
| "step": 11900, | |
| "logs": { | |
| "loss": 0.4511, | |
| "epoch": 4.399260628465804, | |
| "learning_rate": 1.1916466747945099e-05 | |
| } | |
| }, | |
| { | |
| "step": 11950, | |
| "logs": { | |
| "loss": 0.4481, | |
| "epoch": 4.417744916820703, | |
| "learning_rate": 1.187713847484957e-05 | |
| } | |
| }, | |
| { | |
| "step": 12000, | |
| "logs": { | |
| "loss": 0.4457, | |
| "epoch": 4.436229205175601, | |
| "learning_rate": 1.1837810201754044e-05 | |
| } | |
| }, | |
| { | |
| "step": 12050, | |
| "logs": { | |
| "loss": 0.4491, | |
| "epoch": 4.454713493530499, | |
| "learning_rate": 1.1798481928658514e-05 | |
| } | |
| }, | |
| { | |
| "step": 12100, | |
| "logs": { | |
| "loss": 0.453, | |
| "epoch": 4.473197781885397, | |
| "learning_rate": 1.1759153655562985e-05 | |
| } | |
| }, | |
| { | |
| "step": 12150, | |
| "logs": { | |
| "loss": 0.4557, | |
| "epoch": 4.491682070240295, | |
| "learning_rate": 1.1719825382467455e-05 | |
| } | |
| }, | |
| { | |
| "step": 12200, | |
| "logs": { | |
| "loss": 0.4588, | |
| "epoch": 4.510166358595194, | |
| "learning_rate": 1.168049710937193e-05 | |
| } | |
| }, | |
| { | |
| "step": 12250, | |
| "logs": { | |
| "loss": 0.4478, | |
| "epoch": 4.5286506469500925, | |
| "learning_rate": 1.16411688362764e-05 | |
| } | |
| }, | |
| { | |
| "step": 12300, | |
| "logs": { | |
| "loss": 0.4558, | |
| "epoch": 4.547134935304991, | |
| "learning_rate": 1.160184056318087e-05 | |
| } | |
| }, | |
| { | |
| "step": 12350, | |
| "logs": { | |
| "loss": 0.453, | |
| "epoch": 4.565619223659889, | |
| "learning_rate": 1.1562512290085343e-05 | |
| } | |
| }, | |
| { | |
| "step": 12400, | |
| "logs": { | |
| "loss": 0.4566, | |
| "epoch": 4.584103512014788, | |
| "learning_rate": 1.1523184016989815e-05 | |
| } | |
| }, | |
| { | |
| "step": 12450, | |
| "logs": { | |
| "loss": 0.4512, | |
| "epoch": 4.602587800369686, | |
| "learning_rate": 1.1483855743894286e-05 | |
| } | |
| }, | |
| { | |
| "step": 12500, | |
| "logs": { | |
| "loss": 0.4537, | |
| "epoch": 4.621072088724584, | |
| "learning_rate": 1.1444527470798758e-05 | |
| } | |
| }, | |
| { | |
| "step": 12550, | |
| "logs": { | |
| "loss": 0.4596, | |
| "epoch": 4.639556377079482, | |
| "learning_rate": 1.1405199197703229e-05 | |
| } | |
| }, | |
| { | |
| "step": 12600, | |
| "logs": { | |
| "loss": 0.4544, | |
| "epoch": 4.658040665434381, | |
| "learning_rate": 1.1365870924607701e-05 | |
| } | |
| }, | |
| { | |
| "step": 12650, | |
| "logs": { | |
| "loss": 0.4552, | |
| "epoch": 4.676524953789279, | |
| "learning_rate": 1.1326542651512173e-05 | |
| } | |
| }, | |
| { | |
| "step": 12700, | |
| "logs": { | |
| "loss": 0.4561, | |
| "epoch": 4.695009242144177, | |
| "learning_rate": 1.1287214378416644e-05 | |
| } | |
| }, | |
| { | |
| "step": 12750, | |
| "logs": { | |
| "loss": 0.456, | |
| "epoch": 4.7134935304990755, | |
| "learning_rate": 1.1247886105321115e-05 | |
| } | |
| }, | |
| { | |
| "step": 12800, | |
| "logs": { | |
| "loss": 0.455, | |
| "epoch": 4.7319778188539745, | |
| "learning_rate": 1.1208557832225589e-05 | |
| } | |
| }, | |
| { | |
| "step": 12850, | |
| "logs": { | |
| "loss": 0.4579, | |
| "epoch": 4.750462107208873, | |
| "learning_rate": 1.116922955913006e-05 | |
| } | |
| }, | |
| { | |
| "step": 12900, | |
| "logs": { | |
| "loss": 0.4569, | |
| "epoch": 4.768946395563771, | |
| "learning_rate": 1.112990128603453e-05 | |
| } | |
| }, | |
| { | |
| "step": 12950, | |
| "logs": { | |
| "loss": 0.459, | |
| "epoch": 4.787430683918669, | |
| "learning_rate": 1.1090573012939004e-05 | |
| } | |
| }, | |
| { | |
| "step": 13000, | |
| "logs": { | |
| "loss": 0.456, | |
| "epoch": 4.805914972273568, | |
| "learning_rate": 1.1051244739843475e-05 | |
| } | |
| }, | |
| { | |
| "step": 13050, | |
| "logs": { | |
| "loss": 0.4605, | |
| "epoch": 4.824399260628466, | |
| "learning_rate": 1.1011916466747945e-05 | |
| } | |
| }, | |
| { | |
| "step": 13100, | |
| "logs": { | |
| "loss": 0.4565, | |
| "epoch": 4.842883548983364, | |
| "learning_rate": 1.0972588193652417e-05 | |
| } | |
| }, | |
| { | |
| "step": 13150, | |
| "logs": { | |
| "loss": 0.4606, | |
| "epoch": 4.861367837338262, | |
| "learning_rate": 1.093325992055689e-05 | |
| } | |
| }, | |
| { | |
| "step": 13200, | |
| "logs": { | |
| "loss": 0.4586, | |
| "epoch": 4.87985212569316, | |
| "learning_rate": 1.089393164746136e-05 | |
| } | |
| }, | |
| { | |
| "step": 13250, | |
| "logs": { | |
| "loss": 0.4605, | |
| "epoch": 4.898336414048059, | |
| "learning_rate": 1.0854603374365833e-05 | |
| } | |
| }, | |
| { | |
| "step": 13300, | |
| "logs": { | |
| "loss": 0.4565, | |
| "epoch": 4.9168207024029575, | |
| "learning_rate": 1.0815275101270303e-05 | |
| } | |
| }, | |
| { | |
| "step": 13350, | |
| "logs": { | |
| "loss": 0.4585, | |
| "epoch": 4.935304990757856, | |
| "learning_rate": 1.0775946828174776e-05 | |
| } | |
| }, | |
| { | |
| "step": 13400, | |
| "logs": { | |
| "loss": 0.4588, | |
| "epoch": 4.953789279112754, | |
| "learning_rate": 1.0736618555079248e-05 | |
| } | |
| }, | |
| { | |
| "step": 13450, | |
| "logs": { | |
| "loss": 0.4639, | |
| "epoch": 4.972273567467653, | |
| "learning_rate": 1.0697290281983718e-05 | |
| } | |
| }, | |
| { | |
| "step": 13500, | |
| "logs": { | |
| "loss": 0.4666, | |
| "epoch": 4.990757855822551, | |
| "learning_rate": 1.0657962008888189e-05 | |
| } | |
| }, | |
| { | |
| "step": 13550, | |
| "logs": { | |
| "loss": 0.4109, | |
| "epoch": 5.009242144177449, | |
| "learning_rate": 1.0618633735792663e-05 | |
| } | |
| }, | |
| { | |
| "step": 13600, | |
| "logs": { | |
| "loss": 0.3538, | |
| "epoch": 5.027726432532347, | |
| "learning_rate": 1.0579305462697134e-05 | |
| } | |
| }, | |
| { | |
| "step": 13650, | |
| "logs": { | |
| "loss": 0.346, | |
| "epoch": 5.046210720887246, | |
| "learning_rate": 1.0539977189601604e-05 | |
| } | |
| }, | |
| { | |
| "step": 13700, | |
| "logs": { | |
| "loss": 0.3483, | |
| "epoch": 5.064695009242144, | |
| "learning_rate": 1.0500648916506078e-05 | |
| } | |
| }, | |
| { | |
| "step": 13750, | |
| "logs": { | |
| "loss": 0.3548, | |
| "epoch": 5.0831792975970425, | |
| "learning_rate": 1.0461320643410549e-05 | |
| } | |
| }, | |
| { | |
| "step": 13800, | |
| "logs": { | |
| "loss": 0.3567, | |
| "epoch": 5.101663585951941, | |
| "learning_rate": 1.042199237031502e-05 | |
| } | |
| }, | |
| { | |
| "step": 13850, | |
| "logs": { | |
| "loss": 0.3525, | |
| "epoch": 5.12014787430684, | |
| "learning_rate": 1.0382664097219492e-05 | |
| } | |
| }, | |
| { | |
| "step": 13900, | |
| "logs": { | |
| "loss": 0.3563, | |
| "epoch": 5.138632162661738, | |
| "learning_rate": 1.0343335824123964e-05 | |
| } | |
| }, | |
| { | |
| "step": 13950, | |
| "logs": { | |
| "loss": 0.3606, | |
| "epoch": 5.157116451016636, | |
| "learning_rate": 1.0304007551028435e-05 | |
| } | |
| }, | |
| { | |
| "step": 14000, | |
| "logs": { | |
| "loss": 0.3585, | |
| "epoch": 5.175600739371534, | |
| "learning_rate": 1.0264679277932907e-05 | |
| } | |
| }, | |
| { | |
| "step": 14050, | |
| "logs": { | |
| "loss": 0.3547, | |
| "epoch": 5.194085027726432, | |
| "learning_rate": 1.0225351004837378e-05 | |
| } | |
| }, | |
| { | |
| "step": 14100, | |
| "logs": { | |
| "loss": 0.359, | |
| "epoch": 5.212569316081331, | |
| "learning_rate": 1.018602273174185e-05 | |
| } | |
| }, | |
| { | |
| "step": 14150, | |
| "logs": { | |
| "loss": 0.3616, | |
| "epoch": 5.231053604436229, | |
| "learning_rate": 1.0146694458646322e-05 | |
| } | |
| }, | |
| { | |
| "step": 14200, | |
| "logs": { | |
| "loss": 0.3602, | |
| "epoch": 5.249537892791127, | |
| "learning_rate": 1.0107366185550793e-05 | |
| } | |
| }, | |
| { | |
| "step": 14250, | |
| "logs": { | |
| "loss": 0.3607, | |
| "epoch": 5.2680221811460255, | |
| "learning_rate": 1.0068037912455264e-05 | |
| } | |
| }, | |
| { | |
| "step": 14300, | |
| "logs": { | |
| "loss": 0.3642, | |
| "epoch": 5.2865064695009245, | |
| "learning_rate": 1.0028709639359738e-05 | |
| } | |
| }, | |
| { | |
| "step": 14350, | |
| "logs": { | |
| "loss": 0.3616, | |
| "epoch": 5.304990757855823, | |
| "learning_rate": 9.989381366264208e-06 | |
| } | |
| }, | |
| { | |
| "step": 14400, | |
| "logs": { | |
| "loss": 0.364, | |
| "epoch": 5.323475046210721, | |
| "learning_rate": 9.95005309316868e-06 | |
| } | |
| }, | |
| { | |
| "step": 14450, | |
| "logs": { | |
| "loss": 0.3656, | |
| "epoch": 5.341959334565619, | |
| "learning_rate": 9.910724820073151e-06 | |
| } | |
| }, | |
| { | |
| "step": 14500, | |
| "logs": { | |
| "loss": 0.3613, | |
| "epoch": 5.360443622920518, | |
| "learning_rate": 9.871396546977623e-06 | |
| } | |
| }, | |
| { | |
| "step": 14550, | |
| "logs": { | |
| "loss": 0.3655, | |
| "epoch": 5.378927911275416, | |
| "learning_rate": 9.832068273882096e-06 | |
| } | |
| }, | |
| { | |
| "step": 14600, | |
| "logs": { | |
| "loss": 0.3677, | |
| "epoch": 5.397412199630314, | |
| "learning_rate": 9.792740000786566e-06 | |
| } | |
| }, | |
| { | |
| "step": 14650, | |
| "logs": { | |
| "loss": 0.3678, | |
| "epoch": 5.415896487985212, | |
| "learning_rate": 9.753411727691039e-06 | |
| } | |
| }, | |
| { | |
| "step": 14700, | |
| "logs": { | |
| "loss": 0.364, | |
| "epoch": 5.434380776340111, | |
| "learning_rate": 9.71408345459551e-06 | |
| } | |
| }, | |
| { | |
| "step": 14750, | |
| "logs": { | |
| "loss": 0.3654, | |
| "epoch": 5.452865064695009, | |
| "learning_rate": 9.67475518149998e-06 | |
| } | |
| }, | |
| { | |
| "step": 14800, | |
| "logs": { | |
| "loss": 0.3671, | |
| "epoch": 5.4713493530499075, | |
| "learning_rate": 9.635426908404452e-06 | |
| } | |
| }, | |
| { | |
| "step": 14850, | |
| "logs": { | |
| "loss": 0.3724, | |
| "epoch": 5.489833641404806, | |
| "learning_rate": 9.596098635308924e-06 | |
| } | |
| }, | |
| { | |
| "step": 14900, | |
| "logs": { | |
| "loss": 1.4537, | |
| "epoch": 5.508317929759705, | |
| "learning_rate": 9.556770362213395e-06 | |
| } | |
| }, | |
| { | |
| "step": 14950, | |
| "logs": { | |
| "loss": 0.3685, | |
| "epoch": 5.526802218114603, | |
| "learning_rate": 9.517442089117867e-06 | |
| } | |
| }, | |
| { | |
| "step": 15000, | |
| "logs": { | |
| "loss": 0.3688, | |
| "epoch": 5.545286506469501, | |
| "learning_rate": 9.47811381602234e-06 | |
| } | |
| }, | |
| { | |
| "step": 15050, | |
| "logs": { | |
| "loss": 0.3726, | |
| "epoch": 5.563770794824399, | |
| "learning_rate": 9.43878554292681e-06 | |
| } | |
| }, | |
| { | |
| "step": 15100, | |
| "logs": { | |
| "loss": 0.3718, | |
| "epoch": 5.582255083179297, | |
| "learning_rate": 9.399457269831283e-06 | |
| } | |
| }, | |
| { | |
| "step": 15150, | |
| "logs": { | |
| "loss": 0.3691, | |
| "epoch": 5.600739371534196, | |
| "learning_rate": 9.360128996735755e-06 | |
| } | |
| }, | |
| { | |
| "step": 15200, | |
| "logs": { | |
| "loss": 0.3684, | |
| "epoch": 5.619223659889094, | |
| "learning_rate": 9.320800723640226e-06 | |
| } | |
| }, | |
| { | |
| "step": 15250, | |
| "logs": { | |
| "loss": 0.3747, | |
| "epoch": 5.6377079482439925, | |
| "learning_rate": 9.281472450544698e-06 | |
| } | |
| }, | |
| { | |
| "step": 15300, | |
| "logs": { | |
| "loss": 0.3727, | |
| "epoch": 5.656192236598891, | |
| "learning_rate": 9.24214417744917e-06 | |
| } | |
| }, | |
| { | |
| "step": 15350, | |
| "logs": { | |
| "loss": 0.3736, | |
| "epoch": 5.67467652495379, | |
| "learning_rate": 9.20281590435364e-06 | |
| } | |
| }, | |
| { | |
| "step": 15400, | |
| "logs": { | |
| "loss": 0.3725, | |
| "epoch": 5.693160813308688, | |
| "learning_rate": 9.163487631258111e-06 | |
| } | |
| }, | |
| { | |
| "step": 15450, | |
| "logs": { | |
| "loss": 0.3711, | |
| "epoch": 5.711645101663586, | |
| "learning_rate": 9.124159358162584e-06 | |
| } | |
| }, | |
| { | |
| "step": 15500, | |
| "logs": { | |
| "loss": 0.3705, | |
| "epoch": 5.730129390018484, | |
| "learning_rate": 9.084831085067054e-06 | |
| } | |
| }, | |
| { | |
| "step": 15550, | |
| "logs": { | |
| "loss": 0.3698, | |
| "epoch": 5.748613678373383, | |
| "learning_rate": 9.045502811971527e-06 | |
| } | |
| }, | |
| { | |
| "step": 15600, | |
| "logs": { | |
| "loss": 0.3725, | |
| "epoch": 5.767097966728281, | |
| "learning_rate": 9.006174538875999e-06 | |
| } | |
| }, | |
| { | |
| "step": 15650, | |
| "logs": { | |
| "loss": 0.3767, | |
| "epoch": 5.785582255083179, | |
| "learning_rate": 8.96684626578047e-06 | |
| } | |
| }, | |
| { | |
| "step": 15700, | |
| "logs": { | |
| "loss": 0.3696, | |
| "epoch": 5.804066543438077, | |
| "learning_rate": 8.927517992684942e-06 | |
| } | |
| }, | |
| { | |
| "step": 15750, | |
| "logs": { | |
| "loss": 0.3797, | |
| "epoch": 5.822550831792976, | |
| "learning_rate": 8.888189719589414e-06 | |
| } | |
| }, | |
| { | |
| "step": 15800, | |
| "logs": { | |
| "loss": 0.371, | |
| "epoch": 5.8410351201478745, | |
| "learning_rate": 8.848861446493885e-06 | |
| } | |
| }, | |
| { | |
| "step": 15850, | |
| "logs": { | |
| "loss": 0.3769, | |
| "epoch": 5.859519408502773, | |
| "learning_rate": 8.809533173398357e-06 | |
| } | |
| }, | |
| { | |
| "step": 15900, | |
| "logs": { | |
| "loss": 0.3731, | |
| "epoch": 5.878003696857671, | |
| "learning_rate": 8.77020490030283e-06 | |
| } | |
| }, | |
| { | |
| "step": 15950, | |
| "logs": { | |
| "loss": 0.3769, | |
| "epoch": 5.896487985212569, | |
| "learning_rate": 8.7308766272073e-06 | |
| } | |
| }, | |
| { | |
| "step": 16000, | |
| "logs": { | |
| "loss": 0.3711, | |
| "epoch": 5.914972273567468, | |
| "learning_rate": 8.691548354111772e-06 | |
| } | |
| }, | |
| { | |
| "step": 16050, | |
| "logs": { | |
| "loss": 0.3752, | |
| "epoch": 5.933456561922366, | |
| "learning_rate": 8.652220081016243e-06 | |
| } | |
| }, | |
| { | |
| "step": 16100, | |
| "logs": { | |
| "loss": 0.3697, | |
| "epoch": 5.951940850277264, | |
| "learning_rate": 8.612891807920715e-06 | |
| } | |
| }, | |
| { | |
| "step": 16150, | |
| "logs": { | |
| "loss": 0.3751, | |
| "epoch": 5.970425138632162, | |
| "learning_rate": 8.573563534825186e-06 | |
| } | |
| }, | |
| { | |
| "step": 16200, | |
| "logs": { | |
| "loss": 0.3791, | |
| "epoch": 5.988909426987061, | |
| "learning_rate": 8.534235261729658e-06 | |
| } | |
| }, | |
| { | |
| "step": 16250, | |
| "logs": { | |
| "loss": 0.3443, | |
| "epoch": 6.007393715341959, | |
| "learning_rate": 8.494906988634129e-06 | |
| } | |
| }, | |
| { | |
| "step": 16300, | |
| "logs": { | |
| "loss": 0.2903, | |
| "epoch": 6.0258780036968576, | |
| "learning_rate": 8.455578715538601e-06 | |
| } | |
| }, | |
| { | |
| "step": 16350, | |
| "logs": { | |
| "loss": 0.2906, | |
| "epoch": 6.044362292051756, | |
| "learning_rate": 8.416250442443073e-06 | |
| } | |
| }, | |
| { | |
| "step": 16400, | |
| "logs": { | |
| "loss": 0.2884, | |
| "epoch": 6.062846580406655, | |
| "learning_rate": 8.376922169347544e-06 | |
| } | |
| }, | |
| { | |
| "step": 16450, | |
| "logs": { | |
| "loss": 0.2913, | |
| "epoch": 6.081330868761553, | |
| "learning_rate": 8.337593896252016e-06 | |
| } | |
| }, | |
| { | |
| "step": 16500, | |
| "logs": { | |
| "loss": 0.2964, | |
| "epoch": 6.099815157116451, | |
| "learning_rate": 8.298265623156489e-06 | |
| } | |
| }, | |
| { | |
| "step": 16550, | |
| "logs": { | |
| "loss": 0.2877, | |
| "epoch": 6.118299445471349, | |
| "learning_rate": 8.25893735006096e-06 | |
| } | |
| }, | |
| { | |
| "step": 16600, | |
| "logs": { | |
| "loss": 0.2957, | |
| "epoch": 6.136783733826248, | |
| "learning_rate": 8.219609076965432e-06 | |
| } | |
| }, | |
| { | |
| "step": 16650, | |
| "logs": { | |
| "loss": 0.2974, | |
| "epoch": 6.155268022181146, | |
| "learning_rate": 8.180280803869902e-06 | |
| } | |
| }, | |
| { | |
| "step": 16700, | |
| "logs": { | |
| "loss": 0.295, | |
| "epoch": 6.173752310536044, | |
| "learning_rate": 8.140952530774374e-06 | |
| } | |
| }, | |
| { | |
| "step": 16750, | |
| "logs": { | |
| "loss": 0.2947, | |
| "epoch": 6.1922365988909425, | |
| "learning_rate": 8.101624257678847e-06 | |
| } | |
| }, | |
| { | |
| "step": 16800, | |
| "logs": { | |
| "loss": 0.2957, | |
| "epoch": 6.210720887245841, | |
| "learning_rate": 8.062295984583317e-06 | |
| } | |
| }, | |
| { | |
| "step": 16850, | |
| "logs": { | |
| "loss": 0.3001, | |
| "epoch": 6.22920517560074, | |
| "learning_rate": 8.02296771148779e-06 | |
| } | |
| }, | |
| { | |
| "step": 16900, | |
| "logs": { | |
| "loss": 0.2958, | |
| "epoch": 6.247689463955638, | |
| "learning_rate": 7.98363943839226e-06 | |
| } | |
| }, | |
| { | |
| "step": 16950, | |
| "logs": { | |
| "loss": 0.2956, | |
| "epoch": 6.266173752310536, | |
| "learning_rate": 7.944311165296733e-06 | |
| } | |
| }, | |
| { | |
| "step": 17000, | |
| "logs": { | |
| "loss": 0.3, | |
| "epoch": 6.284658040665434, | |
| "learning_rate": 7.904982892201203e-06 | |
| } | |
| }, | |
| { | |
| "step": 17050, | |
| "logs": { | |
| "loss": 0.3, | |
| "epoch": 6.303142329020333, | |
| "learning_rate": 7.865654619105676e-06 | |
| } | |
| }, | |
| { | |
| "step": 17100, | |
| "logs": { | |
| "loss": 0.3003, | |
| "epoch": 6.321626617375231, | |
| "learning_rate": 7.826326346010146e-06 | |
| } | |
| }, | |
| { | |
| "step": 17150, | |
| "logs": { | |
| "loss": 0.3029, | |
| "epoch": 6.340110905730129, | |
| "learning_rate": 7.786998072914618e-06 | |
| } | |
| }, | |
| { | |
| "step": 17200, | |
| "logs": { | |
| "loss": 0.301, | |
| "epoch": 6.358595194085027, | |
| "learning_rate": 7.74766979981909e-06 | |
| } | |
| }, | |
| { | |
| "step": 17250, | |
| "logs": { | |
| "loss": 0.297, | |
| "epoch": 6.377079482439926, | |
| "learning_rate": 7.708341526723561e-06 | |
| } | |
| }, | |
| { | |
| "step": 17300, | |
| "logs": { | |
| "loss": 0.2993, | |
| "epoch": 6.3955637707948245, | |
| "learning_rate": 7.669013253628034e-06 | |
| } | |
| }, | |
| { | |
| "step": 17350, | |
| "logs": { | |
| "loss": 0.3035, | |
| "epoch": 6.414048059149723, | |
| "learning_rate": 7.629684980532506e-06 | |
| } | |
| }, | |
| { | |
| "step": 17400, | |
| "logs": { | |
| "loss": 0.2988, | |
| "epoch": 6.432532347504621, | |
| "learning_rate": 7.590356707436977e-06 | |
| } | |
| }, | |
| { | |
| "step": 17450, | |
| "logs": { | |
| "loss": 0.3001, | |
| "epoch": 6.45101663585952, | |
| "learning_rate": 7.551028434341449e-06 | |
| } | |
| }, | |
| { | |
| "step": 17500, | |
| "logs": { | |
| "loss": 0.3024, | |
| "epoch": 6.469500924214418, | |
| "learning_rate": 7.51170016124592e-06 | |
| } | |
| }, | |
| { | |
| "step": 17550, | |
| "logs": { | |
| "loss": 0.3053, | |
| "epoch": 6.487985212569316, | |
| "learning_rate": 7.472371888150392e-06 | |
| } | |
| }, | |
| { | |
| "step": 17600, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.506469500924214, | |
| "learning_rate": 7.433043615054863e-06 | |
| } | |
| }, | |
| { | |
| "step": 17650, | |
| "logs": { | |
| "loss": 0.3002, | |
| "epoch": 6.524953789279113, | |
| "learning_rate": 7.393715341959336e-06 | |
| } | |
| }, | |
| { | |
| "step": 17700, | |
| "logs": { | |
| "loss": 0.3044, | |
| "epoch": 6.543438077634011, | |
| "learning_rate": 7.354387068863806e-06 | |
| } | |
| }, | |
| { | |
| "step": 17750, | |
| "logs": { | |
| "loss": 0.3016, | |
| "epoch": 6.561922365988909, | |
| "learning_rate": 7.3150587957682786e-06 | |
| } | |
| }, | |
| { | |
| "step": 17800, | |
| "logs": { | |
| "loss": 0.3071, | |
| "epoch": 6.580406654343808, | |
| "learning_rate": 7.27573052267275e-06 | |
| } | |
| }, | |
| { | |
| "step": 17850, | |
| "logs": { | |
| "loss": 0.3002, | |
| "epoch": 6.598890942698706, | |
| "learning_rate": 7.2364022495772215e-06 | |
| } | |
| }, | |
| { | |
| "step": 17900, | |
| "logs": { | |
| "loss": 0.3042, | |
| "epoch": 6.617375231053605, | |
| "learning_rate": 7.197073976481693e-06 | |
| } | |
| }, | |
| { | |
| "step": 17950, | |
| "logs": { | |
| "loss": 0.3042, | |
| "epoch": 6.635859519408503, | |
| "learning_rate": 7.157745703386165e-06 | |
| } | |
| }, | |
| { | |
| "step": 18000, | |
| "logs": { | |
| "loss": 0.3063, | |
| "epoch": 6.654343807763401, | |
| "learning_rate": 7.118417430290636e-06 | |
| } | |
| }, | |
| { | |
| "step": 18050, | |
| "logs": { | |
| "loss": 0.3031, | |
| "epoch": 6.672828096118299, | |
| "learning_rate": 7.079089157195108e-06 | |
| } | |
| }, | |
| { | |
| "step": 18100, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.691312384473198, | |
| "learning_rate": 7.0397608840995805e-06 | |
| } | |
| }, | |
| { | |
| "step": 18150, | |
| "logs": { | |
| "loss": 0.3041, | |
| "epoch": 6.709796672828096, | |
| "learning_rate": 7.000432611004051e-06 | |
| } | |
| }, | |
| { | |
| "step": 18200, | |
| "logs": { | |
| "loss": 0.3036, | |
| "epoch": 6.728280961182994, | |
| "learning_rate": 6.961104337908523e-06 | |
| } | |
| }, | |
| { | |
| "step": 18250, | |
| "logs": { | |
| "loss": 0.3044, | |
| "epoch": 6.7467652495378925, | |
| "learning_rate": 6.921776064812995e-06 | |
| } | |
| }, | |
| { | |
| "step": 18300, | |
| "logs": { | |
| "loss": 0.3057, | |
| "epoch": 6.7652495378927915, | |
| "learning_rate": 6.882447791717466e-06 | |
| } | |
| }, | |
| { | |
| "step": 18350, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.78373382624769, | |
| "learning_rate": 6.843119518621938e-06 | |
| } | |
| }, | |
| { | |
| "step": 18400, | |
| "logs": { | |
| "loss": 0.3058, | |
| "epoch": 6.802218114602588, | |
| "learning_rate": 6.80379124552641e-06 | |
| } | |
| }, | |
| { | |
| "step": 18450, | |
| "logs": { | |
| "loss": 0.3072, | |
| "epoch": 6.820702402957486, | |
| "learning_rate": 6.764462972430881e-06 | |
| } | |
| }, | |
| { | |
| "step": 18500, | |
| "logs": { | |
| "loss": 0.3042, | |
| "epoch": 6.839186691312385, | |
| "learning_rate": 6.725134699335353e-06 | |
| } | |
| }, | |
| { | |
| "step": 18550, | |
| "logs": { | |
| "loss": 0.3091, | |
| "epoch": 6.857670979667283, | |
| "learning_rate": 6.6858064262398245e-06 | |
| } | |
| }, | |
| { | |
| "step": 18600, | |
| "logs": { | |
| "loss": 0.3036, | |
| "epoch": 6.876155268022181, | |
| "learning_rate": 6.646478153144296e-06 | |
| } | |
| }, | |
| { | |
| "step": 18650, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.894639556377079, | |
| "learning_rate": 6.607149880048767e-06 | |
| } | |
| }, | |
| { | |
| "step": 18700, | |
| "logs": { | |
| "loss": 0.3018, | |
| "epoch": 6.913123844731977, | |
| "learning_rate": 6.56782160695324e-06 | |
| } | |
| }, | |
| { | |
| "step": 18750, | |
| "logs": { | |
| "loss": 0.3055, | |
| "epoch": 6.931608133086876, | |
| "learning_rate": 6.52849333385771e-06 | |
| } | |
| }, | |
| { | |
| "step": 18800, | |
| "logs": { | |
| "loss": 0.3046, | |
| "epoch": 6.9500924214417745, | |
| "learning_rate": 6.489165060762183e-06 | |
| } | |
| }, | |
| { | |
| "step": 18850, | |
| "logs": { | |
| "loss": 0.3083, | |
| "epoch": 6.968576709796673, | |
| "learning_rate": 6.449836787666655e-06 | |
| } | |
| }, | |
| { | |
| "step": 18900, | |
| "logs": { | |
| "loss": 0.3118, | |
| "epoch": 6.987060998151571, | |
| "learning_rate": 6.4105085145711256e-06 | |
| } | |
| }, | |
| { | |
| "step": 18950, | |
| "logs": { | |
| "loss": 0.2902, | |
| "epoch": 7.00554528650647, | |
| "learning_rate": 6.371180241475597e-06 | |
| } | |
| }, | |
| { | |
| "step": 19000, | |
| "logs": { | |
| "loss": 0.241, | |
| "epoch": 7.024029574861368, | |
| "learning_rate": 6.331851968380069e-06 | |
| } | |
| }, | |
| { | |
| "step": 19050, | |
| "logs": { | |
| "loss": 0.2432, | |
| "epoch": 7.042513863216266, | |
| "learning_rate": 6.29252369528454e-06 | |
| } | |
| }, | |
| { | |
| "step": 19100, | |
| "logs": { | |
| "loss": 0.2405, | |
| "epoch": 7.060998151571164, | |
| "learning_rate": 6.253195422189012e-06 | |
| } | |
| }, | |
| { | |
| "step": 19150, | |
| "logs": { | |
| "loss": 0.2447, | |
| "epoch": 7.079482439926063, | |
| "learning_rate": 6.2138671490934846e-06 | |
| } | |
| }, | |
| { | |
| "step": 19200, | |
| "logs": { | |
| "loss": 0.2458, | |
| "epoch": 7.097966728280961, | |
| "learning_rate": 6.174538875997955e-06 | |
| } | |
| }, | |
| { | |
| "step": 19250, | |
| "logs": { | |
| "loss": 0.2414, | |
| "epoch": 7.116451016635859, | |
| "learning_rate": 6.1352106029024275e-06 | |
| } | |
| }, | |
| { | |
| "step": 19300, | |
| "logs": { | |
| "loss": 0.2465, | |
| "epoch": 7.134935304990758, | |
| "learning_rate": 6.095882329806899e-06 | |
| } | |
| }, | |
| { | |
| "step": 19350, | |
| "logs": { | |
| "loss": 0.2474, | |
| "epoch": 7.153419593345657, | |
| "learning_rate": 6.05655405671137e-06 | |
| } | |
| }, | |
| { | |
| "step": 19400, | |
| "logs": { | |
| "loss": 0.2464, | |
| "epoch": 7.171903881700555, | |
| "learning_rate": 6.017225783615842e-06 | |
| } | |
| }, | |
| { | |
| "step": 19450, | |
| "logs": { | |
| "loss": 0.2443, | |
| "epoch": 7.190388170055453, | |
| "learning_rate": 5.977897510520314e-06 | |
| } | |
| }, | |
| { | |
| "step": 19500, | |
| "logs": { | |
| "loss": 0.2466, | |
| "epoch": 7.208872458410351, | |
| "learning_rate": 5.938569237424785e-06 | |
| } | |
| }, | |
| { | |
| "step": 19550, | |
| "logs": { | |
| "loss": 0.2497, | |
| "epoch": 7.22735674676525, | |
| "learning_rate": 5.899240964329257e-06 | |
| } | |
| }, | |
| { | |
| "step": 19600, | |
| "logs": { | |
| "loss": 0.2469, | |
| "epoch": 7.245841035120148, | |
| "learning_rate": 5.859912691233728e-06 | |
| } | |
| }, | |
| { | |
| "step": 19650, | |
| "logs": { | |
| "loss": 0.2468, | |
| "epoch": 7.264325323475046, | |
| "learning_rate": 5.8205844181382e-06 | |
| } | |
| }, | |
| { | |
| "step": 19700, | |
| "logs": { | |
| "loss": 0.2495, | |
| "epoch": 7.282809611829944, | |
| "learning_rate": 5.7812561450426715e-06 | |
| } | |
| }, | |
| { | |
| "step": 19750, | |
| "logs": { | |
| "loss": 0.2496, | |
| "epoch": 7.3012939001848425, | |
| "learning_rate": 5.741927871947143e-06 | |
| } | |
| }, | |
| { | |
| "step": 19800, | |
| "logs": { | |
| "loss": 0.2516, | |
| "epoch": 7.3197781885397415, | |
| "learning_rate": 5.702599598851614e-06 | |
| } | |
| }, | |
| { | |
| "step": 19850, | |
| "logs": { | |
| "loss": 0.2516, | |
| "epoch": 7.33826247689464, | |
| "learning_rate": 5.663271325756087e-06 | |
| } | |
| }, | |
| { | |
| "step": 19900, | |
| "logs": { | |
| "loss": 0.2493, | |
| "epoch": 7.356746765249538, | |
| "learning_rate": 5.623943052660557e-06 | |
| } | |
| }, | |
| { | |
| "step": 19950, | |
| "logs": { | |
| "loss": 0.2458, | |
| "epoch": 7.375231053604436, | |
| "learning_rate": 5.58461477956503e-06 | |
| } | |
| }, | |
| { | |
| "step": 20000, | |
| "logs": { | |
| "loss": 0.2494, | |
| "epoch": 7.393715341959335, | |
| "learning_rate": 5.545286506469502e-06 | |
| } | |
| }, | |
| { | |
| "step": 20050, | |
| "logs": { | |
| "loss": 0.2534, | |
| "epoch": 7.412199630314233, | |
| "learning_rate": 5.5059582333739726e-06 | |
| } | |
| }, | |
| { | |
| "step": 20100, | |
| "logs": { | |
| "loss": 0.2499, | |
| "epoch": 7.430683918669131, | |
| "learning_rate": 5.466629960278445e-06 | |
| } | |
| }, | |
| { | |
| "step": 20150, | |
| "logs": { | |
| "loss": 0.249, | |
| "epoch": 7.449168207024029, | |
| "learning_rate": 5.427301687182916e-06 | |
| } | |
| }, | |
| { | |
| "step": 20200, | |
| "logs": { | |
| "loss": 0.2498, | |
| "epoch": 7.467652495378928, | |
| "learning_rate": 5.387973414087388e-06 | |
| } | |
| }, | |
| { | |
| "step": 20250, | |
| "logs": { | |
| "loss": 0.2541, | |
| "epoch": 7.486136783733826, | |
| "learning_rate": 5.348645140991859e-06 | |
| } | |
| }, | |
| { | |
| "step": 20300, | |
| "logs": { | |
| "loss": 0.2579, | |
| "epoch": 7.5046210720887245, | |
| "learning_rate": 5.3093168678963316e-06 | |
| } | |
| }, | |
| { | |
| "step": 20350, | |
| "logs": { | |
| "loss": 0.2476, | |
| "epoch": 7.523105360443623, | |
| "learning_rate": 5.269988594800802e-06 | |
| } | |
| }, | |
| { | |
| "step": 20400, | |
| "logs": { | |
| "loss": 0.2538, | |
| "epoch": 7.541589648798522, | |
| "learning_rate": 5.2306603217052745e-06 | |
| } | |
| }, | |
| { | |
| "step": 20450, | |
| "logs": { | |
| "loss": 0.2537, | |
| "epoch": 7.56007393715342, | |
| "learning_rate": 5.191332048609746e-06 | |
| } | |
| }, | |
| { | |
| "step": 20500, | |
| "logs": { | |
| "loss": 0.2522, | |
| "epoch": 7.578558225508318, | |
| "learning_rate": 5.152003775514217e-06 | |
| } | |
| }, | |
| { | |
| "step": 20550, | |
| "logs": { | |
| "loss": 0.2491, | |
| "epoch": 7.597042513863216, | |
| "learning_rate": 5.112675502418689e-06 | |
| } | |
| }, | |
| { | |
| "step": 20600, | |
| "logs": { | |
| "loss": 0.2509, | |
| "epoch": 7.615526802218114, | |
| "learning_rate": 5.073347229323161e-06 | |
| } | |
| }, | |
| { | |
| "step": 20650, | |
| "logs": { | |
| "loss": 0.2496, | |
| "epoch": 7.634011090573013, | |
| "learning_rate": 5.034018956227632e-06 | |
| } | |
| }, | |
| { | |
| "step": 20700, | |
| "logs": { | |
| "loss": 0.2542, | |
| "epoch": 7.652495378927911, | |
| "learning_rate": 4.994690683132104e-06 | |
| } | |
| }, | |
| { | |
| "step": 20750, | |
| "logs": { | |
| "loss": 0.2517, | |
| "epoch": 7.6709796672828094, | |
| "learning_rate": 4.9553624100365756e-06 | |
| } | |
| }, | |
| { | |
| "step": 20800, | |
| "logs": { | |
| "loss": 0.2544, | |
| "epoch": 7.689463955637708, | |
| "learning_rate": 4.916034136941048e-06 | |
| } | |
| }, | |
| { | |
| "step": 20850, | |
| "logs": { | |
| "loss": 0.2489, | |
| "epoch": 7.707948243992607, | |
| "learning_rate": 4.876705863845519e-06 | |
| } | |
| }, | |
| { | |
| "step": 20900, | |
| "logs": { | |
| "loss": 0.2506, | |
| "epoch": 7.726432532347505, | |
| "learning_rate": 4.83737759074999e-06 | |
| } | |
| }, | |
| { | |
| "step": 20950, | |
| "logs": { | |
| "loss": 0.2535, | |
| "epoch": 7.744916820702403, | |
| "learning_rate": 4.798049317654462e-06 | |
| } | |
| }, | |
| { | |
| "step": 21000, | |
| "logs": { | |
| "loss": 0.2506, | |
| "epoch": 7.763401109057301, | |
| "learning_rate": 4.758721044558934e-06 | |
| } | |
| }, | |
| { | |
| "step": 21050, | |
| "logs": { | |
| "loss": 0.2547, | |
| "epoch": 7.7818853974122, | |
| "learning_rate": 4.719392771463405e-06 | |
| } | |
| }, | |
| { | |
| "step": 21100, | |
| "logs": { | |
| "loss": 0.2525, | |
| "epoch": 7.800369685767098, | |
| "learning_rate": 4.6800644983678775e-06 | |
| } | |
| }, | |
| { | |
| "step": 21150, | |
| "logs": { | |
| "loss": 0.2535, | |
| "epoch": 7.818853974121996, | |
| "learning_rate": 4.640736225272349e-06 | |
| } | |
| }, | |
| { | |
| "step": 21200, | |
| "logs": { | |
| "loss": 0.2508, | |
| "epoch": 7.837338262476894, | |
| "learning_rate": 4.60140795217682e-06 | |
| } | |
| }, | |
| { | |
| "step": 21250, | |
| "logs": { | |
| "loss": 0.254, | |
| "epoch": 7.855822550831793, | |
| "learning_rate": 4.562079679081292e-06 | |
| } | |
| }, | |
| { | |
| "step": 21300, | |
| "logs": { | |
| "loss": 0.251, | |
| "epoch": 7.8743068391866915, | |
| "learning_rate": 4.522751405985763e-06 | |
| } | |
| }, | |
| { | |
| "step": 21350, | |
| "logs": { | |
| "loss": 0.2545, | |
| "epoch": 7.89279112754159, | |
| "learning_rate": 4.483423132890235e-06 | |
| } | |
| }, | |
| { | |
| "step": 21400, | |
| "logs": { | |
| "loss": 0.2497, | |
| "epoch": 7.911275415896488, | |
| "learning_rate": 4.444094859794707e-06 | |
| } | |
| }, | |
| { | |
| "step": 21450, | |
| "logs": { | |
| "loss": 0.253, | |
| "epoch": 7.929759704251387, | |
| "learning_rate": 4.4047665866991786e-06 | |
| } | |
| }, | |
| { | |
| "step": 21500, | |
| "logs": { | |
| "loss": 0.249, | |
| "epoch": 7.948243992606285, | |
| "learning_rate": 4.36543831360365e-06 | |
| } | |
| }, | |
| { | |
| "step": 21550, | |
| "logs": { | |
| "loss": 0.2534, | |
| "epoch": 7.966728280961183, | |
| "learning_rate": 4.3261100405081215e-06 | |
| } | |
| }, | |
| { | |
| "step": 21600, | |
| "logs": { | |
| "loss": 0.2563, | |
| "epoch": 7.985212569316081, | |
| "learning_rate": 4.286781767412593e-06 | |
| } | |
| }, | |
| { | |
| "step": 21650, | |
| "logs": { | |
| "loss": 0.2489, | |
| "epoch": 8.00369685767098, | |
| "learning_rate": 4.247453494317064e-06 | |
| } | |
| }, | |
| { | |
| "step": 21700, | |
| "logs": { | |
| "loss": 0.2079, | |
| "epoch": 8.022181146025877, | |
| "learning_rate": 4.208125221221537e-06 | |
| } | |
| }, | |
| { | |
| "step": 21750, | |
| "logs": { | |
| "loss": 0.2079, | |
| "epoch": 8.040665434380776, | |
| "learning_rate": 4.168796948126008e-06 | |
| } | |
| }, | |
| { | |
| "step": 21800, | |
| "logs": { | |
| "loss": 0.2055, | |
| "epoch": 8.059149722735675, | |
| "learning_rate": 4.12946867503048e-06 | |
| } | |
| }, | |
| { | |
| "step": 21850, | |
| "logs": { | |
| "loss": 0.2115, | |
| "epoch": 8.077634011090574, | |
| "learning_rate": 4.090140401934951e-06 | |
| } | |
| }, | |
| { | |
| "step": 21900, | |
| "logs": { | |
| "loss": 0.2105, | |
| "epoch": 8.096118299445472, | |
| "learning_rate": 4.050812128839423e-06 | |
| } | |
| }, | |
| { | |
| "step": 21950, | |
| "logs": { | |
| "loss": 0.2055, | |
| "epoch": 8.11460258780037, | |
| "learning_rate": 4.011483855743895e-06 | |
| } | |
| }, | |
| { | |
| "step": 22000, | |
| "logs": { | |
| "loss": 0.2086, | |
| "epoch": 8.133086876155268, | |
| "learning_rate": 3.972155582648366e-06 | |
| } | |
| }, | |
| { | |
| "step": 22050, | |
| "logs": { | |
| "loss": 0.2102, | |
| "epoch": 8.151571164510166, | |
| "learning_rate": 3.932827309552838e-06 | |
| } | |
| }, | |
| { | |
| "step": 22100, | |
| "logs": { | |
| "loss": 0.21, | |
| "epoch": 8.170055452865064, | |
| "learning_rate": 3.893499036457309e-06 | |
| } | |
| }, | |
| { | |
| "step": 22150, | |
| "logs": { | |
| "loss": 0.2081, | |
| "epoch": 8.188539741219962, | |
| "learning_rate": 3.854170763361781e-06 | |
| } | |
| }, | |
| { | |
| "step": 22200, | |
| "logs": { | |
| "loss": 0.213, | |
| "epoch": 8.207024029574862, | |
| "learning_rate": 3.814842490266253e-06 | |
| } | |
| }, | |
| { | |
| "step": 22250, | |
| "logs": { | |
| "loss": 0.2114, | |
| "epoch": 8.22550831792976, | |
| "learning_rate": 3.7755142171707245e-06 | |
| } | |
| }, | |
| { | |
| "step": 22300, | |
| "logs": { | |
| "loss": 0.2116, | |
| "epoch": 8.243992606284658, | |
| "learning_rate": 3.736185944075196e-06 | |
| } | |
| }, | |
| { | |
| "step": 22350, | |
| "logs": { | |
| "loss": 0.2106, | |
| "epoch": 8.262476894639557, | |
| "learning_rate": 3.696857670979668e-06 | |
| } | |
| }, | |
| { | |
| "step": 22400, | |
| "logs": { | |
| "loss": 0.2097, | |
| "epoch": 8.280961182994455, | |
| "learning_rate": 3.6575293978841393e-06 | |
| } | |
| }, | |
| { | |
| "step": 22450, | |
| "logs": { | |
| "loss": 0.2119, | |
| "epoch": 8.299445471349353, | |
| "learning_rate": 3.6182011247886107e-06 | |
| } | |
| }, | |
| { | |
| "step": 22500, | |
| "logs": { | |
| "loss": 0.2144, | |
| "epoch": 8.317929759704251, | |
| "learning_rate": 3.5788728516930826e-06 | |
| } | |
| }, | |
| { | |
| "step": 22550, | |
| "logs": { | |
| "loss": 0.2125, | |
| "epoch": 8.336414048059149, | |
| "learning_rate": 3.539544578597554e-06 | |
| } | |
| }, | |
| { | |
| "step": 22600, | |
| "logs": { | |
| "loss": 0.2134, | |
| "epoch": 8.354898336414047, | |
| "learning_rate": 3.5002163055020256e-06 | |
| } | |
| }, | |
| { | |
| "step": 22650, | |
| "logs": { | |
| "loss": 0.2127, | |
| "epoch": 8.373382624768947, | |
| "learning_rate": 3.4608880324064974e-06 | |
| } | |
| }, | |
| { | |
| "step": 22700, | |
| "logs": { | |
| "loss": 0.2111, | |
| "epoch": 8.391866913123845, | |
| "learning_rate": 3.421559759310969e-06 | |
| } | |
| }, | |
| { | |
| "step": 22750, | |
| "logs": { | |
| "loss": 0.213, | |
| "epoch": 8.410351201478743, | |
| "learning_rate": 3.3822314862154404e-06 | |
| } | |
| }, | |
| { | |
| "step": 22800, | |
| "logs": { | |
| "loss": 0.2109, | |
| "epoch": 8.428835489833642, | |
| "learning_rate": 3.3429032131199122e-06 | |
| } | |
| }, | |
| { | |
| "step": 22850, | |
| "logs": { | |
| "loss": 0.2093, | |
| "epoch": 8.44731977818854, | |
| "learning_rate": 3.3035749400243837e-06 | |
| } | |
| }, | |
| { | |
| "step": 22900, | |
| "logs": { | |
| "loss": 0.2126, | |
| "epoch": 8.465804066543438, | |
| "learning_rate": 3.264246666928855e-06 | |
| } | |
| }, | |
| { | |
| "step": 22950, | |
| "logs": { | |
| "loss": 0.2127, | |
| "epoch": 8.484288354898336, | |
| "learning_rate": 3.2249183938333275e-06 | |
| } | |
| }, | |
| { | |
| "step": 23000, | |
| "logs": { | |
| "loss": 0.2184, | |
| "epoch": 8.502772643253234, | |
| "learning_rate": 3.1855901207377985e-06 | |
| } | |
| }, | |
| { | |
| "step": 23050, | |
| "logs": { | |
| "loss": 0.2108, | |
| "epoch": 8.521256931608134, | |
| "learning_rate": 3.14626184764227e-06 | |
| } | |
| }, | |
| { | |
| "step": 23100, | |
| "logs": { | |
| "loss": 0.2123, | |
| "epoch": 8.539741219963032, | |
| "learning_rate": 3.1069335745467423e-06 | |
| } | |
| }, | |
| { | |
| "step": 23150, | |
| "logs": { | |
| "loss": 0.2125, | |
| "epoch": 8.55822550831793, | |
| "learning_rate": 3.0676053014512137e-06 | |
| } | |
| }, | |
| { | |
| "step": 23200, | |
| "logs": { | |
| "loss": 0.2124, | |
| "epoch": 8.576709796672828, | |
| "learning_rate": 3.028277028355685e-06 | |
| } | |
| }, | |
| { | |
| "step": 23250, | |
| "logs": { | |
| "loss": 0.2112, | |
| "epoch": 8.595194085027726, | |
| "learning_rate": 2.988948755260157e-06 | |
| } | |
| }, | |
| { | |
| "step": 23300, | |
| "logs": { | |
| "loss": 0.2103, | |
| "epoch": 8.613678373382625, | |
| "learning_rate": 2.9496204821646285e-06 | |
| } | |
| }, | |
| { | |
| "step": 23350, | |
| "logs": { | |
| "loss": 0.2128, | |
| "epoch": 8.632162661737523, | |
| "learning_rate": 2.9102922090691e-06 | |
| } | |
| }, | |
| { | |
| "step": 23400, | |
| "logs": { | |
| "loss": 0.2125, | |
| "epoch": 8.65064695009242, | |
| "learning_rate": 2.8709639359735715e-06 | |
| } | |
| }, | |
| { | |
| "step": 23450, | |
| "logs": { | |
| "loss": 0.2109, | |
| "epoch": 8.669131238447319, | |
| "learning_rate": 2.8316356628780434e-06 | |
| } | |
| }, | |
| { | |
| "step": 23500, | |
| "logs": { | |
| "loss": 0.2132, | |
| "epoch": 8.687615526802219, | |
| "learning_rate": 2.792307389782515e-06 | |
| } | |
| }, | |
| { | |
| "step": 23550, | |
| "logs": { | |
| "loss": 0.2113, | |
| "epoch": 8.706099815157117, | |
| "learning_rate": 2.7529791166869863e-06 | |
| } | |
| }, | |
| { | |
| "step": 23600, | |
| "logs": { | |
| "loss": 0.2109, | |
| "epoch": 8.724584103512015, | |
| "learning_rate": 2.713650843591458e-06 | |
| } | |
| }, | |
| { | |
| "step": 23650, | |
| "logs": { | |
| "loss": 0.2138, | |
| "epoch": 8.743068391866913, | |
| "learning_rate": 2.6743225704959296e-06 | |
| } | |
| }, | |
| { | |
| "step": 23700, | |
| "logs": { | |
| "loss": 0.2098, | |
| "epoch": 8.761552680221811, | |
| "learning_rate": 2.634994297400401e-06 | |
| } | |
| }, | |
| { | |
| "step": 23750, | |
| "logs": { | |
| "loss": 0.2128, | |
| "epoch": 8.78003696857671, | |
| "learning_rate": 2.595666024304873e-06 | |
| } | |
| }, | |
| { | |
| "step": 23800, | |
| "logs": { | |
| "loss": 0.2143, | |
| "epoch": 8.798521256931608, | |
| "learning_rate": 2.5563377512093444e-06 | |
| } | |
| }, | |
| { | |
| "step": 23850, | |
| "logs": { | |
| "loss": 0.2132, | |
| "epoch": 8.817005545286506, | |
| "learning_rate": 2.517009478113816e-06 | |
| } | |
| }, | |
| { | |
| "step": 23900, | |
| "logs": { | |
| "loss": 0.2099, | |
| "epoch": 8.835489833641406, | |
| "learning_rate": 2.4776812050182878e-06 | |
| } | |
| }, | |
| { | |
| "step": 23950, | |
| "logs": { | |
| "loss": 0.2124, | |
| "epoch": 8.853974121996304, | |
| "learning_rate": 2.4383529319227597e-06 | |
| } | |
| }, | |
| { | |
| "step": 24000, | |
| "logs": { | |
| "loss": 0.2122, | |
| "epoch": 8.872458410351202, | |
| "learning_rate": 2.399024658827231e-06 | |
| } | |
| }, | |
| { | |
| "step": 24050, | |
| "logs": { | |
| "loss": 0.2136, | |
| "epoch": 8.8909426987061, | |
| "learning_rate": 2.3596963857317026e-06 | |
| } | |
| }, | |
| { | |
| "step": 24100, | |
| "logs": { | |
| "loss": 0.2103, | |
| "epoch": 8.909426987060998, | |
| "learning_rate": 2.3203681126361745e-06 | |
| } | |
| }, | |
| { | |
| "step": 24150, | |
| "logs": { | |
| "loss": 0.2132, | |
| "epoch": 8.927911275415896, | |
| "learning_rate": 2.281039839540646e-06 | |
| } | |
| }, | |
| { | |
| "step": 24200, | |
| "logs": { | |
| "loss": 0.2082, | |
| "epoch": 8.946395563770794, | |
| "learning_rate": 2.2417115664451174e-06 | |
| } | |
| }, | |
| { | |
| "step": 24250, | |
| "logs": { | |
| "loss": 0.213, | |
| "epoch": 8.964879852125692, | |
| "learning_rate": 2.2023832933495893e-06 | |
| } | |
| }, | |
| { | |
| "step": 24300, | |
| "logs": { | |
| "loss": 0.2142, | |
| "epoch": 8.98336414048059, | |
| "learning_rate": 2.1630550202540607e-06 | |
| } | |
| }, | |
| { | |
| "step": 24350, | |
| "logs": { | |
| "loss": 0.2123, | |
| "epoch": 9.00184842883549, | |
| "learning_rate": 2.123726747158532e-06 | |
| } | |
| }, | |
| { | |
| "step": 24400, | |
| "logs": { | |
| "loss": 0.1854, | |
| "epoch": 9.020332717190389, | |
| "learning_rate": 2.084398474063004e-06 | |
| } | |
| }, | |
| { | |
| "step": 24450, | |
| "logs": { | |
| "loss": 0.1848, | |
| "epoch": 9.038817005545287, | |
| "learning_rate": 2.0450702009674755e-06 | |
| } | |
| }, | |
| { | |
| "step": 24500, | |
| "logs": { | |
| "loss": 0.1802, | |
| "epoch": 9.057301293900185, | |
| "learning_rate": 2.0057419278719474e-06 | |
| } | |
| }, | |
| { | |
| "step": 24550, | |
| "logs": { | |
| "loss": 0.1859, | |
| "epoch": 9.075785582255083, | |
| "learning_rate": 1.966413654776419e-06 | |
| } | |
| }, | |
| { | |
| "step": 24600, | |
| "logs": { | |
| "loss": 0.1849, | |
| "epoch": 9.094269870609981, | |
| "learning_rate": 1.9270853816808904e-06 | |
| } | |
| }, | |
| { | |
| "step": 24650, | |
| "logs": { | |
| "loss": 0.1841, | |
| "epoch": 9.11275415896488, | |
| "learning_rate": 1.8877571085853622e-06 | |
| } | |
| }, | |
| { | |
| "step": 24700, | |
| "logs": { | |
| "loss": 0.1854, | |
| "epoch": 9.131238447319777, | |
| "learning_rate": 1.848428835489834e-06 | |
| } | |
| }, | |
| { | |
| "step": 24750, | |
| "logs": { | |
| "loss": 0.1847, | |
| "epoch": 9.149722735674677, | |
| "learning_rate": 1.8091005623943054e-06 | |
| } | |
| }, | |
| { | |
| "step": 24800, | |
| "logs": { | |
| "loss": 0.1852, | |
| "epoch": 9.168207024029575, | |
| "learning_rate": 1.769772289298777e-06 | |
| } | |
| }, | |
| { | |
| "step": 24850, | |
| "logs": { | |
| "loss": 0.1846, | |
| "epoch": 9.186691312384474, | |
| "learning_rate": 1.7304440162032487e-06 | |
| } | |
| }, | |
| { | |
| "step": 24900, | |
| "logs": { | |
| "loss": 0.1848, | |
| "epoch": 9.205175600739372, | |
| "learning_rate": 1.6911157431077202e-06 | |
| } | |
| }, | |
| { | |
| "step": 24950, | |
| "logs": { | |
| "loss": 0.1861, | |
| "epoch": 9.22365988909427, | |
| "learning_rate": 1.6517874700121919e-06 | |
| } | |
| }, | |
| { | |
| "step": 25000, | |
| "logs": { | |
| "loss": 0.185, | |
| "epoch": 9.242144177449168, | |
| "learning_rate": 1.6124591969166637e-06 | |
| } | |
| }, | |
| { | |
| "step": 25050, | |
| "logs": { | |
| "loss": 0.1846, | |
| "epoch": 9.260628465804066, | |
| "learning_rate": 1.573130923821135e-06 | |
| } | |
| }, | |
| { | |
| "step": 25100, | |
| "logs": { | |
| "loss": 0.1827, | |
| "epoch": 9.279112754158964, | |
| "learning_rate": 1.5338026507256069e-06 | |
| } | |
| }, | |
| { | |
| "step": 25150, | |
| "logs": { | |
| "loss": 0.1871, | |
| "epoch": 9.297597042513864, | |
| "learning_rate": 1.4944743776300785e-06 | |
| } | |
| }, | |
| { | |
| "step": 25200, | |
| "logs": { | |
| "loss": 0.1865, | |
| "epoch": 9.316081330868762, | |
| "learning_rate": 1.45514610453455e-06 | |
| } | |
| }, | |
| { | |
| "step": 25250, | |
| "logs": { | |
| "loss": 0.1859, | |
| "epoch": 9.33456561922366, | |
| "learning_rate": 1.4158178314390217e-06 | |
| } | |
| }, | |
| { | |
| "step": 25300, | |
| "logs": { | |
| "loss": 0.1874, | |
| "epoch": 9.353049907578558, | |
| "learning_rate": 1.3764895583434931e-06 | |
| } | |
| }, | |
| { | |
| "step": 25350, | |
| "logs": { | |
| "loss": 0.1847, | |
| "epoch": 9.371534195933457, | |
| "learning_rate": 1.3371612852479648e-06 | |
| } | |
| }, | |
| { | |
| "step": 25400, | |
| "logs": { | |
| "loss": 0.1849, | |
| "epoch": 9.390018484288355, | |
| "learning_rate": 1.2978330121524365e-06 | |
| } | |
| }, | |
| { | |
| "step": 25450, | |
| "logs": { | |
| "loss": 0.1895, | |
| "epoch": 9.408502772643253, | |
| "learning_rate": 1.258504739056908e-06 | |
| } | |
| }, | |
| { | |
| "step": 25500, | |
| "logs": { | |
| "loss": 0.1829, | |
| "epoch": 9.426987060998151, | |
| "learning_rate": 1.2191764659613798e-06 | |
| } | |
| }, | |
| { | |
| "step": 25550, | |
| "logs": { | |
| "loss": 0.1837, | |
| "epoch": 9.445471349353049, | |
| "learning_rate": 1.1798481928658513e-06 | |
| } | |
| }, | |
| { | |
| "step": 25600, | |
| "logs": { | |
| "loss": 0.1864, | |
| "epoch": 9.463955637707949, | |
| "learning_rate": 1.140519919770323e-06 | |
| } | |
| }, | |
| { | |
| "step": 25650, | |
| "logs": { | |
| "loss": 0.1862, | |
| "epoch": 9.482439926062847, | |
| "learning_rate": 1.1011916466747946e-06 | |
| } | |
| }, | |
| { | |
| "step": 25700, | |
| "logs": { | |
| "loss": 0.19, | |
| "epoch": 9.500924214417745, | |
| "learning_rate": 1.061863373579266e-06 | |
| } | |
| }, | |
| { | |
| "step": 25750, | |
| "logs": { | |
| "loss": 0.1834, | |
| "epoch": 9.519408502772643, | |
| "learning_rate": 1.0225351004837378e-06 | |
| } | |
| }, | |
| { | |
| "step": 25800, | |
| "logs": { | |
| "loss": 0.1863, | |
| "epoch": 9.537892791127542, | |
| "learning_rate": 9.832068273882094e-07 | |
| } | |
| }, | |
| { | |
| "step": 25850, | |
| "logs": { | |
| "loss": 0.1859, | |
| "epoch": 9.55637707948244, | |
| "learning_rate": 9.438785542926811e-07 | |
| } | |
| }, | |
| { | |
| "step": 25900, | |
| "logs": { | |
| "loss": 0.1829, | |
| "epoch": 9.574861367837338, | |
| "learning_rate": 9.045502811971527e-07 | |
| } | |
| }, | |
| { | |
| "step": 25950, | |
| "logs": { | |
| "loss": 0.1838, | |
| "epoch": 9.593345656192236, | |
| "learning_rate": 8.652220081016244e-07 | |
| } | |
| }, | |
| { | |
| "step": 26000, | |
| "logs": { | |
| "loss": 0.1817, | |
| "epoch": 9.611829944547136, | |
| "learning_rate": 8.258937350060959e-07 | |
| } | |
| }, | |
| { | |
| "step": 26050, | |
| "logs": { | |
| "loss": 0.1834, | |
| "epoch": 9.630314232902034, | |
| "learning_rate": 7.865654619105675e-07 | |
| } | |
| }, | |
| { | |
| "step": 26100, | |
| "logs": { | |
| "loss": 0.1857, | |
| "epoch": 9.648798521256932, | |
| "learning_rate": 7.472371888150393e-07 | |
| } | |
| }, | |
| { | |
| "step": 26150, | |
| "logs": { | |
| "loss": 0.1858, | |
| "epoch": 9.66728280961183, | |
| "learning_rate": 7.079089157195108e-07 | |
| } | |
| }, | |
| { | |
| "step": 26200, | |
| "logs": { | |
| "loss": 0.1858, | |
| "epoch": 9.685767097966728, | |
| "learning_rate": 6.685806426239824e-07 | |
| } | |
| }, | |
| { | |
| "step": 26250, | |
| "logs": { | |
| "loss": 0.1848, | |
| "epoch": 9.704251386321626, | |
| "learning_rate": 6.29252369528454e-07 | |
| } | |
| }, | |
| { | |
| "step": 26300, | |
| "logs": { | |
| "loss": 0.1832, | |
| "epoch": 9.722735674676525, | |
| "learning_rate": 5.899240964329256e-07 | |
| } | |
| }, | |
| { | |
| "step": 26350, | |
| "logs": { | |
| "loss": 0.1842, | |
| "epoch": 9.741219963031423, | |
| "learning_rate": 5.505958233373973e-07 | |
| } | |
| }, | |
| { | |
| "step": 26400, | |
| "logs": { | |
| "loss": 0.1842, | |
| "epoch": 9.75970425138632, | |
| "learning_rate": 5.112675502418689e-07 | |
| } | |
| }, | |
| { | |
| "step": 26450, | |
| "logs": { | |
| "loss": 0.1847, | |
| "epoch": 9.77818853974122, | |
| "learning_rate": 4.7193927714634056e-07 | |
| } | |
| }, | |
| { | |
| "step": 26500, | |
| "logs": { | |
| "loss": 0.185, | |
| "epoch": 9.796672828096119, | |
| "learning_rate": 4.326110040508122e-07 | |
| } | |
| }, | |
| { | |
| "step": 26550, | |
| "logs": { | |
| "loss": 0.1826, | |
| "epoch": 9.815157116451017, | |
| "learning_rate": 3.9328273095528375e-07 | |
| } | |
| }, | |
| { | |
| "step": 26600, | |
| "logs": { | |
| "loss": 0.1833, | |
| "epoch": 9.833641404805915, | |
| "learning_rate": 3.539544578597554e-07 | |
| } | |
| }, | |
| { | |
| "step": 26650, | |
| "logs": { | |
| "loss": 0.1846, | |
| "epoch": 9.852125693160813, | |
| "learning_rate": 3.14626184764227e-07 | |
| } | |
| }, | |
| { | |
| "step": 26700, | |
| "logs": { | |
| "loss": 0.184, | |
| "epoch": 9.870609981515711, | |
| "learning_rate": 2.7529791166869866e-07 | |
| } | |
| }, | |
| { | |
| "step": 26750, | |
| "logs": { | |
| "loss": 0.1864, | |
| "epoch": 9.88909426987061, | |
| "learning_rate": 2.3596963857317028e-07 | |
| } | |
| }, | |
| { | |
| "step": 26800, | |
| "logs": { | |
| "loss": 0.1841, | |
| "epoch": 9.907578558225508, | |
| "learning_rate": 1.9664136547764187e-07 | |
| } | |
| }, | |
| { | |
| "step": 26850, | |
| "logs": { | |
| "loss": 0.1855, | |
| "epoch": 9.926062846580407, | |
| "learning_rate": 1.573130923821135e-07 | |
| } | |
| }, | |
| { | |
| "step": 26900, | |
| "logs": { | |
| "loss": 0.1794, | |
| "epoch": 9.944547134935306, | |
| "learning_rate": 1.1798481928658514e-07 | |
| } | |
| }, | |
| { | |
| "step": 26950, | |
| "logs": { | |
| "loss": 0.1853, | |
| "epoch": 9.963031423290204, | |
| "learning_rate": 7.865654619105675e-08 | |
| } | |
| }, | |
| { | |
| "step": 27000, | |
| "logs": { | |
| "loss": 0.1855, | |
| "epoch": 9.981515711645102, | |
| "learning_rate": 3.9328273095528373e-08 | |
| } | |
| } | |
| ], | |
| "train_wrt_samples": [ | |
| { | |
| "step": 19200, | |
| "logs": { | |
| "loss": 1.2091, | |
| "epoch": 0.018484288354898338, | |
| "learning_rate": 1.0584432680980562e-05 | |
| } | |
| }, | |
| { | |
| "step": 38400, | |
| "logs": { | |
| "loss": 1.1315, | |
| "epoch": 0.036968576709796676, | |
| "learning_rate": 1.2459822860720352e-05 | |
| } | |
| }, | |
| { | |
| "step": 57600, | |
| "logs": { | |
| "loss": 1.1118, | |
| "epoch": 0.05545286506469501, | |
| "learning_rate": 1.355685579689696e-05 | |
| } | |
| }, | |
| { | |
| "step": 76800, | |
| "logs": { | |
| "loss": 1.1091, | |
| "epoch": 0.07393715341959335, | |
| "learning_rate": 1.4335213053988223e-05 | |
| } | |
| }, | |
| { | |
| "step": 96000, | |
| "logs": { | |
| "loss": 1.1063, | |
| "epoch": 0.09242144177449169, | |
| "learning_rate": 1.4938953847726847e-05 | |
| } | |
| }, | |
| { | |
| "step": 115200, | |
| "logs": { | |
| "loss": 1.1012, | |
| "epoch": 0.11090573012939002, | |
| "learning_rate": 1.5432245994674192e-05 | |
| } | |
| }, | |
| { | |
| "step": 134400, | |
| "logs": { | |
| "loss": 1.0844, | |
| "epoch": 0.12939001848428835, | |
| "learning_rate": 1.5849318562425815e-05 | |
| } | |
| }, | |
| { | |
| "step": 153600, | |
| "logs": { | |
| "loss": 1.0911, | |
| "epoch": 0.1478743068391867, | |
| "learning_rate": 1.6210603254020138e-05 | |
| } | |
| }, | |
| { | |
| "step": 172800, | |
| "logs": { | |
| "loss": 1.0816, | |
| "epoch": 0.16635859519408502, | |
| "learning_rate": 1.652927893686328e-05 | |
| } | |
| }, | |
| { | |
| "step": 192000, | |
| "logs": { | |
| "loss": 1.0819, | |
| "epoch": 0.18484288354898337, | |
| "learning_rate": 1.6814344049111566e-05 | |
| } | |
| }, | |
| { | |
| "step": 211200, | |
| "logs": { | |
| "loss": 1.0757, | |
| "epoch": 0.2033271719038817, | |
| "learning_rate": 1.70722168104602e-05 | |
| } | |
| }, | |
| { | |
| "step": 230400, | |
| "logs": { | |
| "loss": 1.0706, | |
| "epoch": 0.22181146025878004, | |
| "learning_rate": 1.7307636196960783e-05 | |
| } | |
| }, | |
| { | |
| "step": 249600, | |
| "logs": { | |
| "loss": 1.0698, | |
| "epoch": 0.24029574861367836, | |
| "learning_rate": 1.7524201039271304e-05 | |
| } | |
| }, | |
| { | |
| "step": 268800, | |
| "logs": { | |
| "loss": 1.0632, | |
| "epoch": 0.2587800369685767, | |
| "learning_rate": 1.7724708765356604e-05 | |
| } | |
| }, | |
| { | |
| "step": 288000, | |
| "logs": { | |
| "loss": 1.0601, | |
| "epoch": 0.27726432532347506, | |
| "learning_rate": 1.7911376992503148e-05 | |
| } | |
| }, | |
| { | |
| "step": 307200, | |
| "logs": { | |
| "loss": 1.0582, | |
| "epoch": 0.2957486136783734, | |
| "learning_rate": 1.808599345743407e-05 | |
| } | |
| }, | |
| { | |
| "step": 326400, | |
| "logs": { | |
| "loss": 1.0512, | |
| "epoch": 0.3142329020332717, | |
| "learning_rate": 1.825002041317456e-05 | |
| } | |
| }, | |
| { | |
| "step": 345600, | |
| "logs": { | |
| "loss": 1.0544, | |
| "epoch": 0.33271719038817005, | |
| "learning_rate": 1.840466914065299e-05 | |
| } | |
| }, | |
| { | |
| "step": 364800, | |
| "logs": { | |
| "loss": 1.043, | |
| "epoch": 0.3512014787430684, | |
| "learning_rate": 1.855095428760744e-05 | |
| } | |
| }, | |
| { | |
| "step": 384000, | |
| "logs": { | |
| "loss": 1.047, | |
| "epoch": 0.36968576709796674, | |
| "learning_rate": 1.8689734253201903e-05 | |
| } | |
| }, | |
| { | |
| "step": 403200, | |
| "logs": { | |
| "loss": 1.0408, | |
| "epoch": 0.38817005545286504, | |
| "learning_rate": 1.8821741709263542e-05 | |
| } | |
| }, | |
| { | |
| "step": 422400, | |
| "logs": { | |
| "loss": 1.0431, | |
| "epoch": 0.4066543438077634, | |
| "learning_rate": 1.89476070147965e-05 | |
| } | |
| }, | |
| { | |
| "step": 441600, | |
| "logs": { | |
| "loss": 1.0431, | |
| "epoch": 0.42513863216266173, | |
| "learning_rate": 1.9067876421445012e-05 | |
| } | |
| }, | |
| { | |
| "step": 460800, | |
| "logs": { | |
| "loss": 1.034, | |
| "epoch": 0.4436229205175601, | |
| "learning_rate": 1.9183026401502057e-05 | |
| } | |
| }, | |
| { | |
| "step": 480000, | |
| "logs": { | |
| "loss": 1.039, | |
| "epoch": 0.46210720887245843, | |
| "learning_rate": 1.9293475049105016e-05 | |
| } | |
| }, | |
| { | |
| "step": 499200, | |
| "logs": { | |
| "loss": 1.0304, | |
| "epoch": 0.4805914972273567, | |
| "learning_rate": 1.9399591243986016e-05 | |
| } | |
| }, | |
| { | |
| "step": 518400, | |
| "logs": { | |
| "loss": 1.0385, | |
| "epoch": 0.49907578558225507, | |
| "learning_rate": 1.950170208484624e-05 | |
| } | |
| }, | |
| { | |
| "step": 537600, | |
| "logs": { | |
| "loss": 1.027, | |
| "epoch": 0.5175600739371534, | |
| "learning_rate": 1.9600098970219974e-05 | |
| } | |
| }, | |
| { | |
| "step": 556800, | |
| "logs": { | |
| "loss": 1.0281, | |
| "epoch": 0.5360443622920518, | |
| "learning_rate": 1.9695042611797287e-05 | |
| } | |
| }, | |
| { | |
| "step": 576000, | |
| "logs": { | |
| "loss": 1.0282, | |
| "epoch": 0.5545286506469501, | |
| "learning_rate": 1.978676719749536e-05 | |
| } | |
| }, | |
| { | |
| "step": 595200, | |
| "logs": { | |
| "loss": 1.0186, | |
| "epoch": 0.5730129390018485, | |
| "learning_rate": 1.9875483871657987e-05 | |
| } | |
| }, | |
| { | |
| "step": 614400, | |
| "logs": { | |
| "loss": 1.0237, | |
| "epoch": 0.5914972273567468, | |
| "learning_rate": 1.9961383662539012e-05 | |
| } | |
| }, | |
| { | |
| "step": 633600, | |
| "logs": { | |
| "loss": 1.0176, | |
| "epoch": 0.609981515711645, | |
| "learning_rate": 1.9978762732528416e-05 | |
| } | |
| }, | |
| { | |
| "step": 652800, | |
| "logs": { | |
| "loss": 1.4539, | |
| "epoch": 0.6284658040665434, | |
| "learning_rate": 1.9939434459432887e-05 | |
| } | |
| }, | |
| { | |
| "step": 672000, | |
| "logs": { | |
| "loss": 1.2593, | |
| "epoch": 0.6469500924214417, | |
| "learning_rate": 1.990010618633736e-05 | |
| } | |
| }, | |
| { | |
| "step": 691200, | |
| "logs": { | |
| "loss": 1.5937, | |
| "epoch": 0.6654343807763401, | |
| "learning_rate": 1.986077791324183e-05 | |
| } | |
| }, | |
| { | |
| "step": 710400, | |
| "logs": { | |
| "loss": 1.0165, | |
| "epoch": 0.6839186691312384, | |
| "learning_rate": 1.9821449640146302e-05 | |
| } | |
| }, | |
| { | |
| "step": 729600, | |
| "logs": { | |
| "loss": 1.4354, | |
| "epoch": 0.7024029574861368, | |
| "learning_rate": 1.9782121367050776e-05 | |
| } | |
| }, | |
| { | |
| "step": 748800, | |
| "logs": { | |
| "loss": 1.021, | |
| "epoch": 0.7208872458410351, | |
| "learning_rate": 1.9742793093955247e-05 | |
| } | |
| }, | |
| { | |
| "step": 768000, | |
| "logs": { | |
| "loss": 1.0078, | |
| "epoch": 0.7393715341959335, | |
| "learning_rate": 1.9703464820859717e-05 | |
| } | |
| }, | |
| { | |
| "step": 787200, | |
| "logs": { | |
| "loss": 1.0057, | |
| "epoch": 0.7578558225508318, | |
| "learning_rate": 1.966413654776419e-05 | |
| } | |
| }, | |
| { | |
| "step": 806400, | |
| "logs": { | |
| "loss": 1.0001, | |
| "epoch": 0.7763401109057301, | |
| "learning_rate": 1.9624808274668662e-05 | |
| } | |
| }, | |
| { | |
| "step": 825600, | |
| "logs": { | |
| "loss": 1.006, | |
| "epoch": 0.7948243992606284, | |
| "learning_rate": 1.9585480001573133e-05 | |
| } | |
| }, | |
| { | |
| "step": 844800, | |
| "logs": { | |
| "loss": 1.0103, | |
| "epoch": 0.8133086876155268, | |
| "learning_rate": 1.9546151728477603e-05 | |
| } | |
| }, | |
| { | |
| "step": 864000, | |
| "logs": { | |
| "loss": 1.0046, | |
| "epoch": 0.8317929759704251, | |
| "learning_rate": 1.9506823455382077e-05 | |
| } | |
| }, | |
| { | |
| "step": 883200, | |
| "logs": { | |
| "loss": 0.9941, | |
| "epoch": 0.8502772643253235, | |
| "learning_rate": 1.9467495182286548e-05 | |
| } | |
| }, | |
| { | |
| "step": 902400, | |
| "logs": { | |
| "loss": 0.9963, | |
| "epoch": 0.8687615526802218, | |
| "learning_rate": 1.942816690919102e-05 | |
| } | |
| }, | |
| { | |
| "step": 921600, | |
| "logs": { | |
| "loss": 0.9926, | |
| "epoch": 0.8872458410351202, | |
| "learning_rate": 1.938883863609549e-05 | |
| } | |
| }, | |
| { | |
| "step": 940800, | |
| "logs": { | |
| "loss": 0.9918, | |
| "epoch": 0.9057301293900185, | |
| "learning_rate": 1.934951036299996e-05 | |
| } | |
| }, | |
| { | |
| "step": 960000, | |
| "logs": { | |
| "loss": 0.9899, | |
| "epoch": 0.9242144177449169, | |
| "learning_rate": 1.9310182089904434e-05 | |
| } | |
| }, | |
| { | |
| "step": 979200, | |
| "logs": { | |
| "loss": 0.9887, | |
| "epoch": 0.9426987060998152, | |
| "learning_rate": 1.9270853816808904e-05 | |
| } | |
| }, | |
| { | |
| "step": 998400, | |
| "logs": { | |
| "loss": 0.9942, | |
| "epoch": 0.9611829944547134, | |
| "learning_rate": 1.9231525543713375e-05 | |
| } | |
| }, | |
| { | |
| "step": 1017600, | |
| "logs": { | |
| "loss": 0.9817, | |
| "epoch": 0.9796672828096118, | |
| "learning_rate": 1.919219727061785e-05 | |
| } | |
| }, | |
| { | |
| "step": 1036800, | |
| "logs": { | |
| "loss": 0.9811, | |
| "epoch": 0.9981515711645101, | |
| "learning_rate": 1.915286899752232e-05 | |
| } | |
| }, | |
| { | |
| "step": 1055744, | |
| "logs": { | |
| "loss": 0.8466, | |
| "epoch": 1.0166358595194085, | |
| "learning_rate": 1.911354072442679e-05 | |
| } | |
| }, | |
| { | |
| "step": 1074944, | |
| "logs": { | |
| "loss": 0.8316, | |
| "epoch": 1.0351201478743068, | |
| "learning_rate": 1.9074212451331264e-05 | |
| } | |
| }, | |
| { | |
| "step": 1094144, | |
| "logs": { | |
| "loss": 0.8363, | |
| "epoch": 1.0536044362292052, | |
| "learning_rate": 1.9034884178235735e-05 | |
| } | |
| }, | |
| { | |
| "step": 1113344, | |
| "logs": { | |
| "loss": 0.8378, | |
| "epoch": 1.0720887245841035, | |
| "learning_rate": 1.8995555905140205e-05 | |
| } | |
| }, | |
| { | |
| "step": 1132544, | |
| "logs": { | |
| "loss": 0.8386, | |
| "epoch": 1.0905730129390019, | |
| "learning_rate": 1.895622763204468e-05 | |
| } | |
| }, | |
| { | |
| "step": 1151744, | |
| "logs": { | |
| "loss": 0.8465, | |
| "epoch": 1.1090573012939002, | |
| "learning_rate": 1.891689935894915e-05 | |
| } | |
| }, | |
| { | |
| "step": 1170944, | |
| "logs": { | |
| "loss": 0.8375, | |
| "epoch": 1.1275415896487986, | |
| "learning_rate": 1.887757108585362e-05 | |
| } | |
| }, | |
| { | |
| "step": 1190144, | |
| "logs": { | |
| "loss": 0.8379, | |
| "epoch": 1.146025878003697, | |
| "learning_rate": 1.8838242812758095e-05 | |
| } | |
| }, | |
| { | |
| "step": 1209344, | |
| "logs": { | |
| "loss": 0.836, | |
| "epoch": 1.1645101663585953, | |
| "learning_rate": 1.8798914539662565e-05 | |
| } | |
| }, | |
| { | |
| "step": 1228544, | |
| "logs": { | |
| "loss": 0.8411, | |
| "epoch": 1.1829944547134936, | |
| "learning_rate": 1.8759586266567036e-05 | |
| } | |
| }, | |
| { | |
| "step": 1247744, | |
| "logs": { | |
| "loss": 0.8442, | |
| "epoch": 1.201478743068392, | |
| "learning_rate": 1.872025799347151e-05 | |
| } | |
| }, | |
| { | |
| "step": 1266944, | |
| "logs": { | |
| "loss": 0.8397, | |
| "epoch": 1.21996303142329, | |
| "learning_rate": 1.868092972037598e-05 | |
| } | |
| }, | |
| { | |
| "step": 1286144, | |
| "logs": { | |
| "loss": 0.8415, | |
| "epoch": 1.2384473197781884, | |
| "learning_rate": 1.864160144728045e-05 | |
| } | |
| }, | |
| { | |
| "step": 1305344, | |
| "logs": { | |
| "loss": 0.8397, | |
| "epoch": 1.2569316081330868, | |
| "learning_rate": 1.8602273174184925e-05 | |
| } | |
| }, | |
| { | |
| "step": 1324544, | |
| "logs": { | |
| "loss": 0.8396, | |
| "epoch": 1.2754158964879851, | |
| "learning_rate": 1.8562944901089396e-05 | |
| } | |
| }, | |
| { | |
| "step": 1343744, | |
| "logs": { | |
| "loss": 0.8452, | |
| "epoch": 1.2939001848428835, | |
| "learning_rate": 1.8523616627993866e-05 | |
| } | |
| }, | |
| { | |
| "step": 1362944, | |
| "logs": { | |
| "loss": 0.8362, | |
| "epoch": 1.3123844731977818, | |
| "learning_rate": 1.848428835489834e-05 | |
| } | |
| }, | |
| { | |
| "step": 1382144, | |
| "logs": { | |
| "loss": 0.8396, | |
| "epoch": 1.3308687615526802, | |
| "learning_rate": 1.844496008180281e-05 | |
| } | |
| }, | |
| { | |
| "step": 1401344, | |
| "logs": { | |
| "loss": 0.8334, | |
| "epoch": 1.3493530499075785, | |
| "learning_rate": 1.840563180870728e-05 | |
| } | |
| }, | |
| { | |
| "step": 1420544, | |
| "logs": { | |
| "loss": 0.834, | |
| "epoch": 1.3678373382624769, | |
| "learning_rate": 1.8366303535611752e-05 | |
| } | |
| }, | |
| { | |
| "step": 1439744, | |
| "logs": { | |
| "loss": 0.8333, | |
| "epoch": 1.3863216266173752, | |
| "learning_rate": 1.8326975262516223e-05 | |
| } | |
| }, | |
| { | |
| "step": 1458944, | |
| "logs": { | |
| "loss": 0.8357, | |
| "epoch": 1.4048059149722736, | |
| "learning_rate": 1.8287646989420697e-05 | |
| } | |
| }, | |
| { | |
| "step": 1478144, | |
| "logs": { | |
| "loss": 0.8374, | |
| "epoch": 1.423290203327172, | |
| "learning_rate": 1.8248318716325167e-05 | |
| } | |
| }, | |
| { | |
| "step": 1497344, | |
| "logs": { | |
| "loss": 0.837, | |
| "epoch": 1.4417744916820703, | |
| "learning_rate": 1.8208990443229638e-05 | |
| } | |
| }, | |
| { | |
| "step": 1516544, | |
| "logs": { | |
| "loss": 0.835, | |
| "epoch": 1.4602587800369686, | |
| "learning_rate": 1.816966217013411e-05 | |
| } | |
| }, | |
| { | |
| "step": 1535744, | |
| "logs": { | |
| "loss": 0.8352, | |
| "epoch": 1.478743068391867, | |
| "learning_rate": 1.8130333897038583e-05 | |
| } | |
| }, | |
| { | |
| "step": 1554944, | |
| "logs": { | |
| "loss": 0.8475, | |
| "epoch": 1.4972273567467653, | |
| "learning_rate": 1.8091005623943053e-05 | |
| } | |
| }, | |
| { | |
| "step": 1574144, | |
| "logs": { | |
| "loss": 0.8339, | |
| "epoch": 1.5157116451016637, | |
| "learning_rate": 1.8051677350847524e-05 | |
| } | |
| }, | |
| { | |
| "step": 1593344, | |
| "logs": { | |
| "loss": 0.8382, | |
| "epoch": 1.534195933456562, | |
| "learning_rate": 1.8012349077751998e-05 | |
| } | |
| }, | |
| { | |
| "step": 1612544, | |
| "logs": { | |
| "loss": 0.8376, | |
| "epoch": 1.5526802218114601, | |
| "learning_rate": 1.797302080465647e-05 | |
| } | |
| }, | |
| { | |
| "step": 1631744, | |
| "logs": { | |
| "loss": 0.8302, | |
| "epoch": 1.5711645101663585, | |
| "learning_rate": 1.793369253156094e-05 | |
| } | |
| }, | |
| { | |
| "step": 1650944, | |
| "logs": { | |
| "loss": 0.8312, | |
| "epoch": 1.5896487985212568, | |
| "learning_rate": 1.7894364258465413e-05 | |
| } | |
| }, | |
| { | |
| "step": 1670144, | |
| "logs": { | |
| "loss": 0.8361, | |
| "epoch": 1.6081330868761552, | |
| "learning_rate": 1.7855035985369884e-05 | |
| } | |
| }, | |
| { | |
| "step": 1689344, | |
| "logs": { | |
| "loss": 0.8321, | |
| "epoch": 1.6266173752310535, | |
| "learning_rate": 1.7815707712274354e-05 | |
| } | |
| }, | |
| { | |
| "step": 1708544, | |
| "logs": { | |
| "loss": 0.8374, | |
| "epoch": 1.645101663585952, | |
| "learning_rate": 1.777637943917883e-05 | |
| } | |
| }, | |
| { | |
| "step": 1727744, | |
| "logs": { | |
| "loss": 0.8287, | |
| "epoch": 1.6635859519408502, | |
| "learning_rate": 1.77370511660833e-05 | |
| } | |
| }, | |
| { | |
| "step": 1746944, | |
| "logs": { | |
| "loss": 0.8367, | |
| "epoch": 1.6820702402957486, | |
| "learning_rate": 1.769772289298777e-05 | |
| } | |
| }, | |
| { | |
| "step": 1766144, | |
| "logs": { | |
| "loss": 0.8439, | |
| "epoch": 1.700554528650647, | |
| "learning_rate": 1.7658394619892244e-05 | |
| } | |
| }, | |
| { | |
| "step": 1785344, | |
| "logs": { | |
| "loss": 0.829, | |
| "epoch": 1.7190388170055453, | |
| "learning_rate": 1.7619066346796714e-05 | |
| } | |
| }, | |
| { | |
| "step": 1804544, | |
| "logs": { | |
| "loss": 0.8325, | |
| "epoch": 1.7375231053604436, | |
| "learning_rate": 1.7579738073701185e-05 | |
| } | |
| }, | |
| { | |
| "step": 1823744, | |
| "logs": { | |
| "loss": 0.837, | |
| "epoch": 1.756007393715342, | |
| "learning_rate": 1.754040980060566e-05 | |
| } | |
| }, | |
| { | |
| "step": 1842944, | |
| "logs": { | |
| "loss": 0.8371, | |
| "epoch": 1.7744916820702403, | |
| "learning_rate": 1.750108152751013e-05 | |
| } | |
| }, | |
| { | |
| "step": 1862144, | |
| "logs": { | |
| "loss": 0.832, | |
| "epoch": 1.7929759704251387, | |
| "learning_rate": 1.74617532544146e-05 | |
| } | |
| }, | |
| { | |
| "step": 1881344, | |
| "logs": { | |
| "loss": 0.8342, | |
| "epoch": 1.811460258780037, | |
| "learning_rate": 1.7422424981319074e-05 | |
| } | |
| }, | |
| { | |
| "step": 1900544, | |
| "logs": { | |
| "loss": 0.8331, | |
| "epoch": 1.8299445471349354, | |
| "learning_rate": 1.7383096708223545e-05 | |
| } | |
| }, | |
| { | |
| "step": 1919744, | |
| "logs": { | |
| "loss": 0.8234, | |
| "epoch": 1.8484288354898337, | |
| "learning_rate": 1.7343768435128015e-05 | |
| } | |
| }, | |
| { | |
| "step": 1938944, | |
| "logs": { | |
| "loss": 0.8311, | |
| "epoch": 1.866913123844732, | |
| "learning_rate": 1.7304440162032486e-05 | |
| } | |
| }, | |
| { | |
| "step": 1958144, | |
| "logs": { | |
| "loss": 0.8259, | |
| "epoch": 1.8853974121996304, | |
| "learning_rate": 1.726511188893696e-05 | |
| } | |
| }, | |
| { | |
| "step": 1977344, | |
| "logs": { | |
| "loss": 0.8253, | |
| "epoch": 1.9038817005545285, | |
| "learning_rate": 1.722578361584143e-05 | |
| } | |
| }, | |
| { | |
| "step": 1996544, | |
| "logs": { | |
| "loss": 0.8297, | |
| "epoch": 1.922365988909427, | |
| "learning_rate": 1.71864553427459e-05 | |
| } | |
| }, | |
| { | |
| "step": 2015744, | |
| "logs": { | |
| "loss": 0.8264, | |
| "epoch": 1.9408502772643252, | |
| "learning_rate": 1.7147127069650372e-05 | |
| } | |
| }, | |
| { | |
| "step": 2034944, | |
| "logs": { | |
| "loss": 0.8283, | |
| "epoch": 1.9593345656192236, | |
| "learning_rate": 1.7107798796554846e-05 | |
| } | |
| }, | |
| { | |
| "step": 2054144, | |
| "logs": { | |
| "loss": 0.8262, | |
| "epoch": 1.977818853974122, | |
| "learning_rate": 1.7068470523459316e-05 | |
| } | |
| }, | |
| { | |
| "step": 2073344, | |
| "logs": { | |
| "loss": 0.829, | |
| "epoch": 1.9963031423290203, | |
| "learning_rate": 1.7029142250363787e-05 | |
| } | |
| }, | |
| { | |
| "step": 2092288, | |
| "logs": { | |
| "loss": 0.6969, | |
| "epoch": 2.014787430683919, | |
| "learning_rate": 1.6989813977268258e-05 | |
| } | |
| }, | |
| { | |
| "step": 2111488, | |
| "logs": { | |
| "loss": 0.6715, | |
| "epoch": 2.033271719038817, | |
| "learning_rate": 1.695048570417273e-05 | |
| } | |
| }, | |
| { | |
| "step": 2130688, | |
| "logs": { | |
| "loss": 0.6636, | |
| "epoch": 2.0517560073937156, | |
| "learning_rate": 1.6911157431077202e-05 | |
| } | |
| }, | |
| { | |
| "step": 2149888, | |
| "logs": { | |
| "loss": 0.6649, | |
| "epoch": 2.0702402957486137, | |
| "learning_rate": 1.6871829157981673e-05 | |
| } | |
| }, | |
| { | |
| "step": 2169088, | |
| "logs": { | |
| "loss": 0.665, | |
| "epoch": 2.088724584103512, | |
| "learning_rate": 1.6832500884886147e-05 | |
| } | |
| }, | |
| { | |
| "step": 2188288, | |
| "logs": { | |
| "loss": 0.6746, | |
| "epoch": 2.1072088724584104, | |
| "learning_rate": 1.6793172611790617e-05 | |
| } | |
| }, | |
| { | |
| "step": 2207488, | |
| "logs": { | |
| "loss": 0.6678, | |
| "epoch": 2.1256931608133085, | |
| "learning_rate": 1.6753844338695088e-05 | |
| } | |
| }, | |
| { | |
| "step": 2226688, | |
| "logs": { | |
| "loss": 0.6739, | |
| "epoch": 2.144177449168207, | |
| "learning_rate": 1.6714516065599562e-05 | |
| } | |
| }, | |
| { | |
| "step": 2245888, | |
| "logs": { | |
| "loss": 0.6666, | |
| "epoch": 2.162661737523105, | |
| "learning_rate": 1.6675187792504033e-05 | |
| } | |
| }, | |
| { | |
| "step": 2265088, | |
| "logs": { | |
| "loss": 0.674, | |
| "epoch": 2.1811460258780038, | |
| "learning_rate": 1.6635859519408503e-05 | |
| } | |
| }, | |
| { | |
| "step": 2284288, | |
| "logs": { | |
| "loss": 0.6737, | |
| "epoch": 2.199630314232902, | |
| "learning_rate": 1.6596531246312977e-05 | |
| } | |
| }, | |
| { | |
| "step": 2303488, | |
| "logs": { | |
| "loss": 0.675, | |
| "epoch": 2.2181146025878005, | |
| "learning_rate": 1.6557202973217448e-05 | |
| } | |
| }, | |
| { | |
| "step": 2322688, | |
| "logs": { | |
| "loss": 0.6743, | |
| "epoch": 2.2365988909426986, | |
| "learning_rate": 1.651787470012192e-05 | |
| } | |
| }, | |
| { | |
| "step": 2341888, | |
| "logs": { | |
| "loss": 0.6718, | |
| "epoch": 2.255083179297597, | |
| "learning_rate": 1.647854642702639e-05 | |
| } | |
| }, | |
| { | |
| "step": 2361088, | |
| "logs": { | |
| "loss": 0.6735, | |
| "epoch": 2.2735674676524953, | |
| "learning_rate": 1.6439218153930863e-05 | |
| } | |
| }, | |
| { | |
| "step": 2380288, | |
| "logs": { | |
| "loss": 0.6798, | |
| "epoch": 2.292051756007394, | |
| "learning_rate": 1.6399889880835334e-05 | |
| } | |
| }, | |
| { | |
| "step": 2399488, | |
| "logs": { | |
| "loss": 0.6768, | |
| "epoch": 2.310536044362292, | |
| "learning_rate": 1.6360561607739804e-05 | |
| } | |
| }, | |
| { | |
| "step": 2418688, | |
| "logs": { | |
| "loss": 0.6796, | |
| "epoch": 2.3290203327171906, | |
| "learning_rate": 1.632123333464428e-05 | |
| } | |
| }, | |
| { | |
| "step": 2437888, | |
| "logs": { | |
| "loss": 0.6813, | |
| "epoch": 2.3475046210720887, | |
| "learning_rate": 1.628190506154875e-05 | |
| } | |
| }, | |
| { | |
| "step": 2457088, | |
| "logs": { | |
| "loss": 0.6774, | |
| "epoch": 2.3659889094269873, | |
| "learning_rate": 1.624257678845322e-05 | |
| } | |
| }, | |
| { | |
| "step": 2476288, | |
| "logs": { | |
| "loss": 0.6745, | |
| "epoch": 2.3844731977818854, | |
| "learning_rate": 1.6203248515357694e-05 | |
| } | |
| }, | |
| { | |
| "step": 2495488, | |
| "logs": { | |
| "loss": 0.6809, | |
| "epoch": 2.402957486136784, | |
| "learning_rate": 1.6163920242262164e-05 | |
| } | |
| }, | |
| { | |
| "step": 2514688, | |
| "logs": { | |
| "loss": 0.6831, | |
| "epoch": 2.421441774491682, | |
| "learning_rate": 1.6124591969166635e-05 | |
| } | |
| }, | |
| { | |
| "step": 2533888, | |
| "logs": { | |
| "loss": 0.6803, | |
| "epoch": 2.43992606284658, | |
| "learning_rate": 1.608526369607111e-05 | |
| } | |
| }, | |
| { | |
| "step": 2553088, | |
| "logs": { | |
| "loss": 0.6791, | |
| "epoch": 2.4584103512014788, | |
| "learning_rate": 1.604593542297558e-05 | |
| } | |
| }, | |
| { | |
| "step": 2572288, | |
| "logs": { | |
| "loss": 0.6812, | |
| "epoch": 2.476894639556377, | |
| "learning_rate": 1.600660714988005e-05 | |
| } | |
| }, | |
| { | |
| "step": 2591488, | |
| "logs": { | |
| "loss": 0.6866, | |
| "epoch": 2.4953789279112755, | |
| "learning_rate": 1.596727887678452e-05 | |
| } | |
| }, | |
| { | |
| "step": 2610688, | |
| "logs": { | |
| "loss": 0.6837, | |
| "epoch": 2.5138632162661736, | |
| "learning_rate": 1.5927950603688995e-05 | |
| } | |
| }, | |
| { | |
| "step": 2629888, | |
| "logs": { | |
| "loss": 0.6814, | |
| "epoch": 2.532347504621072, | |
| "learning_rate": 1.5888622330593465e-05 | |
| } | |
| }, | |
| { | |
| "step": 2649088, | |
| "logs": { | |
| "loss": 0.6845, | |
| "epoch": 2.5508317929759703, | |
| "learning_rate": 1.5849294057497936e-05 | |
| } | |
| }, | |
| { | |
| "step": 2668288, | |
| "logs": { | |
| "loss": 0.6832, | |
| "epoch": 2.569316081330869, | |
| "learning_rate": 1.5809965784402407e-05 | |
| } | |
| }, | |
| { | |
| "step": 2687488, | |
| "logs": { | |
| "loss": 0.6795, | |
| "epoch": 2.587800369685767, | |
| "learning_rate": 1.5770637511306877e-05 | |
| } | |
| }, | |
| { | |
| "step": 2706688, | |
| "logs": { | |
| "loss": 0.679, | |
| "epoch": 2.6062846580406656, | |
| "learning_rate": 1.573130923821135e-05 | |
| } | |
| }, | |
| { | |
| "step": 2725888, | |
| "logs": { | |
| "loss": 0.6851, | |
| "epoch": 2.6247689463955637, | |
| "learning_rate": 1.5691980965115822e-05 | |
| } | |
| }, | |
| { | |
| "step": 2745088, | |
| "logs": { | |
| "loss": 0.692, | |
| "epoch": 2.6432532347504623, | |
| "learning_rate": 1.5652652692020292e-05 | |
| } | |
| }, | |
| { | |
| "step": 2764288, | |
| "logs": { | |
| "loss": 0.6956, | |
| "epoch": 2.6617375231053604, | |
| "learning_rate": 1.5613324418924766e-05 | |
| } | |
| }, | |
| { | |
| "step": 2783488, | |
| "logs": { | |
| "loss": 0.6883, | |
| "epoch": 2.680221811460259, | |
| "learning_rate": 1.5573996145829237e-05 | |
| } | |
| }, | |
| { | |
| "step": 2802688, | |
| "logs": { | |
| "loss": 0.6806, | |
| "epoch": 2.698706099815157, | |
| "learning_rate": 1.5534667872733708e-05 | |
| } | |
| }, | |
| { | |
| "step": 2821888, | |
| "logs": { | |
| "loss": 0.6832, | |
| "epoch": 2.7171903881700556, | |
| "learning_rate": 1.549533959963818e-05 | |
| } | |
| }, | |
| { | |
| "step": 2841088, | |
| "logs": { | |
| "loss": 0.6871, | |
| "epoch": 2.7356746765249538, | |
| "learning_rate": 1.5456011326542652e-05 | |
| } | |
| }, | |
| { | |
| "step": 2860288, | |
| "logs": { | |
| "loss": 0.6843, | |
| "epoch": 2.7541589648798523, | |
| "learning_rate": 1.5416683053447123e-05 | |
| } | |
| }, | |
| { | |
| "step": 2879488, | |
| "logs": { | |
| "loss": 0.6869, | |
| "epoch": 2.7726432532347505, | |
| "learning_rate": 1.5377354780351597e-05 | |
| } | |
| }, | |
| { | |
| "step": 2898688, | |
| "logs": { | |
| "loss": 0.689, | |
| "epoch": 2.7911275415896486, | |
| "learning_rate": 1.5338026507256067e-05 | |
| } | |
| }, | |
| { | |
| "step": 2917888, | |
| "logs": { | |
| "loss": 0.6864, | |
| "epoch": 2.809611829944547, | |
| "learning_rate": 1.5298698234160538e-05 | |
| } | |
| }, | |
| { | |
| "step": 2937088, | |
| "logs": { | |
| "loss": 0.6875, | |
| "epoch": 2.8280961182994453, | |
| "learning_rate": 1.5259369961065012e-05 | |
| } | |
| }, | |
| { | |
| "step": 2956288, | |
| "logs": { | |
| "loss": 0.6844, | |
| "epoch": 2.846580406654344, | |
| "learning_rate": 1.5220041687969483e-05 | |
| } | |
| }, | |
| { | |
| "step": 2975488, | |
| "logs": { | |
| "loss": 0.6916, | |
| "epoch": 2.865064695009242, | |
| "learning_rate": 1.5180713414873953e-05 | |
| } | |
| }, | |
| { | |
| "step": 2994688, | |
| "logs": { | |
| "loss": 0.6849, | |
| "epoch": 2.8835489833641406, | |
| "learning_rate": 1.5141385141778426e-05 | |
| } | |
| }, | |
| { | |
| "step": 3013888, | |
| "logs": { | |
| "loss": 0.6835, | |
| "epoch": 2.9020332717190387, | |
| "learning_rate": 1.5102056868682898e-05 | |
| } | |
| }, | |
| { | |
| "step": 3033088, | |
| "logs": { | |
| "loss": 0.6866, | |
| "epoch": 2.9205175600739373, | |
| "learning_rate": 1.5062728595587369e-05 | |
| } | |
| }, | |
| { | |
| "step": 3052288, | |
| "logs": { | |
| "loss": 0.6863, | |
| "epoch": 2.9390018484288354, | |
| "learning_rate": 1.502340032249184e-05 | |
| } | |
| }, | |
| { | |
| "step": 3071488, | |
| "logs": { | |
| "loss": 0.6903, | |
| "epoch": 2.957486136783734, | |
| "learning_rate": 1.4984072049396311e-05 | |
| } | |
| }, | |
| { | |
| "step": 3090688, | |
| "logs": { | |
| "loss": 0.686, | |
| "epoch": 2.975970425138632, | |
| "learning_rate": 1.4944743776300784e-05 | |
| } | |
| }, | |
| { | |
| "step": 3109888, | |
| "logs": { | |
| "loss": 0.6909, | |
| "epoch": 2.9944547134935307, | |
| "learning_rate": 1.4905415503205256e-05 | |
| } | |
| }, | |
| { | |
| "step": 3128832, | |
| "logs": { | |
| "loss": 0.5832, | |
| "epoch": 3.0129390018484288, | |
| "learning_rate": 1.4866087230109727e-05 | |
| } | |
| }, | |
| { | |
| "step": 3148032, | |
| "logs": { | |
| "loss": 0.5314, | |
| "epoch": 3.0314232902033273, | |
| "learning_rate": 1.4826758957014197e-05 | |
| } | |
| }, | |
| { | |
| "step": 3167232, | |
| "logs": { | |
| "loss": 0.5332, | |
| "epoch": 3.0499075785582255, | |
| "learning_rate": 1.4787430683918671e-05 | |
| } | |
| }, | |
| { | |
| "step": 3186432, | |
| "logs": { | |
| "loss": 0.5359, | |
| "epoch": 3.068391866913124, | |
| "learning_rate": 1.4748102410823142e-05 | |
| } | |
| }, | |
| { | |
| "step": 3205632, | |
| "logs": { | |
| "loss": 0.5398, | |
| "epoch": 3.086876155268022, | |
| "learning_rate": 1.4708774137727613e-05 | |
| } | |
| }, | |
| { | |
| "step": 3224832, | |
| "logs": { | |
| "loss": 0.5433, | |
| "epoch": 3.1053604436229203, | |
| "learning_rate": 1.4669445864632087e-05 | |
| } | |
| }, | |
| { | |
| "step": 3244032, | |
| "logs": { | |
| "loss": 0.5368, | |
| "epoch": 3.123844731977819, | |
| "learning_rate": 1.4630117591536557e-05 | |
| } | |
| }, | |
| { | |
| "step": 3263232, | |
| "logs": { | |
| "loss": 0.5419, | |
| "epoch": 3.142329020332717, | |
| "learning_rate": 1.4590789318441028e-05 | |
| } | |
| }, | |
| { | |
| "step": 3282432, | |
| "logs": { | |
| "loss": 0.5398, | |
| "epoch": 3.1608133086876156, | |
| "learning_rate": 1.45514610453455e-05 | |
| } | |
| }, | |
| { | |
| "step": 3301632, | |
| "logs": { | |
| "loss": 0.5442, | |
| "epoch": 3.1792975970425137, | |
| "learning_rate": 1.4512132772249972e-05 | |
| } | |
| }, | |
| { | |
| "step": 3320832, | |
| "logs": { | |
| "loss": 0.544, | |
| "epoch": 3.1977818853974123, | |
| "learning_rate": 1.4472804499154443e-05 | |
| } | |
| }, | |
| { | |
| "step": 3340032, | |
| "logs": { | |
| "loss": 0.5455, | |
| "epoch": 3.2162661737523104, | |
| "learning_rate": 1.4433476226058915e-05 | |
| } | |
| }, | |
| { | |
| "step": 3359232, | |
| "logs": { | |
| "loss": 0.548, | |
| "epoch": 3.234750462107209, | |
| "learning_rate": 1.4394147952963386e-05 | |
| } | |
| }, | |
| { | |
| "step": 3378432, | |
| "logs": { | |
| "loss": 0.5453, | |
| "epoch": 3.253234750462107, | |
| "learning_rate": 1.4354819679867858e-05 | |
| } | |
| }, | |
| { | |
| "step": 3397632, | |
| "logs": { | |
| "loss": 0.5416, | |
| "epoch": 3.2717190388170057, | |
| "learning_rate": 1.431549140677233e-05 | |
| } | |
| }, | |
| { | |
| "step": 3416832, | |
| "logs": { | |
| "loss": 0.5542, | |
| "epoch": 3.290203327171904, | |
| "learning_rate": 1.4276163133676801e-05 | |
| } | |
| }, | |
| { | |
| "step": 3436032, | |
| "logs": { | |
| "loss": 0.5469, | |
| "epoch": 3.3086876155268024, | |
| "learning_rate": 1.4236834860581272e-05 | |
| } | |
| }, | |
| { | |
| "step": 3455232, | |
| "logs": { | |
| "loss": 0.5545, | |
| "epoch": 3.3271719038817005, | |
| "learning_rate": 1.4197506587485746e-05 | |
| } | |
| }, | |
| { | |
| "step": 3474432, | |
| "logs": { | |
| "loss": 0.5538, | |
| "epoch": 3.345656192236599, | |
| "learning_rate": 1.4158178314390216e-05 | |
| } | |
| }, | |
| { | |
| "step": 3493632, | |
| "logs": { | |
| "loss": 0.5504, | |
| "epoch": 3.364140480591497, | |
| "learning_rate": 1.4118850041294687e-05 | |
| } | |
| }, | |
| { | |
| "step": 3512832, | |
| "logs": { | |
| "loss": 0.5511, | |
| "epoch": 3.3826247689463957, | |
| "learning_rate": 1.4079521768199161e-05 | |
| } | |
| }, | |
| { | |
| "step": 3532032, | |
| "logs": { | |
| "loss": 0.554, | |
| "epoch": 3.401109057301294, | |
| "learning_rate": 1.4040193495103632e-05 | |
| } | |
| }, | |
| { | |
| "step": 3551232, | |
| "logs": { | |
| "loss": 0.5541, | |
| "epoch": 3.4195933456561924, | |
| "learning_rate": 1.4000865222008102e-05 | |
| } | |
| }, | |
| { | |
| "step": 3570432, | |
| "logs": { | |
| "loss": 0.5502, | |
| "epoch": 3.4380776340110906, | |
| "learning_rate": 1.3961536948912575e-05 | |
| } | |
| }, | |
| { | |
| "step": 3589632, | |
| "logs": { | |
| "loss": 0.5513, | |
| "epoch": 3.4565619223659887, | |
| "learning_rate": 1.3922208675817047e-05 | |
| } | |
| }, | |
| { | |
| "step": 3608832, | |
| "logs": { | |
| "loss": 0.5579, | |
| "epoch": 3.4750462107208873, | |
| "learning_rate": 1.3882880402721517e-05 | |
| } | |
| }, | |
| { | |
| "step": 3628032, | |
| "logs": { | |
| "loss": 0.5636, | |
| "epoch": 3.4935304990757854, | |
| "learning_rate": 1.384355212962599e-05 | |
| } | |
| }, | |
| { | |
| "step": 3647232, | |
| "logs": { | |
| "loss": 0.5617, | |
| "epoch": 3.512014787430684, | |
| "learning_rate": 1.380422385653046e-05 | |
| } | |
| }, | |
| { | |
| "step": 3666432, | |
| "logs": { | |
| "loss": 0.5549, | |
| "epoch": 3.530499075785582, | |
| "learning_rate": 1.3764895583434933e-05 | |
| } | |
| }, | |
| { | |
| "step": 3685632, | |
| "logs": { | |
| "loss": 0.5599, | |
| "epoch": 3.5489833641404807, | |
| "learning_rate": 1.3725567310339405e-05 | |
| } | |
| }, | |
| { | |
| "step": 3704832, | |
| "logs": { | |
| "loss": 0.5565, | |
| "epoch": 3.567467652495379, | |
| "learning_rate": 1.3686239037243876e-05 | |
| } | |
| }, | |
| { | |
| "step": 3724032, | |
| "logs": { | |
| "loss": 0.5565, | |
| "epoch": 3.5859519408502774, | |
| "learning_rate": 1.3646910764148346e-05 | |
| } | |
| }, | |
| { | |
| "step": 3743232, | |
| "logs": { | |
| "loss": 0.5558, | |
| "epoch": 3.6044362292051755, | |
| "learning_rate": 1.360758249105282e-05 | |
| } | |
| }, | |
| { | |
| "step": 3762432, | |
| "logs": { | |
| "loss": 0.5599, | |
| "epoch": 3.622920517560074, | |
| "learning_rate": 1.356825421795729e-05 | |
| } | |
| }, | |
| { | |
| "step": 3781632, | |
| "logs": { | |
| "loss": 0.561, | |
| "epoch": 3.641404805914972, | |
| "learning_rate": 1.3528925944861761e-05 | |
| } | |
| }, | |
| { | |
| "step": 3800832, | |
| "logs": { | |
| "loss": 0.5596, | |
| "epoch": 3.6598890942698707, | |
| "learning_rate": 1.3489597671766235e-05 | |
| } | |
| }, | |
| { | |
| "step": 3820032, | |
| "logs": { | |
| "loss": 0.5596, | |
| "epoch": 3.678373382624769, | |
| "learning_rate": 1.3450269398670706e-05 | |
| } | |
| }, | |
| { | |
| "step": 3839232, | |
| "logs": { | |
| "loss": 0.5579, | |
| "epoch": 3.6968576709796674, | |
| "learning_rate": 1.3410941125575177e-05 | |
| } | |
| }, | |
| { | |
| "step": 3858432, | |
| "logs": { | |
| "loss": 0.5611, | |
| "epoch": 3.7153419593345656, | |
| "learning_rate": 1.3371612852479649e-05 | |
| } | |
| }, | |
| { | |
| "step": 3877632, | |
| "logs": { | |
| "loss": 0.5627, | |
| "epoch": 3.733826247689464, | |
| "learning_rate": 1.3332284579384121e-05 | |
| } | |
| }, | |
| { | |
| "step": 3896832, | |
| "logs": { | |
| "loss": 0.5613, | |
| "epoch": 3.7523105360443623, | |
| "learning_rate": 1.3292956306288592e-05 | |
| } | |
| }, | |
| { | |
| "step": 3916032, | |
| "logs": { | |
| "loss": 0.5607, | |
| "epoch": 3.770794824399261, | |
| "learning_rate": 1.3253628033193064e-05 | |
| } | |
| }, | |
| { | |
| "step": 3935232, | |
| "logs": { | |
| "loss": 0.5651, | |
| "epoch": 3.789279112754159, | |
| "learning_rate": 1.3214299760097535e-05 | |
| } | |
| }, | |
| { | |
| "step": 3954432, | |
| "logs": { | |
| "loss": 0.5604, | |
| "epoch": 3.807763401109057, | |
| "learning_rate": 1.3174971487002005e-05 | |
| } | |
| }, | |
| { | |
| "step": 3973632, | |
| "logs": { | |
| "loss": 0.5676, | |
| "epoch": 3.8262476894639557, | |
| "learning_rate": 1.313564321390648e-05 | |
| } | |
| }, | |
| { | |
| "step": 3992832, | |
| "logs": { | |
| "loss": 0.5601, | |
| "epoch": 3.844731977818854, | |
| "learning_rate": 1.309631494081095e-05 | |
| } | |
| }, | |
| { | |
| "step": 4012032, | |
| "logs": { | |
| "loss": 0.5645, | |
| "epoch": 3.8632162661737524, | |
| "learning_rate": 1.305698666771542e-05 | |
| } | |
| }, | |
| { | |
| "step": 4031232, | |
| "logs": { | |
| "loss": 0.5653, | |
| "epoch": 3.8817005545286505, | |
| "learning_rate": 1.3017658394619895e-05 | |
| } | |
| }, | |
| { | |
| "step": 4050432, | |
| "logs": { | |
| "loss": 0.5618, | |
| "epoch": 3.900184842883549, | |
| "learning_rate": 1.2978330121524365e-05 | |
| } | |
| }, | |
| { | |
| "step": 4069632, | |
| "logs": { | |
| "loss": 0.5624, | |
| "epoch": 3.918669131238447, | |
| "learning_rate": 1.2939001848428836e-05 | |
| } | |
| }, | |
| { | |
| "step": 4088832, | |
| "logs": { | |
| "loss": 0.5621, | |
| "epoch": 3.9371534195933457, | |
| "learning_rate": 1.289967357533331e-05 | |
| } | |
| }, | |
| { | |
| "step": 4108032, | |
| "logs": { | |
| "loss": 0.5633, | |
| "epoch": 3.955637707948244, | |
| "learning_rate": 1.286034530223778e-05 | |
| } | |
| }, | |
| { | |
| "step": 4127232, | |
| "logs": { | |
| "loss": 0.5645, | |
| "epoch": 3.9741219963031424, | |
| "learning_rate": 1.2821017029142251e-05 | |
| } | |
| }, | |
| { | |
| "step": 4146432, | |
| "logs": { | |
| "loss": 0.5675, | |
| "epoch": 3.9926062846580406, | |
| "learning_rate": 1.2781688756046723e-05 | |
| } | |
| }, | |
| { | |
| "step": 4165376, | |
| "logs": { | |
| "loss": 0.4943, | |
| "epoch": 4.011090573012939, | |
| "learning_rate": 1.2742360482951194e-05 | |
| } | |
| }, | |
| { | |
| "step": 4184576, | |
| "logs": { | |
| "loss": 0.4282, | |
| "epoch": 4.029574861367838, | |
| "learning_rate": 1.2703032209855666e-05 | |
| } | |
| }, | |
| { | |
| "step": 4203776, | |
| "logs": { | |
| "loss": 0.4285, | |
| "epoch": 4.048059149722736, | |
| "learning_rate": 1.2663703936760139e-05 | |
| } | |
| }, | |
| { | |
| "step": 4222976, | |
| "logs": { | |
| "loss": 0.4307, | |
| "epoch": 4.066543438077634, | |
| "learning_rate": 1.262437566366461e-05 | |
| } | |
| }, | |
| { | |
| "step": 4242176, | |
| "logs": { | |
| "loss": 0.4372, | |
| "epoch": 4.085027726432532, | |
| "learning_rate": 1.258504739056908e-05 | |
| } | |
| }, | |
| { | |
| "step": 4261376, | |
| "logs": { | |
| "loss": 0.4377, | |
| "epoch": 4.103512014787431, | |
| "learning_rate": 1.2545719117473554e-05 | |
| } | |
| }, | |
| { | |
| "step": 4280576, | |
| "logs": { | |
| "loss": 0.4296, | |
| "epoch": 4.121996303142329, | |
| "learning_rate": 1.2506390844378025e-05 | |
| } | |
| }, | |
| { | |
| "step": 4299776, | |
| "logs": { | |
| "loss": 0.4358, | |
| "epoch": 4.140480591497227, | |
| "learning_rate": 1.2467062571282495e-05 | |
| } | |
| }, | |
| { | |
| "step": 4318976, | |
| "logs": { | |
| "loss": 0.4383, | |
| "epoch": 4.1589648798521255, | |
| "learning_rate": 1.2427734298186969e-05 | |
| } | |
| }, | |
| { | |
| "step": 4338176, | |
| "logs": { | |
| "loss": 0.4355, | |
| "epoch": 4.177449168207024, | |
| "learning_rate": 1.238840602509144e-05 | |
| } | |
| }, | |
| { | |
| "step": 4357376, | |
| "logs": { | |
| "loss": 0.44, | |
| "epoch": 4.195933456561923, | |
| "learning_rate": 1.234907775199591e-05 | |
| } | |
| }, | |
| { | |
| "step": 4376576, | |
| "logs": { | |
| "loss": 0.4393, | |
| "epoch": 4.214417744916821, | |
| "learning_rate": 1.2309749478900384e-05 | |
| } | |
| }, | |
| { | |
| "step": 4395776, | |
| "logs": { | |
| "loss": 0.4427, | |
| "epoch": 4.232902033271719, | |
| "learning_rate": 1.2270421205804855e-05 | |
| } | |
| }, | |
| { | |
| "step": 4414976, | |
| "logs": { | |
| "loss": 0.4399, | |
| "epoch": 4.251386321626617, | |
| "learning_rate": 1.2231092932709326e-05 | |
| } | |
| }, | |
| { | |
| "step": 4434176, | |
| "logs": { | |
| "loss": 0.4401, | |
| "epoch": 4.269870609981516, | |
| "learning_rate": 1.2191764659613798e-05 | |
| } | |
| }, | |
| { | |
| "step": 4453376, | |
| "logs": { | |
| "loss": 0.4446, | |
| "epoch": 4.288354898336414, | |
| "learning_rate": 1.2152436386518269e-05 | |
| } | |
| }, | |
| { | |
| "step": 4472576, | |
| "logs": { | |
| "loss": 0.4436, | |
| "epoch": 4.306839186691312, | |
| "learning_rate": 1.211310811342274e-05 | |
| } | |
| }, | |
| { | |
| "step": 4491776, | |
| "logs": { | |
| "loss": 0.4478, | |
| "epoch": 4.32532347504621, | |
| "learning_rate": 1.2073779840327213e-05 | |
| } | |
| }, | |
| { | |
| "step": 4510976, | |
| "logs": { | |
| "loss": 0.447, | |
| "epoch": 4.343807763401109, | |
| "learning_rate": 1.2034451567231684e-05 | |
| } | |
| }, | |
| { | |
| "step": 4530176, | |
| "logs": { | |
| "loss": 0.4505, | |
| "epoch": 4.3622920517560075, | |
| "learning_rate": 1.1995123294136154e-05 | |
| } | |
| }, | |
| { | |
| "step": 4549376, | |
| "logs": { | |
| "loss": 0.4461, | |
| "epoch": 4.380776340110906, | |
| "learning_rate": 1.1955795021040628e-05 | |
| } | |
| }, | |
| { | |
| "step": 4568576, | |
| "logs": { | |
| "loss": 0.4511, | |
| "epoch": 4.399260628465804, | |
| "learning_rate": 1.1916466747945099e-05 | |
| } | |
| }, | |
| { | |
| "step": 4587776, | |
| "logs": { | |
| "loss": 0.4481, | |
| "epoch": 4.417744916820703, | |
| "learning_rate": 1.187713847484957e-05 | |
| } | |
| }, | |
| { | |
| "step": 4606976, | |
| "logs": { | |
| "loss": 0.4457, | |
| "epoch": 4.436229205175601, | |
| "learning_rate": 1.1837810201754044e-05 | |
| } | |
| }, | |
| { | |
| "step": 4626176, | |
| "logs": { | |
| "loss": 0.4491, | |
| "epoch": 4.454713493530499, | |
| "learning_rate": 1.1798481928658514e-05 | |
| } | |
| }, | |
| { | |
| "step": 4645376, | |
| "logs": { | |
| "loss": 0.453, | |
| "epoch": 4.473197781885397, | |
| "learning_rate": 1.1759153655562985e-05 | |
| } | |
| }, | |
| { | |
| "step": 4664576, | |
| "logs": { | |
| "loss": 0.4557, | |
| "epoch": 4.491682070240295, | |
| "learning_rate": 1.1719825382467455e-05 | |
| } | |
| }, | |
| { | |
| "step": 4683776, | |
| "logs": { | |
| "loss": 0.4588, | |
| "epoch": 4.510166358595194, | |
| "learning_rate": 1.168049710937193e-05 | |
| } | |
| }, | |
| { | |
| "step": 4702976, | |
| "logs": { | |
| "loss": 0.4478, | |
| "epoch": 4.5286506469500925, | |
| "learning_rate": 1.16411688362764e-05 | |
| } | |
| }, | |
| { | |
| "step": 4722176, | |
| "logs": { | |
| "loss": 0.4558, | |
| "epoch": 4.547134935304991, | |
| "learning_rate": 1.160184056318087e-05 | |
| } | |
| }, | |
| { | |
| "step": 4741376, | |
| "logs": { | |
| "loss": 0.453, | |
| "epoch": 4.565619223659889, | |
| "learning_rate": 1.1562512290085343e-05 | |
| } | |
| }, | |
| { | |
| "step": 4760576, | |
| "logs": { | |
| "loss": 0.4566, | |
| "epoch": 4.584103512014788, | |
| "learning_rate": 1.1523184016989815e-05 | |
| } | |
| }, | |
| { | |
| "step": 4779776, | |
| "logs": { | |
| "loss": 0.4512, | |
| "epoch": 4.602587800369686, | |
| "learning_rate": 1.1483855743894286e-05 | |
| } | |
| }, | |
| { | |
| "step": 4798976, | |
| "logs": { | |
| "loss": 0.4537, | |
| "epoch": 4.621072088724584, | |
| "learning_rate": 1.1444527470798758e-05 | |
| } | |
| }, | |
| { | |
| "step": 4818176, | |
| "logs": { | |
| "loss": 0.4596, | |
| "epoch": 4.639556377079482, | |
| "learning_rate": 1.1405199197703229e-05 | |
| } | |
| }, | |
| { | |
| "step": 4837376, | |
| "logs": { | |
| "loss": 0.4544, | |
| "epoch": 4.658040665434381, | |
| "learning_rate": 1.1365870924607701e-05 | |
| } | |
| }, | |
| { | |
| "step": 4856576, | |
| "logs": { | |
| "loss": 0.4552, | |
| "epoch": 4.676524953789279, | |
| "learning_rate": 1.1326542651512173e-05 | |
| } | |
| }, | |
| { | |
| "step": 4875776, | |
| "logs": { | |
| "loss": 0.4561, | |
| "epoch": 4.695009242144177, | |
| "learning_rate": 1.1287214378416644e-05 | |
| } | |
| }, | |
| { | |
| "step": 4894976, | |
| "logs": { | |
| "loss": 0.456, | |
| "epoch": 4.7134935304990755, | |
| "learning_rate": 1.1247886105321115e-05 | |
| } | |
| }, | |
| { | |
| "step": 4914176, | |
| "logs": { | |
| "loss": 0.455, | |
| "epoch": 4.7319778188539745, | |
| "learning_rate": 1.1208557832225589e-05 | |
| } | |
| }, | |
| { | |
| "step": 4933376, | |
| "logs": { | |
| "loss": 0.4579, | |
| "epoch": 4.750462107208873, | |
| "learning_rate": 1.116922955913006e-05 | |
| } | |
| }, | |
| { | |
| "step": 4952576, | |
| "logs": { | |
| "loss": 0.4569, | |
| "epoch": 4.768946395563771, | |
| "learning_rate": 1.112990128603453e-05 | |
| } | |
| }, | |
| { | |
| "step": 4971776, | |
| "logs": { | |
| "loss": 0.459, | |
| "epoch": 4.787430683918669, | |
| "learning_rate": 1.1090573012939004e-05 | |
| } | |
| }, | |
| { | |
| "step": 4990976, | |
| "logs": { | |
| "loss": 0.456, | |
| "epoch": 4.805914972273568, | |
| "learning_rate": 1.1051244739843475e-05 | |
| } | |
| }, | |
| { | |
| "step": 5010176, | |
| "logs": { | |
| "loss": 0.4605, | |
| "epoch": 4.824399260628466, | |
| "learning_rate": 1.1011916466747945e-05 | |
| } | |
| }, | |
| { | |
| "step": 5029376, | |
| "logs": { | |
| "loss": 0.4565, | |
| "epoch": 4.842883548983364, | |
| "learning_rate": 1.0972588193652417e-05 | |
| } | |
| }, | |
| { | |
| "step": 5048576, | |
| "logs": { | |
| "loss": 0.4606, | |
| "epoch": 4.861367837338262, | |
| "learning_rate": 1.093325992055689e-05 | |
| } | |
| }, | |
| { | |
| "step": 5067776, | |
| "logs": { | |
| "loss": 0.4586, | |
| "epoch": 4.87985212569316, | |
| "learning_rate": 1.089393164746136e-05 | |
| } | |
| }, | |
| { | |
| "step": 5086976, | |
| "logs": { | |
| "loss": 0.4605, | |
| "epoch": 4.898336414048059, | |
| "learning_rate": 1.0854603374365833e-05 | |
| } | |
| }, | |
| { | |
| "step": 5106176, | |
| "logs": { | |
| "loss": 0.4565, | |
| "epoch": 4.9168207024029575, | |
| "learning_rate": 1.0815275101270303e-05 | |
| } | |
| }, | |
| { | |
| "step": 5125376, | |
| "logs": { | |
| "loss": 0.4585, | |
| "epoch": 4.935304990757856, | |
| "learning_rate": 1.0775946828174776e-05 | |
| } | |
| }, | |
| { | |
| "step": 5144576, | |
| "logs": { | |
| "loss": 0.4588, | |
| "epoch": 4.953789279112754, | |
| "learning_rate": 1.0736618555079248e-05 | |
| } | |
| }, | |
| { | |
| "step": 5163776, | |
| "logs": { | |
| "loss": 0.4639, | |
| "epoch": 4.972273567467653, | |
| "learning_rate": 1.0697290281983718e-05 | |
| } | |
| }, | |
| { | |
| "step": 5182976, | |
| "logs": { | |
| "loss": 0.4666, | |
| "epoch": 4.990757855822551, | |
| "learning_rate": 1.0657962008888189e-05 | |
| } | |
| }, | |
| { | |
| "step": 5201920, | |
| "logs": { | |
| "loss": 0.4109, | |
| "epoch": 5.009242144177449, | |
| "learning_rate": 1.0618633735792663e-05 | |
| } | |
| }, | |
| { | |
| "step": 5221120, | |
| "logs": { | |
| "loss": 0.3538, | |
| "epoch": 5.027726432532347, | |
| "learning_rate": 1.0579305462697134e-05 | |
| } | |
| }, | |
| { | |
| "step": 5240320, | |
| "logs": { | |
| "loss": 0.346, | |
| "epoch": 5.046210720887246, | |
| "learning_rate": 1.0539977189601604e-05 | |
| } | |
| }, | |
| { | |
| "step": 5259520, | |
| "logs": { | |
| "loss": 0.3483, | |
| "epoch": 5.064695009242144, | |
| "learning_rate": 1.0500648916506078e-05 | |
| } | |
| }, | |
| { | |
| "step": 5278720, | |
| "logs": { | |
| "loss": 0.3548, | |
| "epoch": 5.0831792975970425, | |
| "learning_rate": 1.0461320643410549e-05 | |
| } | |
| }, | |
| { | |
| "step": 5297920, | |
| "logs": { | |
| "loss": 0.3567, | |
| "epoch": 5.101663585951941, | |
| "learning_rate": 1.042199237031502e-05 | |
| } | |
| }, | |
| { | |
| "step": 5317120, | |
| "logs": { | |
| "loss": 0.3525, | |
| "epoch": 5.12014787430684, | |
| "learning_rate": 1.0382664097219492e-05 | |
| } | |
| }, | |
| { | |
| "step": 5336320, | |
| "logs": { | |
| "loss": 0.3563, | |
| "epoch": 5.138632162661738, | |
| "learning_rate": 1.0343335824123964e-05 | |
| } | |
| }, | |
| { | |
| "step": 5355520, | |
| "logs": { | |
| "loss": 0.3606, | |
| "epoch": 5.157116451016636, | |
| "learning_rate": 1.0304007551028435e-05 | |
| } | |
| }, | |
| { | |
| "step": 5374720, | |
| "logs": { | |
| "loss": 0.3585, | |
| "epoch": 5.175600739371534, | |
| "learning_rate": 1.0264679277932907e-05 | |
| } | |
| }, | |
| { | |
| "step": 5393920, | |
| "logs": { | |
| "loss": 0.3547, | |
| "epoch": 5.194085027726432, | |
| "learning_rate": 1.0225351004837378e-05 | |
| } | |
| }, | |
| { | |
| "step": 5413120, | |
| "logs": { | |
| "loss": 0.359, | |
| "epoch": 5.212569316081331, | |
| "learning_rate": 1.018602273174185e-05 | |
| } | |
| }, | |
| { | |
| "step": 5432320, | |
| "logs": { | |
| "loss": 0.3616, | |
| "epoch": 5.231053604436229, | |
| "learning_rate": 1.0146694458646322e-05 | |
| } | |
| }, | |
| { | |
| "step": 5451520, | |
| "logs": { | |
| "loss": 0.3602, | |
| "epoch": 5.249537892791127, | |
| "learning_rate": 1.0107366185550793e-05 | |
| } | |
| }, | |
| { | |
| "step": 5470720, | |
| "logs": { | |
| "loss": 0.3607, | |
| "epoch": 5.2680221811460255, | |
| "learning_rate": 1.0068037912455264e-05 | |
| } | |
| }, | |
| { | |
| "step": 5489920, | |
| "logs": { | |
| "loss": 0.3642, | |
| "epoch": 5.2865064695009245, | |
| "learning_rate": 1.0028709639359738e-05 | |
| } | |
| }, | |
| { | |
| "step": 5509120, | |
| "logs": { | |
| "loss": 0.3616, | |
| "epoch": 5.304990757855823, | |
| "learning_rate": 9.989381366264208e-06 | |
| } | |
| }, | |
| { | |
| "step": 5528320, | |
| "logs": { | |
| "loss": 0.364, | |
| "epoch": 5.323475046210721, | |
| "learning_rate": 9.95005309316868e-06 | |
| } | |
| }, | |
| { | |
| "step": 5547520, | |
| "logs": { | |
| "loss": 0.3656, | |
| "epoch": 5.341959334565619, | |
| "learning_rate": 9.910724820073151e-06 | |
| } | |
| }, | |
| { | |
| "step": 5566720, | |
| "logs": { | |
| "loss": 0.3613, | |
| "epoch": 5.360443622920518, | |
| "learning_rate": 9.871396546977623e-06 | |
| } | |
| }, | |
| { | |
| "step": 5585920, | |
| "logs": { | |
| "loss": 0.3655, | |
| "epoch": 5.378927911275416, | |
| "learning_rate": 9.832068273882096e-06 | |
| } | |
| }, | |
| { | |
| "step": 5605120, | |
| "logs": { | |
| "loss": 0.3677, | |
| "epoch": 5.397412199630314, | |
| "learning_rate": 9.792740000786566e-06 | |
| } | |
| }, | |
| { | |
| "step": 5624320, | |
| "logs": { | |
| "loss": 0.3678, | |
| "epoch": 5.415896487985212, | |
| "learning_rate": 9.753411727691039e-06 | |
| } | |
| }, | |
| { | |
| "step": 5643520, | |
| "logs": { | |
| "loss": 0.364, | |
| "epoch": 5.434380776340111, | |
| "learning_rate": 9.71408345459551e-06 | |
| } | |
| }, | |
| { | |
| "step": 5662720, | |
| "logs": { | |
| "loss": 0.3654, | |
| "epoch": 5.452865064695009, | |
| "learning_rate": 9.67475518149998e-06 | |
| } | |
| }, | |
| { | |
| "step": 5681920, | |
| "logs": { | |
| "loss": 0.3671, | |
| "epoch": 5.4713493530499075, | |
| "learning_rate": 9.635426908404452e-06 | |
| } | |
| }, | |
| { | |
| "step": 5701120, | |
| "logs": { | |
| "loss": 0.3724, | |
| "epoch": 5.489833641404806, | |
| "learning_rate": 9.596098635308924e-06 | |
| } | |
| }, | |
| { | |
| "step": 5720320, | |
| "logs": { | |
| "loss": 1.4537, | |
| "epoch": 5.508317929759705, | |
| "learning_rate": 9.556770362213395e-06 | |
| } | |
| }, | |
| { | |
| "step": 5739520, | |
| "logs": { | |
| "loss": 0.3685, | |
| "epoch": 5.526802218114603, | |
| "learning_rate": 9.517442089117867e-06 | |
| } | |
| }, | |
| { | |
| "step": 5758720, | |
| "logs": { | |
| "loss": 0.3688, | |
| "epoch": 5.545286506469501, | |
| "learning_rate": 9.47811381602234e-06 | |
| } | |
| }, | |
| { | |
| "step": 5777920, | |
| "logs": { | |
| "loss": 0.3726, | |
| "epoch": 5.563770794824399, | |
| "learning_rate": 9.43878554292681e-06 | |
| } | |
| }, | |
| { | |
| "step": 5797120, | |
| "logs": { | |
| "loss": 0.3718, | |
| "epoch": 5.582255083179297, | |
| "learning_rate": 9.399457269831283e-06 | |
| } | |
| }, | |
| { | |
| "step": 5816320, | |
| "logs": { | |
| "loss": 0.3691, | |
| "epoch": 5.600739371534196, | |
| "learning_rate": 9.360128996735755e-06 | |
| } | |
| }, | |
| { | |
| "step": 5835520, | |
| "logs": { | |
| "loss": 0.3684, | |
| "epoch": 5.619223659889094, | |
| "learning_rate": 9.320800723640226e-06 | |
| } | |
| }, | |
| { | |
| "step": 5854720, | |
| "logs": { | |
| "loss": 0.3747, | |
| "epoch": 5.6377079482439925, | |
| "learning_rate": 9.281472450544698e-06 | |
| } | |
| }, | |
| { | |
| "step": 5873920, | |
| "logs": { | |
| "loss": 0.3727, | |
| "epoch": 5.656192236598891, | |
| "learning_rate": 9.24214417744917e-06 | |
| } | |
| }, | |
| { | |
| "step": 5893120, | |
| "logs": { | |
| "loss": 0.3736, | |
| "epoch": 5.67467652495379, | |
| "learning_rate": 9.20281590435364e-06 | |
| } | |
| }, | |
| { | |
| "step": 5912320, | |
| "logs": { | |
| "loss": 0.3725, | |
| "epoch": 5.693160813308688, | |
| "learning_rate": 9.163487631258111e-06 | |
| } | |
| }, | |
| { | |
| "step": 5931520, | |
| "logs": { | |
| "loss": 0.3711, | |
| "epoch": 5.711645101663586, | |
| "learning_rate": 9.124159358162584e-06 | |
| } | |
| }, | |
| { | |
| "step": 5950720, | |
| "logs": { | |
| "loss": 0.3705, | |
| "epoch": 5.730129390018484, | |
| "learning_rate": 9.084831085067054e-06 | |
| } | |
| }, | |
| { | |
| "step": 5969920, | |
| "logs": { | |
| "loss": 0.3698, | |
| "epoch": 5.748613678373383, | |
| "learning_rate": 9.045502811971527e-06 | |
| } | |
| }, | |
| { | |
| "step": 5989120, | |
| "logs": { | |
| "loss": 0.3725, | |
| "epoch": 5.767097966728281, | |
| "learning_rate": 9.006174538875999e-06 | |
| } | |
| }, | |
| { | |
| "step": 6008320, | |
| "logs": { | |
| "loss": 0.3767, | |
| "epoch": 5.785582255083179, | |
| "learning_rate": 8.96684626578047e-06 | |
| } | |
| }, | |
| { | |
| "step": 6027520, | |
| "logs": { | |
| "loss": 0.3696, | |
| "epoch": 5.804066543438077, | |
| "learning_rate": 8.927517992684942e-06 | |
| } | |
| }, | |
| { | |
| "step": 6046720, | |
| "logs": { | |
| "loss": 0.3797, | |
| "epoch": 5.822550831792976, | |
| "learning_rate": 8.888189719589414e-06 | |
| } | |
| }, | |
| { | |
| "step": 6065920, | |
| "logs": { | |
| "loss": 0.371, | |
| "epoch": 5.8410351201478745, | |
| "learning_rate": 8.848861446493885e-06 | |
| } | |
| }, | |
| { | |
| "step": 6085120, | |
| "logs": { | |
| "loss": 0.3769, | |
| "epoch": 5.859519408502773, | |
| "learning_rate": 8.809533173398357e-06 | |
| } | |
| }, | |
| { | |
| "step": 6104320, | |
| "logs": { | |
| "loss": 0.3731, | |
| "epoch": 5.878003696857671, | |
| "learning_rate": 8.77020490030283e-06 | |
| } | |
| }, | |
| { | |
| "step": 6123520, | |
| "logs": { | |
| "loss": 0.3769, | |
| "epoch": 5.896487985212569, | |
| "learning_rate": 8.7308766272073e-06 | |
| } | |
| }, | |
| { | |
| "step": 6142720, | |
| "logs": { | |
| "loss": 0.3711, | |
| "epoch": 5.914972273567468, | |
| "learning_rate": 8.691548354111772e-06 | |
| } | |
| }, | |
| { | |
| "step": 6161920, | |
| "logs": { | |
| "loss": 0.3752, | |
| "epoch": 5.933456561922366, | |
| "learning_rate": 8.652220081016243e-06 | |
| } | |
| }, | |
| { | |
| "step": 6181120, | |
| "logs": { | |
| "loss": 0.3697, | |
| "epoch": 5.951940850277264, | |
| "learning_rate": 8.612891807920715e-06 | |
| } | |
| }, | |
| { | |
| "step": 6200320, | |
| "logs": { | |
| "loss": 0.3751, | |
| "epoch": 5.970425138632162, | |
| "learning_rate": 8.573563534825186e-06 | |
| } | |
| }, | |
| { | |
| "step": 6219520, | |
| "logs": { | |
| "loss": 0.3791, | |
| "epoch": 5.988909426987061, | |
| "learning_rate": 8.534235261729658e-06 | |
| } | |
| }, | |
| { | |
| "step": 6238464, | |
| "logs": { | |
| "loss": 0.3443, | |
| "epoch": 6.007393715341959, | |
| "learning_rate": 8.494906988634129e-06 | |
| } | |
| }, | |
| { | |
| "step": 6257664, | |
| "logs": { | |
| "loss": 0.2903, | |
| "epoch": 6.0258780036968576, | |
| "learning_rate": 8.455578715538601e-06 | |
| } | |
| }, | |
| { | |
| "step": 6276864, | |
| "logs": { | |
| "loss": 0.2906, | |
| "epoch": 6.044362292051756, | |
| "learning_rate": 8.416250442443073e-06 | |
| } | |
| }, | |
| { | |
| "step": 6296064, | |
| "logs": { | |
| "loss": 0.2884, | |
| "epoch": 6.062846580406655, | |
| "learning_rate": 8.376922169347544e-06 | |
| } | |
| }, | |
| { | |
| "step": 6315264, | |
| "logs": { | |
| "loss": 0.2913, | |
| "epoch": 6.081330868761553, | |
| "learning_rate": 8.337593896252016e-06 | |
| } | |
| }, | |
| { | |
| "step": 6334464, | |
| "logs": { | |
| "loss": 0.2964, | |
| "epoch": 6.099815157116451, | |
| "learning_rate": 8.298265623156489e-06 | |
| } | |
| }, | |
| { | |
| "step": 6353664, | |
| "logs": { | |
| "loss": 0.2877, | |
| "epoch": 6.118299445471349, | |
| "learning_rate": 8.25893735006096e-06 | |
| } | |
| }, | |
| { | |
| "step": 6372864, | |
| "logs": { | |
| "loss": 0.2957, | |
| "epoch": 6.136783733826248, | |
| "learning_rate": 8.219609076965432e-06 | |
| } | |
| }, | |
| { | |
| "step": 6392064, | |
| "logs": { | |
| "loss": 0.2974, | |
| "epoch": 6.155268022181146, | |
| "learning_rate": 8.180280803869902e-06 | |
| } | |
| }, | |
| { | |
| "step": 6411264, | |
| "logs": { | |
| "loss": 0.295, | |
| "epoch": 6.173752310536044, | |
| "learning_rate": 8.140952530774374e-06 | |
| } | |
| }, | |
| { | |
| "step": 6430464, | |
| "logs": { | |
| "loss": 0.2947, | |
| "epoch": 6.1922365988909425, | |
| "learning_rate": 8.101624257678847e-06 | |
| } | |
| }, | |
| { | |
| "step": 6449664, | |
| "logs": { | |
| "loss": 0.2957, | |
| "epoch": 6.210720887245841, | |
| "learning_rate": 8.062295984583317e-06 | |
| } | |
| }, | |
| { | |
| "step": 6468864, | |
| "logs": { | |
| "loss": 0.3001, | |
| "epoch": 6.22920517560074, | |
| "learning_rate": 8.02296771148779e-06 | |
| } | |
| }, | |
| { | |
| "step": 6488064, | |
| "logs": { | |
| "loss": 0.2958, | |
| "epoch": 6.247689463955638, | |
| "learning_rate": 7.98363943839226e-06 | |
| } | |
| }, | |
| { | |
| "step": 6507264, | |
| "logs": { | |
| "loss": 0.2956, | |
| "epoch": 6.266173752310536, | |
| "learning_rate": 7.944311165296733e-06 | |
| } | |
| }, | |
| { | |
| "step": 6526464, | |
| "logs": { | |
| "loss": 0.3, | |
| "epoch": 6.284658040665434, | |
| "learning_rate": 7.904982892201203e-06 | |
| } | |
| }, | |
| { | |
| "step": 6545664, | |
| "logs": { | |
| "loss": 0.3, | |
| "epoch": 6.303142329020333, | |
| "learning_rate": 7.865654619105676e-06 | |
| } | |
| }, | |
| { | |
| "step": 6564864, | |
| "logs": { | |
| "loss": 0.3003, | |
| "epoch": 6.321626617375231, | |
| "learning_rate": 7.826326346010146e-06 | |
| } | |
| }, | |
| { | |
| "step": 6584064, | |
| "logs": { | |
| "loss": 0.3029, | |
| "epoch": 6.340110905730129, | |
| "learning_rate": 7.786998072914618e-06 | |
| } | |
| }, | |
| { | |
| "step": 6603264, | |
| "logs": { | |
| "loss": 0.301, | |
| "epoch": 6.358595194085027, | |
| "learning_rate": 7.74766979981909e-06 | |
| } | |
| }, | |
| { | |
| "step": 6622464, | |
| "logs": { | |
| "loss": 0.297, | |
| "epoch": 6.377079482439926, | |
| "learning_rate": 7.708341526723561e-06 | |
| } | |
| }, | |
| { | |
| "step": 6641664, | |
| "logs": { | |
| "loss": 0.2993, | |
| "epoch": 6.3955637707948245, | |
| "learning_rate": 7.669013253628034e-06 | |
| } | |
| }, | |
| { | |
| "step": 6660864, | |
| "logs": { | |
| "loss": 0.3035, | |
| "epoch": 6.414048059149723, | |
| "learning_rate": 7.629684980532506e-06 | |
| } | |
| }, | |
| { | |
| "step": 6680064, | |
| "logs": { | |
| "loss": 0.2988, | |
| "epoch": 6.432532347504621, | |
| "learning_rate": 7.590356707436977e-06 | |
| } | |
| }, | |
| { | |
| "step": 6699264, | |
| "logs": { | |
| "loss": 0.3001, | |
| "epoch": 6.45101663585952, | |
| "learning_rate": 7.551028434341449e-06 | |
| } | |
| }, | |
| { | |
| "step": 6718464, | |
| "logs": { | |
| "loss": 0.3024, | |
| "epoch": 6.469500924214418, | |
| "learning_rate": 7.51170016124592e-06 | |
| } | |
| }, | |
| { | |
| "step": 6737664, | |
| "logs": { | |
| "loss": 0.3053, | |
| "epoch": 6.487985212569316, | |
| "learning_rate": 7.472371888150392e-06 | |
| } | |
| }, | |
| { | |
| "step": 6756864, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.506469500924214, | |
| "learning_rate": 7.433043615054863e-06 | |
| } | |
| }, | |
| { | |
| "step": 6776064, | |
| "logs": { | |
| "loss": 0.3002, | |
| "epoch": 6.524953789279113, | |
| "learning_rate": 7.393715341959336e-06 | |
| } | |
| }, | |
| { | |
| "step": 6795264, | |
| "logs": { | |
| "loss": 0.3044, | |
| "epoch": 6.543438077634011, | |
| "learning_rate": 7.354387068863806e-06 | |
| } | |
| }, | |
| { | |
| "step": 6814464, | |
| "logs": { | |
| "loss": 0.3016, | |
| "epoch": 6.561922365988909, | |
| "learning_rate": 7.3150587957682786e-06 | |
| } | |
| }, | |
| { | |
| "step": 6833664, | |
| "logs": { | |
| "loss": 0.3071, | |
| "epoch": 6.580406654343808, | |
| "learning_rate": 7.27573052267275e-06 | |
| } | |
| }, | |
| { | |
| "step": 6852864, | |
| "logs": { | |
| "loss": 0.3002, | |
| "epoch": 6.598890942698706, | |
| "learning_rate": 7.2364022495772215e-06 | |
| } | |
| }, | |
| { | |
| "step": 6872064, | |
| "logs": { | |
| "loss": 0.3042, | |
| "epoch": 6.617375231053605, | |
| "learning_rate": 7.197073976481693e-06 | |
| } | |
| }, | |
| { | |
| "step": 6891264, | |
| "logs": { | |
| "loss": 0.3042, | |
| "epoch": 6.635859519408503, | |
| "learning_rate": 7.157745703386165e-06 | |
| } | |
| }, | |
| { | |
| "step": 6910464, | |
| "logs": { | |
| "loss": 0.3063, | |
| "epoch": 6.654343807763401, | |
| "learning_rate": 7.118417430290636e-06 | |
| } | |
| }, | |
| { | |
| "step": 6929664, | |
| "logs": { | |
| "loss": 0.3031, | |
| "epoch": 6.672828096118299, | |
| "learning_rate": 7.079089157195108e-06 | |
| } | |
| }, | |
| { | |
| "step": 6948864, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.691312384473198, | |
| "learning_rate": 7.0397608840995805e-06 | |
| } | |
| }, | |
| { | |
| "step": 6968064, | |
| "logs": { | |
| "loss": 0.3041, | |
| "epoch": 6.709796672828096, | |
| "learning_rate": 7.000432611004051e-06 | |
| } | |
| }, | |
| { | |
| "step": 6987264, | |
| "logs": { | |
| "loss": 0.3036, | |
| "epoch": 6.728280961182994, | |
| "learning_rate": 6.961104337908523e-06 | |
| } | |
| }, | |
| { | |
| "step": 7006464, | |
| "logs": { | |
| "loss": 0.3044, | |
| "epoch": 6.7467652495378925, | |
| "learning_rate": 6.921776064812995e-06 | |
| } | |
| }, | |
| { | |
| "step": 7025664, | |
| "logs": { | |
| "loss": 0.3057, | |
| "epoch": 6.7652495378927915, | |
| "learning_rate": 6.882447791717466e-06 | |
| } | |
| }, | |
| { | |
| "step": 7044864, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.78373382624769, | |
| "learning_rate": 6.843119518621938e-06 | |
| } | |
| }, | |
| { | |
| "step": 7064064, | |
| "logs": { | |
| "loss": 0.3058, | |
| "epoch": 6.802218114602588, | |
| "learning_rate": 6.80379124552641e-06 | |
| } | |
| }, | |
| { | |
| "step": 7083264, | |
| "logs": { | |
| "loss": 0.3072, | |
| "epoch": 6.820702402957486, | |
| "learning_rate": 6.764462972430881e-06 | |
| } | |
| }, | |
| { | |
| "step": 7102464, | |
| "logs": { | |
| "loss": 0.3042, | |
| "epoch": 6.839186691312385, | |
| "learning_rate": 6.725134699335353e-06 | |
| } | |
| }, | |
| { | |
| "step": 7121664, | |
| "logs": { | |
| "loss": 0.3091, | |
| "epoch": 6.857670979667283, | |
| "learning_rate": 6.6858064262398245e-06 | |
| } | |
| }, | |
| { | |
| "step": 7140864, | |
| "logs": { | |
| "loss": 0.3036, | |
| "epoch": 6.876155268022181, | |
| "learning_rate": 6.646478153144296e-06 | |
| } | |
| }, | |
| { | |
| "step": 7160064, | |
| "logs": { | |
| "loss": 0.3081, | |
| "epoch": 6.894639556377079, | |
| "learning_rate": 6.607149880048767e-06 | |
| } | |
| }, | |
| { | |
| "step": 7179264, | |
| "logs": { | |
| "loss": 0.3018, | |
| "epoch": 6.913123844731977, | |
| "learning_rate": 6.56782160695324e-06 | |
| } | |
| }, | |
| { | |
| "step": 7198464, | |
| "logs": { | |
| "loss": 0.3055, | |
| "epoch": 6.931608133086876, | |
| "learning_rate": 6.52849333385771e-06 | |
| } | |
| }, | |
| { | |
| "step": 7217664, | |
| "logs": { | |
| "loss": 0.3046, | |
| "epoch": 6.9500924214417745, | |
| "learning_rate": 6.489165060762183e-06 | |
| } | |
| }, | |
| { | |
| "step": 7236864, | |
| "logs": { | |
| "loss": 0.3083, | |
| "epoch": 6.968576709796673, | |
| "learning_rate": 6.449836787666655e-06 | |
| } | |
| }, | |
| { | |
| "step": 7256064, | |
| "logs": { | |
| "loss": 0.3118, | |
| "epoch": 6.987060998151571, | |
| "learning_rate": 6.4105085145711256e-06 | |
| } | |
| }, | |
| { | |
| "step": 7275008, | |
| "logs": { | |
| "loss": 0.2902, | |
| "epoch": 7.00554528650647, | |
| "learning_rate": 6.371180241475597e-06 | |
| } | |
| }, | |
| { | |
| "step": 7294208, | |
| "logs": { | |
| "loss": 0.241, | |
| "epoch": 7.024029574861368, | |
| "learning_rate": 6.331851968380069e-06 | |
| } | |
| }, | |
| { | |
| "step": 7313408, | |
| "logs": { | |
| "loss": 0.2432, | |
| "epoch": 7.042513863216266, | |
| "learning_rate": 6.29252369528454e-06 | |
| } | |
| }, | |
| { | |
| "step": 7332608, | |
| "logs": { | |
| "loss": 0.2405, | |
| "epoch": 7.060998151571164, | |
| "learning_rate": 6.253195422189012e-06 | |
| } | |
| }, | |
| { | |
| "step": 7351808, | |
| "logs": { | |
| "loss": 0.2447, | |
| "epoch": 7.079482439926063, | |
| "learning_rate": 6.2138671490934846e-06 | |
| } | |
| }, | |
| { | |
| "step": 7371008, | |
| "logs": { | |
| "loss": 0.2458, | |
| "epoch": 7.097966728280961, | |
| "learning_rate": 6.174538875997955e-06 | |
| } | |
| }, | |
| { | |
| "step": 7390208, | |
| "logs": { | |
| "loss": 0.2414, | |
| "epoch": 7.116451016635859, | |
| "learning_rate": 6.1352106029024275e-06 | |
| } | |
| }, | |
| { | |
| "step": 7409408, | |
| "logs": { | |
| "loss": 0.2465, | |
| "epoch": 7.134935304990758, | |
| "learning_rate": 6.095882329806899e-06 | |
| } | |
| }, | |
| { | |
| "step": 7428608, | |
| "logs": { | |
| "loss": 0.2474, | |
| "epoch": 7.153419593345657, | |
| "learning_rate": 6.05655405671137e-06 | |
| } | |
| }, | |
| { | |
| "step": 7447808, | |
| "logs": { | |
| "loss": 0.2464, | |
| "epoch": 7.171903881700555, | |
| "learning_rate": 6.017225783615842e-06 | |
| } | |
| }, | |
| { | |
| "step": 7467008, | |
| "logs": { | |
| "loss": 0.2443, | |
| "epoch": 7.190388170055453, | |
| "learning_rate": 5.977897510520314e-06 | |
| } | |
| }, | |
| { | |
| "step": 7486208, | |
| "logs": { | |
| "loss": 0.2466, | |
| "epoch": 7.208872458410351, | |
| "learning_rate": 5.938569237424785e-06 | |
| } | |
| }, | |
| { | |
| "step": 7505408, | |
| "logs": { | |
| "loss": 0.2497, | |
| "epoch": 7.22735674676525, | |
| "learning_rate": 5.899240964329257e-06 | |
| } | |
| }, | |
| { | |
| "step": 7524608, | |
| "logs": { | |
| "loss": 0.2469, | |
| "epoch": 7.245841035120148, | |
| "learning_rate": 5.859912691233728e-06 | |
| } | |
| }, | |
| { | |
| "step": 7543808, | |
| "logs": { | |
| "loss": 0.2468, | |
| "epoch": 7.264325323475046, | |
| "learning_rate": 5.8205844181382e-06 | |
| } | |
| }, | |
| { | |
| "step": 7563008, | |
| "logs": { | |
| "loss": 0.2495, | |
| "epoch": 7.282809611829944, | |
| "learning_rate": 5.7812561450426715e-06 | |
| } | |
| }, | |
| { | |
| "step": 7582208, | |
| "logs": { | |
| "loss": 0.2496, | |
| "epoch": 7.3012939001848425, | |
| "learning_rate": 5.741927871947143e-06 | |
| } | |
| }, | |
| { | |
| "step": 7601408, | |
| "logs": { | |
| "loss": 0.2516, | |
| "epoch": 7.3197781885397415, | |
| "learning_rate": 5.702599598851614e-06 | |
| } | |
| }, | |
| { | |
| "step": 7620608, | |
| "logs": { | |
| "loss": 0.2516, | |
| "epoch": 7.33826247689464, | |
| "learning_rate": 5.663271325756087e-06 | |
| } | |
| }, | |
| { | |
| "step": 7639808, | |
| "logs": { | |
| "loss": 0.2493, | |
| "epoch": 7.356746765249538, | |
| "learning_rate": 5.623943052660557e-06 | |
| } | |
| }, | |
| { | |
| "step": 7659008, | |
| "logs": { | |
| "loss": 0.2458, | |
| "epoch": 7.375231053604436, | |
| "learning_rate": 5.58461477956503e-06 | |
| } | |
| }, | |
| { | |
| "step": 7678208, | |
| "logs": { | |
| "loss": 0.2494, | |
| "epoch": 7.393715341959335, | |
| "learning_rate": 5.545286506469502e-06 | |
| } | |
| }, | |
| { | |
| "step": 7697408, | |
| "logs": { | |
| "loss": 0.2534, | |
| "epoch": 7.412199630314233, | |
| "learning_rate": 5.5059582333739726e-06 | |
| } | |
| }, | |
| { | |
| "step": 7716608, | |
| "logs": { | |
| "loss": 0.2499, | |
| "epoch": 7.430683918669131, | |
| "learning_rate": 5.466629960278445e-06 | |
| } | |
| }, | |
| { | |
| "step": 7735808, | |
| "logs": { | |
| "loss": 0.249, | |
| "epoch": 7.449168207024029, | |
| "learning_rate": 5.427301687182916e-06 | |
| } | |
| }, | |
| { | |
| "step": 7755008, | |
| "logs": { | |
| "loss": 0.2498, | |
| "epoch": 7.467652495378928, | |
| "learning_rate": 5.387973414087388e-06 | |
| } | |
| }, | |
| { | |
| "step": 7774208, | |
| "logs": { | |
| "loss": 0.2541, | |
| "epoch": 7.486136783733826, | |
| "learning_rate": 5.348645140991859e-06 | |
| } | |
| }, | |
| { | |
| "step": 7793408, | |
| "logs": { | |
| "loss": 0.2579, | |
| "epoch": 7.5046210720887245, | |
| "learning_rate": 5.3093168678963316e-06 | |
| } | |
| }, | |
| { | |
| "step": 7812608, | |
| "logs": { | |
| "loss": 0.2476, | |
| "epoch": 7.523105360443623, | |
| "learning_rate": 5.269988594800802e-06 | |
| } | |
| }, | |
| { | |
| "step": 7831808, | |
| "logs": { | |
| "loss": 0.2538, | |
| "epoch": 7.541589648798522, | |
| "learning_rate": 5.2306603217052745e-06 | |
| } | |
| }, | |
| { | |
| "step": 7851008, | |
| "logs": { | |
| "loss": 0.2537, | |
| "epoch": 7.56007393715342, | |
| "learning_rate": 5.191332048609746e-06 | |
| } | |
| }, | |
| { | |
| "step": 7870208, | |
| "logs": { | |
| "loss": 0.2522, | |
| "epoch": 7.578558225508318, | |
| "learning_rate": 5.152003775514217e-06 | |
| } | |
| }, | |
| { | |
| "step": 7889408, | |
| "logs": { | |
| "loss": 0.2491, | |
| "epoch": 7.597042513863216, | |
| "learning_rate": 5.112675502418689e-06 | |
| } | |
| }, | |
| { | |
| "step": 7908608, | |
| "logs": { | |
| "loss": 0.2509, | |
| "epoch": 7.615526802218114, | |
| "learning_rate": 5.073347229323161e-06 | |
| } | |
| }, | |
| { | |
| "step": 7927808, | |
| "logs": { | |
| "loss": 0.2496, | |
| "epoch": 7.634011090573013, | |
| "learning_rate": 5.034018956227632e-06 | |
| } | |
| }, | |
| { | |
| "step": 7947008, | |
| "logs": { | |
| "loss": 0.2542, | |
| "epoch": 7.652495378927911, | |
| "learning_rate": 4.994690683132104e-06 | |
| } | |
| }, | |
| { | |
| "step": 7966208, | |
| "logs": { | |
| "loss": 0.2517, | |
| "epoch": 7.6709796672828094, | |
| "learning_rate": 4.9553624100365756e-06 | |
| } | |
| }, | |
| { | |
| "step": 7985408, | |
| "logs": { | |
| "loss": 0.2544, | |
| "epoch": 7.689463955637708, | |
| "learning_rate": 4.916034136941048e-06 | |
| } | |
| }, | |
| { | |
| "step": 8004608, | |
| "logs": { | |
| "loss": 0.2489, | |
| "epoch": 7.707948243992607, | |
| "learning_rate": 4.876705863845519e-06 | |
| } | |
| }, | |
| { | |
| "step": 8023808, | |
| "logs": { | |
| "loss": 0.2506, | |
| "epoch": 7.726432532347505, | |
| "learning_rate": 4.83737759074999e-06 | |
| } | |
| }, | |
| { | |
| "step": 8043008, | |
| "logs": { | |
| "loss": 0.2535, | |
| "epoch": 7.744916820702403, | |
| "learning_rate": 4.798049317654462e-06 | |
| } | |
| }, | |
| { | |
| "step": 8062208, | |
| "logs": { | |
| "loss": 0.2506, | |
| "epoch": 7.763401109057301, | |
| "learning_rate": 4.758721044558934e-06 | |
| } | |
| }, | |
| { | |
| "step": 8081408, | |
| "logs": { | |
| "loss": 0.2547, | |
| "epoch": 7.7818853974122, | |
| "learning_rate": 4.719392771463405e-06 | |
| } | |
| }, | |
| { | |
| "step": 8100608, | |
| "logs": { | |
| "loss": 0.2525, | |
| "epoch": 7.800369685767098, | |
| "learning_rate": 4.6800644983678775e-06 | |
| } | |
| }, | |
| { | |
| "step": 8119808, | |
| "logs": { | |
| "loss": 0.2535, | |
| "epoch": 7.818853974121996, | |
| "learning_rate": 4.640736225272349e-06 | |
| } | |
| }, | |
| { | |
| "step": 8139008, | |
| "logs": { | |
| "loss": 0.2508, | |
| "epoch": 7.837338262476894, | |
| "learning_rate": 4.60140795217682e-06 | |
| } | |
| }, | |
| { | |
| "step": 8158208, | |
| "logs": { | |
| "loss": 0.254, | |
| "epoch": 7.855822550831793, | |
| "learning_rate": 4.562079679081292e-06 | |
| } | |
| }, | |
| { | |
| "step": 8177408, | |
| "logs": { | |
| "loss": 0.251, | |
| "epoch": 7.8743068391866915, | |
| "learning_rate": 4.522751405985763e-06 | |
| } | |
| }, | |
| { | |
| "step": 8196608, | |
| "logs": { | |
| "loss": 0.2545, | |
| "epoch": 7.89279112754159, | |
| "learning_rate": 4.483423132890235e-06 | |
| } | |
| }, | |
| { | |
| "step": 8215808, | |
| "logs": { | |
| "loss": 0.2497, | |
| "epoch": 7.911275415896488, | |
| "learning_rate": 4.444094859794707e-06 | |
| } | |
| }, | |
| { | |
| "step": 8235008, | |
| "logs": { | |
| "loss": 0.253, | |
| "epoch": 7.929759704251387, | |
| "learning_rate": 4.4047665866991786e-06 | |
| } | |
| }, | |
| { | |
| "step": 8254208, | |
| "logs": { | |
| "loss": 0.249, | |
| "epoch": 7.948243992606285, | |
| "learning_rate": 4.36543831360365e-06 | |
| } | |
| }, | |
| { | |
| "step": 8273408, | |
| "logs": { | |
| "loss": 0.2534, | |
| "epoch": 7.966728280961183, | |
| "learning_rate": 4.3261100405081215e-06 | |
| } | |
| }, | |
| { | |
| "step": 8292608, | |
| "logs": { | |
| "loss": 0.2563, | |
| "epoch": 7.985212569316081, | |
| "learning_rate": 4.286781767412593e-06 | |
| } | |
| }, | |
| { | |
| "step": 8311552, | |
| "logs": { | |
| "loss": 0.2489, | |
| "epoch": 8.00369685767098, | |
| "learning_rate": 4.247453494317064e-06 | |
| } | |
| }, | |
| { | |
| "step": 8330752, | |
| "logs": { | |
| "loss": 0.2079, | |
| "epoch": 8.022181146025877, | |
| "learning_rate": 4.208125221221537e-06 | |
| } | |
| }, | |
| { | |
| "step": 8349952, | |
| "logs": { | |
| "loss": 0.2079, | |
| "epoch": 8.040665434380776, | |
| "learning_rate": 4.168796948126008e-06 | |
| } | |
| }, | |
| { | |
| "step": 8369152, | |
| "logs": { | |
| "loss": 0.2055, | |
| "epoch": 8.059149722735675, | |
| "learning_rate": 4.12946867503048e-06 | |
| } | |
| }, | |
| { | |
| "step": 8388352, | |
| "logs": { | |
| "loss": 0.2115, | |
| "epoch": 8.077634011090574, | |
| "learning_rate": 4.090140401934951e-06 | |
| } | |
| }, | |
| { | |
| "step": 8407552, | |
| "logs": { | |
| "loss": 0.2105, | |
| "epoch": 8.096118299445472, | |
| "learning_rate": 4.050812128839423e-06 | |
| } | |
| }, | |
| { | |
| "step": 8426752, | |
| "logs": { | |
| "loss": 0.2055, | |
| "epoch": 8.11460258780037, | |
| "learning_rate": 4.011483855743895e-06 | |
| } | |
| }, | |
| { | |
| "step": 8445952, | |
| "logs": { | |
| "loss": 0.2086, | |
| "epoch": 8.133086876155268, | |
| "learning_rate": 3.972155582648366e-06 | |
| } | |
| }, | |
| { | |
| "step": 8465152, | |
| "logs": { | |
| "loss": 0.2102, | |
| "epoch": 8.151571164510166, | |
| "learning_rate": 3.932827309552838e-06 | |
| } | |
| }, | |
| { | |
| "step": 8484352, | |
| "logs": { | |
| "loss": 0.21, | |
| "epoch": 8.170055452865064, | |
| "learning_rate": 3.893499036457309e-06 | |
| } | |
| }, | |
| { | |
| "step": 8503552, | |
| "logs": { | |
| "loss": 0.2081, | |
| "epoch": 8.188539741219962, | |
| "learning_rate": 3.854170763361781e-06 | |
| } | |
| }, | |
| { | |
| "step": 8522752, | |
| "logs": { | |
| "loss": 0.213, | |
| "epoch": 8.207024029574862, | |
| "learning_rate": 3.814842490266253e-06 | |
| } | |
| }, | |
| { | |
| "step": 8541952, | |
| "logs": { | |
| "loss": 0.2114, | |
| "epoch": 8.22550831792976, | |
| "learning_rate": 3.7755142171707245e-06 | |
| } | |
| }, | |
| { | |
| "step": 8561152, | |
| "logs": { | |
| "loss": 0.2116, | |
| "epoch": 8.243992606284658, | |
| "learning_rate": 3.736185944075196e-06 | |
| } | |
| }, | |
| { | |
| "step": 8580352, | |
| "logs": { | |
| "loss": 0.2106, | |
| "epoch": 8.262476894639557, | |
| "learning_rate": 3.696857670979668e-06 | |
| } | |
| }, | |
| { | |
| "step": 8599552, | |
| "logs": { | |
| "loss": 0.2097, | |
| "epoch": 8.280961182994455, | |
| "learning_rate": 3.6575293978841393e-06 | |
| } | |
| }, | |
| { | |
| "step": 8618752, | |
| "logs": { | |
| "loss": 0.2119, | |
| "epoch": 8.299445471349353, | |
| "learning_rate": 3.6182011247886107e-06 | |
| } | |
| }, | |
| { | |
| "step": 8637952, | |
| "logs": { | |
| "loss": 0.2144, | |
| "epoch": 8.317929759704251, | |
| "learning_rate": 3.5788728516930826e-06 | |
| } | |
| }, | |
| { | |
| "step": 8657152, | |
| "logs": { | |
| "loss": 0.2125, | |
| "epoch": 8.336414048059149, | |
| "learning_rate": 3.539544578597554e-06 | |
| } | |
| }, | |
| { | |
| "step": 8676352, | |
| "logs": { | |
| "loss": 0.2134, | |
| "epoch": 8.354898336414047, | |
| "learning_rate": 3.5002163055020256e-06 | |
| } | |
| }, | |
| { | |
| "step": 8695552, | |
| "logs": { | |
| "loss": 0.2127, | |
| "epoch": 8.373382624768947, | |
| "learning_rate": 3.4608880324064974e-06 | |
| } | |
| }, | |
| { | |
| "step": 8714752, | |
| "logs": { | |
| "loss": 0.2111, | |
| "epoch": 8.391866913123845, | |
| "learning_rate": 3.421559759310969e-06 | |
| } | |
| }, | |
| { | |
| "step": 8733952, | |
| "logs": { | |
| "loss": 0.213, | |
| "epoch": 8.410351201478743, | |
| "learning_rate": 3.3822314862154404e-06 | |
| } | |
| }, | |
| { | |
| "step": 8753152, | |
| "logs": { | |
| "loss": 0.2109, | |
| "epoch": 8.428835489833642, | |
| "learning_rate": 3.3429032131199122e-06 | |
| } | |
| }, | |
| { | |
| "step": 8772352, | |
| "logs": { | |
| "loss": 0.2093, | |
| "epoch": 8.44731977818854, | |
| "learning_rate": 3.3035749400243837e-06 | |
| } | |
| }, | |
| { | |
| "step": 8791552, | |
| "logs": { | |
| "loss": 0.2126, | |
| "epoch": 8.465804066543438, | |
| "learning_rate": 3.264246666928855e-06 | |
| } | |
| }, | |
| { | |
| "step": 8810752, | |
| "logs": { | |
| "loss": 0.2127, | |
| "epoch": 8.484288354898336, | |
| "learning_rate": 3.2249183938333275e-06 | |
| } | |
| }, | |
| { | |
| "step": 8829952, | |
| "logs": { | |
| "loss": 0.2184, | |
| "epoch": 8.502772643253234, | |
| "learning_rate": 3.1855901207377985e-06 | |
| } | |
| }, | |
| { | |
| "step": 8849152, | |
| "logs": { | |
| "loss": 0.2108, | |
| "epoch": 8.521256931608134, | |
| "learning_rate": 3.14626184764227e-06 | |
| } | |
| }, | |
| { | |
| "step": 8868352, | |
| "logs": { | |
| "loss": 0.2123, | |
| "epoch": 8.539741219963032, | |
| "learning_rate": 3.1069335745467423e-06 | |
| } | |
| }, | |
| { | |
| "step": 8887552, | |
| "logs": { | |
| "loss": 0.2125, | |
| "epoch": 8.55822550831793, | |
| "learning_rate": 3.0676053014512137e-06 | |
| } | |
| }, | |
| { | |
| "step": 8906752, | |
| "logs": { | |
| "loss": 0.2124, | |
| "epoch": 8.576709796672828, | |
| "learning_rate": 3.028277028355685e-06 | |
| } | |
| }, | |
| { | |
| "step": 8925952, | |
| "logs": { | |
| "loss": 0.2112, | |
| "epoch": 8.595194085027726, | |
| "learning_rate": 2.988948755260157e-06 | |
| } | |
| }, | |
| { | |
| "step": 8945152, | |
| "logs": { | |
| "loss": 0.2103, | |
| "epoch": 8.613678373382625, | |
| "learning_rate": 2.9496204821646285e-06 | |
| } | |
| }, | |
| { | |
| "step": 8964352, | |
| "logs": { | |
| "loss": 0.2128, | |
| "epoch": 8.632162661737523, | |
| "learning_rate": 2.9102922090691e-06 | |
| } | |
| }, | |
| { | |
| "step": 8983552, | |
| "logs": { | |
| "loss": 0.2125, | |
| "epoch": 8.65064695009242, | |
| "learning_rate": 2.8709639359735715e-06 | |
| } | |
| }, | |
| { | |
| "step": 9002752, | |
| "logs": { | |
| "loss": 0.2109, | |
| "epoch": 8.669131238447319, | |
| "learning_rate": 2.8316356628780434e-06 | |
| } | |
| }, | |
| { | |
| "step": 9021952, | |
| "logs": { | |
| "loss": 0.2132, | |
| "epoch": 8.687615526802219, | |
| "learning_rate": 2.792307389782515e-06 | |
| } | |
| }, | |
| { | |
| "step": 9041152, | |
| "logs": { | |
| "loss": 0.2113, | |
| "epoch": 8.706099815157117, | |
| "learning_rate": 2.7529791166869863e-06 | |
| } | |
| }, | |
| { | |
| "step": 9060352, | |
| "logs": { | |
| "loss": 0.2109, | |
| "epoch": 8.724584103512015, | |
| "learning_rate": 2.713650843591458e-06 | |
| } | |
| }, | |
| { | |
| "step": 9079552, | |
| "logs": { | |
| "loss": 0.2138, | |
| "epoch": 8.743068391866913, | |
| "learning_rate": 2.6743225704959296e-06 | |
| } | |
| }, | |
| { | |
| "step": 9098752, | |
| "logs": { | |
| "loss": 0.2098, | |
| "epoch": 8.761552680221811, | |
| "learning_rate": 2.634994297400401e-06 | |
| } | |
| }, | |
| { | |
| "step": 9117952, | |
| "logs": { | |
| "loss": 0.2128, | |
| "epoch": 8.78003696857671, | |
| "learning_rate": 2.595666024304873e-06 | |
| } | |
| }, | |
| { | |
| "step": 9137152, | |
| "logs": { | |
| "loss": 0.2143, | |
| "epoch": 8.798521256931608, | |
| "learning_rate": 2.5563377512093444e-06 | |
| } | |
| }, | |
| { | |
| "step": 9156352, | |
| "logs": { | |
| "loss": 0.2132, | |
| "epoch": 8.817005545286506, | |
| "learning_rate": 2.517009478113816e-06 | |
| } | |
| }, | |
| { | |
| "step": 9175552, | |
| "logs": { | |
| "loss": 0.2099, | |
| "epoch": 8.835489833641406, | |
| "learning_rate": 2.4776812050182878e-06 | |
| } | |
| }, | |
| { | |
| "step": 9194752, | |
| "logs": { | |
| "loss": 0.2124, | |
| "epoch": 8.853974121996304, | |
| "learning_rate": 2.4383529319227597e-06 | |
| } | |
| }, | |
| { | |
| "step": 9213952, | |
| "logs": { | |
| "loss": 0.2122, | |
| "epoch": 8.872458410351202, | |
| "learning_rate": 2.399024658827231e-06 | |
| } | |
| }, | |
| { | |
| "step": 9233152, | |
| "logs": { | |
| "loss": 0.2136, | |
| "epoch": 8.8909426987061, | |
| "learning_rate": 2.3596963857317026e-06 | |
| } | |
| }, | |
| { | |
| "step": 9252352, | |
| "logs": { | |
| "loss": 0.2103, | |
| "epoch": 8.909426987060998, | |
| "learning_rate": 2.3203681126361745e-06 | |
| } | |
| }, | |
| { | |
| "step": 9271552, | |
| "logs": { | |
| "loss": 0.2132, | |
| "epoch": 8.927911275415896, | |
| "learning_rate": 2.281039839540646e-06 | |
| } | |
| }, | |
| { | |
| "step": 9290752, | |
| "logs": { | |
| "loss": 0.2082, | |
| "epoch": 8.946395563770794, | |
| "learning_rate": 2.2417115664451174e-06 | |
| } | |
| }, | |
| { | |
| "step": 9309952, | |
| "logs": { | |
| "loss": 0.213, | |
| "epoch": 8.964879852125692, | |
| "learning_rate": 2.2023832933495893e-06 | |
| } | |
| }, | |
| { | |
| "step": 9329152, | |
| "logs": { | |
| "loss": 0.2142, | |
| "epoch": 8.98336414048059, | |
| "learning_rate": 2.1630550202540607e-06 | |
| } | |
| }, | |
| { | |
| "step": 9348096, | |
| "logs": { | |
| "loss": 0.2123, | |
| "epoch": 9.00184842883549, | |
| "learning_rate": 2.123726747158532e-06 | |
| } | |
| }, | |
| { | |
| "step": 9367296, | |
| "logs": { | |
| "loss": 0.1854, | |
| "epoch": 9.020332717190389, | |
| "learning_rate": 2.084398474063004e-06 | |
| } | |
| }, | |
| { | |
| "step": 9386496, | |
| "logs": { | |
| "loss": 0.1848, | |
| "epoch": 9.038817005545287, | |
| "learning_rate": 2.0450702009674755e-06 | |
| } | |
| }, | |
| { | |
| "step": 9405696, | |
| "logs": { | |
| "loss": 0.1802, | |
| "epoch": 9.057301293900185, | |
| "learning_rate": 2.0057419278719474e-06 | |
| } | |
| }, | |
| { | |
| "step": 9424896, | |
| "logs": { | |
| "loss": 0.1859, | |
| "epoch": 9.075785582255083, | |
| "learning_rate": 1.966413654776419e-06 | |
| } | |
| }, | |
| { | |
| "step": 9444096, | |
| "logs": { | |
| "loss": 0.1849, | |
| "epoch": 9.094269870609981, | |
| "learning_rate": 1.9270853816808904e-06 | |
| } | |
| }, | |
| { | |
| "step": 9463296, | |
| "logs": { | |
| "loss": 0.1841, | |
| "epoch": 9.11275415896488, | |
| "learning_rate": 1.8877571085853622e-06 | |
| } | |
| }, | |
| { | |
| "step": 9482496, | |
| "logs": { | |
| "loss": 0.1854, | |
| "epoch": 9.131238447319777, | |
| "learning_rate": 1.848428835489834e-06 | |
| } | |
| }, | |
| { | |
| "step": 9501696, | |
| "logs": { | |
| "loss": 0.1847, | |
| "epoch": 9.149722735674677, | |
| "learning_rate": 1.8091005623943054e-06 | |
| } | |
| }, | |
| { | |
| "step": 9520896, | |
| "logs": { | |
| "loss": 0.1852, | |
| "epoch": 9.168207024029575, | |
| "learning_rate": 1.769772289298777e-06 | |
| } | |
| }, | |
| { | |
| "step": 9540096, | |
| "logs": { | |
| "loss": 0.1846, | |
| "epoch": 9.186691312384474, | |
| "learning_rate": 1.7304440162032487e-06 | |
| } | |
| }, | |
| { | |
| "step": 9559296, | |
| "logs": { | |
| "loss": 0.1848, | |
| "epoch": 9.205175600739372, | |
| "learning_rate": 1.6911157431077202e-06 | |
| } | |
| }, | |
| { | |
| "step": 9578496, | |
| "logs": { | |
| "loss": 0.1861, | |
| "epoch": 9.22365988909427, | |
| "learning_rate": 1.6517874700121919e-06 | |
| } | |
| }, | |
| { | |
| "step": 9597696, | |
| "logs": { | |
| "loss": 0.185, | |
| "epoch": 9.242144177449168, | |
| "learning_rate": 1.6124591969166637e-06 | |
| } | |
| }, | |
| { | |
| "step": 9616896, | |
| "logs": { | |
| "loss": 0.1846, | |
| "epoch": 9.260628465804066, | |
| "learning_rate": 1.573130923821135e-06 | |
| } | |
| }, | |
| { | |
| "step": 9636096, | |
| "logs": { | |
| "loss": 0.1827, | |
| "epoch": 9.279112754158964, | |
| "learning_rate": 1.5338026507256069e-06 | |
| } | |
| }, | |
| { | |
| "step": 9655296, | |
| "logs": { | |
| "loss": 0.1871, | |
| "epoch": 9.297597042513864, | |
| "learning_rate": 1.4944743776300785e-06 | |
| } | |
| }, | |
| { | |
| "step": 9674496, | |
| "logs": { | |
| "loss": 0.1865, | |
| "epoch": 9.316081330868762, | |
| "learning_rate": 1.45514610453455e-06 | |
| } | |
| }, | |
| { | |
| "step": 9693696, | |
| "logs": { | |
| "loss": 0.1859, | |
| "epoch": 9.33456561922366, | |
| "learning_rate": 1.4158178314390217e-06 | |
| } | |
| }, | |
| { | |
| "step": 9712896, | |
| "logs": { | |
| "loss": 0.1874, | |
| "epoch": 9.353049907578558, | |
| "learning_rate": 1.3764895583434931e-06 | |
| } | |
| }, | |
| { | |
| "step": 9732096, | |
| "logs": { | |
| "loss": 0.1847, | |
| "epoch": 9.371534195933457, | |
| "learning_rate": 1.3371612852479648e-06 | |
| } | |
| }, | |
| { | |
| "step": 9751296, | |
| "logs": { | |
| "loss": 0.1849, | |
| "epoch": 9.390018484288355, | |
| "learning_rate": 1.2978330121524365e-06 | |
| } | |
| }, | |
| { | |
| "step": 9770496, | |
| "logs": { | |
| "loss": 0.1895, | |
| "epoch": 9.408502772643253, | |
| "learning_rate": 1.258504739056908e-06 | |
| } | |
| }, | |
| { | |
| "step": 9789696, | |
| "logs": { | |
| "loss": 0.1829, | |
| "epoch": 9.426987060998151, | |
| "learning_rate": 1.2191764659613798e-06 | |
| } | |
| }, | |
| { | |
| "step": 9808896, | |
| "logs": { | |
| "loss": 0.1837, | |
| "epoch": 9.445471349353049, | |
| "learning_rate": 1.1798481928658513e-06 | |
| } | |
| }, | |
| { | |
| "step": 9828096, | |
| "logs": { | |
| "loss": 0.1864, | |
| "epoch": 9.463955637707949, | |
| "learning_rate": 1.140519919770323e-06 | |
| } | |
| }, | |
| { | |
| "step": 9847296, | |
| "logs": { | |
| "loss": 0.1862, | |
| "epoch": 9.482439926062847, | |
| "learning_rate": 1.1011916466747946e-06 | |
| } | |
| }, | |
| { | |
| "step": 9866496, | |
| "logs": { | |
| "loss": 0.19, | |
| "epoch": 9.500924214417745, | |
| "learning_rate": 1.061863373579266e-06 | |
| } | |
| }, | |
| { | |
| "step": 9885696, | |
| "logs": { | |
| "loss": 0.1834, | |
| "epoch": 9.519408502772643, | |
| "learning_rate": 1.0225351004837378e-06 | |
| } | |
| }, | |
| { | |
| "step": 9904896, | |
| "logs": { | |
| "loss": 0.1863, | |
| "epoch": 9.537892791127542, | |
| "learning_rate": 9.832068273882094e-07 | |
| } | |
| }, | |
| { | |
| "step": 9924096, | |
| "logs": { | |
| "loss": 0.1859, | |
| "epoch": 9.55637707948244, | |
| "learning_rate": 9.438785542926811e-07 | |
| } | |
| }, | |
| { | |
| "step": 9943296, | |
| "logs": { | |
| "loss": 0.1829, | |
| "epoch": 9.574861367837338, | |
| "learning_rate": 9.045502811971527e-07 | |
| } | |
| }, | |
| { | |
| "step": 9962496, | |
| "logs": { | |
| "loss": 0.1838, | |
| "epoch": 9.593345656192236, | |
| "learning_rate": 8.652220081016244e-07 | |
| } | |
| }, | |
| { | |
| "step": 9981696, | |
| "logs": { | |
| "loss": 0.1817, | |
| "epoch": 9.611829944547136, | |
| "learning_rate": 8.258937350060959e-07 | |
| } | |
| }, | |
| { | |
| "step": 10000896, | |
| "logs": { | |
| "loss": 0.1834, | |
| "epoch": 9.630314232902034, | |
| "learning_rate": 7.865654619105675e-07 | |
| } | |
| }, | |
| { | |
| "step": 10020096, | |
| "logs": { | |
| "loss": 0.1857, | |
| "epoch": 9.648798521256932, | |
| "learning_rate": 7.472371888150393e-07 | |
| } | |
| }, | |
| { | |
| "step": 10039296, | |
| "logs": { | |
| "loss": 0.1858, | |
| "epoch": 9.66728280961183, | |
| "learning_rate": 7.079089157195108e-07 | |
| } | |
| }, | |
| { | |
| "step": 10058496, | |
| "logs": { | |
| "loss": 0.1858, | |
| "epoch": 9.685767097966728, | |
| "learning_rate": 6.685806426239824e-07 | |
| } | |
| }, | |
| { | |
| "step": 10077696, | |
| "logs": { | |
| "loss": 0.1848, | |
| "epoch": 9.704251386321626, | |
| "learning_rate": 6.29252369528454e-07 | |
| } | |
| }, | |
| { | |
| "step": 10096896, | |
| "logs": { | |
| "loss": 0.1832, | |
| "epoch": 9.722735674676525, | |
| "learning_rate": 5.899240964329256e-07 | |
| } | |
| }, | |
| { | |
| "step": 10116096, | |
| "logs": { | |
| "loss": 0.1842, | |
| "epoch": 9.741219963031423, | |
| "learning_rate": 5.505958233373973e-07 | |
| } | |
| }, | |
| { | |
| "step": 10135296, | |
| "logs": { | |
| "loss": 0.1842, | |
| "epoch": 9.75970425138632, | |
| "learning_rate": 5.112675502418689e-07 | |
| } | |
| }, | |
| { | |
| "step": 10154496, | |
| "logs": { | |
| "loss": 0.1847, | |
| "epoch": 9.77818853974122, | |
| "learning_rate": 4.7193927714634056e-07 | |
| } | |
| }, | |
| { | |
| "step": 10173696, | |
| "logs": { | |
| "loss": 0.185, | |
| "epoch": 9.796672828096119, | |
| "learning_rate": 4.326110040508122e-07 | |
| } | |
| }, | |
| { | |
| "step": 10192896, | |
| "logs": { | |
| "loss": 0.1826, | |
| "epoch": 9.815157116451017, | |
| "learning_rate": 3.9328273095528375e-07 | |
| } | |
| }, | |
| { | |
| "step": 10212096, | |
| "logs": { | |
| "loss": 0.1833, | |
| "epoch": 9.833641404805915, | |
| "learning_rate": 3.539544578597554e-07 | |
| } | |
| }, | |
| { | |
| "step": 10231296, | |
| "logs": { | |
| "loss": 0.1846, | |
| "epoch": 9.852125693160813, | |
| "learning_rate": 3.14626184764227e-07 | |
| } | |
| }, | |
| { | |
| "step": 10250496, | |
| "logs": { | |
| "loss": 0.184, | |
| "epoch": 9.870609981515711, | |
| "learning_rate": 2.7529791166869866e-07 | |
| } | |
| }, | |
| { | |
| "step": 10269696, | |
| "logs": { | |
| "loss": 0.1864, | |
| "epoch": 9.88909426987061, | |
| "learning_rate": 2.3596963857317028e-07 | |
| } | |
| }, | |
| { | |
| "step": 10288896, | |
| "logs": { | |
| "loss": 0.1841, | |
| "epoch": 9.907578558225508, | |
| "learning_rate": 1.9664136547764187e-07 | |
| } | |
| }, | |
| { | |
| "step": 10308096, | |
| "logs": { | |
| "loss": 0.1855, | |
| "epoch": 9.926062846580407, | |
| "learning_rate": 1.573130923821135e-07 | |
| } | |
| }, | |
| { | |
| "step": 10327296, | |
| "logs": { | |
| "loss": 0.1794, | |
| "epoch": 9.944547134935306, | |
| "learning_rate": 1.1798481928658514e-07 | |
| } | |
| }, | |
| { | |
| "step": 10346496, | |
| "logs": { | |
| "loss": 0.1853, | |
| "epoch": 9.963031423290204, | |
| "learning_rate": 7.865654619105675e-08 | |
| } | |
| }, | |
| { | |
| "step": 10365696, | |
| "logs": { | |
| "loss": 0.1855, | |
| "epoch": 9.981515711645102, | |
| "learning_rate": 3.9328273095528373e-08 | |
| } | |
| } | |
| ], | |
| "Evaluation": [ | |
| { | |
| "step": 2705, | |
| "logs": { | |
| "eval_loss": 0.9760558605194092 | |
| } | |
| }, | |
| { | |
| "step": 5410, | |
| "logs": { | |
| "eval_loss": 0.9268760681152344 | |
| } | |
| }, | |
| { | |
| "step": 8115, | |
| "logs": { | |
| "eval_loss": 0.9153628945350647 | |
| } | |
| }, | |
| { | |
| "step": 10820, | |
| "logs": { | |
| "eval_loss": 0.9207033514976501 | |
| } | |
| }, | |
| { | |
| "step": 13525, | |
| "logs": { | |
| "eval_loss": 0.9357024431228638 | |
| } | |
| }, | |
| { | |
| "step": 16230, | |
| "logs": { | |
| "eval_loss": 0.948551595211029 | |
| } | |
| }, | |
| { | |
| "step": 18935, | |
| "logs": { | |
| "eval_loss": 0.992328941822052 | |
| } | |
| }, | |
| { | |
| "step": 21640, | |
| "logs": { | |
| "eval_loss": 1.0297634601593018 | |
| } | |
| }, | |
| { | |
| "step": 24345, | |
| "logs": { | |
| "eval_loss": 1.0606719255447388 | |
| } | |
| }, | |
| { | |
| "step": 27050, | |
| "logs": { | |
| "eval_loss": 1.0935026407241821 | |
| } | |
| } | |
| ] | |
| } | |
| } |