|
{ |
|
"batch_size": 128, |
|
"best_eval_metric_checkpoint_number": 18, |
|
"best_eval_metric_epoch": 10, |
|
"best_eval_metric_steps": 470, |
|
"best_eval_metric_value": 0.6166250705718994, |
|
"best_eval_test_metrics": { |
|
"combined": { |
|
"loss": 3.0807435512542725 |
|
}, |
|
"intent": { |
|
"accuracy": 0.5496426820755005, |
|
"accuracy_micro": 0.5959885120391846, |
|
"hits_at_k": 0.6660665273666382, |
|
"loss": 3.0807435512542725, |
|
"roc_auc": 0.9340102672576904 |
|
} |
|
}, |
|
"best_eval_train_metrics": { |
|
"combined": { |
|
"loss": 0.15086334943771362 |
|
}, |
|
"intent": { |
|
"accuracy": 0.9410130977630615, |
|
"accuracy_micro": 0.9574396014213562, |
|
"hits_at_k": 0.9925163984298706, |
|
"loss": 0.15086334943771362, |
|
"roc_auc": 0.9996311664581299 |
|
} |
|
}, |
|
"best_eval_validation_metrics": { |
|
"combined": { |
|
"loss": 2.5151546001434326 |
|
}, |
|
"intent": { |
|
"accuracy": 0.6166250705718994, |
|
"accuracy_micro": 0.63271164894104, |
|
"hits_at_k": 0.7617202997207642, |
|
"loss": 2.5151546001434326, |
|
"roc_auc": 0.9704092144966125 |
|
} |
|
}, |
|
"best_increase_batch_size_eval_metric": Infinity, |
|
"checkpoint_number": 20, |
|
"checkpoint_to_epoch": { |
|
"1": 1, |
|
"10": 5, |
|
"11": 6, |
|
"12": 6, |
|
"13": 7, |
|
"14": 7, |
|
"15": 8, |
|
"16": 8, |
|
"17": 9, |
|
"18": 9, |
|
"19": 10, |
|
"2": 1, |
|
"20": 10, |
|
"3": 2, |
|
"4": 2, |
|
"5": 3, |
|
"6": 3, |
|
"7": 4, |
|
"8": 4, |
|
"9": 5 |
|
}, |
|
"checkpoint_to_step": { |
|
"1": 47, |
|
"10": 235, |
|
"11": 282, |
|
"12": 282, |
|
"13": 329, |
|
"14": 329, |
|
"15": 376, |
|
"16": 376, |
|
"17": 423, |
|
"18": 423, |
|
"19": 470, |
|
"2": 47, |
|
"20": 470, |
|
"3": 94, |
|
"4": 94, |
|
"5": 141, |
|
"6": 141, |
|
"7": 188, |
|
"8": 188, |
|
"9": 235 |
|
}, |
|
"cumulative_checkpoint_token_usage": { |
|
"1": 1521697, |
|
"10": 7608485, |
|
"11": 9130182, |
|
"12": 9130182, |
|
"13": 10651879, |
|
"14": 10651879, |
|
"15": 12173576, |
|
"16": 12173576, |
|
"17": 13695273, |
|
"18": 13695273, |
|
"19": 15216970, |
|
"2": 1521697, |
|
"20": 15216970, |
|
"3": 3043394, |
|
"4": 3043394, |
|
"5": 4565091, |
|
"6": 4565091, |
|
"7": 6086788, |
|
"8": 6086788, |
|
"9": 7608485 |
|
}, |
|
"cumulative_step_token_usage": { |
|
"0": 32896, |
|
"1": 65792, |
|
"10": 361856, |
|
"100": 3273666, |
|
"101": 3306562, |
|
"102": 3339458, |
|
"103": 3372354, |
|
"104": 3405250, |
|
"105": 3438146, |
|
"106": 3471042, |
|
"107": 3503938, |
|
"108": 3536834, |
|
"109": 3569730, |
|
"11": 394752, |
|
"110": 3602626, |
|
"111": 3635522, |
|
"112": 3668418, |
|
"113": 3701314, |
|
"114": 3734210, |
|
"115": 3767106, |
|
"116": 3800002, |
|
"117": 3832898, |
|
"118": 3865794, |
|
"119": 3898690, |
|
"12": 427648, |
|
"120": 3931586, |
|
"121": 3964482, |
|
"122": 3997378, |
|
"123": 4030274, |
|
"124": 4063170, |
|
"125": 4096066, |
|
"126": 4128962, |
|
"127": 4161858, |
|
"128": 4194754, |
|
"129": 4227650, |
|
"13": 460544, |
|
"130": 4260546, |
|
"131": 4293442, |
|
"132": 4326338, |
|
"133": 4359234, |
|
"134": 4392130, |
|
"135": 4425026, |
|
"136": 4457922, |
|
"137": 4490818, |
|
"138": 4523714, |
|
"139": 4556610, |
|
"14": 493440, |
|
"140": 4565091, |
|
"141": 4597987, |
|
"142": 4630883, |
|
"143": 4663779, |
|
"144": 4696675, |
|
"145": 4729571, |
|
"146": 4762467, |
|
"147": 4795363, |
|
"148": 4828259, |
|
"149": 4861155, |
|
"15": 526336, |
|
"150": 4894051, |
|
"151": 4926947, |
|
"152": 4959843, |
|
"153": 4992739, |
|
"154": 5025635, |
|
"155": 5058531, |
|
"156": 5091427, |
|
"157": 5124323, |
|
"158": 5157219, |
|
"159": 5190115, |
|
"16": 559232, |
|
"160": 5223011, |
|
"161": 5255907, |
|
"162": 5288803, |
|
"163": 5321699, |
|
"164": 5354595, |
|
"165": 5387491, |
|
"166": 5420387, |
|
"167": 5453283, |
|
"168": 5486179, |
|
"169": 5519075, |
|
"17": 592128, |
|
"170": 5551971, |
|
"171": 5584867, |
|
"172": 5617763, |
|
"173": 5650659, |
|
"174": 5683555, |
|
"175": 5716451, |
|
"176": 5749347, |
|
"177": 5782243, |
|
"178": 5815139, |
|
"179": 5848035, |
|
"18": 625024, |
|
"180": 5880931, |
|
"181": 5913827, |
|
"182": 5946723, |
|
"183": 5979619, |
|
"184": 6012515, |
|
"185": 6045411, |
|
"186": 6078307, |
|
"187": 6086788, |
|
"188": 6119684, |
|
"189": 6152580, |
|
"19": 657920, |
|
"190": 6185476, |
|
"191": 6218372, |
|
"192": 6251268, |
|
"193": 6284164, |
|
"194": 6317060, |
|
"195": 6349956, |
|
"196": 6382852, |
|
"197": 6415748, |
|
"198": 6448644, |
|
"199": 6481540, |
|
"2": 98688, |
|
"20": 690816, |
|
"200": 6514436, |
|
"201": 6547332, |
|
"202": 6580228, |
|
"203": 6613124, |
|
"204": 6646020, |
|
"205": 6678916, |
|
"206": 6711812, |
|
"207": 6744708, |
|
"208": 6777604, |
|
"209": 6810500, |
|
"21": 723712, |
|
"210": 6843396, |
|
"211": 6876292, |
|
"212": 6909188, |
|
"213": 6942084, |
|
"214": 6974980, |
|
"215": 7007876, |
|
"216": 7040772, |
|
"217": 7073668, |
|
"218": 7106564, |
|
"219": 7139460, |
|
"22": 756608, |
|
"220": 7172356, |
|
"221": 7205252, |
|
"222": 7238148, |
|
"223": 7271044, |
|
"224": 7303940, |
|
"225": 7336836, |
|
"226": 7369732, |
|
"227": 7402628, |
|
"228": 7435524, |
|
"229": 7468420, |
|
"23": 789504, |
|
"230": 7501316, |
|
"231": 7534212, |
|
"232": 7567108, |
|
"233": 7600004, |
|
"234": 7608485, |
|
"235": 7641381, |
|
"236": 7674277, |
|
"237": 7707173, |
|
"238": 7740069, |
|
"239": 7772965, |
|
"24": 822400, |
|
"240": 7805861, |
|
"241": 7838757, |
|
"242": 7871653, |
|
"243": 7904549, |
|
"244": 7937445, |
|
"245": 7970341, |
|
"246": 8003237, |
|
"247": 8036133, |
|
"248": 8069029, |
|
"249": 8101925, |
|
"25": 855296, |
|
"250": 8134821, |
|
"251": 8167717, |
|
"252": 8200613, |
|
"253": 8233509, |
|
"254": 8266405, |
|
"255": 8299301, |
|
"256": 8332197, |
|
"257": 8365093, |
|
"258": 8397989, |
|
"259": 8430885, |
|
"26": 888192, |
|
"260": 8463781, |
|
"261": 8496677, |
|
"262": 8529573, |
|
"263": 8562469, |
|
"264": 8595365, |
|
"265": 8628261, |
|
"266": 8661157, |
|
"267": 8694053, |
|
"268": 8726949, |
|
"269": 8759845, |
|
"27": 921088, |
|
"270": 8792741, |
|
"271": 8825637, |
|
"272": 8858533, |
|
"273": 8891429, |
|
"274": 8924325, |
|
"275": 8957221, |
|
"276": 8990117, |
|
"277": 9023013, |
|
"278": 9055909, |
|
"279": 9088805, |
|
"28": 953984, |
|
"280": 9121701, |
|
"281": 9130182, |
|
"282": 9163078, |
|
"283": 9195974, |
|
"284": 9228870, |
|
"285": 9261766, |
|
"286": 9294662, |
|
"287": 9327558, |
|
"288": 9360454, |
|
"289": 9393350, |
|
"29": 986880, |
|
"290": 9426246, |
|
"291": 9459142, |
|
"292": 9492038, |
|
"293": 9524934, |
|
"294": 9557830, |
|
"295": 9590726, |
|
"296": 9623622, |
|
"297": 9656518, |
|
"298": 9689414, |
|
"299": 9722310, |
|
"3": 131584, |
|
"30": 1019776, |
|
"300": 9755206, |
|
"301": 9788102, |
|
"302": 9820998, |
|
"303": 9853894, |
|
"304": 9886790, |
|
"305": 9919686, |
|
"306": 9952582, |
|
"307": 9985478, |
|
"308": 10018374, |
|
"309": 10051270, |
|
"31": 1052672, |
|
"310": 10084166, |
|
"311": 10117062, |
|
"312": 10149958, |
|
"313": 10182854, |
|
"314": 10215750, |
|
"315": 10248646, |
|
"316": 10281542, |
|
"317": 10314438, |
|
"318": 10347334, |
|
"319": 10380230, |
|
"32": 1085568, |
|
"320": 10413126, |
|
"321": 10446022, |
|
"322": 10478918, |
|
"323": 10511814, |
|
"324": 10544710, |
|
"325": 10577606, |
|
"326": 10610502, |
|
"327": 10643398, |
|
"328": 10651879, |
|
"329": 10684775, |
|
"33": 1118464, |
|
"330": 10717671, |
|
"331": 10750567, |
|
"332": 10783463, |
|
"333": 10816359, |
|
"334": 10849255, |
|
"335": 10882151, |
|
"336": 10915047, |
|
"337": 10947943, |
|
"338": 10980839, |
|
"339": 11013735, |
|
"34": 1151360, |
|
"340": 11046631, |
|
"341": 11079527, |
|
"342": 11112423, |
|
"343": 11145319, |
|
"344": 11178215, |
|
"345": 11211111, |
|
"346": 11244007, |
|
"347": 11276903, |
|
"348": 11309799, |
|
"349": 11342695, |
|
"35": 1184256, |
|
"350": 11375591, |
|
"351": 11408487, |
|
"352": 11441383, |
|
"353": 11474279, |
|
"354": 11507175, |
|
"355": 11540071, |
|
"356": 11572967, |
|
"357": 11605863, |
|
"358": 11638759, |
|
"359": 11671655, |
|
"36": 1217152, |
|
"360": 11704551, |
|
"361": 11737447, |
|
"362": 11770343, |
|
"363": 11803239, |
|
"364": 11836135, |
|
"365": 11869031, |
|
"366": 11901927, |
|
"367": 11934823, |
|
"368": 11967719, |
|
"369": 12000615, |
|
"37": 1250048, |
|
"370": 12033511, |
|
"371": 12066407, |
|
"372": 12099303, |
|
"373": 12132199, |
|
"374": 12165095, |
|
"375": 12173576, |
|
"376": 12206472, |
|
"377": 12239368, |
|
"378": 12272264, |
|
"379": 12305160, |
|
"38": 1282944, |
|
"380": 12338056, |
|
"381": 12370952, |
|
"382": 12403848, |
|
"383": 12436744, |
|
"384": 12469640, |
|
"385": 12502536, |
|
"386": 12535432, |
|
"387": 12568328, |
|
"388": 12601224, |
|
"389": 12634120, |
|
"39": 1315840, |
|
"390": 12667016, |
|
"391": 12699912, |
|
"392": 12732808, |
|
"393": 12765704, |
|
"394": 12798600, |
|
"395": 12831496, |
|
"396": 12864392, |
|
"397": 12897288, |
|
"398": 12930184, |
|
"399": 12963080, |
|
"4": 164480, |
|
"40": 1348736, |
|
"400": 12995976, |
|
"401": 13028872, |
|
"402": 13061768, |
|
"403": 13094664, |
|
"404": 13127560, |
|
"405": 13160456, |
|
"406": 13193352, |
|
"407": 13226248, |
|
"408": 13259144, |
|
"409": 13292040, |
|
"41": 1381632, |
|
"410": 13324936, |
|
"411": 13357832, |
|
"412": 13390728, |
|
"413": 13423624, |
|
"414": 13456520, |
|
"415": 13489416, |
|
"416": 13522312, |
|
"417": 13555208, |
|
"418": 13588104, |
|
"419": 13621000, |
|
"42": 1414528, |
|
"420": 13653896, |
|
"421": 13686792, |
|
"422": 13695273, |
|
"423": 13728169, |
|
"424": 13761065, |
|
"425": 13793961, |
|
"426": 13826857, |
|
"427": 13859753, |
|
"428": 13892649, |
|
"429": 13925545, |
|
"43": 1447424, |
|
"430": 13958441, |
|
"431": 13991337, |
|
"432": 14024233, |
|
"433": 14057129, |
|
"434": 14090025, |
|
"435": 14122921, |
|
"436": 14155817, |
|
"437": 14188713, |
|
"438": 14221609, |
|
"439": 14254505, |
|
"44": 1480320, |
|
"440": 14287401, |
|
"441": 14320297, |
|
"442": 14353193, |
|
"443": 14386089, |
|
"444": 14418985, |
|
"445": 14451881, |
|
"446": 14484777, |
|
"447": 14517673, |
|
"448": 14550569, |
|
"449": 14583465, |
|
"45": 1513216, |
|
"450": 14616361, |
|
"451": 14649257, |
|
"452": 14682153, |
|
"453": 14715049, |
|
"454": 14747945, |
|
"455": 14780841, |
|
"456": 14813737, |
|
"457": 14846633, |
|
"458": 14879529, |
|
"459": 14912425, |
|
"46": 1521697, |
|
"460": 14945321, |
|
"461": 14978217, |
|
"462": 15011113, |
|
"463": 15044009, |
|
"464": 15076905, |
|
"465": 15109801, |
|
"466": 15142697, |
|
"467": 15175593, |
|
"468": 15208489, |
|
"469": 15216970, |
|
"47": 1554593, |
|
"48": 1587489, |
|
"49": 1620385, |
|
"5": 197376, |
|
"50": 1653281, |
|
"51": 1686177, |
|
"52": 1719073, |
|
"53": 1751969, |
|
"54": 1784865, |
|
"55": 1817761, |
|
"56": 1850657, |
|
"57": 1883553, |
|
"58": 1916449, |
|
"59": 1949345, |
|
"6": 230272, |
|
"60": 1982241, |
|
"61": 2015137, |
|
"62": 2048033, |
|
"63": 2080929, |
|
"64": 2113825, |
|
"65": 2146721, |
|
"66": 2179617, |
|
"67": 2212513, |
|
"68": 2245409, |
|
"69": 2278305, |
|
"7": 263168, |
|
"70": 2311201, |
|
"71": 2344097, |
|
"72": 2376993, |
|
"73": 2409889, |
|
"74": 2442785, |
|
"75": 2475681, |
|
"76": 2508577, |
|
"77": 2541473, |
|
"78": 2574369, |
|
"79": 2607265, |
|
"8": 296064, |
|
"80": 2640161, |
|
"81": 2673057, |
|
"82": 2705953, |
|
"83": 2738849, |
|
"84": 2771745, |
|
"85": 2804641, |
|
"86": 2837537, |
|
"87": 2870433, |
|
"88": 2903329, |
|
"89": 2936225, |
|
"9": 328960, |
|
"90": 2969121, |
|
"91": 3002017, |
|
"92": 3034913, |
|
"93": 3043394, |
|
"94": 3076290, |
|
"95": 3109186, |
|
"96": 3142082, |
|
"97": 3174978, |
|
"98": 3207874, |
|
"99": 3240770 |
|
}, |
|
"epoch": 10, |
|
"incremental_checkpoint_token_usage": { |
|
"1": 1521697, |
|
"10": 0, |
|
"11": 1521697, |
|
"12": 0, |
|
"13": 1521697, |
|
"14": 0, |
|
"15": 1521697, |
|
"16": 0, |
|
"17": 1521697, |
|
"18": 0, |
|
"19": 1521697, |
|
"2": 0, |
|
"20": 0, |
|
"3": 1521697, |
|
"4": 0, |
|
"5": 1521697, |
|
"6": 0, |
|
"7": 1521697, |
|
"8": 0, |
|
"9": 1521697 |
|
}, |
|
"incremental_step_token_usage": { |
|
"0": 32896, |
|
"1": 32896, |
|
"10": 32896, |
|
"100": 32896, |
|
"101": 32896, |
|
"102": 32896, |
|
"103": 32896, |
|
"104": 32896, |
|
"105": 32896, |
|
"106": 32896, |
|
"107": 32896, |
|
"108": 32896, |
|
"109": 32896, |
|
"11": 32896, |
|
"110": 32896, |
|
"111": 32896, |
|
"112": 32896, |
|
"113": 32896, |
|
"114": 32896, |
|
"115": 32896, |
|
"116": 32896, |
|
"117": 32896, |
|
"118": 32896, |
|
"119": 32896, |
|
"12": 32896, |
|
"120": 32896, |
|
"121": 32896, |
|
"122": 32896, |
|
"123": 32896, |
|
"124": 32896, |
|
"125": 32896, |
|
"126": 32896, |
|
"127": 32896, |
|
"128": 32896, |
|
"129": 32896, |
|
"13": 32896, |
|
"130": 32896, |
|
"131": 32896, |
|
"132": 32896, |
|
"133": 32896, |
|
"134": 32896, |
|
"135": 32896, |
|
"136": 32896, |
|
"137": 32896, |
|
"138": 32896, |
|
"139": 32896, |
|
"14": 32896, |
|
"140": 8481, |
|
"141": 32896, |
|
"142": 32896, |
|
"143": 32896, |
|
"144": 32896, |
|
"145": 32896, |
|
"146": 32896, |
|
"147": 32896, |
|
"148": 32896, |
|
"149": 32896, |
|
"15": 32896, |
|
"150": 32896, |
|
"151": 32896, |
|
"152": 32896, |
|
"153": 32896, |
|
"154": 32896, |
|
"155": 32896, |
|
"156": 32896, |
|
"157": 32896, |
|
"158": 32896, |
|
"159": 32896, |
|
"16": 32896, |
|
"160": 32896, |
|
"161": 32896, |
|
"162": 32896, |
|
"163": 32896, |
|
"164": 32896, |
|
"165": 32896, |
|
"166": 32896, |
|
"167": 32896, |
|
"168": 32896, |
|
"169": 32896, |
|
"17": 32896, |
|
"170": 32896, |
|
"171": 32896, |
|
"172": 32896, |
|
"173": 32896, |
|
"174": 32896, |
|
"175": 32896, |
|
"176": 32896, |
|
"177": 32896, |
|
"178": 32896, |
|
"179": 32896, |
|
"18": 32896, |
|
"180": 32896, |
|
"181": 32896, |
|
"182": 32896, |
|
"183": 32896, |
|
"184": 32896, |
|
"185": 32896, |
|
"186": 32896, |
|
"187": 8481, |
|
"188": 32896, |
|
"189": 32896, |
|
"19": 32896, |
|
"190": 32896, |
|
"191": 32896, |
|
"192": 32896, |
|
"193": 32896, |
|
"194": 32896, |
|
"195": 32896, |
|
"196": 32896, |
|
"197": 32896, |
|
"198": 32896, |
|
"199": 32896, |
|
"2": 32896, |
|
"20": 32896, |
|
"200": 32896, |
|
"201": 32896, |
|
"202": 32896, |
|
"203": 32896, |
|
"204": 32896, |
|
"205": 32896, |
|
"206": 32896, |
|
"207": 32896, |
|
"208": 32896, |
|
"209": 32896, |
|
"21": 32896, |
|
"210": 32896, |
|
"211": 32896, |
|
"212": 32896, |
|
"213": 32896, |
|
"214": 32896, |
|
"215": 32896, |
|
"216": 32896, |
|
"217": 32896, |
|
"218": 32896, |
|
"219": 32896, |
|
"22": 32896, |
|
"220": 32896, |
|
"221": 32896, |
|
"222": 32896, |
|
"223": 32896, |
|
"224": 32896, |
|
"225": 32896, |
|
"226": 32896, |
|
"227": 32896, |
|
"228": 32896, |
|
"229": 32896, |
|
"23": 32896, |
|
"230": 32896, |
|
"231": 32896, |
|
"232": 32896, |
|
"233": 32896, |
|
"234": 8481, |
|
"235": 32896, |
|
"236": 32896, |
|
"237": 32896, |
|
"238": 32896, |
|
"239": 32896, |
|
"24": 32896, |
|
"240": 32896, |
|
"241": 32896, |
|
"242": 32896, |
|
"243": 32896, |
|
"244": 32896, |
|
"245": 32896, |
|
"246": 32896, |
|
"247": 32896, |
|
"248": 32896, |
|
"249": 32896, |
|
"25": 32896, |
|
"250": 32896, |
|
"251": 32896, |
|
"252": 32896, |
|
"253": 32896, |
|
"254": 32896, |
|
"255": 32896, |
|
"256": 32896, |
|
"257": 32896, |
|
"258": 32896, |
|
"259": 32896, |
|
"26": 32896, |
|
"260": 32896, |
|
"261": 32896, |
|
"262": 32896, |
|
"263": 32896, |
|
"264": 32896, |
|
"265": 32896, |
|
"266": 32896, |
|
"267": 32896, |
|
"268": 32896, |
|
"269": 32896, |
|
"27": 32896, |
|
"270": 32896, |
|
"271": 32896, |
|
"272": 32896, |
|
"273": 32896, |
|
"274": 32896, |
|
"275": 32896, |
|
"276": 32896, |
|
"277": 32896, |
|
"278": 32896, |
|
"279": 32896, |
|
"28": 32896, |
|
"280": 32896, |
|
"281": 8481, |
|
"282": 32896, |
|
"283": 32896, |
|
"284": 32896, |
|
"285": 32896, |
|
"286": 32896, |
|
"287": 32896, |
|
"288": 32896, |
|
"289": 32896, |
|
"29": 32896, |
|
"290": 32896, |
|
"291": 32896, |
|
"292": 32896, |
|
"293": 32896, |
|
"294": 32896, |
|
"295": 32896, |
|
"296": 32896, |
|
"297": 32896, |
|
"298": 32896, |
|
"299": 32896, |
|
"3": 32896, |
|
"30": 32896, |
|
"300": 32896, |
|
"301": 32896, |
|
"302": 32896, |
|
"303": 32896, |
|
"304": 32896, |
|
"305": 32896, |
|
"306": 32896, |
|
"307": 32896, |
|
"308": 32896, |
|
"309": 32896, |
|
"31": 32896, |
|
"310": 32896, |
|
"311": 32896, |
|
"312": 32896, |
|
"313": 32896, |
|
"314": 32896, |
|
"315": 32896, |
|
"316": 32896, |
|
"317": 32896, |
|
"318": 32896, |
|
"319": 32896, |
|
"32": 32896, |
|
"320": 32896, |
|
"321": 32896, |
|
"322": 32896, |
|
"323": 32896, |
|
"324": 32896, |
|
"325": 32896, |
|
"326": 32896, |
|
"327": 32896, |
|
"328": 8481, |
|
"329": 32896, |
|
"33": 32896, |
|
"330": 32896, |
|
"331": 32896, |
|
"332": 32896, |
|
"333": 32896, |
|
"334": 32896, |
|
"335": 32896, |
|
"336": 32896, |
|
"337": 32896, |
|
"338": 32896, |
|
"339": 32896, |
|
"34": 32896, |
|
"340": 32896, |
|
"341": 32896, |
|
"342": 32896, |
|
"343": 32896, |
|
"344": 32896, |
|
"345": 32896, |
|
"346": 32896, |
|
"347": 32896, |
|
"348": 32896, |
|
"349": 32896, |
|
"35": 32896, |
|
"350": 32896, |
|
"351": 32896, |
|
"352": 32896, |
|
"353": 32896, |
|
"354": 32896, |
|
"355": 32896, |
|
"356": 32896, |
|
"357": 32896, |
|
"358": 32896, |
|
"359": 32896, |
|
"36": 32896, |
|
"360": 32896, |
|
"361": 32896, |
|
"362": 32896, |
|
"363": 32896, |
|
"364": 32896, |
|
"365": 32896, |
|
"366": 32896, |
|
"367": 32896, |
|
"368": 32896, |
|
"369": 32896, |
|
"37": 32896, |
|
"370": 32896, |
|
"371": 32896, |
|
"372": 32896, |
|
"373": 32896, |
|
"374": 32896, |
|
"375": 8481, |
|
"376": 32896, |
|
"377": 32896, |
|
"378": 32896, |
|
"379": 32896, |
|
"38": 32896, |
|
"380": 32896, |
|
"381": 32896, |
|
"382": 32896, |
|
"383": 32896, |
|
"384": 32896, |
|
"385": 32896, |
|
"386": 32896, |
|
"387": 32896, |
|
"388": 32896, |
|
"389": 32896, |
|
"39": 32896, |
|
"390": 32896, |
|
"391": 32896, |
|
"392": 32896, |
|
"393": 32896, |
|
"394": 32896, |
|
"395": 32896, |
|
"396": 32896, |
|
"397": 32896, |
|
"398": 32896, |
|
"399": 32896, |
|
"4": 32896, |
|
"40": 32896, |
|
"400": 32896, |
|
"401": 32896, |
|
"402": 32896, |
|
"403": 32896, |
|
"404": 32896, |
|
"405": 32896, |
|
"406": 32896, |
|
"407": 32896, |
|
"408": 32896, |
|
"409": 32896, |
|
"41": 32896, |
|
"410": 32896, |
|
"411": 32896, |
|
"412": 32896, |
|
"413": 32896, |
|
"414": 32896, |
|
"415": 32896, |
|
"416": 32896, |
|
"417": 32896, |
|
"418": 32896, |
|
"419": 32896, |
|
"42": 32896, |
|
"420": 32896, |
|
"421": 32896, |
|
"422": 8481, |
|
"423": 32896, |
|
"424": 32896, |
|
"425": 32896, |
|
"426": 32896, |
|
"427": 32896, |
|
"428": 32896, |
|
"429": 32896, |
|
"43": 32896, |
|
"430": 32896, |
|
"431": 32896, |
|
"432": 32896, |
|
"433": 32896, |
|
"434": 32896, |
|
"435": 32896, |
|
"436": 32896, |
|
"437": 32896, |
|
"438": 32896, |
|
"439": 32896, |
|
"44": 32896, |
|
"440": 32896, |
|
"441": 32896, |
|
"442": 32896, |
|
"443": 32896, |
|
"444": 32896, |
|
"445": 32896, |
|
"446": 32896, |
|
"447": 32896, |
|
"448": 32896, |
|
"449": 32896, |
|
"45": 32896, |
|
"450": 32896, |
|
"451": 32896, |
|
"452": 32896, |
|
"453": 32896, |
|
"454": 32896, |
|
"455": 32896, |
|
"456": 32896, |
|
"457": 32896, |
|
"458": 32896, |
|
"459": 32896, |
|
"46": 8481, |
|
"460": 32896, |
|
"461": 32896, |
|
"462": 32896, |
|
"463": 32896, |
|
"464": 32896, |
|
"465": 32896, |
|
"466": 32896, |
|
"467": 32896, |
|
"468": 32896, |
|
"469": 8481, |
|
"47": 32896, |
|
"48": 32896, |
|
"49": 32896, |
|
"5": 32896, |
|
"50": 32896, |
|
"51": 32896, |
|
"52": 32896, |
|
"53": 32896, |
|
"54": 32896, |
|
"55": 32896, |
|
"56": 32896, |
|
"57": 32896, |
|
"58": 32896, |
|
"59": 32896, |
|
"6": 32896, |
|
"60": 32896, |
|
"61": 32896, |
|
"62": 32896, |
|
"63": 32896, |
|
"64": 32896, |
|
"65": 32896, |
|
"66": 32896, |
|
"67": 32896, |
|
"68": 32896, |
|
"69": 32896, |
|
"7": 32896, |
|
"70": 32896, |
|
"71": 32896, |
|
"72": 32896, |
|
"73": 32896, |
|
"74": 32896, |
|
"75": 32896, |
|
"76": 32896, |
|
"77": 32896, |
|
"78": 32896, |
|
"79": 32896, |
|
"8": 32896, |
|
"80": 32896, |
|
"81": 32896, |
|
"82": 32896, |
|
"83": 32896, |
|
"84": 32896, |
|
"85": 32896, |
|
"86": 32896, |
|
"87": 32896, |
|
"88": 32896, |
|
"89": 32896, |
|
"9": 32896, |
|
"90": 32896, |
|
"91": 32896, |
|
"92": 32896, |
|
"93": 8481, |
|
"94": 32896, |
|
"95": 32896, |
|
"96": 32896, |
|
"97": 32896, |
|
"98": 32896, |
|
"99": 32896 |
|
}, |
|
"last_improvement_steps": 0, |
|
"last_increase_batch_size": 0, |
|
"last_increase_batch_size_eval_metric_improvement": 0, |
|
"last_increase_batch_size_steps": 0, |
|
"last_learning_rate_reduction": 0, |
|
"last_learning_rate_reduction_steps": 0, |
|
"learning_rate": 0.0009581637888400619, |
|
"llm_eval_examples": {}, |
|
"num_increases_batch_size": 0, |
|
"num_reductions_learning_rate": 0, |
|
"steps": 470, |
|
"test_metrics": { |
|
"combined": { |
|
"loss": [ |
|
[ |
|
1, |
|
47, |
|
4.140954494476318 |
|
], |
|
[ |
|
2, |
|
94, |
|
3.6341311931610107 |
|
], |
|
[ |
|
3, |
|
141, |
|
2.973945379257202 |
|
], |
|
[ |
|
4, |
|
188, |
|
2.604846239089966 |
|
], |
|
[ |
|
5, |
|
235, |
|
2.477090835571289 |
|
], |
|
[ |
|
6, |
|
282, |
|
2.765279769897461 |
|
], |
|
[ |
|
7, |
|
329, |
|
2.932941436767578 |
|
], |
|
[ |
|
8, |
|
376, |
|
2.916217565536499 |
|
], |
|
[ |
|
9, |
|
423, |
|
3.01550555229187 |
|
], |
|
[ |
|
10, |
|
470, |
|
3.0807435512542725 |
|
] |
|
] |
|
}, |
|
"intent": { |
|
"accuracy": [ |
|
[ |
|
1, |
|
47, |
|
0.02062796801328659 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.03668239712715149 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.12673470377922058 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.2651279866695404 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.3786191940307617 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.41484618186950684 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.48310428857803345 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.49936506152153015 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.5275611281394958 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.5496426820755005 |
|
] |
|
], |
|
"accuracy_micro": [ |
|
[ |
|
1, |
|
47, |
|
0.05730659142136574 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.10028653591871262 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.266475647687912 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.3982807993888855 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.4871060252189636 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.4871060252189636 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.5587392449378967 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.5415472984313965 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.5759312510490417 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.5959885120391846 |
|
] |
|
], |
|
"hits_at_k": [ |
|
[ |
|
1, |
|
47, |
|
0.052861444652080536 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.11137306690216064 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.25743797421455383 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.4437764883041382 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.5734579563140869 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.6254034638404846 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.6468311548233032 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.6431319713592529 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.6786106824874878 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.6660665273666382 |
|
] |
|
], |
|
"loss": [ |
|
[ |
|
1, |
|
47, |
|
4.140954494476318 |
|
], |
|
[ |
|
2, |
|
94, |
|
3.6341311931610107 |
|
], |
|
[ |
|
3, |
|
141, |
|
2.973945379257202 |
|
], |
|
[ |
|
4, |
|
188, |
|
2.604846239089966 |
|
], |
|
[ |
|
5, |
|
235, |
|
2.477090835571289 |
|
], |
|
[ |
|
6, |
|
282, |
|
2.765279769897461 |
|
], |
|
[ |
|
7, |
|
329, |
|
2.932941436767578 |
|
], |
|
[ |
|
8, |
|
376, |
|
2.916217565536499 |
|
], |
|
[ |
|
9, |
|
423, |
|
3.01550555229187 |
|
], |
|
[ |
|
10, |
|
470, |
|
3.0807435512542725 |
|
] |
|
], |
|
"roc_auc": [ |
|
[ |
|
1, |
|
47, |
|
0.6999472975730896 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.8169810771942139 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.8789530992507935 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.9105718731880188 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.9285396337509155 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.932953953742981 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.9334519505500793 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.9398418664932251 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.9440649747848511 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.9340102672576904 |
|
] |
|
] |
|
} |
|
}, |
|
"total_tokens_used": 15216970, |
|
"train_metrics": { |
|
"combined": { |
|
"loss": [ |
|
[ |
|
1, |
|
47, |
|
4.941826820373535 |
|
], |
|
[ |
|
2, |
|
94, |
|
3.8220131397247314 |
|
], |
|
[ |
|
3, |
|
141, |
|
2.966855049133301 |
|
], |
|
[ |
|
4, |
|
188, |
|
1.9691708087921143 |
|
], |
|
[ |
|
5, |
|
235, |
|
1.1989307403564453 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.7208091020584106 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.41259047389030457 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.2844356894493103 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.20260311663150787 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.15086334943771362 |
|
] |
|
] |
|
}, |
|
"intent": { |
|
"accuracy": [ |
|
[ |
|
1, |
|
47, |
|
0.014659089967608452 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.03883907198905945 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.10787460207939148 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.25457778573036194 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.4590109586715698 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.653484046459198 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.8075626492500305 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.8613330721855164 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.9029062986373901 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.9410130977630615 |
|
] |
|
], |
|
"accuracy_micro": [ |
|
[ |
|
1, |
|
47, |
|
0.035635873675346375 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.09812531620264053 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.23492653667926788 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.4457017481327057 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.6433035135269165 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.7851714491844177 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.8792433738708496 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.9142037034034729 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.9376794695854187 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.9574396014213562 |
|
] |
|
], |
|
"hits_at_k": [ |
|
[ |
|
1, |
|
47, |
|
0.03866136819124222 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.09584441781044006 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.2281757891178131 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.46207964420318604 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.700287401676178 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.876828670501709 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.9502895474433899 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.9748519659042358 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.985029935836792 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.9925163984298706 |
|
] |
|
], |
|
"loss": [ |
|
[ |
|
1, |
|
47, |
|
4.941826820373535 |
|
], |
|
[ |
|
2, |
|
94, |
|
3.8220131397247314 |
|
], |
|
[ |
|
3, |
|
141, |
|
2.966855049133301 |
|
], |
|
[ |
|
4, |
|
188, |
|
1.9691708087921143 |
|
], |
|
[ |
|
5, |
|
235, |
|
1.1989307403564453 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.7208091020584106 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.41259047389030457 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.2844356894493103 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.20260311663150787 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.15086334943771362 |
|
] |
|
], |
|
"roc_auc": [ |
|
[ |
|
1, |
|
47, |
|
0.5121718645095825 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.7023259997367859 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.8708662986755371 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.9513766765594482 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.98272705078125 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.9933627843856812 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.997870147228241 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.9987038969993591 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.999286949634552 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.9996311664581299 |
|
] |
|
] |
|
} |
|
}, |
|
"tune_checkpoint_num": 0, |
|
"validation_metrics": { |
|
"combined": { |
|
"loss": [ |
|
[ |
|
1, |
|
47, |
|
4.075289249420166 |
|
], |
|
[ |
|
2, |
|
94, |
|
3.5391108989715576 |
|
], |
|
[ |
|
3, |
|
141, |
|
2.817091703414917 |
|
], |
|
[ |
|
4, |
|
188, |
|
2.289855718612671 |
|
], |
|
[ |
|
5, |
|
235, |
|
2.167616605758667 |
|
], |
|
[ |
|
6, |
|
282, |
|
2.3362152576446533 |
|
], |
|
[ |
|
7, |
|
329, |
|
2.3229939937591553 |
|
], |
|
[ |
|
8, |
|
376, |
|
2.545104742050171 |
|
], |
|
[ |
|
9, |
|
423, |
|
2.641582489013672 |
|
], |
|
[ |
|
10, |
|
470, |
|
2.5151546001434326 |
|
] |
|
] |
|
}, |
|
"intent": { |
|
"accuracy": [ |
|
[ |
|
1, |
|
47, |
|
0.02408008836209774 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.039156392216682434 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.13850188255310059 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.262044221162796 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.4144769310951233 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.4744482636451721 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.5366732478141785 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.546140730381012 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.5821728706359863 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.6166250705718994 |
|
] |
|
], |
|
"accuracy_micro": [ |
|
[ |
|
1, |
|
47, |
|
0.06743185222148895 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.09899569302797318 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.28263989090919495 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.4189383089542389 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.515064537525177 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.5451936721801758 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.6011477708816528 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.5810617208480835 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.5968436002731323 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.63271164894104 |
|
] |
|
], |
|
"hits_at_k": [ |
|
[ |
|
1, |
|
47, |
|
0.0595182403922081 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.12082408368587494 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.28157058358192444 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.4951961934566498 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.60570228099823 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.6759977340698242 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.7160040140151978 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.7496565580368042 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.7678131461143494 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.7617202997207642 |
|
] |
|
], |
|
"loss": [ |
|
[ |
|
1, |
|
47, |
|
4.075289249420166 |
|
], |
|
[ |
|
2, |
|
94, |
|
3.5391108989715576 |
|
], |
|
[ |
|
3, |
|
141, |
|
2.817091703414917 |
|
], |
|
[ |
|
4, |
|
188, |
|
2.289855718612671 |
|
], |
|
[ |
|
5, |
|
235, |
|
2.167616605758667 |
|
], |
|
[ |
|
6, |
|
282, |
|
2.3362152576446533 |
|
], |
|
[ |
|
7, |
|
329, |
|
2.3229939937591553 |
|
], |
|
[ |
|
8, |
|
376, |
|
2.545104742050171 |
|
], |
|
[ |
|
9, |
|
423, |
|
2.641582489013672 |
|
], |
|
[ |
|
10, |
|
470, |
|
2.5151546001434326 |
|
] |
|
], |
|
"roc_auc": [ |
|
[ |
|
1, |
|
47, |
|
0.7134010791778564 |
|
], |
|
[ |
|
2, |
|
94, |
|
0.8469101190567017 |
|
], |
|
[ |
|
3, |
|
141, |
|
0.9105364680290222 |
|
], |
|
[ |
|
4, |
|
188, |
|
0.9462321400642395 |
|
], |
|
[ |
|
5, |
|
235, |
|
0.955407440662384 |
|
], |
|
[ |
|
6, |
|
282, |
|
0.9614531993865967 |
|
], |
|
[ |
|
7, |
|
329, |
|
0.9639908075332642 |
|
], |
|
[ |
|
8, |
|
376, |
|
0.9642417430877686 |
|
], |
|
[ |
|
9, |
|
423, |
|
0.9641472697257996 |
|
], |
|
[ |
|
10, |
|
470, |
|
0.9704092144966125 |
|
] |
|
] |
|
} |
|
} |
|
} |