a
step,train_loss,train_accuracy,valid_loss,valid_mean_token_accuracy 1,2.92067,0.75,, 2,2.62473,0.6087,, 3,1.34436,0.78378,, 4,2.91867,0.47059,, 5,2.40155,0.58333,, 6,2.94846,0.5,, 7,3.22334,0.57576,, 8,1.62783,0.76271,, 9,2.76755,0.71429,, 10,2.34966,0.58333,, 11,1.92754,0.71875,, 12,2.21972,0.71429,, 13,2.29487,0.58621,, 14,0.55413,0.85185,, 15,2.22656,0.57407,, 16,2.0954,0.67647,, 17,1.14929,0.73333,, 18,1.3771,0.71154,, 19,1.18295,0.66667,, 20,1.32835,0.8,, 21,1.85532,0.66667,, 22,2.1101,0.71429,, 23,1.42592,0.71429,, 24,2.09209,0.625,, 25,1.23408,0.7,, 26,1.0532,0.7037,, 27,1.65112,0.65789,, 28,1.54421,0.84,, 29,1.89176,0.67647,, 30,0.70141,0.78261,, 31,0.7678,0.77273,, 32,1.29999,0.68182,, 33,1.14227,0.64,, 34,1.1596,0.64516,, 35,1.18784,0.66667,, 36,1.80449,0.53846,, 37,1.65341,0.52941,, 38,1.42946,0.56667,, 39,0.90729,0.74359,, 40,1.23791,0.70833,, 41,0.96462,0.76471,, 42,0.99814,0.78571,, 43,0.67773,0.71154,, 44,1.97177,0.45455,, 45,1.27929,0.7,, 46,0.99474,0.70909,, 47,1.56512,0.52174,, 48,0.7506,0.76471,, 49,1.03906,0.74074,, 50,0.92305,0.7027,, 51,7.49904,0.5,, 52,0.70145,0.75556,, 53,3.24906,0.72727,, 54,0.59138,0.83333,, 55,0.84415,0.81818,, 56,1.32725,0.52941,, 57,0.50658,0.82609,, 58,0.92382,0.81081,, 59,1.77482,0.5,, 60,1.44891,0.52174,, 61,0.77302,0.81818,, 62,0.80979,0.78846,, 63,0.70493,0.82143,, 64,1.07066,0.66667,, 65,7.28292,0.5,, 66,1.63486,0.63636,, 67,0.83739,0.7037,, 68,0.7805,0.77778,, 69,0.70532,0.75,, 70,1.14863,0.73077,, 71,0.83883,0.70833,, 72,0.89378,0.75,, 73,0.90999,0.77778,, 74,0.61602,0.73077,, 75,0.90497,0.72727,, 76,0.86941,0.76923,, 77,1.50792,0.65217,, 78,0.69242,0.77778,, 79,0.89294,0.74194,, 80,0.57168,0.83333,, 81,1.01522,0.73333,, 82,0.67394,0.82353,, 83,0.31818,0.88889,, 84,0.90707,0.71429,, 85,1.27592,0.59259,, 86,0.99031,0.70833,, 87,0.56038,0.86667,, 88,1.28131,0.76316,, 89,1.88523,0.55882,, 90,0.84125,0.72973,, 91,1.30219,0.6875,, 92,0.89603,0.76,, 93,1.47441,0.70588,, 94,0.53711,0.78571,, 95,0.81778,0.66667,, 96,1.33487,0.625,, 97,3.03943,0.81818,, 98,0.75701,0.77966,, 99,0.72118,0.70588,, 100,0.4524,0.8125,, 101,1.02615,0.80952,, 102,1.11188,0.68182,, 103,0.95316,0.75,, 104,0.65282,0.84,, 105,0.83847,0.8,, 106,0.64666,0.77778,, 107,1.07833,0.66667,, 108,0.94822,0.74074,, 109,0.87235,0.76471,, 110,1.28774,0.68966,, 111,1.14233,0.78947,, 112,0.5275,0.78846,, 113,0.26218,0.88889,, 114,1.65365,0.55882,, 115,0.78461,0.8,, 116,0.57701,0.85714,, 117,0.97936,0.68182,, 118,0.57317,0.75,, 119,0.67419,0.80769,, 120,0.46602,0.92,, 121,1.20842,0.68966,, 122,0.38407,0.90625,, 123,0.66467,0.81481,, 124,0.96144,0.83333,, 125,1.64121,0.59091,, 126,0.46505,0.86667,, 127,0.52876,0.82353,, 128,0.93434,0.73077,, 129,0.85138,0.76667,, 130,0.68216,0.66667,, 131,0.68104,0.79167,, 132,0.49697,0.93333,, 133,1.42817,0.6087,, 134,1.24223,0.625,, 135,1.38707,0.65217,, 136,0.82668,0.72727,, 137,0.63099,0.90909,, 138,0.67471,0.82222,, 139,0.86222,0.8,, 140,0.87854,0.75,, 141,0.95747,0.72222,, 142,0.58041,0.82222,, 143,0.75429,0.80645,, 144,0.60305,0.73529,, 145,0.77937,0.75676,, 146,1.44416,0.63636,, 147,1.33034,0.73529,, 148,0.87322,0.75926,, 149,1.19613,0.71875,, 150,7.15896,0.75,, 151,0.56755,0.81481,, 152,0.48109,0.82143,, 153,0.80779,0.75,, 154,0.76726,0.80556,, 155,1.1833,0.61111,, 156,0.76193,0.79167,, 157,0.72659,0.82051,, 158,0.75307,0.66667,, 159,0.77806,0.83784,, 160,0.77584,0.78431,, 161,0.94356,0.73333,, 162,0.7152,0.81356,, 163,2.88606,0.81818,, 164,0.40264,0.82609,, 165,1.10442,0.64706,,