| { |
| "MSE": 0.0, |
| "MSE/layer0": 0.0, |
| "MSE/layer1": 0.0, |
| "MSE/layer2": 0.0, |
| "MSE/layer3": 0.0, |
| "dead_code_fraction": 1.0, |
| "dead_code_fraction/layer0": 1.0, |
| "dead_code_fraction/layer1": 1.0, |
| "dead_code_fraction/layer2": 1.0, |
| "dead_code_fraction/layer3": 1.0, |
| "epoch": 1.0, |
| "eval_MSE/layer0": 220380.4595384912, |
| "eval_MSE/layer1": 132.78432877894963, |
| "eval_MSE/layer2": 365.9396393365076, |
| "eval_MSE/layer3": 415.98040078389045, |
| "eval_accuracy": 0.4525254617525837, |
| "eval_dead_code_fraction/layer0": 0.99694, |
| "eval_dead_code_fraction/layer1": 0.9535, |
| "eval_dead_code_fraction/layer2": 0.93486, |
| "eval_dead_code_fraction/layer3": 0.98186, |
| "eval_first_transition_accuracy": 0.88, |
| "eval_input_norm/layer0": 333.77172351868165, |
| "eval_input_norm/layer1": 6.54500140022604, |
| "eval_input_norm/layer2": 6.137018968109251, |
| "eval_input_norm/layer3": 7.40972196774554, |
| "eval_loss": 1.2691402435302734, |
| "eval_multicode_k": 1, |
| "eval_output_norm/layer0": 12.936006403074337, |
| "eval_output_norm/layer1": 13.144865618203756, |
| "eval_output_norm/layer2": 18.324818944643734, |
| "eval_output_norm/layer3": 18.466466705456643, |
| "eval_runtime": 40.0743, |
| "eval_samples_per_second": 817.682, |
| "eval_steps_per_second": 1.597, |
| "eval_transition_accuracy": 0.5633870967741935, |
| "input_norm": 0.0, |
| "input_norm/layer0": 0.0, |
| "input_norm/layer1": 0.0, |
| "input_norm/layer2": 0.0, |
| "input_norm/layer3": 0.0, |
| "loss": 1.313426919734478, |
| "max_norm": 46.33829879760742, |
| "max_norm/layer0": 17.856664657592773, |
| "max_norm/layer1": 20.084186553955078, |
| "max_norm/layer2": 33.940242767333984, |
| "max_norm/layer3": 46.33829879760742, |
| "mean_norm": 8.291451185941696, |
| "mean_norm/layer0": 8.462452054023743, |
| "mean_norm/layer1": 8.18280303478241, |
| "mean_norm/layer2": 8.143204748630524, |
| "mean_norm/layer3": 8.377344906330109, |
| "multicode_k": 1, |
| "output_norm": 0.0, |
| "output_norm/layer0": 0.0, |
| "output_norm/layer1": 0.0, |
| "output_norm/layer2": 0.0, |
| "output_norm/layer3": 0.0, |
| "perplexity": 3.5577924120078235, |
| "runtime": 19944.2896, |
| "samples_per_second": 1026.86, |
| "steps_per_second": 1.003 |
| } |