OpenDeltaMirror/examples/examples_prompt/collect_result.jsonl

60 lines
1.8 KiB
JSON

# the final results will be populated here.{
"evaluate": {
"epoch": 20.0,
"eval_accuracy": 89.2156862745098,
"eval_average_metrics": 90.76168929110105,
"eval_f1": 92.3076923076923,
"eval_loss": 0.16493959724903107,
"eval_runtime": 1.6391,
"eval_samples_per_second": 124.455
},
"repo_name": "DeltaHub/bitfit_t5-base_mrpc",
"test": {
"epoch": 20.0,
"test_accuracy": 88.23529411764706,
"test_average_metrics": 89.97971602434077,
"test_f1": 91.72413793103448,
"test_loss": 0.14968213438987732,
"test_runtime": 1.6344,
"test_samples_per_second": 124.82
}
}
{
"evaluate": {
"epoch": 20.0,
"eval_average_metrics": 52.10265668831534,
"eval_loss": 0.3603779077529907,
"eval_matthews_correlation": 52.10265668831534,
"eval_runtime": 1.0808,
"eval_samples_per_second": 482.046
},
"repo_name": "DeltaHub/bitfit_t5-base_cola",
"test": {
"epoch": 20.0,
"test_average_metrics": 54.209563471221934,
"test_loss": 0.2853100299835205,
"test_matthews_correlation": 54.209563471221934,
"test_runtime": 1.056,
"test_samples_per_second": 494.304
}
}
{
"evaluate": {
"epoch": 20.0,
"eval_average_metrics": 53.80613287067274,
"eval_loss": 0.25723716616630554,
"eval_matthews_correlation": 53.80613287067274,
"eval_runtime": 1.0583,
"eval_samples_per_second": 492.299
},
"repo_name": "DeltaHub/bitfit_t5-base_cola",
"test": {
"epoch": 20.0,
"test_average_metrics": 54.32497579543861,
"test_loss": 0.22327613830566406,
"test_matthews_correlation": 54.32497579543861,
"test_runtime": 1.0556,
"test_samples_per_second": 494.507
}
}