Files
CGA-bench/saves/0406~0412/Paper_Experiments/PAPER_20260412_152529/Chatbench_RunInfo.json
2026-05-22 10:02:42 +08:00

93 lines
2.2 KiB
JSON

[
{
"task_id": "fsm_ps2",
"task_number": 94,
"time": 740.58,
"prompt_tokens": 9501,
"completion_tokens": 7054,
"token_cost": 0.6132599999999999,
"ERROR(incomplete)": false,
"op_record": [
"gen",
"syncheck",
"funccheck",
"cga",
"eval"
],
"reboot_times": 0,
"max_iter": 10,
"coverage": 77.77777777777779,
"circuit_type": "SEQ",
"checklist_worked": false,
"scenario_num": 10,
"Eval0_pass": true,
"Eval0_iv_pass": true,
"debug_iter_iv": 0,
"iv_runing_time": 0.03,
"Eval0_py_pass": true,
"debug_iter_py": 0,
"py_runing_time": 0.03,
"TB_corrected": false,
"TBcheck_oprecord": [
[
"discrim"
]
],
"rtl_num_newly_gen": 0,
"Eval1_pass": true,
"Eval2_pass": false,
"Eval2_ratio": "3/10",
"Eval2_failed_mutant_idxes": [
2,
4,
6,
7,
8,
9,
10
],
"full_pass": false
},
{
"task_id": "lemmings4",
"task_number": 150,
"time": 13147.0,
"prompt_tokens": 48382,
"completion_tokens": 34711,
"token_cost": 3.0503,
"ERROR(incomplete)": false,
"op_record": [
"gen",
"syncheck",
"gen",
"syncheck",
"gen",
"syncheck",
"funccheck",
"cga",
"eval"
],
"reboot_times": 2,
"max_iter": 10,
"coverage": 91.66666666666666,
"circuit_type": "SEQ",
"checklist_worked": false,
"scenario_num": 10,
"Eval0_pass": true,
"Eval0_iv_pass": true,
"debug_iter_iv": 1,
"iv_runing_time": 0.02,
"Eval0_py_pass": true,
"debug_iter_py": 0,
"py_runing_time": 0.02,
"TB_corrected": false,
"TBcheck_oprecord": [
[
"discrim"
]
],
"rtl_num_newly_gen": 0,
"Eval1_pass": false,
"full_pass": false
}
]