上传所有文件

2026-03-30 16:46:48 +08:00
parent 8c2008c738
commit 35c99bac58
110 changed files with 23243 additions and 0 deletions
--- a/config/init.py
+++ b/config/init.py
@@ -0,0 +1,8 @@
+"""
+Description :   description
+Author      :   Ruidi Qiu (r.qiu@tum.de)
+Time        :   2024/7/3 18:17:10
+LastEdited  :   2024/7/3 23:25:11
+"""
+
+from .config import *
--- a/config/pycache/init.cpython-312.pyc
+++ b/config/pycache/init.cpython-312.pyc
--- a/config/pycache/config.cpython-312.pyc
+++ b/config/pycache/config.cpython-312.pyc
--- a/config/config.py
+++ b/config/config.py
@@ -0,0 +1,330 @@
+"""
+Description :   This is the config module of the project. This file is copied and modified from OplixNet project.
+Author      :   Ruidi Qiu (ruidi.qiu@tum.de)
+Time        :   2023/11/28 11:20:33
+LastEdited  :   2024/9/16 09:39:02
+"""
+from datetime import datetime
+import yaml
+import json
+import os
+import socket
+import sys
+import utils.utils as utils
+sys.path.append("..")
+
+CONFIG_FORMAT = "yaml" # "yaml" or "json"
+
+# path:
+DIR_PATH = 'config' # to ONN
+CFG_DEF_NAME = 'default' + "." + CONFIG_FORMAT
+CFG_DEF_PATH = '%s/%s' % (DIR_PATH, CFG_DEF_NAME)
+CFG_CUS_NAME = 'custom' + "." + CONFIG_FORMAT
+CFG_CUS_PATH = '%s/%s' % (DIR_PATH, CFG_CUS_NAME)
+
+# discarded on 2024/2/1 23:16:25
+# GPT_MODELS = {
+#     "3.5" : "gpt-3.5-turbo-1106",
+#     "4" : "gpt-4-1106-preview"
+# }
+
+GPT_MODELS = {
+    "4o" : "gpt-4o-2024-08-06",
+    "4omini" : "gpt-4o-mini-2024-07-18",
+    "4t" : "gpt-4-turbo-2024-04-09",
+    "3.5" : "gpt-3.5-turbo-0125",
+    "4" : "gpt-4-0125-preview",
+    "3.5old" : "gpt-3.5-turbo-1106",
+    "4old" : "gpt-4-1106-preview",
+    "o1": "o1-preview-2024-09-12",
+    "o1mini": "o1-mini-2024-09-12"
+}
+
+CLAUDE_MODELS = {
+    "sonnet3.5": "claude-3-5-sonnet-20240620",
+    "3.5sonnet": "claude-3-5-sonnet-20240620",
+    "claude3.5sonnet": "claude-3-5-sonnet-20240620",
+    "claude3.5": "claude-3-5-sonnet-20240620",
+
+    "opus":"claude-3-opus-20240229",
+    "sonnet": "claude-3-sonnet-20240229",
+    "haiku": "claude-3-haiku-20240307",
+    "claude3_opus":"claude-3-opus-20240229",
+    "claude3_sonnet": "claude-3-sonnet-20240229",
+    "claude3_haiku": "claude-3-haiku-20240307",
+    
+    "claude2.1": "claude-2.1",
+    "claude2.0": "claude-2.0",
+    "claude2": "claude-2.0"
+}
+
+LLM_MODEL_REDIRECTION = {
+    '4omini' : GPT_MODELS["4omini"],
+    '4o' : GPT_MODELS["4o"],
+    '4t' : GPT_MODELS["4t"],
+    '3.5' : GPT_MODELS["3.5"],
+    3.5 : GPT_MODELS["3.5"],
+    '4' : GPT_MODELS["4"],
+    '4.0' : GPT_MODELS["4"],
+    4 : GPT_MODELS["4"],
+    "3.5old" : GPT_MODELS["3.5old"],
+    "4old" : GPT_MODELS["4old"],
+    "o1": GPT_MODELS["o1"],
+    "o1mini": GPT_MODELS["o1mini"]
+}
+
+LLM_MODEL_REDIRECTION = {**LLM_MODEL_REDIRECTION, **CLAUDE_MODELS}
+WEEKRANGEMARK = "$weekrange$"
+
+######################################## utils ###########################################
+def str2bool(v):
+    if isinstance(v, bool):
+        return v
+    if v.lower() in ('yes', 'true', 't', 'y', '1'):
+        return True
+    elif v.lower() in ('no', 'false', 'f', 'n', '0'):
+        return False
+    else:
+        raise TypeError('Boolean value expected.')
+
+def get_time():
+    now = datetime.now()
+    time_str = now.strftime("%Y%m%d_%H%M%S")
+    return time_str
+
+def get_runinfo():
+    hostname = socket.gethostname(),
+    pid = os.getpid(),
+    return hostname[0], pid[0]
+
+################################ agparser (for future) ###################################
+################################## load .yaml/.json config #####################################
+def load_yaml_dict(path: str):
+    with open(path, 'rb') as f:
+        yaml_dict = yaml.safe_load(f)
+    return yaml_dict
+
+def load_json_dict(path: str):
+    with open(path, 'r') as f:
+        json_dict = json.load(f)
+    return json_dict
+
+def merge_config_dict(old_dict: dict, new_dict):
+    merge_dict = {}
+    if new_dict is None:
+        return old_dict
+    keys_old = old_dict.keys()
+    keys_new = new_dict.keys()
+    # we ignore the case when a key exists in new_dict but not in old_dict, because that is forbidden in my design
+    # but raising an error is still needed
+    for key in keys_new:
+        if  key not in keys_old:
+            raise Exception("%s is in custom_config but not in default_config, which is forbidden. Please modify related tree structure or add it to %s"%(key, CFG_DEF_PATH))
+    for key in keys_old:
+        if key not in keys_new:
+            merge_dict[key] = old_dict[key]
+        else:
+            if isinstance(old_dict[key], dict): # if the value is a dict
+                if not isinstance(new_dict[key], dict):
+                    raise TypeError("value of %s isn't a dict in custom_config but is a dict in default_config"%(key))
+                else:
+                    merge_dict[key] = merge_config_dict(old_dict[key], new_dict[key])
+            else: #if the value is not a dict:
+                if isinstance(new_dict[key], dict):
+                    raise TypeError("value of %s is a dict in custom_config but isn't a dict in default_config"%(key))
+                else:
+                    if new_dict[key] is None:
+                        merge_dict[key] = old_dict[key]
+                    else:
+                        merge_dict[key] = new_dict[key]
+    return merge_dict
+
+def load_config_dict(mode='merge', config_old_path = CFG_DEF_PATH, config_new_path = CFG_CUS_PATH, config_format = CONFIG_FORMAT):
+    if config_format == "yaml":
+        load_config_func = load_yaml_dict
+    elif config_format == "json":
+        load_config_func = load_json_dict
+    else:
+        raise Exception("wrong config format input: %s (can only be yaml or json)"%(config_format))
+    config_old = load_config_func(config_old_path)
+    config_new = load_config_func(config_new_path)
+    if mode == "merge":
+        return merge_config_dict(config_old, config_new)
+    elif mode == "split":
+        return config_new, config_old
+    else:
+        raise Exception("wrong mode input: %s"%(mode))
+
+################################### dict to object ######################################
+class Dict(dict):
+    """a class generated from python dict class"""
+    __setattr__ = dict.__setitem__
+    __getattr__ = dict.__getitem__
+
+    def get_copy(self):
+        internal_dict = DictTodict(self)
+        return dictToObj(internal_dict)
+    
+    def get_item(self, *key_iters, default=None):
+        internal_dict = DictTodict(self)
+        mid_val = internal_dict
+        for key in key_iters:
+            if key not in mid_val:
+                return default
+            mid_val = mid_val[key]
+        return mid_val
+
+def dictToObj(dictObj):
+    if not isinstance(dictObj, dict):
+        raise TypeError("this variable is not a instance of 'dict' type")
+    d = Dict()
+    for k, v in dictObj.items():
+        d[k] = recur_dictToObj(v)
+    return d
+
+def recur_dictToObj(dictObj):
+    if not isinstance(dictObj, dict):
+        return dictObj
+    d = Dict()
+    for k, v in dictObj.items():
+        d[k] = recur_dictToObj(v)
+    return d
+
+def DictTodict(Dict_obj):
+    if not isinstance(Dict_obj, Dict):
+        raise TypeError("this variable is not a instance of 'Dict' type")
+    d = dict()
+    # recursive the Dict attr
+    for k, v in Dict_obj.items():
+        d[k] = recur_DictTodict(v)
+    return d
+
+def recur_DictTodict(Dict_obj):
+    if not isinstance(Dict_obj, Dict):
+        return Dict_obj
+    d = dict()
+    for k, v in Dict_obj.items():
+        d[k] = recur_DictTodict(v)
+    return d
+
+def load_config_obj(custom_config_path):
+    return dictToObj(load_config_dict(config_new_path = custom_config_path))
+
+################################# config validation #####################################
+def config_val(config_obj):
+    # run_mode_val = ['normal', 'postproc', 'para', 'sensprune', 'custom']
+    # cvnn_dinmode_val = [] # has val func in ComplexNN
+    # assert config_obj.run.mode in run_mode_val, "There is no run mode named %s, only names in %s are valid"%(config_obj.run.mode, str_list(run_mode_val))
+    return True
+
+####################################### get config ######################################
+class Config(Dict):
+    # singleton pattern
+    _instance = None
+    _initialized = False
+    def __new__(cls, *args, **kwargs):
+        if not cls._instance:
+            cls._instance = super(Config, cls).__new__(cls)
+        return cls._instance
+    
+    def __init__(self, custom_config_path=None, *args, **kwargs):
+        if not self._initialized:
+            super(Config, self).__init__(*args, **kwargs)
+            if custom_config_path is not None:
+                self.load_config(custom_config_path)
+            self._initialized = True
+
+    def load_config(self, custom_config_path):
+        time = get_time()
+        hostname, pid =  get_runinfo()
+        config = load_config_obj(custom_config_path)
+        config.run.custom_path = custom_config_path
+        config.run.time = time
+        config.run.hostname = hostname
+        config.run.pid = pid
+        config.run.pyversion = sys.version
+        current_week = utils.get_week_range()
+        config.save.pub.dir = config.save.pub.dir.replace(WEEKRANGEMARK, current_week)
+        if not config.save.en:
+            # config.save.log.en = False
+            # config.save.message.en = False
+            # iterate the attr of config.save, if they have en attr, set it to False
+            for attr in DictTodict(config.save).keys():
+                sub_config = getattr(config.save, attr)
+                if isinstance(sub_config, Dict):
+                    try: # will raise keyerror if sub_config doesn't have en attr (it will only return false when come across AttributeError, but Dict doesn't have en attr, so it will raise KeyError)
+                        hasattr(sub_config, "en")
+                    except:
+                        continue
+                    setattr(sub_config, "en", False)
+        if config.gpt.model in LLM_MODEL_REDIRECTION.keys():
+            config.gpt.model = LLM_MODEL_REDIRECTION[config.gpt.model]
+        if config.gpt.rtlgen_model is None:
+            config.gpt.rtlgen_model = config.gpt.model
+        else:
+            if config.gpt.rtlgen_model in LLM_MODEL_REDIRECTION.keys():
+                config.gpt.rtlgen_model = LLM_MODEL_REDIRECTION[config.gpt.rtlgen_model]
+        # config_val(config)
+        self.update(config)
+
+# def load_config(custom_config_path)->Dict: #str = CFG_CUS_PATH):
+#     time = get_time()
+#     hostname, pid =  get_runinfo()
+#     config = load_config_obj(custom_config_path)
+#     config.run.custom_path = custom_config_path
+#     config.run.time = time
+#     config.run.hostname = hostname
+#     config.run.pid = pid
+#     if not config.save.en:
+#         # config.save.log.en = False
+#         # config.save.message.en = False
+#         # iterate the attr of config.save, if they have en attr, set it to False
+#         for attr in DictTodict(config.save).keys():
+#             sub_config = getattr(config.save, attr)
+#             if isinstance(sub_config, Dict):
+#                 try: # will raise keyerror if sub_config doesn't have en attr (it will only return false when come across AttributeError, but Dict doesn't have en attr, so it will raise KeyError)
+#                     hasattr(sub_config, "en")
+#                 except:
+#                     continue
+#                 setattr(sub_config, "en", False)
+#     if config.gpt.model in LLM_MODEL_REDIRECTION.keys():
+#         config.gpt.model = LLM_MODEL_REDIRECTION[config.gpt.model]
+#     # config_val(config)
+#     return config
+
+def load_split_config(custom_config_path = CFG_CUS_PATH, default_config_path = CFG_DEF_PATH):
+    # no validation. only for printing
+    # used in loader_saver.py
+    (custom_cfg_dict, default_cfg_dict) = load_config_dict('split', default_config_path, custom_config_path)
+    if custom_cfg_dict is None:
+        # custom_config can be None
+        custom_cfg = None
+    else:
+        custom_cfg = dictToObj(custom_cfg_dict)
+    default_cfg = dictToObj(default_cfg_dict)
+    return custom_cfg, default_cfg
+
+def get_cfg_path_from_alias(custom_cfg_alias: str|int) -> str:
+    if isinstance(custom_cfg_alias, str):
+        if custom_cfg_alias.isdigit():
+            custom_cfg_filename = "custom" + str(custom_cfg_alias) + "." + "yaml"
+            config_path = os.path.join("config/configs", custom_cfg_filename)
+        elif "/" in custom_cfg_alias and ".yaml" in custom_cfg_alias:
+            config_path = custom_cfg_alias
+        else:
+            config_path = os.path.join("config/configs", custom_cfg_alias + "." + "yaml")
+    elif isinstance(custom_cfg_alias, int):
+        custom_cfg_filename = "custom" + str(custom_cfg_alias) + "." + "yaml"
+        config_path = os.path.join("config/configs", custom_cfg_filename)
+    else:
+        raise ValueError("Invalid custom config alias: '--config %s'"%(custom_cfg_alias))
+    if not os.path.exists(config_path):
+        raise FileNotFoundError("alias [%s]: The custom config file %s doesn't exist"%(custom_cfg_alias, config_path))
+    return config_path
+
+### test ###
+if __name__ == "__main__":
+    my_config = Config(CFG_CUS_PATH)
+    print(my_config.get_item("run", "mode"))
+    print(my_config.run.mode)
+    print(my_config.get_item("run"))
--- a/config/custom.yaml
+++ b/config/custom.yaml
@@ -0,0 +1,15 @@
+
+run:
+    mode: 'autoline'
+gpt:
+    model: "qwen-max"
+    key_path: "config/key_API.json"
+save:
+    en: True
+    root: "/home/zhang/CorrectBench/TBgen_App/output/example_mul/"
+autoline:
+    cga:
+        enabled: True
+        max_iter: 10
+    promptscript: "pychecker"
+    onlyrun: "TBgensimeval"
--- a/config/default.yaml
+++ b/config/default.yaml
@@ -0,0 +1,96 @@
+################# running #################
+run:
+    version: '2.0' # last stable version of the code
+    time: ~ # preserved, will be set in program
+    custom_path: ~ #preserved, will be set in program
+    mode: 'qwen-max' # 'chatgpt': like a chatgpt but can load prompt or previous messages. 'autoline': run pipeline of Chatbench automatically. 'iverilog': run iverilog. 'test': test mode.
+
+################# saving ##################
+save:
+    en: True # True -> save according to settings below; False -> do not save anything.
+    root: ~ # the root saving dir ends with '/'; will be set in program. 
+    pub:
+        prefix: # the real name of one experiment, fill it in custom_path;
+        dir: 'saves/$weekrange$/' # Ended with '/'; if not empty, log/tb/data will share one dir, recommended.
+        subdir: '' # the final dir of one experiment would be dir + subdir;
+
+    log:
+        en: True
+        dir: 'logs/'
+        notes: ~
+        cfg_pmode: iwantall # available: ['split', 'merge', 'iwantall'] # config print mode; see loader_saver.py;
+        debug_en: False
+        level: "TRACE"
+
+    message:
+        en: True
+        dir: 'messages/'
+        format: 'json' # 'json' or 'txt'
+
+    iverilog:
+        en: True
+        subdir: 'ivcode_nodebug' # for pub mode
+
+################# loading #################
+load:
+    prompt: 
+        path: "config/initial_prompts/prompt1.txt" # Only valid when gpt.start_form = "prompt"; path to the prompt file
+        pick_idx: [] # TODO: valid only when path is ended with '.json', else ignored 
+        
+    stage_template:
+        path: "config/templates/stage_template0301.txt"
+
+############### GPT related ###############
+gpt:
+    model: "4o" # model name. Now we only use "gpt-4-1106-preview" or "gpt-3.5-turbo-1106" (20231128). "3.5" or "4" will be redirected to the above two models. see https://platform.openai.com/docs/models.
+    key_path: "config/key_API.json" # path to the key file
+    temperature: ~ # currently only in mode "chatgpt". not valid in mode "autoline" because it is too complicated. For chatgpt, it is default to 1.0. see https://platform.openai.com/docs/api-reference/chat/create.
+    json_mode: False # if True, the output of GPT will be in json format. Don't forget to ask GPT to return the json format. 
+    chatgpt: # settings below are valid only at mode "chatgpt";
+        start_form: "chat" #  "chat": input messages by hand; "prompt": input messages from file; only valid for the first message. In the future there will be a new start_form "competion".
+        # follow_form: "chat" # 
+        one_time_talk: False # will not continue to talk after the first message.
+    rtlgen_model: ~ # model used in autoline-3-TBcheck-discriminator, if None, use the same model as gpt.model.
+
+################# iverilog ################
+iverilog:
+    dir: "" # valid at mode "iverilog"; path to the dir of the iverilog files
+    task_id: "" # valid at mode "iverilog"; the task id of the iverilog task
+
+################# autoline ################
+autoline:
+    result_path: "results"
+    cga:
+        enabled: True
+        max_iter: 10
+        target_coverage: 100.0
+    probset: # integret probset/mutantset/prob_except; 20240304
+        path: ~ # default:"data/HDLBits/HDLBits_data.jsonl", you must enter this path in custom.yaml to avoid unconscious use. 
+        mutant_path: ~ # used in TB_eval2; you must enter this path in custom.yaml to avoid unconscious use.
+        gptgenRTL_path: ~ # used in TB_eval2b; you must enter this path in custom.yaml to avoid unconscious use.
+        more_info_paths: [] # more info added to the probset; 
+        only: ['lemmings3','lemmings4','ece241_2013_q8','2014_q3fsm','m2014_q6','review2015_fsm','rule110','fsm_ps2'] # only import data in the list by task_id;
+        exclude: [] # excludes data in the list by task_id;
+        exclude_json: ~ # excludes data in the json file by task_id;
+        filter: [{}] # only imports data containing key-value pairs; example: {"circuit_type": "CMB"} means only import data with "circuit_type" = "CMB"; x
+    checklist:
+        max: 3
+    debug:
+        max: 5 # max iterations of debug; if 0, no debug.
+        reboot: 1 # rerun stage 4 after every x iterations of debug. if 0, not debug but only reboot
+        py_rollback: 2 # reboot both after every x iterations of py_debug; if 0, no py debug; if 1, only debug 1 time and then reboot;
+    onlyrun: ~ # valid: [~, "TBgen", "TBgensim", "TBgensimeval"] ; if none, run all tasks; if not none, run only the tasks in the list.
+    promptscript: ~
+    timeout: 300 # timeout for run a python or iverilog code; unit: second.
+    TBcheck:
+        rtl_num: 20 # the number of rtls used in the TB_check; will be ignored if the llmgen_rtls are provided in probset.
+        correct_max: 3
+        discrim_mode: "col_full_wrong"
+        correct_mode: "naive"
+        rtl_compens_en: True # if True, when the half of the rtls contain syntax error, will generate more rtls to compensate.
+        rtl_compens_max_iter: 3 # the max iteration of generating rtls to compensate.
+    itermax: 10 # the max reboot times of the whole program; this reboot is trigered by TBcheck's next action
+    update_desc: False # if True, when reboot the program, will use the updated description of the task (from TBcheck)
+    save_compile: True # if True, save the compiling codes and files (codes in TBeval and TBcheck.discriminator); if False, not save.
+    save_finalcodes: True # if True, save the eventually generated Testbench codes (Verilog + Python); if False, not save.
+    error_interruption: False # if True, the program will stop when error occurs; Usually used in debugging.
--- a/config/key_API.json
+++ b/config/key_API.json
@@ -0,0 +1,5 @@
+{
+    "OPENAI_API_KEY" : "",
+    "ANTHROPIC_API_KEY" : "",
+    "dashscope" : ""
+}