MCPcopy
hub / github.com/hkust-nlp/ceval / main

Function main

code/evaluator_series/eval_llama.py:83–134  ·  view source on GitHub ↗
(
        ckpt_dir: str,
        param_size: int = 13,
        ntrain: int = 5,
        few_shot: bool = False,
        cot: bool = False,
        subject: str = "operating_system",
        max_seq_len: int = 2048,
)

Source from the content-addressed store, hash-verified

81
82
83def main(
84 ckpt_dir: str,
85 param_size: int = 13,
86 ntrain: int = 5,
87 few_shot: bool = False,
88 cot: bool = False,
89 subject: str = "operating_system",
90 max_seq_len: int = 2048,
91):
92 evaluator = load(
93 ckpt_dir,
94 param_size=param_size,
95 ntrain=ntrain,
96 max_seq_len=max_seq_len
97 )
98
99 subject_name = subject
100 run_date = time.strftime('%Y-%m-%d_%H-%M-%S', time.localtime(time.time()))
101 save_result_dir = os.path.join(
102 r"logs", f"LLaMA_{param_size}{'_CoT' if cot else ''}_{run_date}")
103 os.makedirs(save_result_dir, exist_ok=True)
104
105 local_rank, _ = setup_model_parallel()
106 if local_rank == 0:
107 print(f"Start evaluating {subject_name}")
108
109 val_file_path = os.path.join('data/val', f'{subject_name}_val.csv')
110 val_df = pd.read_csv(val_file_path)
111
112 if few_shot:
113 dev_file_path = os.path.join('data/dev', f'{subject_name}_dev.csv')
114 dev_df = pd.read_csv(dev_file_path)
115 correct_ratio = evaluator.eval_subject(
116 subject_name,
117 val_df,
118 dev_df,
119 few_shot=few_shot,
120 save_result_dir=save_result_dir,
121 cot=cot,
122 **generate_args
123 )
124 else:
125 correct_ratio = evaluator.eval_subject(
126 subject_name,
127 val_df,
128 save_result_dir=save_result_dir,
129 cot=cot,
130 **generate_args
131 )
132
133 if local_rank == 0:
134 print("Acc:", correct_ratio)
135
136
137if __name__ == "__main__":

Callers

nothing calls this directly

Calls 3

loadFunction · 0.85
setup_model_parallelFunction · 0.85
eval_subjectMethod · 0.45

Tested by

no test coverage detected