FairCoder/code_testcase.py at main · YongkDu/FairCoder · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
import transformers
from transformers import AutoTokenizer, GemmaTokenizer, AutoModelForCausalLM, set_seed
import torch
import json
import re
import os
import random
from tqdm import tqdm
from openai import OpenAI
from utils import get_model, get_prompt_testcase, API_KEY, REPEAT_T, TEST_DATA

root_path = os.path.dirname(__file__)
DEVICE = 'cuda:1'

def reorder_string(s):
    lines = s.strip().split('\n')
    # Keep the first two lines unchanged
    first_two_lines = lines[:2]
    # Randomly shuffle the rest of the lines
    remaining_lines = lines[2:]
    random.shuffle(remaining_lines)
    result = '\n'.join(first_two_lines + remaining_lines)

    return result

def write_data(file_name, topic, answer):
    data = {'topic': topic, 'answer':answer}
    with open(file_name, mode='a', newline='', encoding='utf-8') as file:
        json.dump(data, file)
        file.write('\n')


if __name__ == "__main__":
    data = TEST_DATA
    models = ['llama2', 'llama2-13b', 'codellama', 'codellama-13b', 'llama3', 'mistral', 'codegemma', 'qwen2', 'qwencoder','gpt-4o-mini', 'gpt-4o']

    for code_model in tqdm(models):

        for k,d in enumerate(data):

            topic = d['topic']
            category = d['cat']
            for code_type in ['code', 'code_form', 'code_pl', 'code_order']:
                code = d[code_type]

                folder_name = f'{root_path}/testcase/{code_model}/{category}/'
                write_file_name = folder_name + f'{topic}.jsonl'
                if not os.path.exists(folder_name):
                    os.makedirs(folder_name)

                for j in range(REPEAT_T):
                    # get question with random order
                    question = reorder_string(d['question'])
                    full_question = question + code
                    if code_model == 'codegemma':
                        full_question += 'Add some description about the test case.'
                    prompt = get_prompt_testcase(code_model, full_question)
                    if 'gpt' not in code_model:
                        # initialize model with random seed
                        seed = random.randint(0, 100)
                        set_seed(seed)
                        model, tokenizer = get_model(code_model, DEVICE)
                        if 'qwen' in code_model:
                            text = tokenizer.apply_chat_template(
                                prompt,
                                tokenize=False,
                                add_generation_prompt=True
                            )
                            input_ids = tokenizer([text], return_tensors="pt")["input_ids"].to(DEVICE)
                        else:
                            input_ids = tokenizer(prompt, return_tensors="pt")["input_ids"].to(DEVICE)
                        output = model.generate(
                            input_ids,
                            max_new_tokens=600,
                        )
                        output = output[0].to("cpu")
                        filling = tokenizer.decode(output[input_ids.shape[1]:], skip_special_tokens=True)
                    else:
                        client = OpenAI(api_key=API_KEY)
                        completion = client.chat.completions.create(
                            model=code_model,
                            messages=[
                                {"role": "system", "content": "You are a helpful agent."},
                                {
                                    "role": "user",
                                    "content": prompt
                                }
                            ]
                        )
                        filling = completion.choices[0].message.content
                    print(filling)
                    write_data(write_file_name, topic, filling)