AutoSafeCoder/main.py at main · SecureAIAutonomyLab/AutoSafeCoder · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
from executor_agent_safe import FResult, execute_fuzz
from programmer_agent import ProgrammerAgent
from tester_fuzz_agent import TesterFuzzAgent
from fuzz_agent import InputMutatorAgent
from executor_static import ExecutorStaticAgent
from datasets import load_dataset
import json
import os
import gzip

class MultiAgentSystem:
    def __init__(self, entry):
        self.programmer_agent = ProgrammerAgent(entry)
        self.tester_fuzz_agent = TesterFuzzAgent(entry)
        self.executor_static = ExecutorStaticAgent(entry)
        self.code = None
        self.test_inputs = None

    def run(self,iterations=120):
        # Step 1: Programmer writes code
        self.code = self.programmer_agent.write_code()
        print(f"Programmer's Code:\n{self.code}")

        problems = {}
        # Add the entry to the dictionary
        problems[entry['ID']] = {'ID': entry['ID']}
        #Step 2: Static analyzer agent reviews code
        result, error_description = self.executor_static.execute_static_analysis_gpt(self.code)

        print('result')
        print(result)
        # If error, give feedback to programmer agent up to 4 times
        if result.name != FResult.SAFE.name:
            for i in range(4):
                self.code = self.programmer_agent.write_code_feedback_static(self.code, error_description, "")
                result, error_description = self.executor_static.execute_static_analysis_gpt(self.code)

                if result.name == FResult.SAFE.name:
                    static_analysis_status = f'fixed {i + 1}'
                    break
                print('error feedback:' + error_description)
            if result.name != FResult.SAFE.name:
                static_analysis_status = 'fail: ' + error_description
        else:
            static_analysis_status = 'success'

        print(f"Programmer's Code after static analysis changes:\n{self.code}")
        # Step 3: Fuzzing agent generates initial test inputs
        test_inputs_list = []
        self.test_inputs = self.tester_fuzz_agent.generate_test_inputs()
        if (self.test_inputs == {}):
            #If no inputs generated for some reason, dynamic testing is not done
            task = {**problems[entry['ID']], "code": self.code, "fuzzing_inputs": test_inputs_list, "unit_test_status": "no unit tests", "static_analysis_status": static_analysis_status, "fuzzing_test_status": "No inputs created"}
            with open("results.json", 'a') as f:
                json.dump(task, f)
                f.write("\n")  # Write a new line after each JSON object
            return
        test_inputs_list.append(self.test_inputs)
        print(f"Initial Test Inputs:\n{self.test_inputs}")

        failed_inputs_fuzz = []
        fuzzing_test_status = None
        # Step 4: Execute and mutate in a loop for the given number of iterations
        for iteration in range(iterations):
            print(f"\nIteration {iteration + 1}")

            # Step 4a: Executor runs the code with current inputs
            try:
                result,passed,inputs,functionname = execute_fuzz(self.code,self.test_inputs, 3)
            except Exception as e:
                print("exception code", self.code)
                print(e)
                fuzzing_test_status = "error running function"
                break
            print(f"Execution Feedback:\n{result}")

            # If there's an error, flag the test as failed
            if not passed:
                if("No module named" in result):
                    fuzzing_test_status = "module missing: " + result
                    break
                elif("No root path can be found for the provided module 'builtins'" in result):
                    fuzzing_test_status = "prevent run by reliability_guard"
                    break
                else:
                    failed_inputs_fuzz.append({'inputs': inputs, 'result': result})
                    if len(failed_inputs_fuzz) > 10:
                        break

            mutator_agent = InputMutatorAgent(inputs, self.code,functionname)
            self.test_inputs = mutator_agent.mutate_inputs()
            test_inputs_list.append(self.test_inputs)
            print(f"Mutated Inputs:\n{self.test_inputs}")

        # Step 5: If errors were found in fuzzing, give feedback to coder to fix
        if len(failed_inputs_fuzz) != 0:
            problems[entry['ID']]['initial_failed_inputs'] = failed_inputs_fuzz[:5].copy()
            problems[entry['ID']]['code_before_fuzz_fix'] = self.code
            fuzzing_test_status = 'fail'
            # Give feedback to Coder up to 4 times
            for i in range(4):
                print(f"will try to fix code from fuzz try {i+1}")
                self.code = self.programmer_agent.write_code_feedback_fuzz(self.code, failed_inputs_fuzz[:5])
                print(f"code changed in fuzz {i+1}")
                print(self.code)
                new_failed_inputs = []
                for inputs in failed_inputs_fuzz:
                    try:
                        # run the code with the failing inputs to see if problem is fixed
                        result,passed,_inputs,_functionname = execute_fuzz(self.code,self.test_inputs, 3)
                    except Exception as e:
                        print("exception code", self.code)
                        print(e)
                        fuzzing_test_status = "error running function"
                        break
                    if not passed:
                        new_failed_inputs.append({'inputs': inputs, 'result': result})

                if len(new_failed_inputs) != 0:
                    failed_inputs_fuzz = new_failed_inputs
                    continue
                else:
                    fuzzing_test_status = f'fixed {i + 1}'
                    break

        else:
            if (fuzzing_test_status is None):
                fuzzing_test_status = 'success'
                print(f"No errors encountered in {iterations} iterations.")

        # Step 6: Save the results in a JSON file
        if not os.path.exists("results.json"):
            with open("results.json", 'w') as f:
                pass

        #result includes code, fuzzing inputs used, static and fuzzing testing status
        task = {**problems[entry['ID']], "code": self.code, "fuzzing_inputs": test_inputs_list, "unit_test_status": "no unit tests", "static_analysis_status": static_analysis_status, "fuzzing_test_status": fuzzing_test_status}
        with open("results.json", 'a') as f:  # 'a' mode to append to the file
            json.dump(task, f)
            f.write("\n")  # Write a new line after each JSON object

        print(f"Tasks saved to results.json")

if __name__ == "__main__":

    #Human eval dataset
    #dataset = load_dataset("openai_humaneval",split="test")
    #dataset = [entry for entry in dataset]

    #Path to your local humaneval.jsonl.gz file
    #local_file = "./local_humaneval.gz"

    #Function to read the dataset from the compressed jsonl.gz file
    # def read_humaneval_dataset(file_path):
    #    dataset = []
    #    with gzip.open(file_path, 'rt', encoding='utf-8') as f:
    #        for line in f:
    #            dataset.append(json.loads(line))
    #    return dataset

    # Load the dataset
    #dataset = read_humaneval_dataset(local_file)

    #Security Eval dataset
    local_file_jsonl = "./dataset copy.jsonl"

    # Function to read the dataset from the jsonl file
    def read_dataset_jsonl(file_path):
        dataset = []
        with open(file_path, 'r', encoding='utf-8') as f:
            for line in f:
                dataset.append(json.loads(line))
        return dataset

    # Load the dataset
    dataset = read_dataset_jsonl(local_file_jsonl)

    for entry in dataset:
            system = MultiAgentSystem(entry)
            system.run()