oss-fuzz-gen/pipeline.py at main · google/oss-fuzz-gen · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
# Copyright 2025 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""The fuzzing main pipeline."""
import argparse
from typing import Optional

import logger
from agent.base_agent import BaseAgent
from results import AnalysisResult, BuildResult, Result, RunResult, TrialResult
from stage.analysis_stage import AnalysisStage
from stage.execution_stage import ExecutionStage
from stage.writing_stage import WritingStage


class Pipeline():
  """The fuzzing main pipeline, consisting of three iterative stages:
    1. Writing stage generates or refines the fuzz target and its associated
       build script to improve code coverage and enhance bug-finding
       capabilities for the function under test.
    2. Execution stage assesses the fuzz target's performance by measuring
       code coverage and detecting runtime crashes.
    3. Analysis stage examines the results from the execution stage, extracting
       insights from the coverage and crash data to suggest improvements for the
       writing stage in the next iteration.
    """

  def __init__(self,
               args: argparse.Namespace,
               trial: int,
               writing_stage_agents: Optional[list[BaseAgent]] = None,
               execution_stage_agents: Optional[list[BaseAgent]] = None,
               analysis_stage_agents: Optional[list[BaseAgent]] = None):
    self.args = args
    self.trial = trial
    self.logger = logger.get_trial_logger(trial=trial)
    self.logger.debug('Pipeline Initialized')
    self.writing_stage: WritingStage = WritingStage(args, trial,
                                                    writing_stage_agents)
    self.execution_stage: ExecutionStage = ExecutionStage(
        args, trial, execution_stage_agents)
    self.analysis_stage: AnalysisStage = AnalysisStage(args, trial,
                                                       analysis_stage_agents)
    self.max_cycle_count = 5

  def _terminate(self, result_history: list[Result], cycle_count: int) -> bool:
    """Validates if the termination conditions have been satisfied."""
    if not cycle_count:
      return False

    if cycle_count > self.max_cycle_count:
      self.logger.info('[Cycle %d] Terminate after %d cycles: %s', cycle_count,
                       self.max_cycle_count, result_history)
      return True

    last_result = result_history[-1]

    # If this is a result from the build stage that shows it failed, then
    # we should terminate as we don't know how to progress.
    if isinstance(last_result, BuildResult) and not last_result.success:
      self.logger.debug('[Cycle %d] Last result is failed BuildResult: %s',
                        cycle_count, last_result)
      return True

    # If the latest result is not from the analysis stage, then we should
    # terminate, as it indicates an error from the execution stage.
    if not isinstance(last_result, AnalysisResult):
      self.logger.warning('[Cycle %d] Last result is not AnalysisResult: %s',
                          cycle_count, result_history)
      return True

    # If the analysis stage succeeded, our work is done and we terminate.
    if last_result.success:
      self.logger.info('[Cycle %d] Generation succeeds: %s', cycle_count,
                       result_history)
      return True
    else:
      # If the analysis stage failed then we should not terminate but rather
      # continue trying to generate a new fuzz harness/build set up.
      self.logger.info('[Cycle %d] Generation continues: %s', cycle_count,
                       result_history)
      return False

  def _update_status(self,
                     result_history: list[Result],
                     finished: bool = False) -> None:
    trial_result = TrialResult(benchmark=result_history[-1].benchmark,
                               trial=self.trial,
                               work_dirs=result_history[-1].work_dirs,
                               result_history=result_history)
    self.logger.write_result(
        result_status_dir=trial_result.best_result.work_dirs.status,
        result=trial_result,
        finished=finished)

  def _execute_one_cycle(self, result_history: list[Result],
                         cycle_count: int) -> None:
    """Executes the stages once."""
    self.logger.info('[Cycle %d] Initial result is %s', cycle_count,
                     result_history[-1])
    # Writing stage: We expect a build result that succeeds from this stage,
    # and if it fails then we will return from this cycle and terminate
    # the pipeline.
    result_history.append(
        self.writing_stage.execute(result_history=result_history,
                                   cycle_count=cycle_count))
    self._update_status(result_history=result_history)
    if (not isinstance(result_history[-1], BuildResult) or
        not result_history[-1].success):
      self.logger.warning('[Cycle %d] Build failure, skipping the rest steps',
                          cycle_count)
      return

    # Execution stage: We expect a run result that has a log path from this stage,
    # and if it fails then we will return from this cycle and terminate
    # the pipeline.
    result_history.append(
        self.execution_stage.execute(result_history=result_history,
                                     cycle_count=cycle_count))
    self._update_status(result_history=result_history)
    if (not isinstance(result_history[-1], RunResult) or
        not result_history[-1].log_path):
      self.logger.warning('[Cycle %d] Run failure, skipping the rest steps',
                          cycle_count)
      return

    # Analysis stage: We expect an analysis result from this stage. If the
    # analysis result from this stage fails, then we will continue the
    # pipeline and retry making a harness. If the analysis stage is successful,
    # then we will terminate the pipeline.
    result_history.append(
        self.analysis_stage.execute(result_history=result_history,
                                    cycle_count=cycle_count))
    # TODO(maoyi): add the indicator for the success of analysis stage
    if not isinstance(result_history[-1], AnalysisResult):
      self.logger.warning(
          '[Cycle %d] Analysis failure, skipping the rest steps', cycle_count)
      return
    self._update_status(result_history=result_history)
    self.logger.info('[Cycle %d] Analysis result %s: %s', cycle_count,
                     result_history[-1].success, result_history[-1])

  def execute(self, result_history: list[Result]) -> list[Result]:
    """
    Runs the fuzzing pipeline iteratively to assess and refine the fuzz target.
    1. Writing Stage refines the fuzz target and its build script using insights
    from the previous cycle.
    2. Execution Stage measures the performance of the revised fuzz target.
    3. Analysis Stage examines the execution results to guide the next cycle's
    improvements.
    The process repeats until the termination conditions are met.
    """
    self.logger.debug('Pipeline starts')
    cycle_count = 0
    self._update_status(result_history=result_history)
    while not self._terminate(result_history=result_history,
                              cycle_count=cycle_count):
      cycle_count += 1
      self._execute_one_cycle(result_history=result_history,
                              cycle_count=cycle_count)
    return result_history