google · maoyixie · Nov 7, 2024 · Nov 7, 2024 · Nov 7, 2024 · Nov 7, 2024
diff --git a/agent/crash_analyzer.py b/agent/crash_analyzer.py
@@ -14,8 +14,199 @@
 """An LLM agent to analyze and provide insight of a fuzz target's runtime crash.
 Use it as a usual module locally, or as script in cloud builds.
 """
+import os
+import shutil
+import subprocess as sp
+from typing import Optional
+
+import logger
 from agent.base_agent import BaseAgent
+from experiment import evaluator as evaluator_lib
+from experiment.workdir import WorkDirs
+from llm_toolkit import prompt_builder
+from llm_toolkit.prompts import Prompt
+from results import CrashResult, Result, RunResult
+from tool.container_tool import ProjectContainerTool
+from tool.lldb_tool import LLDBTool
+
+MAX_ROUND = 100
 
 
 class CrashAnalyzer(BaseAgent):
-  pass
+  """The Agent to analyze a runtime crash and provide insight to fuzz target."""
+
+  def _initial_prompt(self, results: list[Result]) -> Prompt:
+    """Constructs initial prompt of the agent."""
+    last_result = results[-1]
+
+    if isinstance(last_result, RunResult):
+      crash_analyzer_prompt_builder = \
+        prompt_builder.CrashAnalyzerTemplateBuilder(
+          model=self.llm,
+          benchmark=last_result.benchmark)
+      prompt = crash_analyzer_prompt_builder.build_crash_analyzer_prompt(
+          last_result.benchmark, last_result.fuzz_target_source,
+          last_result.run_error, last_result.crash_func)
+      return prompt
+
+    logger.error("Expected a RunResult object in results list",
+                 trial=self.trial)
+    return prompt_builder.CrashAnalyzerTemplateBuilder(self.llm).build([])
+
+  def _format_lldb_execution_result(
+      self,
+      process: sp.CompletedProcess,
+      previous_prompt: Optional[Prompt] = None) -> str:
+    """Formats a prompt based on lldb execution result."""
+    if previous_prompt:
+      previous_prompt_text = previous_prompt.get()
+    else:
+      previous_prompt_text = ''
+    stdout = self.llm.truncate_prompt(process.stdout,
+                                      previous_prompt_text).strip()
+    stderr = self.llm.truncate_prompt(process.stderr,
+                                      stdout + previous_prompt_text).strip()
+    return (f'<lldb>\n{process.args}\n</lldb>\n'
+            f'<return code>\n{process.returncode}\n</return code>\n'
+            f'<stdout>\n{stdout}\n</stdout>\n'
+            f'<stderr>\n{stderr}\n</stderr>\n')
+
+  def _container_handle_lldb_command(self, response: str, tool: LLDBTool,
+                                     prompt: Prompt) -> Prompt:
+    """Handles the command from LLM with lldb |tool|."""
+    prompt_text = ''
+    for command in self._parse_tags(response, 'lldb'):
+      prompt_text += self._format_lldb_execution_result(
+          tool.execute_in_screen(command), previous_prompt=prompt) + '\n'
+      prompt.append(prompt_text)
+    return prompt
+
+  def _container_handle_conclusion(self, cur_round: int, response: str,
+                                   crash_result: CrashResult) -> None:
+    """Parses LLM conclusion, analysis and suggestion."""
+    logger.info('----- ROUND %02d Received conclusion -----',
+                cur_round,
+                trial=self.trial)
+
+    conclusion = self._parse_tag(response, 'conclusion')
+    if conclusion == 'Crash is caused by bug in fuzz driver.':
+      crash_result.true_bug = False
+    elif conclusion == 'Crash is caused by bug in project.':
+      crash_result.true_bug = True
+    else:
+      logger.error('***** Failed to match conclusion in %02d rounds *****',
+                   cur_round,
+                   trial=self.trial)
+
+    crash_result.insight = self._parse_tag(response, 'analysis and suggestion')
+    if not crash_result.insight:
+      logger.error('Round %02d No analysis and suggestion in conclusion: %s',
+                   cur_round,
+                   response,
+                   trial=self.trial)
+
+  def _container_tool_reaction(self, cur_round: int, response: str,
+                               crash_result: CrashResult) -> Optional[Prompt]:
+    """Validates LLM conclusion or executes its command."""
+    if self._parse_tag(response, 'conclusion'):
+      return self._container_handle_conclusion(cur_round, response,
+                                               crash_result)
+    prompt = prompt_builder.CrashAnalyzerTemplateBuilder(self.llm,
+                                                         None).build([])
+    if self._parse_tag(response, 'lldb'):
+      return self._container_handle_lldb_command(response, self.analyze_tool,
+                                                 prompt)
+    if self._parse_tag(response, 'bash'):
+      return self._container_handle_bash_command(response, self.check_tool,
+                                                 prompt)
+    return None
+
+  def _copy_cloud_artifact(self, artifact_path: str) -> None:
+    """Copies the artifact from cloud build."""
+    cloud_build_artifact_path = (
+        f'/workspace/{os.path.basename(artifact_path)}')
+    if os.path.exists(cloud_build_artifact_path):
+      os.makedirs(os.path.dirname(artifact_path), exist_ok=True)
+      shutil.copyfile(cloud_build_artifact_path, artifact_path)
+      logger.info('Copied artifact from %s to %s',
+                  cloud_build_artifact_path,
+                  artifact_path,
+                  trial=self.trial)
+    else:
+      logger.warning('Unable to find artifact_path in cloud build: %s',
+                     cloud_build_artifact_path,
+                     trial=self.trial)
+
+  def execute(self, result_history: list[Result]) -> CrashResult:
+    """Executes the agent based on previous run result."""
+    WorkDirs(self.args.work_dirs.base)
+    last_result = result_history[-1]
+    benchmark = last_result.benchmark
+    logger.info('Executing Crash Analyzer', trial=self.trial)
+    assert isinstance(last_result, RunResult)
+
+    if self.args.cloud_experiment_name:
+      self._copy_cloud_artifact(last_result.artifact_path)
+
+    # TODO(dongge): Move these to oss_fuzz_checkout.
+    generated_target_name = os.path.basename(benchmark.target_path)
+    sample_id = os.path.splitext(generated_target_name)[0]
+    generated_oss_fuzz_project = (
+        f'{benchmark.id}-{sample_id}-lldb-{self.trial:02d}')
+    generated_oss_fuzz_project = evaluator_lib.rectify_docker_tag(
+        generated_oss_fuzz_project)
+
+    # TODO(dongge): Write to OSS-Fuzz project dir files directly.
+    fuzz_target_path = os.path.join(last_result.work_dirs.fuzz_targets,
+                                    f'{self.trial:02d}.fuzz_target')
+    with open(fuzz_target_path, 'w') as ft_file:
+      ft_file.write(last_result.fuzz_target_source)
+    if last_result.build_script_source:
+      build_script_path = os.path.join(last_result.work_dirs.fuzz_targets,
+                                       f'{self.trial:02d}.build_script')
+      with open(build_script_path, 'w') as ft_file:
+        ft_file.write(last_result.build_script_source)
+    else:
+      build_script_path = ''
+
+    evaluator_lib.Evaluator.create_ossfuzz_project_with_lldb(
+        benchmark, generated_oss_fuzz_project, fuzz_target_path, last_result,
+        build_script_path, last_result.artifact_path)
+
+    self.analyze_tool = LLDBTool(benchmark,
+                                 result=last_result,
+                                 name='lldb',
+                                 project_name=generated_oss_fuzz_project)
+    self.analyze_tool.execute('compile > /dev/null')
+    self.analyze_tool.execute("'screen -dmS lldb_session bash -c 'lldb'")
+    self.check_tool = ProjectContainerTool(
+        benchmark, name='check', project_name=generated_oss_fuzz_project)
+    self.check_tool.compile(extra_commands=' && rm -rf /out/* > /dev/null')
+    prompt = self._initial_prompt(result_history)
+    prompt.add_problem(self.analyze_tool.tutorial())
+    prompt.add_problem(self.check_tool.tutorial())
+    crash_result = CrashResult(benchmark=benchmark,
+                               trial=last_result.trial,
+                               work_dirs=last_result.work_dirs,
+                               author=self,
+                               chat_history={self.name: ''})
+    cur_round = 1
+    try:
+      client = self.llm.get_chat_client(model=self.llm.get_model())
+      while prompt and cur_round < MAX_ROUND:
+        response = self.chat_llm(cur_round=cur_round,
+                                 client=client,
+                                 prompt=prompt,
+                                 trial=self.trial)
+        prompt = self._container_tool_reaction(cur_round, response,
+                                               crash_result)
+        cur_round += 1
+        self._sleep_random_duration(trial=self.trial)
+    finally:
+      # Cleanup: stop the container
+      logger.debug('Stopping the crash analyze container %s',
+                   self.analyze_tool.container_id,
+                   trial=self.trial)
+      self.analyze_tool.terminate()
+
+    return crash_result
diff --git a/common/cloud_builder.py b/common/cloud_builder.py
@@ -32,7 +32,7 @@
 
 import utils
 from agent.base_agent import BaseAgent
-from results import Result
+from results import Result, RunResult
 
 OF_REPO = 'https://github.com/google/oss-fuzz.git'
 OFG_ROOT_DIR = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
@@ -107,12 +107,12 @@ def _prepare_and_upload_archive(self) -> str:
       return self._upload_to_gcs(archive_path)
 
   def _request_cloud_build(self, ofg_repo_url: str, agent_dill_url: str,
-                           results_dill_url: str,
+                           results_dill_url: str, artifact_url: str,
                            new_result_filename: str) -> str:
     """Requests Cloud Build to execute the operation."""
     cloud_build_config = {
         'steps': [
-            # Step 1: Download the dill files from GCS bucket.
+            # Step 1: Download the dill and artifact files from GCS bucket.
             {
                 'name': 'bash',
                 'dir': '/workspace',
@@ -128,6 +128,16 @@ def _request_cloud_build(self, ofg_repo_url: str, agent_dill_url: str,
                 'dir': '/workspace',
                 'args': ['cp', results_dill_url, 'dills/result_history.pkl']
             },
+            {
+                'name': 'gcr.io/cloud-builders/gsutil',
+                'dir': '/workspace',
+                'args': [
+                    'cp', artifact_url,
+                    f'/workspace/{os.path.basename(artifact_url)}'
+                ],
+                # artifact_url only exists in crash analyzer.
+                'allowFailure': True,
+            },
             # Step 2: Prepare OFG and OF repos.
             {
                 'name':
@@ -196,7 +206,7 @@ def _request_cloud_build(self, ofg_repo_url: str, agent_dill_url: str,
                     '/workspace/dills/new_result.pkl'
                 ],
             },
-            # Step 4: Upload the result to GCS bucket
+            # Step 6: Upload the result to GCS bucket
             {
                 'name': 'bash',
                 'dir': '/workspace',
@@ -309,11 +319,15 @@ def run(self, agent: BaseAgent, result_history: list[Result],
     ofg_url = self._prepare_and_upload_archive()
     agent_url = self._upload_to_gcs(agent_dill)
     results_url = self._upload_to_gcs(results_dill)
+    last_result = result_history[-1]
+    artifact_url = 'ARTIFACT_URL DOES NOT EXISTS'
+    if isinstance(last_result, RunResult) and last_result.artifact_path:
+      artifact_url = self._upload_to_gcs(last_result.artifact_path)
 
     # Step 3: Request Cloud Build.
     new_result_filename = f'{uuid.uuid4().hex}.pkl'
     build_id = self._request_cloud_build(ofg_url, agent_url, results_url,
-                                         new_result_filename)
+                                         artifact_url, new_result_filename)
 
     # Step 4: Download new result dill.
     cloud_build_log = ''
@@ -334,7 +348,7 @@ def run(self, agent: BaseAgent, result_history: list[Result],
 
     cloud_build_log += self._get_build_log(build_id)
 
-    # Step 4: Deserialize dilld file.
+    # Step 5: Deserialize dilld file.
     result = utils.deserialize_from_dill(new_result_dill)
     if not result:
       cloud_build_log += f'Failed to deserialize from dill {new_result_dill}.\n'