File: parse_fuzzer.cc

package info (click to toggle)
chromium 139.0.7258.127-1
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 6,122,068 kB
  • sloc: cpp: 35,100,771; ansic: 7,163,530; javascript: 4,103,002; python: 1,436,920; asm: 946,517; xml: 746,709; pascal: 187,653; perl: 88,691; sh: 88,436; objc: 79,953; sql: 51,488; cs: 44,583; fortran: 24,137; makefile: 22,147; tcl: 15,277; php: 13,980; yacc: 8,984; ruby: 7,485; awk: 3,720; lisp: 3,096; lex: 1,327; ada: 727; jsp: 228; sed: 36
file content (83 lines) | stat: -rw-r--r-- 2,818 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
// Copyright 2021 The Chromium Authors
// Use of this source code is governed by an MIT-style license that can be
// found in the LICENSE file.

#include "third_party/liburlpattern/parse.h"

#include <stddef.h>
#include <stdint.h>

#include <optional>
#include <string>
#include <string_view>

#include "base/check.h"
#include "base/check_op.h"
#include "base/containers/span.h"
#include "base/logging.h"
#include "base/strings/strcat.h"
#include "base/strings/string_util.h"
#include "base/types/expected.h"
#include "third_party/abseil-cpp/absl/status/status.h"
#include "third_party/abseil-cpp/absl/strings/str_format.h"
#include "third_party/liburlpattern/pattern.h"

namespace liburlpattern {
namespace {
base::expected<std::string, absl::Status> PassThrough(std::string_view input) {
  return std::string(input);
}

std::optional<std::string> ParseAndCanonicalize(std::string_view s) {
  base::expected<Pattern, absl::Status> pattern = Parse(s, &PassThrough);
  if (!pattern.has_value()) {
    LOG(INFO) << "Parse failed with status: " << pattern.error();
    return std::nullopt;
  }
  return pattern->GeneratePatternString();
}

std::string FancyHexDump(std::string_view label, std::string_view data) {
  std::string char_line, hex_line;
  for (char c : data) {
    if (!base::IsAsciiPrintable(c))
      char_line.append(" [?]");
    else
      char_line.append(absl::StrFormat("%4c", c));
    hex_line.append(absl::StrFormat("  %02x", c));
  }
  return base::StrCat({label, "\n", char_line, "\n", hex_line});
}

struct Environment {
  Environment() { logging::SetMinLogLevel(logging::LOGGING_INFO); }
};
}  // namespace

extern "C" int LLVMFuzzerTestOneInput(const uint8_t* data, size_t size) {
  static Environment env;

  // Make a copy of `data` on the heap to enable ASAN to catch OOB accesses.
  std::string pattern_string(reinterpret_cast<const char*>(data), size);

  std::optional<std::string> canonical = ParseAndCanonicalize(pattern_string);
  if (!canonical)
    return 0;

  // If `Pattern::GeneratePatternString()` generates canonical strings,
  // recanonicalizing one of its outputs should always be a no-op. To test that
  // property, let's check that `ParseAndCanonicalize()` is idempotent, i.e.
  // that `canonical` is a fixed point of the function.
  std::optional<std::string> canonical2 = ParseAndCanonicalize(*canonical);
  CHECK(canonical2)
      << "Failed to parse canonical pattern from original input.\n"
      << FancyHexDump("original : ", pattern_string) << "\n"
      << FancyHexDump("canonical: ", *canonical);

  CHECK_EQ(*canonical, *canonical2)
      << "Canonical pattern and its recanonicalization are not equal.\n"
      << FancyHexDump("canonical : ", *canonical) << "\n"
      << FancyHexDump("canonical2: ", *canonical2);
  return 0;
}
}  // namespace liburlpattern