File: clean_json_attrs.py

package info (click to toggle)
chromium 120.0.6099.224-1~deb11u1
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 6,112,112 kB
  • sloc: cpp: 32,907,025; ansic: 8,148,123; javascript: 3,679,536; python: 2,031,248; asm: 959,718; java: 804,675; xml: 617,256; sh: 111,417; objc: 100,835; perl: 88,443; cs: 53,032; makefile: 29,579; fortran: 24,137; php: 21,162; tcl: 21,147; sql: 20,809; ruby: 17,735; pascal: 12,864; yacc: 8,045; lisp: 3,388; lex: 1,323; ada: 727; awk: 329; jsp: 267; csh: 117; exp: 43; sed: 37
file content (56 lines) | stat: -rwxr-xr-x 1,515 bytes parent folder | download | duplicates (11)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#!/usr/bin/env python

import json
import os
import re


def Clean(start_dir, attr_pattern, file_pattern):
  cleaned = False

  def _remove_attrs(json_dict, attr_pattern):
    assert isinstance(json_dict, dict)

    removed = False

    for key, val in json_dict.items():
      if isinstance(val, dict):
        if _remove_attrs(val, attr_pattern):
          removed = True
      elif re.search(attr_pattern, key):
        del json_dict[key]
        removed = True

    return removed

  for root, dirs, files in os.walk(start_dir):
    for f in files:
      if not re.search(file_pattern, f):
        continue

      path = os.path.join(root, f)
      json_dict = json.loads(open(path).read())
      if not _remove_attrs(json_dict, attr_pattern):
        continue

      with open(path, 'w') as new_contents:
        new_contents.write(json.dumps(json_dict))
      cleaned = True

  return cleaned


if __name__ == '__main__':
  import argparse
  import sys
  parser = argparse.ArgumentParser(
      description='Recursively removes attributes from JSON files')
  parser.add_argument('--attr_pattern', type=str, required=True,
      help='A regex of attributes to remove')
  parser.add_argument('--file_pattern', type=str, required=True,
      help='A regex of files to clean')
  parser.add_argument('start_dir', type=str,
      help='A directory to start scanning')
  args = parser.parse_args(sys.argv[1:])
  Clean(start_dir=args.start_dir, attr_pattern=args.attr_pattern,
        file_pattern=args.file_pattern)