File: validate.py

package info (click to toggle)
dacco 2021.01.01-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, bullseye, forky, sid, trixie
  • size: 11,000 kB
  • sloc: python: 56; makefile: 2
file content (81 lines) | stat: -rwxr-xr-x 2,215 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
#!/usr/bin/env python3

import argparse
import glob
import os
import subprocess
import sys


def print_buffered_reader(buffered_reader):
    number_of_lines = 0
    for line in buffered_reader.readlines():
        line = line.decode('utf-8').rstrip()
        print(line)
        number_of_lines += 1

    return number_of_lines


def validate_file(dtd_path, file_path, *, verbose):
    xmllint_bin = 'xmllint'
    try:
        proc = subprocess.Popen([xmllint_bin, '--noout', '--dtdvalid', dtd_path, file_path],
                                stdout=subprocess.PIPE, stderr=subprocess.PIPE)
    except FileNotFoundError:
        print(
            f'{xmllint_bin} needs to be available in the path. In Debian based systems is available in the package "libxml2-utils"', sys.stderr)
        sys.exit(2)
    if verbose:
        print_buffered_reader(proc.stdout)
        print_buffered_reader(proc.stderr)

    proc.communicate()

    return proc.returncode == 0


def validate_directory(dtd_path, directory_path):
    total_files = 0
    invalid_files = 0

    files = glob.glob(os.path.join(directory_path, '*'))
    files.sort()

    for file_path in files:
        valid = validate_file(dtd_path, file_path, verbose=False)

        print(f'{file_path} valid {valid}')

        total_files += 1

        invalid_files += 1 if not valid else 0

    print('Total files:', total_files)
    print('Invalid files:', invalid_files)


def validate(dtd_path, path):
    if not os.path.isfile(dtd_path):
        print(f'Make sure that {dtd_path} is a DTD file')
        sys.exit(1)

    if os.path.isfile(path):
        valid = validate_file(dtd_path, path, verbose=True)
        print('File is valid:', valid)
    elif os.path.isdir(path):
        validate_directory(dtd_path, path)
    else:
        print(f'Make sure that {path} is a file or directory')
        sys.exit(2)


if __name__ == '__main__':
    parser = argparse.ArgumentParser(description='Validates a file or a directory using the DTD')

    parser.add_argument('dtd_file', help='DTD file to validate against it')
    parser.add_argument('path', help='File or directory to validate')

    args = parser.parse_args()

    validate(args.dtd_file, args.path)