File: extract-doc-tarball-from-upstream

package info (click to toggle)
gcc-12-doc 12.2.0-1
  • links: PTS, VCS
  • area: non-free
  • in suites: bookworm, forky, sid, trixie
  • size: 26,004 kB
  • sloc: perl: 479; python: 301; makefile: 239; cpp: 17
file content (82 lines) | stat: -rw-r--r-- 2,420 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
#!/usr/bin/env python3

# Copyright (c) 2012 Samuel Bronson
# Copyright (c) 2012, 2014, 2015, 2017 GUO Yixuan
#
# Made available under the "expat" license, which follows:
#
# Permission is hereby granted, free of charge, to any person obtaining
# a copy of this software and associated documentation files (the
# "Software"), to deal in the Software without restriction, including
# without limitation the rights to use, copy, modify, merge, publish,
# distribute, sublicense, and/or sell copies of the Software, and to
# permit persons to whom the Software is furnished to do so, subject to
# the following conditions:
#
# The above copyright notice and this permission notice shall be included
# in all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

import sys
import tarfile
import re
import posixpath
from pprint import pprint


try:
    infn, pkg, ver = sys.argv[1:]
except ValueError:
    print("usage: %s gcc-X.Y.Z.tar.(gz|bz2) gcc-X.Y-doc X.Y.Z[.mumble]" % sys.argv[0])
    exit(1)

# Output type, "xz" or "gz"
outtype = "xz"

# output filename
#outfn = '%s_%s.orig.tar.gz' % (pkg, ver)
outfn = ( '%s_%s.orig.tar.' + outtype ) % (pkg, ver)

# directory that the output tarball would extract to
# (the prefix in the tarball)
outdir = '%s-%s.orig' % (pkg, ver)

intar = tarfile.open(infn, 'r|*', format=tarfile.PAX_FORMAT)

# Now tarfile supports compression on write
outtar = tarfile.open(name=outfn, mode='w:' + outtype)

pat_s = r"""
  ^.*\.(7|texi|rst|texinfo)$
| ^gcc/ada/(xgnatugn.adb|ug_words)$
| ^gcc/ada/doc/
| ^contrib/texi2pod\.pl$
"""
pat = re.compile(pat_s, re.VERBOSE)

for member in intar:
    if not member.isreg():
        continue

    _, path = member.name.split('/', 1)

    mo = pat.search(path)
    if not mo:
        continue

    outpath = posixpath.join(outdir, path)
    print(outpath)

    mf = intar.extractfile(member)
    member.name = outpath
    outtar.addfile(member, mf)

intar.close()
outtar.close()