File: extract-doc-tarball-from-upstream

package info (click to toggle)
gcc-6-doc 6.3.0-1
  • links: PTS, VCS
  • area: non-free
  • in suites: stretch
  • size: 26,640 kB
  • ctags: 102
  • sloc: perl: 473; python: 291; makefile: 269; cpp: 17
file content (89 lines) | stat: -rw-r--r-- 2,561 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#!/usr/bin/env python

# Copyright (c) 2012 Samuel Bronson
#
# Made available under the "expat" license, which follows:
#
# Permission is hereby granted, free of charge, to any person obtaining
# a copy of this software and associated documentation files (the
# "Software"), to deal in the Software without restriction, including
# without limitation the rights to use, copy, modify, merge, publish,
# distribute, sublicense, and/or sell copies of the Software, and to
# permit persons to whom the Software is furnished to do so, subject to
# the following conditions:
#
# The above copyright notice and this permission notice shall be included
# in all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

import sys
import tarfile
import gzip
# Requires python-lzma for xz support.
import lzma
import re
import posixpath
from pprint import pprint


try:
    infn, pkg, ver = sys.argv[1:]
except ValueError:
    print "usage: %s gcc-X.Y.Z.tar.(gz|bz2) gcc-X.Y-doc X.Y.Z[.mumble]" % sys.argv[0]
    exit(1)

# Output type, "xz" or "gz"
outtype = "xz"

# output filename
#outfn = '%s_%s.orig.tar.gz' % (pkg, ver)
outfn = ( '%s_%s.orig.tar.' + outtype ) % (pkg, ver)

# directory that the output tarball would extract to
# (the prefix in the tarball)
outdir = '%s-%s.orig' % (pkg, ver)

intar = tarfile.open(infn, 'r|*', format=tarfile.PAX_FORMAT)

if outtype == "gz":
    outtarball = gzip.GzipFile(outfn, 'wb', mtime=0)
else:
    outtarball = lzma.LZMAFile(outfn, mode='wb', options={'format':'xz'})

outtar = tarfile.open(None, 'w:tar', fileobj=outtarball)

pat_s = r"""
  ^.*\.(7|texi|rst|texinfo)$
| ^gcc/ada/(xgnatugn.adb|ug_words)$
| ^gcc/ada/doc/
| ^contrib/texi2pod\.pl$
"""
pat = re.compile(pat_s, re.VERBOSE)

for member in intar:
    if not member.isreg():
        continue

    _, path = member.name.split('/', 1)

    mo = pat.search(path)
    if not mo:
        continue

    outpath = posixpath.join(outdir, path)
    print outpath

    mf = intar.extractfile(member)
    member.name = outpath
    outtar.addfile(member, mf)

intar.close()
outtar.close()
outtarball.close()