File: pdfmetadata

package info (click to toggle)
origami-pdf 2.1.0-1~exp2
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 1,444 kB
  • sloc: ruby: 17,883; makefile: 8
file content (124 lines) | stat: -rwxr-xr-x 3,115 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
#!/usr/bin/env ruby

=begin

= Info
    Prints out the metadata contained in a PDF document.

= License
    Copyright (C) 2016  Guillaume Delugré.

    Origami is free software: you can redistribute it and/or modify
    it under the terms of the GNU Lesser General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    Origami is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU Lesser General Public License for more details.

    You should have received a copy of the GNU Lesser General Public License
    along with Origami.  If not, see <http://www.gnu.org/licenses/>.

=end

begin
    require 'origami'
rescue LoadError
    $: << File.join(__dir__, '../lib')
    require 'origami'
end
include Origami

require 'colorize'
require 'optparse'

class OptParser
    BANNER = <<USAGE
Usage: #{$0} [<PDF-file>] [-i] [-x]
Prints out the metadata contained in a PDF document.
Bug reports or feature requests at: http://github.com/gdelugre/origami

Options:
USAGE

    def self.parser(options)
        OptionParser.new do |opts|
            opts.banner = BANNER

            opts.on("-i", "--info", "Extracts document info metadata") do
                options[:doc_info] = true
            end

            opts.on("-x", "--xmp", "Extracts XMP document metadata stream") do
                options[:doc_stream] = true
            end

            opts.on("-n", "--no-color", "Turn off colorized output.") do
                options[:disable_colors] = true
            end

            opts.on_tail("-h", "--help", "Show this message") do
                puts opts
                exit
            end
        end
    end

    def self.parse(args)
        options =
        {
            disable_colors: false
        }

        self.parser(options).parse!(args)

        options
    end
end

begin
    @options = OptParser.parse(ARGV)

    unless @options[:doc_info] or @options[:doc_stream]
        @options[:doc_info] = @options[:doc_stream] = true
    end

    String.disable_colorization @options[:disable_colors]

    target = (ARGV.empty?) ? STDIN : ARGV.shift
    params =
    {
        verbosity: Parser::VERBOSE_QUIET,
        lazy: true
    }

    pdf = PDF.read(target, params)

    if @options[:doc_info] and pdf.document_info?
        puts "[*] Document information dictionary:".magenta

        docinfo = pdf.document_info
        docinfo.each_pair do |name, item|
            obj = item.solve

            print name.value.to_s.ljust(20, ' ').green
            puts ": #{obj.respond_to?(:to_utf8) ? obj.to_utf8 : obj.value}"
        end
        puts
    end

    if @options[:doc_stream] and pdf.metadata?
        puts "[*] Metadata stream:".magenta

        metadata = pdf.metadata
        metadata.each_pair do |name, item|
            print name.ljust(20, ' ').green
            puts ": #{item}"
        end
    end

rescue
    abort "#{$!.class}: #{$!.message}"
end