-
Notifications
You must be signed in to change notification settings - Fork 110
/
pdfdecompress
executable file
·97 lines (74 loc) · 2.35 KB
/
pdfdecompress
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
#!/usr/bin/env ruby
=begin
= Info
Uncompresses all binary streams of a PDF document.
= License
Copyright (C) 2016 Guillaume Delugré.
Origami is free software: you can redistribute it and/or modify
it under the terms of the GNU Lesser General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
Origami is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public License
along with Origami. If not, see <http://www.gnu.org/licenses/>.
=end
begin
require 'origami'
rescue LoadError
$: << File.join(__dir__, '../lib')
require 'origami'
end
include Origami
require 'optparse'
class OptParser
BANNER = <<USAGE
Usage: #{$0} [<PDF-file>] [-p <password>] [-o <output-file>]
Uncompresses all binary streams of a PDF document.
Bug reports or feature requests at: http://github.com/gdelugre/origami
Options:
USAGE
def self.parser(options)
OptionParser.new do |opts|
opts.banner = BANNER
opts.on("-o", "--output FILE", "Output PDF file (stdout by default)") do |o|
options[:output] = o
end
opts.on_tail("-h", "--help", "Show this message") do
puts opts
exit
end
end
end
def self.parse(args)
options =
{
output: STDOUT,
}
self.parser(options).parse!(args)
options
end
end
begin
@options = OptParser.parse(ARGV)
target = (ARGV.empty?) ? STDIN : ARGV.shift
params =
{
verbosity: Parser::VERBOSE_QUIET,
}
pdf = PDF.read(target, params)
pdf.each_object
.select { |obj| obj.is_a?(Stream) }
.each { |stream|
unless stream.filters.any?{|filter| %i[JPXDecode DCTDecode JBIG2Decode].include?(filter.value) }
stream.encoded_data = stream.data
stream.dictionary.delete(:Filter)
end
}
pdf.save(@options[:output], noindent: true)
rescue
STDERR.puts $!.backtrace.join($/)
abort "#{$!.class}: #{$!.message}"
end