-
Notifications
You must be signed in to change notification settings - Fork 25
Expand file tree
/
Copy pathpdf2random_text-example.py
More file actions
62 lines (51 loc) · 1.82 KB
/
pdf2random_text-example.py
File metadata and controls
62 lines (51 loc) · 1.82 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
from PyPDF2 import PdfFileWriter, PdfFileReader
import sys
# globals
if len(sys.argv) < 2:
pdffile = 'assets/fw9.pdf'
else:
pdffile = sys.argv[1]
output = PdfFileWriter()
input1 = PdfFileReader(open(pdffile, "rb"))
# print how many pages input1 has:
print("pdf has %d pages." % input1.getNumPages())
print(input1.getDocumentInfo())
print(input1.getXmpMetadata())
if input1.isEncrypted:
print('encrypted')
else:
print('not encrypted')
i = 4
content = ""
while i < 6:
texter = input1.getPage(i).extractText()
# print(texter)
i = i + 1
content += texter + "\n"
content = " ".join(content.replace("\xa0", " ").strip().split())
# add page 1 from input1 to output document, unchanged
output.addPage(input1.getPage(0))
# add page 2 from input1, but rotated clockwise 90 degrees
output.addPage(input1.getPage(1).rotateClockwise(90))
# add page 3 from input1, rotated the other way:
output.addPage(input1.getPage(2).rotateCounterClockwise(90))
# alt: output.addPage(input1.getPage(2).rotateClockwise(270))
# add page 4 from input1, but first add a watermark from another PDF:
page4 = input1.getPage(3)
watermark = PdfFileReader(open(pdffile, "rb"))
page4.mergePage(watermark.getPage(0))
output.addPage(page4)
# add page 5 from input1, but crop it to half size:
page5 = input1.getPage(4)
page5.mediaBox.upperRight = (
page5.mediaBox.getUpperRight_x() / 2,
page5.mediaBox.getUpperRight_y() / 2
)
output.addPage(page5)
# add some Javascript to launch the print window on opening this PDF.
# the password dialog may prevent the print dialog from being shown,
# comment the the encription lines, if that's the case, to try this out
output.addJS("this.print({bUI:true,bSilent:false,bShrinkToFit:true});")
# finally, write "output" to document-output.pdf
outputStream = open("PyPDF2-output.pdf", "wb")
output.write(outputStream)