import
fitz
import
sys
import
os
font_path
=
"C:/Windows/Fonts/simsun.ttc"
def
process_pdf(input_pdf_path, output_pdf_path, name, class_info):
doc
=
fitz.
open
(input_pdf_path)
for
page
in
doc:
for
image
in
page.get_images(full
=
True
):
xref
=
image[
0
]
if
(image[
2
]
=
=
558
and
image[
3
]
=
=
120
)
or
(image[
2
]
=
=
215
and
image[
3
]
=
=
219
):
page.delete_image(xref)
text_instances
=
page.search_for(
"姓名:"
)
print
(text_instances)
for
inst
in
text_instances:
page.insert_text((inst.x1, inst.y1
-
8
),name,fontname
=
"china-ss"
,fontsize
=
12
)
text_instances
=
page.search_for(
"班级:"
)
for
inst
in
text_instances:
page.insert_text((inst.x1, inst.y1
-
8
),class_info,fontname
=
"china-ss"
,fontsize
=
12
)
doc.save(output_pdf_path)
doc.close()
if
__name__
=
=
"__main__"
:
if
len
(sys.argv) !
=
2
:
print
(
"Usage: python script.py <input_pdf>"
)
sys.exit(
1
)
input_pdf
=
sys.argv[
1
]
file_name, _
=
os.path.splitext(input_pdf)
output_pdf
=
f
"{file_name}_output.pdf"
name
=
"XXX"
class_info
=
"一(3)班"
process_pdf(input_pdf, output_pdf, name, class_info)