More languages
Some test text!
More languages
Sample Python code for using Apryse SDK to copy pages from one document to another, delete and rearrange pages, and use ImportPages() method for very efficient copy and merge operations. Learn more about our Python PDF Library and PDF Editing & Manipulation Library.
Get Started Samples DownloadTo run this sample, get started with a free trial of Apryse SDK.
#---------------------------------------------------------------------------------------
# Copyright (c) 2001-2023 by Apryse Software Inc. All Rights Reserved.
# Consult LICENSE.txt regarding license information.
#---------------------------------------------------------------------------------------
import site
site.addsitedir("../../../PDFNetC/Lib")
import sys
from PDFNetPython import *
sys.path.append("../../LicenseKey/PYTHON")
from LicenseKey import *
def main():
PDFNet.Initialize(LicenseKey)
# Relative path to the folder containing the test files.
input_path = "../../TestFiles/"
output_path = "../../TestFiles/Output/"
# Sample 1 - Split a PDF document into multiple pages
print("_______________________________________________")
print("Sample 1 - Split a PDF document into multiple pages...")
print("Opening the input pdf...")
in_doc=PDFDoc(input_path + "newsletter.pdf")
in_doc.InitSecurityHandler()
page_num = in_doc.GetPageCount()
i = 1
while i<=page_num:
new_doc=PDFDoc()
new_doc.InsertPages(0, in_doc, i, i, PDFDoc.e_none)
new_doc.Save(output_path + "newsletter_split_page_" + str(i) + ".pdf", SDFDoc.e_remove_unused)
print("Done. Result saved in newsletter_split_page_" + str(i) + ".pdf")
new_doc.Close()
i = i + 1
# Close the open document to free up document memory sooner than waiting for the
# garbage collector
in_doc.Close()
# Sample 2 - Merge several PDF documents into one
print("_______________________________________________")
print("Sample 2 - Merge several PDF documents into one...")
new_doc=PDFDoc()
new_doc.InitSecurityHandler()
page_num = 15
i = 1
while i <= page_num:
print("Opening newsletter_split_page_" + str(i) + ".pdf")
in_doc=PDFDoc(output_path + "newsletter_split_page_" + str(i) + ".pdf")
new_doc.InsertPages(i, in_doc, 1, in_doc.GetPageCount(), PDFDoc.e_none)
in_doc.Close()
i = i + 1
new_doc.Save(output_path + "newsletter_merge_pages.pdf", SDFDoc.e_remove_unused)
print("Done. Result saved in newsletter_merge_pages.pdf");
# Close the open document to free up document memory sooner than waiting for the
# garbage collector
in_doc.Close()
# Sample 3 - Delete every second page
print("_______________________________________________")
print("Sample 3 - Delete every second page...")
print("Opening the input pdf...")
in_doc = PDFDoc(input_path + "newsletter.pdf")
in_doc.InitSecurityHandler();
page_num = in_doc.GetPageCount()
while page_num >= 1:
itr = in_doc.GetPageIterator(page_num)
in_doc.PageRemove(itr)
page_num = page_num - 2
in_doc.Save(output_path + "newsletter_page_remove.pdf", 0)
print("Done. Result saved in newsletter_page_remove.pdf...")
# Close the open document to free up document memory sooner than waiting for the
# garbage collector
in_doc.Close()
# Sample 4 - Inserts a page from one document at different
# locations within another document
print("_______________________________________________")
print("Sample 4 - Insert a page at different locations...")
print("Opening the input pdf...")
in1_doc = PDFDoc(input_path + "newsletter.pdf")
in1_doc.InitSecurityHandler()
in2_doc = PDFDoc(input_path + "fish.pdf")
in2_doc.InitSecurityHandler()
src_page = in2_doc.GetPageIterator()
dst_page = in1_doc.GetPageIterator()
page_num = 1
while dst_page.HasNext():
if page_num % 3 == 0:
in1_doc.PageInsert(dst_page, src_page.Current())
page_num = page_num + 1
dst_page.Next()
in1_doc.Save(output_path + "newsletter_page_insert.pdf", 0)
print("Done. Result saved in newsletter_page_insert.pdf...")
# Close the open document to free up document memory sooner than waiting for the
# garbage collector
in1_doc.Close()
in2_doc.Close()
# Sample 5 - Replicate pages within a single document
print("_______________________________________________")
print("Sample 5 - Replicate pages within a single document...")
print("Opening the input pdf...")
doc = PDFDoc(input_path + "newsletter.pdf")
doc.InitSecurityHandler()
# Replicate the cover page three times (copy page #1 and place it before the
# seventh page in the document page sequence)
cover = doc.GetPage(1)
p7 = doc.GetPageIterator(7)
doc.PageInsert(p7, cover)
doc.PageInsert(p7, cover)
doc.PageInsert(p7, cover)
# Replicate the cover page two more times by placing it before and after
# existing pages.
doc.PagePushFront(cover);
doc.PagePushBack(cover)
doc.Save(output_path + "newsletter_page_clone.pdf", 0)
print("Done. Result saved in newsletter_page_clone.pdf...")
doc.Close()
# Sample 6 - Use ImportPages() in order to copy multiple pages at once
# in order to preserve shared resources between pages (e.g. images, fonts,
# colorspaces, etc.)
print("_______________________________________________")
print("Sample 6 - Preserving shared resources using ImportPages...")
print("Opening the input pdf...")
in_doc = PDFDoc(input_path + "newsletter.pdf")
in_doc.InitSecurityHandler()
new_doc = PDFDoc()
copy_pages = VectorPage()
itr = in_doc.GetPageIterator()
while itr.HasNext():
copy_pages.push_back(itr.Current())
itr.Next()
imported_pages = new_doc.ImportPages(copy_pages)
i = iter(imported_pages)
for x in i:
new_doc.PagePushFront(x) # Order pages in reverse order.
# Use PagePushBack() if you would like to preserve the same order.
new_doc.Save(output_path + "newsletter_import_pages.pdf", 0)
# Close the open document to free up document memory sooner than waiting for the
# garbage collector
in_doc.Close()
new_doc.Close()
PDFNet.Terminate()
print("Done. Result saved in newsletter_import_pages.pdf...\n")
print("Note that the output file size is less than half the size")
print("of the file produced using individual page copy operations")
print("between two documents")
if __name__ == '__main__':
main()