• 使用python对PDF文件进行等页数分割


    用到了pyPDF库,很简单的脚步,废话不多说了。直接上代码

     1 # coding:utf8
     2 import os
     3 from pyPdf import PdfFileWriter, PdfFileReader
     4 def split(pdf_file, delta, output_dir):
     5     if not os.path.exists(output_dir):
     6         os.makedirs(output_dir)
     7     if not os.path.exists(pdf_file):
     8         return
     9     input_stream = file(pdf_file, 'rb')
    10     pdf_input = PdfFileReader(input_stream)
    11     page_count = pdf_input.getNumPages()
    12     sum_page_count = int(page_count / (delta * 1.0))
    13     remind_page = page_count % delta
    14     for i in range(0, sum_page_count + 1):
    15         start = i * delta
    16         end = (i + 1) * delta 
    17         pdf_out = PdfFileWriter()
    18         file_path = os.path.join(output_dir, os.path.split(pdf_file)[1]) #
    19         if i < sum_page_count:
    20             file_path = os.path.join(output_dir, str(start + 1) + '-' + str(end) + ".pdf")
    21             for j in range(start, end):
    22                 page = pdf_input.getPage(j)
    23                 pdf_out.addPage(page)
    24         else:
    25             file_path = os.path.join(output_dir, str(delta * sum_page_count + 1) + '-' + str(page_count) + ".pdf")
    26             for j in range(delta * (sum_page_count), page_count):
    27                 page = pdf_input.getPage(j)
    28                 pdf_out.addPage(page)
    29         out_stream = file(file_path, 'wb')
    30         pdf_out.write(out_stream)
    31         out_stream.close()
    32     input_stream.close()
    33 
    34 if __name__ == '__main__':
    35     import sys
    36     #split(u'C:/Users/sky/Desktop/17.pdf', 50, u'C:/Users/sky/Desktop/RES')
    37     try:
    38         pdf_path = sys.argv[1]
    39         page_count = int(sys.argv[2])
    40         out_dir = sys.argv[3]
    41         split(pdf_path, page_count, out_dir)
    42     except:
    43         pass
    44         
    45         
  • 相关阅读:
    pycharm的集成vim
    几款在线脑图制作工具
    编辑器vim简介
    常用服务器ftp、ssh
    56. Merge Intervals
    58. Length of Last Word
    55. Jump Game
    53. Maximum Subarray
    52. N-Queens II
    51. N-Queens
  • 原文地址:https://www.cnblogs.com/AllStarGIS/p/5397370.html
Copyright © 2020-2023  润新知