kokoro-aya/pdf_extract.py

## 0 main.py → pdf_extract.py

    
            0
            
          
  main.py → pdf_extract.py

  
              Show comments
            

   View file


            File renamed without changes.
          

## 47 changes: 47 additions & 0 deletions main.py
@@ -0,0 +1,47 @@

    from argparse import ArgumentParser
from argparse import ArgumentParser

    from PyPDF2 import PdfFileReader, PdfWriter
from PyPDF2 import PdfFileReader, PdfWriter


    def main():
def main():

        parser = ArgumentParser(
    parser = ArgumentParser(

            prog="A simple PDF page extractor",
        prog="A simple PDF page extractor",

            description="A simple PDF page extractor",
        description="A simple PDF page extractor",

            epilog="Text at the bottom for help"
        epilog="Text at the bottom for help"

        )
    )

        parser.add_argument("input")
    parser.add_argument("input")

        parser.add_argument("output")
    parser.add_argument("output")

        parser.add_argument("start")
    parser.add_argument("start")

        parser.add_argument("to")
    parser.add_argument("to")


        args = parser.parse_args()
    args = parser.parse_args()


        input_file = args.input
    input_file = args.input

        output_file = args.output
    output_file = args.output

        start = int(args.start)
    start = int(args.start)

        to = int(args.to)
    to = int(args.to)


        if start < 0 or to < 0:
    if start < 0 or to < 0:

            raise "Starting and ending page must be a natural number."
        raise "Starting and ending page must be a natural number."


        if start > to:
    if start > to:

            raise "Starting page must be smaller than ending page."
        raise "Starting page must be smaller than ending page."


        with open(input_file, 'rb') as reader:
    with open(input_file, 'rb') as reader:

            pdf = PdfFileReader(reader)
        pdf = PdfFileReader(reader)

            info = pdf.getDocumentInfo()
        info = pdf.getDocumentInfo()

            page_num = pdf.getNumPages()
        page_num = pdf.getNumPages()


            if start > page_num or to > page_num:
        if start > page_num or to > page_num:

                raise f"Either the starting page or ending page is out of range of the file pages. " \
            raise f"Either the starting page or ending page is out of range of the file pages. " \

                      f"The file has {page_num} pages."
                  f"The file has {page_num} pages."


            pdf_out = PdfWriter()
        pdf_out = PdfWriter()

            for i in range(start, to):
        for i in range(start, to):

                pdf_out.addPage(pdf.getPage(i))
            pdf_out.addPage(pdf.getPage(i))

            pdf_out.write(output_file)
        pdf_out.write(output_file)


            print("Extraction finished.")
        print("Extraction finished.")


    if __name__ == '__main__':
if __name__ == '__main__':

        main()
    main()