Python convert примеры, docx2pdf.convert Python примеры использования

Пример #1

0

Показать файл

def main(event, context):
    for record in event['Records']:
        # get uploaded file name
        bucket = record['s3']['bucket']['name']
        key = unquote_plus(record['s3']['object']['key'])
        print(bucket)
        print(key)

        # create upload and download paths
        tmpkey = key.replace('/', '')
        tmp_download_path = '/tmp/{}{}'.format(uuid.uuid4(), tmpkey)
        tmp_converted_path = '/tmp/converted-{}'.format(tmpkey)
        tmp_split_path = '/tmp/split'
        os.mkdir(tmp_split_path)

        # Download file
        s3.download_file(bucket, key, tmp_download_path)

        # Convert file to pdf
        convert(tmp_download_path, tmp_converted_path)

        # Split PDF and upload new docs to staging area
        document = PdfFileReader(open(tmp_converted_path, "rb"))
        for i in range(document.numPages):
            output = PdfFileWriter()
            output.addPage(document.getPage(i))
            tmp_page_path = '{}/pdf-{}-{}'.format(tmp_split_path, i, tmpkey)
            with open(tmp_page_path, "wb") as outputStream:
                output.write(outputStream)
            new_key = key.replace('.docx', '/{}.pdf'.format(i))
            s3.upload_file(tmp_page_path, bucket,
                           new_key.replace('raw', 'staging'))

Пример #2

0

Показать файл

Файл: PrintQR.py Проект: androidRollin/QR-Code-Attendance-Registry-System

def QRstoPDF(path):
    doc = docx.Document()
    p = doc.add_paragraph()
    r = p.add_run()
    try:
        with open(path, "r") as csv_file:
            csv_reader = csv.reader(csv_file)
            next(csv_reader)
            count = 0
            for line in csv_reader:
                count += 1
                FileNameQR = "QRimages/" + line[0] + "QR.jpg"
                Section = line[2]
                r.add_picture(FileNameQR,
                              width=docx.shared.Inches(3),
                              height=docx.shared.Inches(3))
                if (count == 6):
                    p = doc.add_paragraph()
                    r = p.add_run()
                    count = 0
    except FileNotFoundError:
        print("FileNOtFound")

    pdfname = "C:/Users/ROLINE JOHN AGUILAR/Downloads/" + line[
        2] + "QRs" + ".pdf"
    wordname = "QRGenerated.docx"
    doc.save(wordname)

    convert(wordname, pdfname)
    os.remove(wordname)
    os.startfile(pdfname)
    os.remove("QRData.csv")

Пример #3

0

Показать файл

Файл: glopan.py Проект: mortenengen/glowing-pancake

def docx_to_pdf(docxfile: str):
    """Convert a DOCX file to PDF.

    Args:
        docxfile (str): The name of the DOCX file to convert.
    """
    docx2pdf.convert(docxfile)

Пример #4

0

Показать файл

 def slicing_original_documents_docx(self):
     # Convert the docx to a pdf
     self.docx_filepath = os.path.basename(self.filename)
     convert(self.docx_filepath)
     self.raw_filename = os.path.basename(self.filename)
     originaldoc_data12 = self.slicing_original_documents_pdf()
     return originaldoc_data12

Пример #5

0

Показать файл

Файл: pdf_miner.py Проект: nikitaschultz2i/pdf_comparison

def process_docx(path):
    convert(path)
    new_path = path.replace("docx", "pdf")
    print(new_path)
    output_string = process_pdf(new_path)
    os.remove(new_path)
    return output_string

Пример #6

0

Показать файл

Файл: bilago.py Проект: aklauritzen/bilago

def convert_docx_to_pdf(docx_file):
    convert(docx_file)

    # Delay to resolve a problem when converting small .docxfiles.
    time.sleep(1)

    temporary_docx_pdf_files.append(docx_file)

Пример #7

0

Показать файл

    def main(self):
        print(self.document_1.get_merge_fields())
        self.read_files()

        for n_idx, n_row in self.df_data.iterrows():
            dict = {
                "姓名": str(n_row['姓名']),
                "年龄": str(n_row['年龄']),
                "生日": str(n_row['生日']),
                "folder": 'folder1'
            }
            self.document_1.merge(**dict)

            file_path = self.path + 'xlsx/'
            if not os.path.exists(file_path):
                os.makedirs(file_path)

            file_docx = self.path + 'xlsx/' + n_row['姓名'] + '.docx'
            self.document_1.write(file_docx)
            # time.sleep(1)

            file_path = self.path + n_row['性别'] + '/'
            if not os.path.exists(file_path):
                os.makedirs(file_path)

            file_pdf = file_path + n_row['姓名'] + '.pdf'
            # file_pdf = self.path + 'pdfs/' + n_row['姓名'] + '.pdf'
            # self.generate_pdf(file_docx,file_pdf)
            convert(file_docx, file_pdf, keep_active=True)
        self.document_1.close()

Пример #8

0

Показать файл

def download_file(filename, pi_no):

    print(pi_no)
    x = requests.get(
        'http://151.80.237.86:1251/ords/zkt/pi_doc/doc?pi_no={}'.format(str(pi_no)))
    data = x.json()
    doc = DocxTemplate(
        "./{}".format(
            filename))

    pythoncom.CoInitialize()
    for x in data['items']:
        if x['pi_no'].strip() == '{}'.format(pi_no):  # 17865
            # pprint(x)
            doc.render(x)

# # time.sleep(1)

            file_stream = StringIO()
            doc.save('./static/file.docx')
            convert('./static/file.docx',
                    './static/file.pdf')
    flash("Your file has been created, Now you can download!!")

    return render_template('upload_file.html')

Пример #9

0

Показать файл

Файл: main2.py Проект: naazneen/Test

    def saveaspdf(self, parent, fname):

        from docx2pdf import convert

        #convert("input.docx")
        print(tx)
        convert(tx, tx + ".pdf")

Пример #10

0

Показать файл

Файл: convert.py Проект: OWASP/cornucopia

def convert_docx_to_pdf(docx_filename: str, output_pdf_filename: str) -> str:
    logging.debug(
        f" --- docx_file = {docx_filename}\n--- starting pdf conversion now.")
    fail: bool = False
    msg: str = ""
    if convert_vars.can_convert_to_pdf:
        # Use docx2pdf for windows and mac with MS Word installed
        try:
            docx2pdf.convert(docx_filename, output_pdf_filename)
        except Exception as e:
            msg = f"\nConvert error: {e}"
            fail = True
    else:
        fail = True
    if fail:
        msg = (
            "Error. A temporary docx file was created in the output folder but cannot be converted "
            f"to pdf (yet) on operating system: {sys.platform}\n"
            "This does work on Windows and Mac with MS Word installed.") + msg
        logging.warning(msg)
        return docx_filename

    # If not debugging then delete the temp file
    if not convert_vars.args.debug:
        os.remove(docx_filename)
    return output_pdf_filename

Пример #11

0

Показать файл

def openFile():
    global filez
    filez = askopenfilenames(title='Choose a file')
    if len(filez) != 0:
        for i in range(len(filez)):
            convert(filez[i])
    print('done')

Пример #12

0

Показать файл

Файл: doc_to_pdf.py Проект: hduzn/python_tools

def doc_to_pdf():
    # 文件位置
    path = r'C:\小现代化(1)'

    file_list = get_filelist(path)
    # print(file_list)

    # 定义空list,存放文件列表
    docx_files = []
    for file in file_list:
        if (file.endswith(".docx")):
            docx_files.append(file)
        elif (file.endswith(".doc")):
            docx_file = doc2docx(file)
            docx_files.append(docx_file)
    # print(docx_files)
    for docx in docx_files:
        print(docx)
    print('docx文件数：', len(docx_files))

    # 转换文件
    print('-----------------开始转换 docx 文件-----------------')
    for file in docx_files:
        print(file)
        #print(file.split('.docx')[0]+'.pdf')
        convert(file, file.split('.docx')[0] + '.pdf')

Пример #13

0

Показать файл

Файл: daily_pdf.py Проект: CleHou/COVID-19-Data-Analysis-Project

    def fill_template(self):
        context = self.var_template()

        path_to_template = os.path.normpath(
            f'{self.root}/src/pdf_creation/template.docx')
        template = DocxTemplate(path_to_template)

        template.render(context)

        date_str = self.date.strftime("%Y-%m-%d")
        year = self.date.strftime("%Y")
        month = self.date.strftime("%m - %B")

        #file_dir = f"{self.root}/reports/Daily_PDF/{year}/{month}"
        #file_name = f"First_page_{date_str}"
        file_dir = f"{self.root}/reports/Daily_PDF"
        file_name = "First_page"

        file_fct.creation_folder('', [file_dir])
        full_path = os.path.normcase(f'{file_dir}/{file_name}.docx')

        template.save(full_path)
        convert(full_path)
        os.remove(full_path)

        return os.path.normcase(f'{file_dir}/{file_name}.pdf')

Пример #14

0

Показать файл

Файл: views.py Проект: apotipak/hrms

def generate_contract_list(request, *args, **kwargs):

    base_url = MEDIA_ROOT + '/contract/template/'
    contract_number_from = kwargs['contract_number_from']
    contract_number_to = kwargs['contract_number_to']
    contract_status = kwargs['contract_status']
    contract_zone = kwargs['contract_zone']

    # now = datetime.datetime.now()
    # html = "<html><body>It is now %s.</body></html>" % now
    # return HttpResponse(html)

    template_name = base_url + 'CNT_ContractStatus.docx'
    file_name = "contract_list_report"

    context = {
        'customer': "TEST",
    }

    tpl = DocxTemplate(template_name)
    tpl.render(context)
    tpl.save(MEDIA_ROOT + '/contract/download/' + file_name + ".docx")

    # docx2pdf
    docx_file = path.abspath("media\\contract\\download\\" + file_name +
                             ".docx")
    pdf_file = path.abspath("media\\contract\\download\\" + file_name + ".pdf")
    convert(docx_file, pdf_file)

    return FileResponse(open(pdf_file, 'rb'), content_type='application/pdf')

Пример #15

0

Показать файл

def proses():

    rasma = asma.get()
    rref = ref.get()
    rttl = ttl.get()
    rttt= ttt.get()
    rprau = prau.get()
    rdowo = dowo.get()
    recdis=str(selhas())

    tpl = DocxTemplate('Python.docx')
    context = {1:{  "nama":"%s" %str(rasma),
                    "TTL":"%s" %str(rttl),
                    "ref":"Ref: CPA-2021-FTR-%s"%str(rref),
                    "TTT": "%s" %str(rttt),
                    "ecdis": "ECDIS Model %s" % str(recdis),
                    "ship":"Onboard %s" %str(rprau),
                    "dura": "%s" % str(rdowo)}
                }

    sref= str(rref)
    sasma = str(rasma)
    sprau = str(rprau)
    jenber = " "+ sref + " "+ sasma + " " + sprau

    tpl.render(context[1])
    tpl.save("CPA2021FTR%s.docx" %jenber)

    convert("CPA2021FTR%s.docx" %jenber, "C:/Users/QylaMeisya/Documents/Sertifikat Training Familiarrisasi ECDIS Photosop/sertfampy" )

    label = teka.Label(cen_ut, text="Sert. %s Selesai ! Input Entry lagi / Tutup Program !" %str(rasma))
    label.pack()

Пример #16

0

Показать файл

Файл: doc2pdf_variable_text.py Проект: diganthdr/python_bootcamp

def make_custom_report(input_map, template):

    #fill the template:
    replace_words_in_document(input_map, template)

    #convert to pdf.
    convert(TEMP_REPLACED_DOC, PDF_FILE_NAME)

Пример #17

0

Показать файл

def certificate(name, fio, date1, date2, choose):
    f = fio.split("\r\n")
    print(f)
    zipObj = ZipFile('sample.zip', 'w')
    if choose == "Base":
        for person in f:
            doc = DocxTemplate("Sertifikat_ryzhiiy2.docx")
            context = {
                'Program': name,
                'Name': person.rstrip(),
                'Date1': date1,
                'Date2': date2,
                'Choose': choose
            }
            doc.render(context)
            doc.save("{}_base.docx".format(person.rstrip()))
            convert("{}_base.docx".format(person.rstrip()))
            zipObj.write('{}_base.pdf'.format(person.rstrip()))

    else:
        for person in f:
            doc = DocxTemplate("Sertifikat_ryzhiiy2.docx")
            context = {
                'Program': name,
                'Name': person.rstrip(),
                'Date1': date1,
                'Date2': date2,
                'Choose': choose
            }
            doc.render(context)
            doc.save("{}_project.docx".format(person.rstrip()))
            convert("{}_project.docx".format(person.rstrip()))
            zipObj.write('{}_project.pdf'.format(person.rstrip()))

    zipObj.close()

Пример #18

0

Показать файл

def docxToPdf(inDir,file):
    convertDir = inDir+"/converted"
    if not os.path.exists(convertDir):
        os.makedirs(convertDir)
    opFileName = file.split(".")[0]+".pdf"
    convert(os.path.join(inDir, file), os.path.join(convertDir, opFileName))
    return os.path.join(convertDir, opFileName)

Пример #19

0

Показать файл

def word2pdf(files_path):
    """对于给定的文件夹，转换文件夹内所有docx文件为同名的pdf文件"""
    files = os.listdir(files_path)
    for f in files:
        if f.endswith('docx') and '转让登记表' in f:
            f_new = os.path.splitext(f)[0] + ".pdf"
            convert(os.path.join(files_path, f),
                    os.path.join(files_path, f_new))

Пример #20

0

Показать файл

Файл: 5.word文件批量转pdf.py Проект: hong96206/python

def convert_single(src_file, dst_file):
    """
    单个文件实现 word->pdf 转换
    :param src_file: 源文件 xxx.docx
    :param dst_file: 目标文件 xxx.pdf
    :return:
    """
    docx2pdf.convert(src_file, dst_file)

Пример #21

0

Показать файл

def convert_doc_to_pdf(doc_file):
    # Use a breakpoint in the code line below to debug your script.
    # Press Ctrl+F8 to toggle the breakpoint.
    filename, _ = os.path.splitext(doc_file)
    pdf_file = filename + '.pdf'
    docx2pdf.convert(doc_file, pdf_file)

    return pdf_file

Пример #22

0

Показать файл

Файл: MysticsCardFiller.py Проект: Jet170/MysticsCardFiller

def wordToPdf(requireDocPause):
    print("Converting from Word doc to pdf...")
    if (requireDocPause):
        input(
            "Please open " + outputDocName +
            ", save over the original output file, then close it and press enter"
        )
    convert(outputDocName, outputPDFName)

Пример #23

0

Показать файл

 def doc_pdf(self):
     """
     :return: converts document to pdf
     """
     if self.dst == "":
         convert(self.src)
     else:
         convert(self.src, self.dst)

Пример #24

0

Показать файл

def convert_pdf(input_dir="output/", output_dir="output_pdf/"):
    """
    docxファイルの保存されたフォルダを指定して、フォルダ格納データを全てpdfにして、指定フォルダに保存する
    :param input_dir: dir_name, default:output/,  outputフォルダを利用
    :param output_dir: dir_name, default:output_pdf/, output_pdfフォルダを利用
    :return: output_pdfフォルダにoutputフォルダのpdfが全て保存される
    """
    convert(input_dir, output_dir)

Пример #25

0

Показать файл

Файл: main.py Проект: lrbeauty/pdfgenerator

def making_a_doc_function(request):
    #plot from uploaded data now need to make chart from live data that has been uploaded to the site. this will be done by either doing pandas crunching all over again to get the numbers that you want or by reading numbers tht have already been put in one of the tables. most ikley a combination of both

    doc = docx.Document()
    pk = 3
    if not saf_defect_table.objects.filter(
            pk=pk).exists():  #this accesses the saf_defect_table
        doc.add_heading("no text")
        doc.save('thisisdoc.docx')
    else:
        saf_defect_table_variable = saf_defect_table.objects.get(pk=pk)

        doc.add_heading(str(saf_defect_table_variable.saf_number_in_table))
        doc.add_heading(str(saf_defect_table_variable.defect_number_in_table))

        #making a plot from a csv file that was uploaded to DB table
        if FileUpload.objects.filter(
                attribution_file_upload='pftest4.csv').exists():
            life3 = pd.read_csv(
                FileUpload.objects.get(attribution_file_upload='pftest4.csv').
                attribution_file_upload)
            life3.plot(kind='bar', x='status', y='item')
            plt.title('my plot title')
            plt.xlabel('years')
            plt.ylabel('Age')
            memfile = io.BytesIO(
            )  #this is needed in order to save the file to a temporary memory section
            plt.savefig(memfile)
            doc.add_picture(memfile, width=Inches(4))
            memfile.close()
            plt.clf()  #this shuts down the plot so then you can make a new.

        #making a plot out of numbers that are already stored in saf defect table DB table
        y1 = saf_defect_table_variable.saf_number_in_table
        y2 = saf_defect_table_variable.defect_number_in_table
        korea_scores = (y1, y2)
        col_count = 2
        bar_width = .2
        index = np.arange(col_count)
        plt.barh(index, korea_scores, bar_width, alpha=.4, label="Korea")
        memfile2 = io.BytesIO()
        plt.savefig(memfile2)
        doc.add_picture(memfile2, width=Inches(4))
        memfile2.close()

    doc.save('thisisdoc.docx')

    #converting the generated docx into a pdf file
    convert("thisisdoc.docx", "output.pdf")
    pdf = open('output.pdf', 'rb')
    response = FileResponse(pdf)

    # Report_File_Upload_Table.objects.create(generated_report_file_upload=output.pdf)
    return response
    #return render(request, 'doc.html', response)


#----------------end of section 2--------------------------------------------

Пример #26

0

Показать файл

Файл: AufgabenK.py Проект: niha1020/AufgabenK

    def get_path_value(self):
        #print(self.path_value.get())
        self.path = self.path_value.get()
        self.folder_name = self.path.rsplit("\\",1)[1]
        #print(self.folder_name) 

        #self.directory = self.path
        for folder_entry in os.scandir(self.path): #directory):
            self.folder_name = Path(folder_entry).stem
            #print(folder_entry.path)
            mergedObject = PdfFileMerger()

            for file_entry in os.scandir(folder_entry):
                self.file_name = Path(file_entry).stem
                print("Filenname", self.file_name)


                if not (file_entry.path.endswith(".jpg")
                        or  file_entry.path.endswith(".jpeg")
                        or file_entry.path.endswith(".png")
                        #or file_entry.path.endswith(".doc")
                        or file_entry.path.endswith(".docx")
                        or file_entry.path.endswith(".pdf")
                        )and file_entry.is_file():
                        print("Was ist das? Konvertier ich nicht  " + file_entry.path)
                        
                #if (file_entry.path.endswith("") and file_entry.is_file()):
                #        print("nothing")

                

                        

                if (file_entry.path.endswith(".jpg") or  file_entry.path.endswith(".jpeg") or file_entry.path.endswith(".png")) and file_entry.is_file():
                        #print(file_entry.path) 

                        image = Image.open(file_entry.path)
                        i = image.convert('RGB')
                        i.save(os.path.splitext(file_entry.path)[0] + ".pdf")

               # if (file_entry.path.endswith(".doc") ) and file_entry.is_file():
               #         convert(file_entry)
	                        

                if (file_entry.path.endswith(".docx")) and file_entry.is_file():
                        convert(file_entry)

            for file_entry in os.scandir(folder_entry):    
                if (file_entry.path.endswith(".pdf") and file_entry.is_file()):
                    #print(file_entry.path + ".pdf")
                    
                    new_pdf = Pdf.new()
                    with Pdf.open(file_entry.path, allow_overwriting_input=True) as pdf:
                        pdf.save(file_entry.path)
                        
                    mergedObject.append(PdfFileReader(file_entry.path, "rb"))

            mergedObject.write(self.path + "\\" + Path(folder_entry).stem + " - " +Path(self.path).stem  + ".pdf")

Пример #27

0

Показать файл

Файл: doc_functions.py Проект: HeenaBajaj/documentum

def ConvertToPdfFromFile(file_path, output_path):
    img_type = file_path.split(".")[1]
    if img_type == "jpg" or img_type == "jpeg" or img_type == "png":
        from PIL import Image
        image = Image.open(file_path)
        pdf_bytes = img2pdf.convert(image.filename)
        file = open(output_path, "wb")
        file.write(pdf_bytes)
        image.close()
        file.close()
    elif img_type == "doc" or img_type == "docx":
        from docx2pdf import convert
        convert(file_path, output_path)
    elif img_type == "txt":
        pdf = FPDF()
        # Add a page
        pdf.add_page()
        # set style and size of font
        # that you want in the pdf
        pdf.set_font("Arial", size=15)
        # open the text file in read mode
        f = open(file_path, "r")
        # insert the texts in pdf
        for x in f:
            pdf.cell(200, 10, txt=x, ln=1, align='C')
        # save the pdf with name .pdf
        pdf.output(output_path)

    elif img_type == "csv":
        config = pdfkit.configuration(
            wkhtmltopdf=
            r'C:\Users\A118090\AppData\Local\Programs\Python\Python36\Lib\site-packages\wkhtmltopdf'
        )
        pdfkit.from_file(file_path, output_path, configuration=config)

    elif img_type == "xlsx" or img_type == "xlsm" or img_type == "xls":
        from win32com import client
        xlApp = client.Dispatch("Excel.Application")
        books = xlApp.Workbooks.Open(file_path)
        # ws = books.Worksheets[0]
        # ws.Visible = 1
        # ws.ExportAsFixedFormat(0, output_path)
        ws_index_list = []
        r1 = 1
        while (r1 <= books.Worksheets.Count):

            ws_index_list.append(r1)
            r1 += 1
        # print(ws_index_list)
        books.WorkSheets(ws_index_list).Select()
        # # Save
        books.ActiveSheet.ExportAsFixedFormat(0, output_path)
        books.Close(True, file_path)
        print("file_path closed..")
    else:
        text = "file format does not match"

    print("Converted file: " + file_path + "\n\tto: " + output_path)

Пример #28

0

Показать файл

def docx2pdf():
	resultlab.configure(text= 'Please Wait... Converting Docx to PDF')
	print('Converting Docx to PDF')
	sleep(1)
	destvar = sourcevar.replace('.docx','.pdf')
	convert(sourcevar , destvar)
	print('\nConverted Successfully!!\n')
	print(f'File Sucessfully Saved as {destvar}')
	resultlab.configure(text= f'File Sucessfully Saved as {destvar}')

Пример #29

0

Показать файл

    def convertToPdf(self, path=None):
        """Convert word document to pdf"""

        if path:
            path.replace('.docx', '.pdf')
            convert(path)
        else:
            self.path.replace('.docx', '.pdf')
            convert(self.path)

Пример #30

0

Показать файл

def convertAndDelete():
    directory = os.getcwd()
    convert(str(directory), str(directory) + "/dataPDF")
    files_in_directory = os.listdir(directory)
    docxFiles = [file for file in files_in_directory if file.endswith(".docx")]

    for file in docxFiles:
        path_to_file = os.path.join(directory, file)
        os.remove(path_to_file)

Python convert примеры использования