Esempi in Python per convert, esempi in Python per docx2pdf.convert

Esempio n. 1

0

Mostra file

def main(event, context):
    for record in event['Records']:
        # get uploaded file name
        bucket = record['s3']['bucket']['name']
        key = unquote_plus(record['s3']['object']['key'])
        print(bucket)
        print(key)

        # create upload and download paths
        tmpkey = key.replace('/', '')
        tmp_download_path = '/tmp/{}{}'.format(uuid.uuid4(), tmpkey)
        tmp_converted_path = '/tmp/converted-{}'.format(tmpkey)
        tmp_split_path = '/tmp/split'
        os.mkdir(tmp_split_path)

        # Download file
        s3.download_file(bucket, key, tmp_download_path)

        # Convert file to pdf
        convert(tmp_download_path, tmp_converted_path)

        # Split PDF and upload new docs to staging area
        document = PdfFileReader(open(tmp_converted_path, "rb"))
        for i in range(document.numPages):
            output = PdfFileWriter()
            output.addPage(document.getPage(i))
            tmp_page_path = '{}/pdf-{}-{}'.format(tmp_split_path, i, tmpkey)
            with open(tmp_page_path, "wb") as outputStream:
                output.write(outputStream)
            new_key = key.replace('.docx', '/{}.pdf'.format(i))
            s3.upload_file(tmp_page_path, bucket,
                           new_key.replace('raw', 'staging'))

Esempio n. 2

0

Mostra file

File: PrintQR.py Progetto: androidRollin/QR-Code-Attendance-Registry-System

def QRstoPDF(path):
    doc = docx.Document()
    p = doc.add_paragraph()
    r = p.add_run()
    try:
        with open(path, "r") as csv_file:
            csv_reader = csv.reader(csv_file)
            next(csv_reader)
            count = 0
            for line in csv_reader:
                count += 1
                FileNameQR = "QRimages/" + line[0] + "QR.jpg"
                Section = line[2]
                r.add_picture(FileNameQR,
                              width=docx.shared.Inches(3),
                              height=docx.shared.Inches(3))
                if (count == 6):
                    p = doc.add_paragraph()
                    r = p.add_run()
                    count = 0
    except FileNotFoundError:
        print("FileNOtFound")

    pdfname = "C:/Users/ROLINE JOHN AGUILAR/Downloads/" + line[
        2] + "QRs" + ".pdf"
    wordname = "QRGenerated.docx"
    doc.save(wordname)

    convert(wordname, pdfname)
    os.remove(wordname)
    os.startfile(pdfname)
    os.remove("QRData.csv")

Esempio n. 3

0

Mostra file

File: glopan.py Progetto: mortenengen/glowing-pancake

def docx_to_pdf(docxfile: str):
    """Convert a DOCX file to PDF.

    Args:
        docxfile (str): The name of the DOCX file to convert.
    """
    docx2pdf.convert(docxfile)

Esempio n. 4

0

Mostra file

 def slicing_original_documents_docx(self):
     # Convert the docx to a pdf
     self.docx_filepath = os.path.basename(self.filename)
     convert(self.docx_filepath)
     self.raw_filename = os.path.basename(self.filename)
     originaldoc_data12 = self.slicing_original_documents_pdf()
     return originaldoc_data12

Esempio n. 5

0

Mostra file

File: pdf_miner.py Progetto: nikitaschultz2i/pdf_comparison

def process_docx(path):
    convert(path)
    new_path = path.replace("docx", "pdf")
    print(new_path)
    output_string = process_pdf(new_path)
    os.remove(new_path)
    return output_string

Esempio n. 6

0

Mostra file

File: bilago.py Progetto: aklauritzen/bilago

def convert_docx_to_pdf(docx_file):
    convert(docx_file)

    # Delay to resolve a problem when converting small .docxfiles.
    time.sleep(1)

    temporary_docx_pdf_files.append(docx_file)

Esempio n. 7

0

Mostra file

    def main(self):
        print(self.document_1.get_merge_fields())
        self.read_files()

        for n_idx, n_row in self.df_data.iterrows():
            dict = {
                "姓名": str(n_row['姓名']),
                "年龄": str(n_row['年龄']),
                "生日": str(n_row['生日']),
                "folder": 'folder1'
            }
            self.document_1.merge(**dict)

            file_path = self.path + 'xlsx/'
            if not os.path.exists(file_path):
                os.makedirs(file_path)

            file_docx = self.path + 'xlsx/' + n_row['姓名'] + '.docx'
            self.document_1.write(file_docx)
            # time.sleep(1)

            file_path = self.path + n_row['性别'] + '/'
            if not os.path.exists(file_path):
                os.makedirs(file_path)

            file_pdf = file_path + n_row['姓名'] + '.pdf'
            # file_pdf = self.path + 'pdfs/' + n_row['姓名'] + '.pdf'
            # self.generate_pdf(file_docx,file_pdf)
            convert(file_docx, file_pdf, keep_active=True)
        self.document_1.close()

Esempio n. 8

0

Mostra file

def download_file(filename, pi_no):

    print(pi_no)
    x = requests.get(
        'http://151.80.237.86:1251/ords/zkt/pi_doc/doc?pi_no={}'.format(str(pi_no)))
    data = x.json()
    doc = DocxTemplate(
        "./{}".format(
            filename))

    pythoncom.CoInitialize()
    for x in data['items']:
        if x['pi_no'].strip() == '{}'.format(pi_no):  # 17865
            # pprint(x)
            doc.render(x)

# # time.sleep(1)

            file_stream = StringIO()
            doc.save('./static/file.docx')
            convert('./static/file.docx',
                    './static/file.pdf')
    flash("Your file has been created, Now you can download!!")

    return render_template('upload_file.html')

Esempio n. 9

0

Mostra file

File: main2.py Progetto: naazneen/Test

    def saveaspdf(self, parent, fname):

        from docx2pdf import convert

        #convert("input.docx")
        print(tx)
        convert(tx, tx + ".pdf")

Esempio n. 10

0

Mostra file

File: convert.py Progetto: OWASP/cornucopia

def convert_docx_to_pdf(docx_filename: str, output_pdf_filename: str) -> str:
    logging.debug(
        f" --- docx_file = {docx_filename}\n--- starting pdf conversion now.")
    fail: bool = False
    msg: str = ""
    if convert_vars.can_convert_to_pdf:
        # Use docx2pdf for windows and mac with MS Word installed
        try:
            docx2pdf.convert(docx_filename, output_pdf_filename)
        except Exception as e:
            msg = f"\nConvert error: {e}"
            fail = True
    else:
        fail = True
    if fail:
        msg = (
            "Error. A temporary docx file was created in the output folder but cannot be converted "
            f"to pdf (yet) on operating system: {sys.platform}\n"
            "This does work on Windows and Mac with MS Word installed.") + msg
        logging.warning(msg)
        return docx_filename

    # If not debugging then delete the temp file
    if not convert_vars.args.debug:
        os.remove(docx_filename)
    return output_pdf_filename

Esempio n. 11

0

Mostra file

def openFile():
    global filez
    filez = askopenfilenames(title='Choose a file')
    if len(filez) != 0:
        for i in range(len(filez)):
            convert(filez[i])
    print('done')

Esempio n. 12

0

Mostra file

File: doc_to_pdf.py Progetto: hduzn/python_tools

def doc_to_pdf():
    # 文件位置
    path = r'C:\小现代化(1)'

    file_list = get_filelist(path)
    # print(file_list)

    # 定义空list,存放文件列表
    docx_files = []
    for file in file_list:
        if (file.endswith(".docx")):
            docx_files.append(file)
        elif (file.endswith(".doc")):
            docx_file = doc2docx(file)
            docx_files.append(docx_file)
    # print(docx_files)
    for docx in docx_files:
        print(docx)
    print('docx文件数：', len(docx_files))

    # 转换文件
    print('-----------------开始转换 docx 文件-----------------')
    for file in docx_files:
        print(file)
        #print(file.split('.docx')[0]+'.pdf')
        convert(file, file.split('.docx')[0] + '.pdf')

Esempio n. 13

0

Mostra file

File: daily_pdf.py Progetto: CleHou/COVID-19-Data-Analysis-Project

    def fill_template(self):
        context = self.var_template()

        path_to_template = os.path.normpath(
            f'{self.root}/src/pdf_creation/template.docx')
        template = DocxTemplate(path_to_template)

        template.render(context)

        date_str = self.date.strftime("%Y-%m-%d")
        year = self.date.strftime("%Y")
        month = self.date.strftime("%m - %B")

        #file_dir = f"{self.root}/reports/Daily_PDF/{year}/{month}"
        #file_name = f"First_page_{date_str}"
        file_dir = f"{self.root}/reports/Daily_PDF"
        file_name = "First_page"

        file_fct.creation_folder('', [file_dir])
        full_path = os.path.normcase(f'{file_dir}/{file_name}.docx')

        template.save(full_path)
        convert(full_path)
        os.remove(full_path)

        return os.path.normcase(f'{file_dir}/{file_name}.pdf')

Esempio n. 14

0

Mostra file

File: views.py Progetto: apotipak/hrms

def generate_contract_list(request, *args, **kwargs):

    base_url = MEDIA_ROOT + '/contract/template/'
    contract_number_from = kwargs['contract_number_from']
    contract_number_to = kwargs['contract_number_to']
    contract_status = kwargs['contract_status']
    contract_zone = kwargs['contract_zone']

    # now = datetime.datetime.now()
    # html = "<html><body>It is now %s.</body></html>" % now
    # return HttpResponse(html)

    template_name = base_url + 'CNT_ContractStatus.docx'
    file_name = "contract_list_report"

    context = {
        'customer': "TEST",
    }

    tpl = DocxTemplate(template_name)
    tpl.render(context)
    tpl.save(MEDIA_ROOT + '/contract/download/' + file_name + ".docx")

    # docx2pdf
    docx_file = path.abspath("media\\contract\\download\\" + file_name +
                             ".docx")
    pdf_file = path.abspath("media\\contract\\download\\" + file_name + ".pdf")
    convert(docx_file, pdf_file)

    return FileResponse(open(pdf_file, 'rb'), content_type='application/pdf')

Esempio n. 15

0

Mostra file

def proses():

    rasma = asma.get()
    rref = ref.get()
    rttl = ttl.get()
    rttt= ttt.get()
    rprau = prau.get()
    rdowo = dowo.get()
    recdis=str(selhas())

    tpl = DocxTemplate('Python.docx')
    context = {1:{  "nama":"%s" %str(rasma),
                    "TTL":"%s" %str(rttl),
                    "ref":"Ref: CPA-2021-FTR-%s"%str(rref),
                    "TTT": "%s" %str(rttt),
                    "ecdis": "ECDIS Model %s" % str(recdis),
                    "ship":"Onboard %s" %str(rprau),
                    "dura": "%s" % str(rdowo)}
                }

    sref= str(rref)
    sasma = str(rasma)
    sprau = str(rprau)
    jenber = " "+ sref + " "+ sasma + " " + sprau

    tpl.render(context[1])
    tpl.save("CPA2021FTR%s.docx" %jenber)

    convert("CPA2021FTR%s.docx" %jenber, "C:/Users/QylaMeisya/Documents/Sertifikat Training Familiarrisasi ECDIS Photosop/sertfampy" )

    label = teka.Label(cen_ut, text="Sert. %s Selesai ! Input Entry lagi / Tutup Program !" %str(rasma))
    label.pack()

Esempio n. 16

0

Mostra file

File: doc2pdf_variable_text.py Progetto: diganthdr/python_bootcamp

def make_custom_report(input_map, template):

    #fill the template:
    replace_words_in_document(input_map, template)

    #convert to pdf.
    convert(TEMP_REPLACED_DOC, PDF_FILE_NAME)

Esempio n. 17

0

Mostra file

def certificate(name, fio, date1, date2, choose):
    f = fio.split("\r\n")
    print(f)
    zipObj = ZipFile('sample.zip', 'w')
    if choose == "Base":
        for person in f:
            doc = DocxTemplate("Sertifikat_ryzhiiy2.docx")
            context = {
                'Program': name,
                'Name': person.rstrip(),
                'Date1': date1,
                'Date2': date2,
                'Choose': choose
            }
            doc.render(context)
            doc.save("{}_base.docx".format(person.rstrip()))
            convert("{}_base.docx".format(person.rstrip()))
            zipObj.write('{}_base.pdf'.format(person.rstrip()))

    else:
        for person in f:
            doc = DocxTemplate("Sertifikat_ryzhiiy2.docx")
            context = {
                'Program': name,
                'Name': person.rstrip(),
                'Date1': date1,
                'Date2': date2,
                'Choose': choose
            }
            doc.render(context)
            doc.save("{}_project.docx".format(person.rstrip()))
            convert("{}_project.docx".format(person.rstrip()))
            zipObj.write('{}_project.pdf'.format(person.rstrip()))

    zipObj.close()

Esempio n. 18

0

Mostra file

def docxToPdf(inDir,file):
    convertDir = inDir+"/converted"
    if not os.path.exists(convertDir):
        os.makedirs(convertDir)
    opFileName = file.split(".")[0]+".pdf"
    convert(os.path.join(inDir, file), os.path.join(convertDir, opFileName))
    return os.path.join(convertDir, opFileName)

Esempio n. 19

0

Mostra file

def word2pdf(files_path):
    """对于给定的文件夹，转换文件夹内所有docx文件为同名的pdf文件"""
    files = os.listdir(files_path)
    for f in files:
        if f.endswith('docx') and '转让登记表' in f:
            f_new = os.path.splitext(f)[0] + ".pdf"
            convert(os.path.join(files_path, f),
                    os.path.join(files_path, f_new))

Esempio n. 20

0

Mostra file

File: 5.word文件批量转pdf.py Progetto: hong96206/python

def convert_single(src_file, dst_file):
    """
    单个文件实现 word->pdf 转换
    :param src_file: 源文件 xxx.docx
    :param dst_file: 目标文件 xxx.pdf
    :return:
    """
    docx2pdf.convert(src_file, dst_file)

Esempio n. 21

0

Mostra file

def convert_doc_to_pdf(doc_file):
    # Use a breakpoint in the code line below to debug your script.
    # Press Ctrl+F8 to toggle the breakpoint.
    filename, _ = os.path.splitext(doc_file)
    pdf_file = filename + '.pdf'
    docx2pdf.convert(doc_file, pdf_file)

    return pdf_file

Esempio n. 22

0

Mostra file

File: MysticsCardFiller.py Progetto: Jet170/MysticsCardFiller

def wordToPdf(requireDocPause):
    print("Converting from Word doc to pdf...")
    if (requireDocPause):
        input(
            "Please open " + outputDocName +
            ", save over the original output file, then close it and press enter"
        )
    convert(outputDocName, outputPDFName)

Esempio n. 23

0

Mostra file

 def doc_pdf(self):
     """
     :return: converts document to pdf
     """
     if self.dst == "":
         convert(self.src)
     else:
         convert(self.src, self.dst)

Esempio n. 24

0

Mostra file

def convert_pdf(input_dir="output/", output_dir="output_pdf/"):
    """
    docxファイルの保存されたフォルダを指定して、フォルダ格納データを全てpdfにして、指定フォルダに保存する
    :param input_dir: dir_name, default:output/,  outputフォルダを利用
    :param output_dir: dir_name, default:output_pdf/, output_pdfフォルダを利用
    :return: output_pdfフォルダにoutputフォルダのpdfが全て保存される
    """
    convert(input_dir, output_dir)

Esempio n. 25

0

Mostra file

File: main.py Progetto: lrbeauty/pdfgenerator

def making_a_doc_function(request):
    #plot from uploaded data now need to make chart from live data that has been uploaded to the site. this will be done by either doing pandas crunching all over again to get the numbers that you want or by reading numbers tht have already been put in one of the tables. most ikley a combination of both

    doc = docx.Document()
    pk = 3
    if not saf_defect_table.objects.filter(
            pk=pk).exists():  #this accesses the saf_defect_table
        doc.add_heading("no text")
        doc.save('thisisdoc.docx')
    else:
        saf_defect_table_variable = saf_defect_table.objects.get(pk=pk)

        doc.add_heading(str(saf_defect_table_variable.saf_number_in_table))
        doc.add_heading(str(saf_defect_table_variable.defect_number_in_table))

        #making a plot from a csv file that was uploaded to DB table
        if FileUpload.objects.filter(
                attribution_file_upload='pftest4.csv').exists():
            life3 = pd.read_csv(
                FileUpload.objects.get(attribution_file_upload='pftest4.csv').
                attribution_file_upload)
            life3.plot(kind='bar', x='status', y='item')
            plt.title('my plot title')
            plt.xlabel('years')
            plt.ylabel('Age')
            memfile = io.BytesIO(
            )  #this is needed in order to save the file to a temporary memory section
            plt.savefig(memfile)
            doc.add_picture(memfile, width=Inches(4))
            memfile.close()
            plt.clf()  #this shuts down the plot so then you can make a new.

        #making a plot out of numbers that are already stored in saf defect table DB table
        y1 = saf_defect_table_variable.saf_number_in_table
        y2 = saf_defect_table_variable.defect_number_in_table
        korea_scores = (y1, y2)
        col_count = 2
        bar_width = .2
        index = np.arange(col_count)
        plt.barh(index, korea_scores, bar_width, alpha=.4, label="Korea")
        memfile2 = io.BytesIO()
        plt.savefig(memfile2)
        doc.add_picture(memfile2, width=Inches(4))
        memfile2.close()

    doc.save('thisisdoc.docx')

    #converting the generated docx into a pdf file
    convert("thisisdoc.docx", "output.pdf")
    pdf = open('output.pdf', 'rb')
    response = FileResponse(pdf)

    # Report_File_Upload_Table.objects.create(generated_report_file_upload=output.pdf)
    return response
    #return render(request, 'doc.html', response)


#----------------end of section 2--------------------------------------------

Esempio n. 26

0

Mostra file

File: AufgabenK.py Progetto: niha1020/AufgabenK

    def get_path_value(self):
        #print(self.path_value.get())
        self.path = self.path_value.get()
        self.folder_name = self.path.rsplit("\\",1)[1]
        #print(self.folder_name) 

        #self.directory = self.path
        for folder_entry in os.scandir(self.path): #directory):
            self.folder_name = Path(folder_entry).stem
            #print(folder_entry.path)
            mergedObject = PdfFileMerger()

            for file_entry in os.scandir(folder_entry):
                self.file_name = Path(file_entry).stem
                print("Filenname", self.file_name)


                if not (file_entry.path.endswith(".jpg")
                        or  file_entry.path.endswith(".jpeg")
                        or file_entry.path.endswith(".png")
                        #or file_entry.path.endswith(".doc")
                        or file_entry.path.endswith(".docx")
                        or file_entry.path.endswith(".pdf")
                        )and file_entry.is_file():
                        print("Was ist das? Konvertier ich nicht  " + file_entry.path)
                        
                #if (file_entry.path.endswith("") and file_entry.is_file()):
                #        print("nothing")

                

                        

                if (file_entry.path.endswith(".jpg") or  file_entry.path.endswith(".jpeg") or file_entry.path.endswith(".png")) and file_entry.is_file():
                        #print(file_entry.path) 

                        image = Image.open(file_entry.path)
                        i = image.convert('RGB')
                        i.save(os.path.splitext(file_entry.path)[0] + ".pdf")

               # if (file_entry.path.endswith(".doc") ) and file_entry.is_file():
               #         convert(file_entry)
	                        

                if (file_entry.path.endswith(".docx")) and file_entry.is_file():
                        convert(file_entry)

            for file_entry in os.scandir(folder_entry):    
                if (file_entry.path.endswith(".pdf") and file_entry.is_file()):
                    #print(file_entry.path + ".pdf")
                    
                    new_pdf = Pdf.new()
                    with Pdf.open(file_entry.path, allow_overwriting_input=True) as pdf:
                        pdf.save(file_entry.path)
                        
                    mergedObject.append(PdfFileReader(file_entry.path, "rb"))

            mergedObject.write(self.path + "\\" + Path(folder_entry).stem + " - " +Path(self.path).stem  + ".pdf")

Esempio n. 27

0

Mostra file

File: doc_functions.py Progetto: HeenaBajaj/documentum

def ConvertToPdfFromFile(file_path, output_path):
    img_type = file_path.split(".")[1]
    if img_type == "jpg" or img_type == "jpeg" or img_type == "png":
        from PIL import Image
        image = Image.open(file_path)
        pdf_bytes = img2pdf.convert(image.filename)
        file = open(output_path, "wb")
        file.write(pdf_bytes)
        image.close()
        file.close()
    elif img_type == "doc" or img_type == "docx":
        from docx2pdf import convert
        convert(file_path, output_path)
    elif img_type == "txt":
        pdf = FPDF()
        # Add a page
        pdf.add_page()
        # set style and size of font
        # that you want in the pdf
        pdf.set_font("Arial", size=15)
        # open the text file in read mode
        f = open(file_path, "r")
        # insert the texts in pdf
        for x in f:
            pdf.cell(200, 10, txt=x, ln=1, align='C')
        # save the pdf with name .pdf
        pdf.output(output_path)

    elif img_type == "csv":
        config = pdfkit.configuration(
            wkhtmltopdf=
            r'C:\Users\A118090\AppData\Local\Programs\Python\Python36\Lib\site-packages\wkhtmltopdf'
        )
        pdfkit.from_file(file_path, output_path, configuration=config)

    elif img_type == "xlsx" or img_type == "xlsm" or img_type == "xls":
        from win32com import client
        xlApp = client.Dispatch("Excel.Application")
        books = xlApp.Workbooks.Open(file_path)
        # ws = books.Worksheets[0]
        # ws.Visible = 1
        # ws.ExportAsFixedFormat(0, output_path)
        ws_index_list = []
        r1 = 1
        while (r1 <= books.Worksheets.Count):

            ws_index_list.append(r1)
            r1 += 1
        # print(ws_index_list)
        books.WorkSheets(ws_index_list).Select()
        # # Save
        books.ActiveSheet.ExportAsFixedFormat(0, output_path)
        books.Close(True, file_path)
        print("file_path closed..")
    else:
        text = "file format does not match"

    print("Converted file: " + file_path + "\n\tto: " + output_path)

Esempio n. 28

0

Mostra file

def docx2pdf():
	resultlab.configure(text= 'Please Wait... Converting Docx to PDF')
	print('Converting Docx to PDF')
	sleep(1)
	destvar = sourcevar.replace('.docx','.pdf')
	convert(sourcevar , destvar)
	print('\nConverted Successfully!!\n')
	print(f'File Sucessfully Saved as {destvar}')
	resultlab.configure(text= f'File Sucessfully Saved as {destvar}')

Esempio n. 29

0

Mostra file

    def convertToPdf(self, path=None):
        """Convert word document to pdf"""

        if path:
            path.replace('.docx', '.pdf')
            convert(path)
        else:
            self.path.replace('.docx', '.pdf')
            convert(self.path)

Esempio n. 30

0

Mostra file

def convertAndDelete():
    directory = os.getcwd()
    convert(str(directory), str(directory) + "/dataPDF")
    files_in_directory = os.listdir(directory)
    docxFiles = [file for file in files_in_directory if file.endswith(".docx")]

    for file in docxFiles:
        path_to_file = os.path.join(directory, file)
        os.remove(path_to_file)