首页 > 解决方案 > 使用 PyPDF2 和 Openpyxl 在 excel 文件上设置值的问题

问题描述

我有下一个代码:

import PyPDF2
import openpyxl
from openpyxl import Workbook
from openpyxl import load_workbook
from openpyxl.worksheet.cell_range import CellRange

#Definir Archivo Excel
file = 'C:\\Users\\Desktop\\PYTHON_PDF\\PRUEBA_PDF.xlsx'
wb = openpyxl.load_workbook(file)#define workook
ws = wb['Hoja1']#define sheet1
#define max values for columns
max_row_for_a = max((a.row for a in ws['A'] if a.value is not None))
max_row_for_b = max((b.row for b in ws['B'] if b.value is not None))

#LOOP
for row in ws.iter_rows(min_row=2, max_col=1, max_row=max_row_for_a):
    pdf=  row[0].value
    print (pdf)
    for row2 in ws.iter_rows(min_row=2, max_col=2, max_row=max_row_for_b, min_col=2):
        extracto = row2[0].value
        pdfselect=open(pdf,"rb")
        leer = PyPDF2.PdfFileReader(pdfselect)
        pagina = leer.getPage(0)  
        extracto =  pagina.extractText()
        print(extracto)
        wb.save("PRUEBA_PDF2.xlsx")
        wb.close

这个想法是用pdf的名称读取excel的A列并在B列中写入pdf提取的内容,但是当我执行代码时不显示任何内容,甚至不显示错误。我尝试使用这样的最小案例,但没有问题:

#pdfselect=open("ejemplo.pdf","rb")
#leer = PyPDF2.PdfFileReader(pdfselect)
#pagina = leer.getPage(0)   
#sheet =   wb.active 
#ws['B2'] = pagina.extractText()
#wb.save("PRUEBA_PDF2.xlsx")
#wb.close

我做错了什么?问候!

标签: pythonexcelpdfopenpyxlpypdf2

解决方案


我发现了问题。正确的代码必须是这样的:

import PyPDF2
import openpyxl
from openpyxl import Workbook
from openpyxl import load_workbook
from openpyxl.worksheet.cell_range import CellRange

#Definir Archivo Excel

file = 'C:\\Users\\lorrego\\Desktop\\PYTHON_PDF\\PRUEBA_PDF.xlsx'
wb = openpyxl.load_workbook(file)#define workook
ws = wb['Hoja1']#define la hoja 1
max_row_for_a = max((a.row for a in ws['A'] if a.value is not None))



for row in ws.iter_rows(min_row=2, max_col=2, max_row=max_row_for_a):

    pdf=  row[0].value  
    pdfselected=open(pdf,"rb")
    leer = PyPDF2.PdfFileReader(pdfselected)
    pagina = leer.getPage(0)  
    ws.cell(row=row[0].row, column=2).value = pagina.extractText()
    wb.save("C:\\Users\\Desktop\\PYTHON_PDF\\PRUEBA_PDF.xlsx")
    wb.close

推荐阅读