receipt_loader.py 638 B

12345678910111213141516171819202122232425
  1. '''
  2. Created on Jun 25, 2020 @author: vnc-console
  3. '''
  4. import fitz
  5. import pypdf
  6. from receipt import Receipts
  7. loader = Receipts()
  8. # for pdf in loader.filter_files('.pdf', 'RECIPISEMAI2020/'):
  9. # print(pdf)
  10. # loader.pdf_reader('RECIPISEMAI2020/' + pdf)
  11. loader.xling('recipise', 'recipise', '.pdf', 'y', path='RECIPISEMAI2020/')
  12. # pdf = PyPDF2.PdfFileReader('RECIPISEMAI2020/213947068_12760778_D300_5_2020.pdf')
  13. # pdf = fitz.open('RECIPISEMAI2020/ABCONSULT.PDF')
  14. # fitz.Page.getTextPage(self, flags)
  15. # page = pdf.loadPage(0)
  16. # text = page.getText('text')
  17. # print(text)
  18. # cnt = page.extractText()
  19. # print(cnt)