nelsonjq commited on
Commit
38a37b1
·
verified ·
1 Parent(s): a9d9c73

Update utils.py

Browse files
Files changed (1) hide show
  1. utils.py +6 -2
utils.py CHANGED
@@ -1,6 +1,10 @@
1
- def pdf_to_text(pdf_path: str) -> str:
2
- from PyPDF2 import PdfReader
 
 
3
 
 
 
4
  text = ""
5
  with open(pdf_path, "rb") as file:
6
  reader = PdfReader(file)
 
1
+ import os
2
+ import pandas as pd
3
+ from lingtrain_aligner import preprocessor, splitter, aligner, resolver, reader, vis_helper
4
+ from PyPDF2 import PdfReader
5
 
6
+ def pdf_to_text(pdf_path: str) -> str:
7
+
8
  text = ""
9
  with open(pdf_path, "rb") as file:
10
  reader = PdfReader(file)