File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 22dist /
33TextSpitter.egg-info /
44v * /
5+ git_push.bat
Original file line number Diff line number Diff line change @@ -15,8 +15,8 @@ def PdfFileRead(file):
1515 those characters get filtered out.'''
1616
1717 try :
18- with file .open (). read () as f :
19- pdf_file = fitz .Document (stream = f , filetype = 'pdf' )
18+ with file .open () as f :
19+ pdf_file = fitz .Document (stream = f . read () , filetype = 'pdf' )
2020 raw_text = [ele .getText ('text' ) for ele in pdf_file ]
2121 text = '' .join (raw_text )
2222 # else:
@@ -29,8 +29,8 @@ def PdfFileRead(file):
2929
3030
3131def DocxFileRead (file ):
32- with file .open (). read () as f :
33- f_stream = BytesIO (f )
32+ with file .open () as f :
33+ f_stream = BytesIO (f . read () )
3434 document = Document (f_stream )
3535 raw_text = [p .text for p in document .paragraphs ]
3636 text = '\n ' .join (raw_text )
Original file line number Diff line number Diff line change @@ -17,7 +17,7 @@ def file_load(self):
1717 if file_type == file_types_tup [0 ]:
1818 text = PdfFileRead (self .name )
1919 elif file_type == file_types_tup [1 ]:
20- text = DocxFileRead (self .text )
20+ text = DocxFileRead (self .name )
2121 # elif file_type == file_types_tup[2]:
2222 # text = DocFileRead(self.text)
2323 else :
You can’t perform that action at this time.
0 commit comments