heymenn commited on
Commit
ef3ecaa
1 Parent(s): e086aec

Update scrape_3gpp.py

Browse files
Files changed (1) hide show
  1. scrape_3gpp.py +1 -0
scrape_3gpp.py CHANGED
@@ -453,6 +453,7 @@ def extractionPrincipale(url, excel_file=None, status_list=None, progress=gr.Pro
453
  tabLine = []
454
  file = pdfReader
455
  pdfNumberPages = len(file.pages)
 
456
  for pdfPage in range(0, pdfNumberPages):
457
 
458
  load_page = file.get_page(pdfPage)
 
453
  tabLine = []
454
  file = pdfReader
455
  pdfNumberPages = len(file.pages)
456
+ words_limit = 1000
457
  for pdfPage in range(0, pdfNumberPages):
458
 
459
  load_page = file.get_page(pdfPage)