Skip to content

Commit

Permalink
daily limit detectLanguage considration
Browse files Browse the repository at this point in the history
Ugliest way to fix it... Do not hesitate to provide better code here
  • Loading branch information
Patent2net committed Jul 10, 2021
1 parent e47f40d commit 6a7b17e
Showing 1 changed file with 23 additions and 4 deletions.
27 changes: 23 additions & 4 deletions Patent2Net/P2N-Indexer.py
Original file line number Diff line number Diff line change
Expand Up @@ -274,23 +274,42 @@ def GenereListeFichiers(rep):
contenu = fichier.read()
if len(contenu) > 0:
phrase = contenu.split('.')[0]

if len(phrase) > 0 and len(phrase.split()) > 5: # more than 5 words
try:
lang = detectlanguage.simple_detect(phrase)
if detectlanguage.user_status()['requests'] < detectlanguage.user_status() ['daily_requests_limit'] -1:
lang = detectlanguage.simple_detect(phrase)
else:
time.sleep(86400) # wait ONE day!
lang = detectlanguage.simple_detect(phrase)
except:
time.sleep(2)
try:
lang = detectlanguage.simple_detect(phrase)
if detectlanguage.user_status()['requests'] < detectlanguage.user_status()[
'daily_requests_limit'] - 1:
lang = detectlanguage.simple_detect(phrase)
else:
time.sleep(86400) # wait ONE day!
lang = detectlanguage.simple_detect(phrase)
except:
lang = ''
else:
phrase = contenu.split('.')[1]
try:
lang = detectlanguage.simple_detect(phrase)
if detectlanguage.user_status()['requests'] < detectlanguage.user_status()[
'daily_requests_limit'] - 1:
lang = detectlanguage.simple_detect(phrase)
else:
time.sleep(86400) # wait ONE day!
lang = detectlanguage.simple_detect(phrase)
except:
time.sleep(2)
try:
lang = detectlanguage.simple_detect(phrase)
if detectlanguage.user_status()['requests'] < detectlanguage.user_status()['daily_requests_limit'] - 1:
lang = detectlanguage.simple_detect(phrase)
else:
time.sleep(86400) # wait ONE day!
lang = detectlanguage.simple_detect(phrase)
except:
lang = ''
if len(lang) > 0:
Expand Down

0 comments on commit 6a7b17e

Please sign in to comment.