Till Fischer
commited on
Commit
·
c7ad5e5
1
Parent(s):
cca703d
Update all changes
Browse files- analyze_aspects.py +2 -1
analyze_aspects.py
CHANGED
@@ -94,7 +94,8 @@ def analyze_quickwin(db_path: Path, isbn: str, device: int = -1, languages: list
|
|
94 |
logger.info(f"Review ID {review_id} ({lang}) wird verarbeitet.")
|
95 |
|
96 |
lang_map = {'de': 'german', 'en': 'english'}
|
97 |
-
|
|
|
98 |
|
99 |
if lang == 'de':
|
100 |
aspect_map = ASPECT_LABEL_MAP
|
|
|
94 |
logger.info(f"Review ID {review_id} ({lang}) wird verarbeitet.")
|
95 |
|
96 |
lang_map = {'de': 'german', 'en': 'english'}
|
97 |
+
tokenizer = nltk.data.load(f"tokenizers/punkt/{lang_map.get(lang, 'english')}.pickle")
|
98 |
+
sentences = tokenizer.tokenize(text)
|
99 |
|
100 |
if lang == 'de':
|
101 |
aspect_map = ASPECT_LABEL_MAP
|