Skip to content

Commit

Permalink
Do not print skipped compound words
Browse files Browse the repository at this point in the history
  • Loading branch information
BigNerd committed Oct 1, 2020
1 parent 311b00f commit 0267eaa
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion justmltools/nlp/word_embedder.py
Original file line number Diff line number Diff line change
Expand Up @@ -155,7 +155,8 @@ def __create_word_index_dict_and_embedding_matrix(
embedding_matrix[next_word_index] = np.asarray(tokens[1:], dtype='float32')
next_word_index += 1
else:
print(f"skipping line with compound word {word} because it splits into {word_sequence}")
#print(f"skipping line with compound word {word} because it splits into {word_sequence}")
pass
embedding_file.close()
print(f"loaded {next_word_index - 1} word embeddings")
non_lower_case_percentage: float = 100 * number_of_non_lower_case_words / max(next_word_index, 1)
Expand Down

0 comments on commit 0267eaa

Please sign in to comment.