-
Notifications
You must be signed in to change notification settings - Fork 0
/
corpus_adder.py
26 lines (22 loc) · 1.02 KB
/
corpus_adder.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from typing import List
from word_wheel_solver import WordWheelSolver
class CorpusAdder():
def __init__(self, excluded_tags=[]):
self.excluded_tags = excluded_tags
def add_tagged_corpus_to_solver(self, corpus: List[tuple], solver: WordWheelSolver):
for word_tag_pair in corpus:
tag = word_tag_pair[1]
if tag not in self.excluded_tags:
solver.add_word_to_dictionary(word_tag_pair[0])
def add_corpus_from_file(self, file_path: str, solver: WordWheelSolver):
with open(file_path, 'r') as file:
lines = file.readlines()
for line in lines:
line = line.replace('\n', '')
solver.add_word_to_dictionary(line)
def write_unique_words_to_file(self, file_path: str, corpus: List[tuple]):
with open(file_path, 'w') as file:
for word_tag_pair in corpus:
tag = word_tag_pair[1]
if tag not in self.excluded_tags:
file.write(str(word_tag_pair) + '\n')