|
import csv |
|
|
|
def load_word_database(database_filename): |
|
with open(database_filename, mode='r', encoding='utf-8') as database_file: |
|
return set(word.strip().lower() for word in database_file) |
|
|
|
def check_generated_conversation_for_words(csv_filename, word_database): |
|
with open(csv_filename, mode='r', newline='', encoding='utf-8') as csv_file: |
|
csv_reader = csv.DictReader(csv_file) |
|
words = [] |
|
for row in csv_reader: |
|
generated_conversation = row.get('Generated Conversation', '').lower() |
|
words.extend(word for word in generated_conversation.split() if word in word_database) |
|
save_words_to_csv(words) |
|
|
|
def save_words_to_csv(words): |
|
output_csv_filename = "text.csv" |
|
with open(output_csv_filename, mode='w', newline='', encoding='utf-8') as output_csv_file: |
|
csv_writer = csv.writer(output_csv_file) |
|
csv_writer.writerows([[word] for word in words]) |
|
|
|
def main(): |
|
database_filename = 'word_database.txt' |
|
csv_filename = 'info.csv' |
|
|
|
word_database = load_word_database(database_filename) |
|
check_generated_conversation_for_words(csv_filename, word_database) |
|
|
|
if __name__ == "__main__": |
|
main() |
|
|