Spaces:

mskov
/

Speech-Trigger-Detection

Runtime error

mskov commited on Sep 18, 2023

Commit

77c21f6

•

1 Parent(s): a7827a1

Update replace_explitives.py

Files changed (1) hide show

replace_explitives.py CHANGED Viewed

@@ -1,28 +1,40 @@
 import regex as re
 def sub_explitives(textfile, selection):
     replacetext = "person"
     # text = word_tokenize(textfile)
     # print(text)
     # sentences = sent_tokenize(textfile)
     if selection == "B-Word":
-        target_word = r"\bbitch\b"
     elif selection == "N-Word":
-        target_word = r"\bnigga\b"
     elif selection == "All Explitives":
-        target_word = r"\bshit\b"
     else:
-        target_word = None
     print("selection:", selection, "target_word:", target_word)
     if target_word:
         print("target word was found, ", target_word)
         print(textfile)
-        textfile = re.sub(target_word, replacetext, textfile, flags=re.IGNORECASE)
     return textfile

 import regex as re
+import nltk
+def load_words_from_file(file_path):
+    with open(file_path, "r", encoding="utf-8") as f:
+        words = [line.strip() for line in f.readlines()]
+    return words
 def sub_explitives(textfile, selection):
     replacetext = "person"
+    # Load target words from text files
+    b_word_list = load_words_from_file("b_word.txt")
+    n_word_list = load_words_from_file("n_word.txt")
+    expletives_list = load_words_from_file("expletives.txt")
     # text = word_tokenize(textfile)
     # print(text)
     # sentences = sent_tokenize(textfile)
     if selection == "B-Word":
+        target_word = b_word_list
     elif selection == "N-Word":
+        target_word = n_word_list
     elif selection == "All Explitives":
+        target_word = expletives_list
     else:
+        target_word = []
     print("selection:", selection, "target_word:", target_word)
     if target_word:
         print("target word was found, ", target_word)
         print(textfile)
+        pattern = r"\b" + re.escape(target_word) + r"\b"  # Create a regex pattern for each word
+        # textfile = re.sub(target_word, replacetext, textfile, flags=re.IGNORECASE)
+        textfile = re.sub(pattern, replacetext, textfile, flags=re.IGNORECASE)
     return textfile