new changes to textedit

2019-05-31 09:43:04 +02:00 · 2019-05-31 09:43:04 +02:00 · 0af0e230c7
commit 0af0e230c7
parent 9fc5375862
1 changed files with 2 additions and 2 deletions
--- a/textedit.py
+++ b/textedit.py
@ -10,7 +10,7 @@ PART 1
 We create the dictionary and save it.
 """

-stopws = [",", ".", "?","!",":","(",")",">","<","@","#","``","/","–","''","‘","-","’", "DOCTYPE", "html", "!", "'", "<br>", "<br />", "/body", "/html", "/head", "h2", "/h2", "h1", "/h1","”","“"]
+stopws = [",", ".", "?","!",":","(",")",">","<","@","#","``","/","–","''","‘","-","’", "DOCTYPE", "html", "!", "'", "<br>", "<br />", "/body", "/html", "/head", "h2", "/h2", "h1", "/h1","”","“", "o", "Ca", "/"]

 path = "static/files/"
 for path, subdirs, files in os.walk(path):
@ -55,7 +55,7 @@ def analysis(the_word, file_name):
    # print(re_word)
    # print(the_word)
    for sent_token in sent_tokens:
-        if re.search(re_word, sent_token):
+        if re.search(re_word, sent_token, re.IGNORECASE):
            new_sent_tokens.append({'id': id, 'sentence': sent_token.replace('\n', ' ').strip("'<>()“”")})
    if the_word in sentences_w_word: # if this is not the first iteration
        previous_sent_tokens = sentences_w_word[the_word]