improved smart

2020-01-10 21:15:10 +01:00 · 2020-01-10 21:15:10 +01:00 · 8f70e65b92
commit 8f70e65b92
parent 72f6bb2fd3
1 changed files with 53 additions and 40 deletions
--- a/api/thesaurus.py
+++ b/api/thesaurus.py
@ -1,11 +1,20 @@
 import requests
 import re, random
 import nltk
+import threading, queue
 from util import logging, config

 key = config.settings["api_keys"]["thesaurus"]
 url = f"http://thesaurus.altervista.org/thesaurus/v1?key={key}&language=en_US&output=json&word="

+def start_thread(target, args):
+    q = queue.Queue()
+    def wrapper():
+        q.put(target(args))
+    t = threading.Thread(target=wrapper)
+    t.start()
+    return q
+
 def thesaurufy_sentence(sentence):
    symbols = nltk.word_tokenize(sentence)
    tags = nltk.pos_tag(symbols)
@ -13,47 +22,51 @@ def thesaurufy_sentence(sentence):
    if len(symbols) == 0:
        return ""
    
+    queues = []
    for i in range(0, len(symbols)):
-        if not symbols[i].isalpha():
-            continue
-
-        if tags[i][1] != "NN" and tags[i][1] != "VB" and tags[i][1] != "VBG" and tags[i][1] != "VBP" and tags[i][1] != "JJ" and tags[i][1] != "RB":
-            symbols[i] = " " + symbols[i]
-            continue
-
-        response = requests.get(url + symbols[i])
-        if not response.ok:
-            # logging.warning(f"Thesaurus API returned {response.status_code} ({url + symbols[i]})")
-            symbols[i] = " " + symbols[i]
-            continue
+        queues.append(start_thread(target = handle_token, args=(tags[i])))
        
-        responses = response.json()["response"]
-        condition = ""
-        if tags[i][1] == "JJ":
-            condition = "(adj)"
-        elif tags[i][1] == "RB":
-            condition = "(adv)"
-        elif tags[i][1] == "NN":
-            condition = "(noun)"
-        else:
-            condition = "(verb)"
-
-        try:
-            words = random.choice([a for a in responses if a["list"]["category"] == condition])["list"]["synonyms"].split("|")
-        except:
-            symbols[i] = " " + symbols[i]
-            continue
-        
-        # print(words)
-        word = words[random.randint(0, len(words) - 1)]
-        
-        if "(" in word:
-            if "antonym" in word.split("(")[1].lower():
-                symbols[i] = " " + symbols[i]
-                continue
-
-            word = word.split("(")[0][:-1]
-
-        symbols[i] = " " + word
+    for i in range(0, len(symbols)):
+        symbols[i] = queues[i].get()

    return "".join(symbols)
+
+def handle_token(args):
+    token = args
+    if not token[0].isalpha():
+        return token[0]
+
+    if token[1] != "NN" and token[1] != "VB" and token[1] != "VBG" and token[1] != "VBP" and token[1] != "JJ" and token[1] != "RB":
+        return (" " + token[0])
+
+    response = requests.get(url + token[0])
+    if not response.ok:
+        # logging.warning(f"Thesaurus API returned {response.status_code} ({url + token[0]})")
+        return (" " + token[0])
+    
+    responses = response.json()["response"]
+    condition = ""
+    if token[1] == "JJ":
+        condition = "(adj)"
+    elif token[1] == "RB":
+        condition = "(adv)"
+    elif token[1] == "NN":
+        condition = "(noun)"
+    else:
+        condition = "(verb)"
+
+    try:
+        words = random.choice([a for a in responses if a["list"]["category"] == condition])["list"]["synonyms"].split("|")
+    except:
+        return (" " + token[0])
+    
+    # print(words)
+    word = words[random.randint(0, len(words) - 1)]
+    
+    if "(" in word:
+        if "antonym" in word.split("(")[1].lower():
+            return (" " + token[0])
+
+        word = word.split("(")[0][:-1]
+
+    return (" " + word)