mhezarei · hamedkhaledi · Mar 5, 2021 · Mar 6, 2021
diff --git a/test.py → Code/API_voice/__init__.py b/test.py → Code/API_voice/__init__.py
diff --git a/aryana.py → Code/API_voice/aryana.py b/aryana.py → Code/API_voice/aryana.py
diff --git a/deepmine.py → Code/API_voice/deepmine.py b/deepmine.py → Code/API_voice/deepmine.py
diff --git a/nevisa.py → Code/API_voice/nevisa.py b/nevisa.py → Code/API_voice/nevisa.py
diff --git a/speechRec.py → Code/API_voice/speechRec.py b/speechRec.py → Code/API_voice/speechRec.py
diff --git a/Code/__init__.py b/Code/__init__.py
diff --git a/aibot.py → Code/aibot.py b/aibot.py → Code/aibot.py
@@ -1,15 +1,14 @@
-import time
-
+import os
 from transformers import AutoTokenizer, AutoModelForTokenClassification
 
-from answer_per_question import answer_per_question
-from aryana import aryana
-from auto_correct import auto_correct
-from find_dates import reformat_date
-from find_events_in_sentence import find_events_in_sentence
-from find_time import reformat_date_time
-from speechRec import google
-from split import split
+from .answer_per_question import answer_per_question
+from .API_voice.aryana import aryana
+from .auto_correct import auto_correct
+from .arguments.find_dates import reformat_date
+from .arguments.find_events_in_sentence import find_events_in_sentence
+from .arguments.find_time import reformat_date_time
+from .API_voice.speechRec import google
+from .split import split
 
 
 class BOT:
@@ -35,8 +34,9 @@ def AIBOT(self, Question):
         answer_set = {'type': set(), 'city': set(), 'date': set(),
                       'time': set(), 'religious_time': set(), 'calendar_type': set(),
                       'event': set(), 'api_url': set(), 'result': []}
-        # Question = auto_correct(Question)
+
         try:
+            Question = auto_correct(Question)
             Question = reformat_date_time(Question)
         except:
             pass
@@ -45,12 +45,11 @@ def AIBOT(self, Question):
             Question = reformat_date(Question)
         except:
             pass
-
-        '/var/www/AIBot/media/codes/[email protected]/bert-base-parsbert-ner-uncased'
+        p = os.path.dirname(os.path.abspath(__file__))
         tokenizer = AutoTokenizer.from_pretrained(
-            '/var/www/AIBot/media/codes/[email protected]/bert-base-parsbert-ner-uncased')
+            p + '/../bert-base-parsbert-ner-uncased')
         model = AutoModelForTokenClassification.from_pretrained(
-            '/var/www/AIBot/media/codes/[email protected]/bert-base-parsbert-ner-uncased')
+            p + '/../bert-base-parsbert-ner-uncased')
 
         try:
             events, event_keys = find_events_in_sentence(Question)
@@ -60,6 +59,7 @@ def AIBOT(self, Question):
 
         try:
             Questions = split(Question, events)
+            print('Questions : ' + Questions)
         except:
             Questions = [Question]
             pass
@@ -83,6 +83,11 @@ def AIBOT(self, Question):
             answer[key] = list(answer_set[key])
         final_answer = final_answer + " ."
 
+        response = aryana(final_answer)
+
+        with open("response.wav", mode='bw') as f:
+            f.write(response.content)
+
         return answer, final_answer
 
     '''

diff --git a/answer_per_question.py → Code/answer_per_question.py b/answer_per_question.py → Code/answer_per_question.py
@@ -3,16 +3,16 @@
 import dateparser
 from persiantools.jdatetime import JalaliDate
 
-from find import find
-from find_fit_word import find_fit_word
-from find_time_from_religious import find_time_from_religious
-from find_weather_from_city_date import find_weather_from_city_date
-from learning import predict
-from mhr_time import Time
-from output_sentences import religion_sentence, time_sentence, date_sentence, unknown_sentence, weather_sentence, \
+from .arguments.find import find
+from .arguments.find_fit_word import find_fit_word
+from .arguments.find_time_from_religious import find_time_from_religious
+from .arguments.find_weather_from_city_date import find_weather_from_city_date
+from .learning import predict
+from .mhr_time import Time
+from .output_sentences import religion_sentence, time_sentence, date_sentence, unknown_sentence, weather_sentence, \
     weather_logical_sentence
-from utility import convert_date
-from weather_difference import weather_difference
+from .utility import convert_date
+from .weather_difference import weather_difference
 
 
 def answer_per_question(Question, model, tokenizer, all_events, all_event_keys):

diff --git a/Code/argument_corpse.py b/Code/argument_corpse.py
@@ -0,0 +1,11 @@
+new = []
+with open("../Data/auto_correct/argument_corpse.txt") as f:
+    words = f.read().split('\n')
+    words.remove('')
+    for w in words:
+        if ' ' in w:
+            new += w.split()
+        else:
+            new.append(w)
+
+new = list(set(new))
diff --git a/Code/arguments/__init__.py b/Code/arguments/__init__.py
diff --git a/find.py → Code/arguments/find.py b/find.py → Code/arguments/find.py
@@ -1,14 +1,14 @@
 from __future__ import unicode_literals
 
-from find_calendar_types import find_calendar_types
-from find_cities import find_cities
-from find_dates import find_dates
-from find_events import find_events
-from find_religious_time import find_religious_time
-from find_time import find_date_time
-from find_weather_method import find_weather_method
-from pipeline_sentence import pipeline_sentence
-from tokens_in_sentence import find_tokens_in_sentence
+from .find_calendar_types import find_calendar_types
+from .find_cities import find_cities
+from .find_dates import find_dates
+from .find_events import find_events
+from .find_religious_time import find_religious_time
+from .find_time import find_date_time
+from .find_weather_method import find_weather_method
+from ..pipeline_sentence import pipeline_sentence
+from ..tokens_in_sentence import find_tokens_in_sentence
 
 
 # If you don't have model -> Comment 7, 8, 23, 24 lines and Uncomment 27, 28, 29 lines

diff --git a/find_calendar_types.py → Code/arguments/find_calendar_types.py b/find_calendar_types.py → Code/arguments/find_calendar_types.py
diff --git a/find_cities.py → Code/arguments/find_cities.py b/find_cities.py → Code/arguments/find_cities.py
diff --git a/find_dates.py → Code/arguments/find_dates.py b/find_dates.py → Code/arguments/find_dates.py
diff --git a/find_events.py → Code/arguments/find_events.py b/find_events.py → Code/arguments/find_events.py
@@ -13,7 +13,7 @@ def find_events(sentence, dates, all_events, all_event_keys):
         event_month = dates[0].split('-')[1]
         event_day = dates[0].split('-')[2]
         new_dates = dates
-        url1 = os.path.join(p, event_year + ".csv")
+        url1 = p + "/../../Data/events/" + event_year + ".csv"
         df2 = pd.read_csv(url1)
         for idx, row in df2.iterrows():
             if str(row["month"]) == event_month and str(row["day"]) == str(event_day):
@@ -35,7 +35,7 @@ def find_events(sentence, dates, all_events, all_event_keys):
         new_dates = []
         if len(events) > 0 and len(dates) > 0:
             year = dates[0].split('-')[0]
-            url1 = os.path.join(p, year + ".csv")
+            url1 = p + "/../../Data/events/" + year + ".csv"
             df2 = pd.read_csv(url1)
 
             for idx, row in df2.iterrows():

diff --git a/find_events_in_sentence.py → Code/arguments/find_events_in_sentence.py b/find_events_in_sentence.py → Code/arguments/find_events_in_sentence.py
@@ -5,7 +5,7 @@
 
 def find_events_in_sentence(sentence):
     p = os.path.dirname(os.path.abspath(__file__))
-    url1 = os.path.join(p, "find important events.csv")
+    url1 = os.path.join(p, "../../Data/events/find important events.csv")
     df1 = pd.read_csv(url1)
     important_events = df1['event']
     important_events_key = df1['event_key']

diff --git a/find_fit_word.py → Code/arguments/find_fit_word.py b/find_fit_word.py → Code/arguments/find_fit_word.py
diff --git a/find_religious_time.py → Code/arguments/find_religious_time.py b/find_religious_time.py → Code/arguments/find_religious_time.py
diff --git a/find_time.py → Code/arguments/find_time.py b/find_time.py → Code/arguments/find_time.py
@@ -2,7 +2,7 @@
 
 from unidecode import unidecode
 
-from persian_num_change import persian_num_change
+from ..persian_num_change import persian_num_change
 
 
 def find_date_time(tokens_lem, sentence):

diff --git a/find_time_from_religious.py → Code/arguments/find_time_from_religious.py b/find_time_from_religious.py → Code/arguments/find_time_from_religious.py
@@ -1,5 +1,5 @@
-from religious_time import ReligiousTime
-from utility import convert_date
+from ..religious_time import ReligiousTime
+from ..utility import convert_date
 
 
 def find_time_from_religious(answer):

diff --git a/find_weather_from_city_date.py → .../arguments/find_weather_from_city_date.py b/find_weather_from_city_date.py → .../arguments/find_weather_from_city_date.py
@@ -1,6 +1,6 @@
 from datetime import datetime
 
-from weather import Weather
+from ..weather import Weather
 
 
 def find_weather_from_city_date(Question, city, greg_date):

diff --git a/find_weather_method.py → Code/arguments/find_weather_method.py b/find_weather_method.py → Code/arguments/find_weather_method.py
diff --git a/auto_correct.py → Code/auto_correct.py b/auto_correct.py → Code/auto_correct.py
@@ -44,7 +44,8 @@ def lv(s, t):
 
 
 def correct(word: str) -> str:
-    with open('new_argument_corpse.txt') as f:
+    p = os.path.dirname(os.path.abspath(__file__))
+    with open(p + '/../Data/auto_correct/new_argument_corpse.txt') as f:
         data = f.read().split('\n')
         data.remove('')
 
@@ -71,29 +72,8 @@ def correct(word: str) -> str:
     return word
 
 
-def load_lists():
-    p = os.path.dirname(os.path.abspath(__file__))
-    url = os.path.join(p, "fa_cities_final2.csv")
-    df = pd.read_csv(url)
-    cities = df['city-fa']
-
-    url = os.path.join(p, "important_words.csv")
-    df = pd.read_csv(url)
-    important_words = df['words']
-
-    url = os.path.join(p, "find important events.csv")
-    df = pd.read_csv(url)
-    events = df['event']
-
-    url = os.path.join(p, "countries.csv")
-    df = pd.read_csv(url)
-    countries = df['country']
-    return cities, important_words, events, countries
-
-
 def auto_correct(sentence: str):
     start = time.time()
-    cities, important_word, events, countries = load_lists()
 
     symbols = "!\"#$%&()*+-./;<=>?@[\\]^_`{|}~\n،,؟؛"
     for i in symbols:
@@ -114,4 +94,3 @@ def auto_correct(sentence: str):
     return new_sen[:-1]
 
 
-auto_correct("اذان ژهر به در حال حاضر افق تران کی است؟")
diff --git a/capitals.py → Code/capitals.py b/capitals.py → Code/capitals.py
diff --git a/date.py → Code/date.py b/date.py → Code/date.py
diff --git a/learning.py → Code/learning.py b/learning.py → Code/learning.py
@@ -6,7 +6,7 @@
 os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
 import numpy as np
 import pandas as pd
-from rule_based import rule_based_score
+from .rule_based import rule_based_score
 from tensorflow.keras.models import Sequential
 from tensorflow.keras.layers import Embedding, Dense, LSTM
 from sklearn.model_selection import train_test_split
@@ -20,7 +20,8 @@
            3: "date",
            4: "unknown"}
 
-df = pd.read_csv("questions and data.csv", index_col=0)
+p = os.path.dirname(os.path.abspath(__file__))
+df = pd.read_csv(p + "/../Data/intent/questions and data.csv", index_col=0)
 df_x = df["questions"].values
 df_y = df["class0"].values
 # df = pd.read_csv("mh_clean.csv")
@@ -60,12 +61,13 @@ def train_model():
 # print("Saved model to disk")
 
 def predict(sent: str) -> int:
-    json_file = open('all_lstm_model.json', 'r')
+    p = os.path.dirname(os.path.abspath(__file__))
+    json_file = open(p + '/../Models/all_lstm_model.json', 'r')
 
     model = json_file.read()
     json_file.close()
     model = model_from_json(model)
-    model.load_weights("all_lstm_model_weights.h5")
+    model.load_weights(p + "/../Models/all_lstm_model_weights.h5")
 
     unk = 5
     enc = tokenizer.texts_to_sequences(np.array([sent]))

diff --git a/mhr_time.py → Code/mhr_time.py b/mhr_time.py → Code/mhr_time.py
@@ -3,7 +3,7 @@
 import requests
 from bs4 import BeautifulSoup
 
-from utility import get_english_names
+from .utility import get_english_names
 
 
 class Time:

diff --git a/output_sentences.py → Code/output_sentences.py b/output_sentences.py → Code/output_sentences.py
@@ -5,7 +5,7 @@
 import num2fawords
 from persiantools.jdatetime import JalaliDate
 
-from capitals import capital_to_country
+from .capitals import capital_to_country
 
 
 def convert_month(month: int) -> str:

diff --git a/persian_num_change.py → Code/persian_num_change.py b/persian_num_change.py → Code/persian_num_change.py
diff --git a/pipeline_sentence.py → Code/pipeline_sentence.py b/pipeline_sentence.py → Code/pipeline_sentence.py
@@ -1,7 +1,7 @@
 from hazm import word_tokenize, Lemmatizer, Normalizer
 from transformers import pipeline
 
-from capitals import capital_dictionary_keys, country_to_capital
+from .capitals import capital_dictionary_keys, country_to_capital
 
 
 def pipeline_sentence(sentence, model, tokenizer):

diff --git a/religious_time.py → Code/religious_time.py b/religious_time.py → Code/religious_time.py
@@ -1,6 +1,6 @@
 import requests
 
-from utility import get_english_names, split_date
+from .utility import get_english_names, split_date
 
 REL_TIME_CONVERSION = {
 	"امساک": "Imsak",

diff --git a/rule_based.py → Code/rule_based.py b/rule_based.py → Code/rule_based.py
@@ -30,15 +30,15 @@ def get_list_from(filename: str) -> list:
 def parse_shamsi_events() -> list:
 	# this is only needed for date category so we can
 	# only check the whole combination and not the words
-	f = os.path.join(p, 'shamsi_events.csv')
+	f = os.path.join(p, '../Data/events/shamsi_events.csv')
 	events = pd.read_csv(f, encoding="utf-8")
 	temp_combs = events["event"].tolist()
 	return list(set(temp_combs))
 
 
 def initialize() -> Tuple[list, list]:
-	used_words = get_list_from(os.path.join(p, 'used_words.txt'))
-	used_combs = get_list_from(os.path.join(p, 'used_combs.txt'))
+	used_words = get_list_from(os.path.join(p, '../Data/intent/used_words.txt'))
+	used_combs = get_list_from(os.path.join(p, '../Data/intent/used_combs.txt'))
 
 	c = parse_shamsi_events()
 	used_combs[3] += c

diff --git a/split.py → Code/split.py b/split.py → Code/split.py
@@ -2,15 +2,16 @@
 # coding: utf-8
 
 # In[1]:
-
+import os
 
 from hazm import *
 
 # In[2]:
 
 
 combs = []
-with open("split_combs", "r") as a_file:
+p = os.path.dirname(os.path.abspath(__file__))
+with open(p + "/../Data/split/split_combs", "r") as a_file:
     for line in a_file:
         combs.append(line.strip())
 

diff --git a/tf_idf_with_max_padding.py → Code/tf_idf_with_max_padding.py b/tf_idf_with_max_padding.py → Code/tf_idf_with_max_padding.py
@@ -6,9 +6,9 @@
 from hazm import *
 
 p = os.path.dirname(os.path.abspath(__file__))
-f = os.path.join(p, "answers_clean.csv")
+f = os.path.join(p, "../Data/intent/answers_clean.csv")
 answers_clean = pd.read_csv(p, index_col=0)
-f = os.path.join(p, "stop_words_short.txt")
+f = os.path.join(p, "../Data/split/stop_words_short.txt")
 text_file = open(f,
                  encoding="utf8")  # I'm not really sure about removing stop words
 stop_words = text_file.read().split("\n")
@@ -95,7 +95,7 @@ def main():
 	padded = max_padding(vectors, max_tokens_per_line)
 	df = pd.DataFrame(padded)
 	p = os.path.dirname(os.path.abspath(__file__))
-	f = os.path.join(p, "tf_idf_padded.csv")
+	f = os.path.join(p, "../Data/intent/tf_idf_padded.csv")
 	df.to_csv(f)
 
 

diff --git a/tokens_in_sentence.py → Code/tokens_in_sentence.py b/tokens_in_sentence.py → Code/tokens_in_sentence.py
diff --git a/utility.py → Code/utility.py b/utility.py → Code/utility.py
@@ -9,7 +9,7 @@
 
 def get_english_names(city: str) -> Tuple[str, str]:
     p = os.path.dirname(os.path.abspath(__file__))
-    f = os.path.join(p, "cities15000.txt")
+    f = os.path.join(p, "../Data/cities/cities15000.txt")
     df = pd.read_csv(f,
                      usecols=[1, 2, 3, 8, 14], sep='\t',
                      encoding="utf-8", header=None)
@@ -19,7 +19,7 @@ def get_english_names(city: str) -> Tuple[str, str]:
     cc = target_row[8]
 
     p = os.path.dirname(os.path.abspath(__file__))
-    f = os.path.join(p, "IP2LOCATION-COUNTRY-MULTILINGUAL.CSV")
+    f = os.path.join(p, "../Data/cities/IP2LOCATION-COUNTRY-MULTILINGUAL.CSV")
     df = pd.read_csv(f,
                      encoding="utf-8",
                      header=None, skiprows=3736, nrows=249)
@@ -29,7 +29,7 @@ def get_english_names(city: str) -> Tuple[str, str]:
 
 def get_lat_lon(eng_city: str) -> Tuple[float, float]:
     p = os.path.dirname(os.path.abspath(__file__))
-    f = os.path.join(p, "cities15000.txt")
+    f = os.path.join(p, "../Data/cities/cities15000.txt")
     df = pd.read_csv(f, usecols=[2, 4, 5, 14],
                      sep='\t',
                      encoding="utf-8", header=None)

diff --git a/weather.py → Code/weather.py b/weather.py → Code/weather.py
@@ -1,6 +1,6 @@
 import requests
 
-from utility import *
+from .utility import *
 
 
 class Weather: