-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathmain.py
31 lines (30 loc) · 856 Bytes
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
from hazm import *
import pickle
listt = [
"تلفات جاده آمار",
"انرژي هسته قوانين",
"مربي فوتبال ايران",
"تحريم اقتصادي ايران",
"باغباني گل آموزش"
]
for x in listt:
input_query = x
pkl_file = open('data.pkl', 'rb')
dic = pickle.load(pkl_file)
pkl_file.close()
normalizer = Normalizer()
normalized = normalizer.normalize(input_query)
stemmer = Stemmer()
stemmed = stemmer.stem(normalized)
tokens = word_tokenize(stemmed)
list_of_synonyms = {}
for x in tokens:
try:
tokens_synonyms = word_tokenize(dic[x])
for y in tokens_synonyms:
list_of_synonyms[x] = y
except:
pass
list_of_synonyms[x] = x
values = list_of_synonyms.values()
print(' '.join(values))