-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathlexiPersTags.py
28 lines (21 loc) · 842 Bytes
/
lexiPersTags.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
def addLexiPers():
import xml.etree.ElementTree as ET
import pandas as pd
root = ET.parse('/home/ashkan/Documents/PycharmProjects/sentiment_analysis/LexiPersV1.0/Data/adj-final.xml').getroot()
sense = []
label = []
for synset in root.findall('Synset'):
sense.append(synset.get('Sense'))
label.append(int(synset.get('Label')))
lexiDict = dict(zip(sense, label))
lexiPers = pd.DataFrame.from_dict(lexiDict, orient='index').T
key = []
values = []
for i in range(lexiPers.shape[1]):
temp = lexiPers.columns[i]
x = temp.split(',')
for j in range(len(x)):
key.append(x[j])
values.append(lexiPers.iloc[0, i])
df = pd.DataFrame(list(zip(key, values)), columns=['Persian Translation (Google Translate)', 'sentiment'])
return df