forked from cltl/OpenDutchWordnet
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathle.py
123 lines (99 loc) · 3.33 KB
/
le.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
class Le():
'''
class from XML element LexicalEntry
.. highlight::
<LexicalEntry id="havenplaats-n-1">
<Lemma partOfSpeech="noun" writtenForm="havenplaats"/>
<Sense id="o_n-109910434"
provenance="cdb2.2_Auto"
synset="eng-30-08633957-n/>
'''
def __init__(self,le_el,lexicon_el):
self.le_el = le_el
self.sense_el = self.le_el.find("Sense")
self.lexicon_el = lexicon_el
def get_id(self):
'''
return identifier of lexical entry
by returning attribute "id"
:rtype: str
:return: identifier of lexical entry
'''
return self.le_el.get("id")
def get_lemma(self):
'''
return lemma of le by returning attribute "writtenForm"
from child "Lemma"
:rtype: str
:return: lemma of le
'''
self.lemma_el = self.le_el.find("Lemma")
if self.lemma_el is not None:
return self.lemma_el.get("writtenForm")
else:
return None
def get_pos(self):
'''
return pos (noun | verb) of lexical entry
by returning attribute "partOfSpeech"
:rtype: str
:return: noun | verb. None if not found.
'''
return self.le_el.get("partOfSpeech")
def get_sense_id(self):
'''
return sense id from open referentie bestand nederlands
by returning attribute "id" from child element "Sense"
:rtype: str
:return: sense id from open referentie bestand nederlands.
None if not found
'''
return self.sense_el.get("id")
def get_annotator(self):
'''
return manual annotator (default is '')
by returning attribute 'annotator' from child element 'Sense'
:rtype: str
:return: manual annotator (default '')
'''
return self.sense_el.get('annotator')
def get_sense_number(self):
'''
return sense number
by returning attribute "senseId" from child element "Sense"
:rtype: int
:return: sense number, None if not found
'''
return self.sense_el.get("senseId")
def get_provenance(self):
'''
get provenance of lexical entry by returning
attribute "provenance" from child element "Sense"
:rtype: str
:return: provenance (source concatenated by "+")
'''
return self.sense_el.get("provenance")
def get_definition(self):
'''
get definition of lexical entry by returning
attribute 'definition' from child element 'Sense'
:rtype: str
:return: definition
'''
return self.sense_el.get('definition')
def get_synset_id(self):
'''
return synset identifier to which lexical entry belongs
:rtype: str
:return: synset identifier. None if not found
'''
return self.sense_el.get("synset")
def remove_me(self):
'''
remove lexical entry element
'''
try:
self.lexicon_el.remove(self.le_el)
return (True,'')
except ValueError:
return (False,'could not remove %s' % self.get_id())