-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathPatternUtil.py
58 lines (51 loc) · 1.94 KB
/
PatternUtil.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
class Triplets :
def __init__(self, sentenceId, beginPos, endPos) :
self.sentenceId = sentenceId
self.beginPos = beginPos
self.endPos = endPos
def __str__(self):
return "( "+str(self.sentenceId)+","+str(self.beginPos)+","+str(self.endPos)+" )"
def __repr__(self):
return self.__str__()
class Pattern:
def __init__(self,tree,patternId,alignment,triplets, patternString):
self.patternId = patternId
self.tree = tree
self.patternString = patternString
self.alignment = alignment
self.triplets = triplets
def getPattern(self):
return self.tree
# 1- 1 |BT| (NP (NP (NN 0)) (PP (IN 0) (S (VP (VP (VBG 0) (NP (NP (DT 0)))))))) |ET|
def getPartsTree(line) :
id = int(line.split('- ',1)[0])
rest = line.split('- ',1)[1]
alignment = int(rest.split(' ',1)[0])
tree = rest.split(' ',1)[1]
return [id, alignment, tree]
def getPartsPattern(line) :
id = int(line.split('- ',1)[0])
rest = line.split('- ',1)[1]
triplets = rest[rest.rfind(': ')+2:]
triplets = triplets.split(")(")
triplets[0] = triplets[0][1:]
triplets[len(triplets)-1] = triplets[len(triplets)-1][:-1]
triplets = [Triplets(int(i.split(',')[0]), int(i.split(',')[1]), int(i.split(',')[2])) for i in triplets]
pattern = rest[0 : rest.rfind(': ')]
return [id, triplets, pattern]
def loadPatterns(loadTreeString, loadPatternString) :
patternobjectList = []
f_loadTreeString = open(loadTreeString)
f_loadPatternString = open(loadPatternString)
treeList = f_loadTreeString.readlines()
patternList = f_loadPatternString.readlines()
for i in range(0, len(treeList)) :
partsTree = getPartsTree(treeList[i].rstrip('\n'))
partsPattern = getPartsPattern(patternList[i].rstrip('\n'))
patternobjectList.append(Pattern(partsTree[2], partsPattern[0], partsTree[1], partsPattern[1], partsPattern[2]))
return patternobjectList
def toDictionary(patternList) :
patternDictionary = {}
for pattern in patternList :
patternDictionary[pattern.patternId] = pattern
return patternDictionary