Skip to content

Commit 6d49aa9

Browse files
committed
Adding properties param for tokensregex, semgrex and regex
1 parent 4c9bd82 commit 6d49aa9

File tree

2 files changed

+13
-7
lines changed

2 files changed

+13
-7
lines changed

example.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -14,3 +14,8 @@
1414
print(output)
1515
output = nlp.semgrex(text, pattern='{tag: VBD}', filter=False)
1616
print(output)
17+
output = nlp.semgrex(text, pattern='{ner: PERS}', filter=False, properties={
18+
'annotators': 'tokenize,ssplit,ner,depparse',
19+
'pipelineLanguage': 'en',
20+
})
21+
print(output)

pycorenlp/corenlp.py

Lines changed: 8 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -36,21 +36,22 @@ def annotate(self, text, properties=None):
3636
pass
3737
return output
3838

39-
def tokensregex(self, text, pattern, filter):
40-
return self.regex('/tokensregex', text, pattern, filter)
39+
def tokensregex(self, text, pattern, filter, properties = None):
40+
return self.regex('/tokensregex', text, pattern, filter, properties)
4141

42-
def semgrex(self, text, pattern, filter):
43-
return self.regex('/semgrex', text, pattern, filter)
42+
def semgrex(self, text, pattern, filter, properties = None):
43+
return self.regex('/semgrex', text, pattern, filter, properties)
4444

45-
def regex(self, endpoint, text, pattern, filter):
45+
def regex(self, endpoint, text, pattern, filter, properties = None):
4646
r = requests.get(
4747
self.server_url + endpoint, params={
48-
'pattern': pattern,
48+
'pattern': pattern,
49+
'properties': str(properties or {}),
4950
'filter': filter
5051
}, data=text)
5152
output = r.text
5253
try:
53-
output = json.loads(r.text)
54+
output = json.loads(r.text, encoding='utf-8', strict=True)
5455
except:
5556
pass
5657
return output

0 commit comments

Comments
 (0)