diff --git a/nlp-tools2/v1/lemma.ini b/nlp-tools2/v1/lemma.ini index 3ca8a9b..b31a3c0 100644 --- a/nlp-tools2/v1/lemma.ini +++ b/nlp-tools2/v1/lemma.ini @@ -24,8 +24,8 @@ plugin = @ezs/analytics [JSONParse] -legacy = false -separator = $ +#legacy = false +#separator = $ [expand] path = env('path', 'value') diff --git a/nlp-tools2/v1/ws_lemmatization.py b/nlp-tools2/v1/ws_lemmatization.py index bcd912b..6b28cd8 100644 --- a/nlp-tools2/v1/ws_lemmatization.py +++ b/nlp-tools2/v1/ws_lemmatization.py @@ -14,12 +14,13 @@ for line in sys.stdin: data=json.loads(line) i=data['value'] - if type(i)==str and len(i.split(' '))==1: - + if type(i)==str and (len(i.split(' '))==1 and len(i.split('/'))==1): + i=i.replace("*"," ").strip() data["value"]=nlp(i)[0].lemma_ elif type(i)==list: ll=list() for j in i: + j=j.replace('*',' ').strip() if len(j.split())==1: ll.append(nlp(j)[0].lemma_) else: @@ -27,6 +28,7 @@ data['value']=ll else: + i=i.replace('*',' ').strip() sent=' '.join([w.lemma_ for w in nlp(i)]) data['value']=sent