From db62194db1d2a644b51c2f9b877ce18fd6ef0dc4 Mon Sep 17 00:00:00 2001 From: guoyuankai Date: Mon, 11 Jan 2021 10:38:52 +0800 Subject: [PATCH] fix blanck-bug in post processing --- minlp-tokenizer/minlptokenizer/tokenizer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/minlp-tokenizer/minlptokenizer/tokenizer.py b/minlp-tokenizer/minlptokenizer/tokenizer.py index 63bced23..1052bf02 100644 --- a/minlp-tokenizer/minlptokenizer/tokenizer.py +++ b/minlp-tokenizer/minlptokenizer/tokenizer.py @@ -125,7 +125,7 @@ def tag2words(self, text, y_pred_result): word = '' if word: words.append(word) - return regex.split(r'\s+', ' '.join(words)) + return words def set_interfere_factor(self, interfere_factor): """