From 75d593702ad0f4f42a910aebfee5de8b6c4c8bd1 Mon Sep 17 00:00:00 2001 From: yunfan Date: Wed, 18 Mar 2020 11:26:00 +0800 Subject: [PATCH] [update] multi criteria cws --- reproduction/multi-criteria-cws/data-prepare.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/reproduction/multi-criteria-cws/data-prepare.py b/reproduction/multi-criteria-cws/data-prepare.py index 1d6e89b5..2c28e3b6 100644 --- a/reproduction/multi-criteria-cws/data-prepare.py +++ b/reproduction/multi-criteria-cws/data-prepare.py @@ -51,7 +51,7 @@ def preprocess(text): def to_sentence_list(text, split_long_sentence=False): text = preprocess(text) delimiter = set() - delimiter.update("。!?:;…、,(),;!?、,\"'") + delimiter.update("。!?:;…、,(),;!?、.\"'") delimiter.add("……") sent_list = [] sent = []