diff --git a/reproduction/multi-criteria-cws/data-prepare.py b/reproduction/multi-criteria-cws/data-prepare.py index 1d6e89b5..2c28e3b6 100644 --- a/reproduction/multi-criteria-cws/data-prepare.py +++ b/reproduction/multi-criteria-cws/data-prepare.py @@ -51,7 +51,7 @@ def preprocess(text): def to_sentence_list(text, split_long_sentence=False): text = preprocess(text) delimiter = set() - delimiter.update("。!?:;…、,(),;!?、,\"'") + delimiter.update("。!?:;…、,(),;!?、.\"'") delimiter.add("……") sent_list = [] sent = []