| @@ -239,7 +239,7 @@ class SeqLabelPreprocess(BasePreprocess): | |||||
| label2index: dict of {str, int} | label2index: dict of {str, int} | ||||
| """ | """ | ||||
| # In seq labeling, both word seq and label seq need to be padded to the same length in a mini-batch. | # In seq labeling, both word seq and label seq need to be padded to the same length in a mini-batch. | ||||
| label2index = DEFAULT_WORD_TO_INDEX.copy() | |||||
| label2index = {} # DEFAULT_WORD_TO_INDEX.copy() | |||||
| word2index = DEFAULT_WORD_TO_INDEX.copy() | word2index = DEFAULT_WORD_TO_INDEX.copy() | ||||
| for example in data: | for example in data: | ||||
| for word, label in zip(example[0], example[1]): | for word, label in zip(example[0], example[1]): | ||||
| @@ -297,7 +297,7 @@ class ClassPreprocess(BasePreprocess): | |||||
| # build vocabulary from scratch if nothing exists | # build vocabulary from scratch if nothing exists | ||||
| word2index = DEFAULT_WORD_TO_INDEX.copy() | word2index = DEFAULT_WORD_TO_INDEX.copy() | ||||
| label2index = DEFAULT_WORD_TO_INDEX.copy() | |||||
| label2index = {} # DEFAULT_WORD_TO_INDEX.copy() | |||||
| # collect every word and label | # collect every word and label | ||||
| for sent, label in data: | for sent, label in data: | ||||