|
@@ -280,6 +280,8 @@ class StaticEmbedding(TokenEmbedding): |
|
|
found_unknown = True |
|
|
found_unknown = True |
|
|
if word in vocab: |
|
|
if word in vocab: |
|
|
index = vocab.to_index(word) |
|
|
index = vocab.to_index(word) |
|
|
|
|
|
if index in matrix: |
|
|
|
|
|
warnings.warn(f"Word:{word} occurs again in line:{idx}(starts from 0)") |
|
|
matrix[index] = torch.from_numpy(np.fromstring(' '.join(nums), sep=' ', dtype=dtype, count=dim)) |
|
|
matrix[index] = torch.from_numpy(np.fromstring(' '.join(nums), sep=' ', dtype=dtype, count=dim)) |
|
|
if self.only_norm_found_vector: |
|
|
if self.only_norm_found_vector: |
|
|
matrix[index] = matrix[index] / np.linalg.norm(matrix[index]) |
|
|
matrix[index] = matrix[index] / np.linalg.norm(matrix[index]) |
|
|