|
@@ -28,15 +28,15 @@ class CoreferencePipe(Pipe): |
|
|
.. csv-table:: |
|
|
.. csv-table:: |
|
|
:header: "raw_key", "raw_speaker","raw_words","raw_clusters" |
|
|
:header: "raw_key", "raw_speaker","raw_words","raw_clusters" |
|
|
|
|
|
|
|
|
"bc/cctv/00/cctv_0000_0", "[["Speaker#1", "Speaker#1"],[]]","[["I","am"],[]]","[[[2,3],[6,7]],[[10,12],[20,22]]]" |
|
|
|
|
|
"bc/cctv/00/cctv_0000_1"", "[["Speaker#1", "Speaker#1"],[]]","[["He","is"],[]]","[[[2,3],[6,7]],[[10,12],[20,22]]]" |
|
|
|
|
|
|
|
|
"bc/cctv/00/cctv_0000_0", "[[Speaker#1, Speaker#1],[]]","[['I','am'],[]]","[[[2,3],[6,7]],[[10,12],[20,22]]]" |
|
|
|
|
|
"bc/cctv/00/cctv_0000_1", "[['Speaker#1', 'peaker#1'],[]]","[['He','is'],[]]","[[[2,3],[6,7]],[[10,12],[20,22]]]" |
|
|
"[...]", "[...]","[...]","[...]" |
|
|
"[...]", "[...]","[...]","[...]" |
|
|
|
|
|
|
|
|
处理完成后数据包含文章类别、speaker信息、句子信息、句子对应的index、char、句子长度、target: |
|
|
处理完成后数据包含文章类别、speaker信息、句子信息、句子对应的index、char、句子长度、target: |
|
|
.. csv-table:: |
|
|
.. csv-table:: |
|
|
:header: "words1", "words2","words3","words4","chars","seq_len","target" |
|
|
:header: "words1", "words2","words3","words4","chars","seq_len","target" |
|
|
|
|
|
|
|
|
"bc", "[[0,0],[1,1]]","[["I","am"],[]]",[[1,2],[]],[[[1],[2,3]],[]],[2,3],"[[[2,3],[6,7]],[[10,12],[20,22]]]" |
|
|
|
|
|
|
|
|
"bc", "[[0,0],[1,1]]","[['I','am'],[]]","[[1,2],[]]","[[[1],[2,3]],[]]","[2,3]","[[[2,3],[6,7]],[[10,12],[20,22]]]" |
|
|
"[...]", "[...]","[...]","[...]","[...]","[...]","[...]" |
|
|
"[...]", "[...]","[...]","[...]","[...]","[...]","[...]" |
|
|
|
|
|
|
|
|
|
|
|
|
|
|