ENSEMBLEModule: 12 models (new) ENSEMBLEModule: 12 models (new) MSPE_v18_branchy27 date_duration_module_4 arithmetic_module_3 ================================================================================ Dataset: question_dev_result.json total: 247, correct: 182, accuracy: 0.737 Question Type (QTYPE) => --基礎題 (portion:0.623, count:154, errors: 29, accuracy: 0.812) -- D007Q02, D007Q03, D031Q01, D031Q02, D061Q04, D073Q06, D079Q07, D085Q01, D085Q05, D091Q03, D091Q11, D103Q04, D127Q01, D181Q02, D181Q05, D211Q05, D241Q07, D247Q01, D247Q02, D247Q05, D253Q01, D283Q04, D289Q08, D295Q02, D301Q04, D301Q05, D307Q03, D325Q03, D325Q04, --進階題 (portion:0.356, count:88, errors: 31, accuracy: 0.648) -- D007Q04, D013Q01, D013Q02, D037Q04, D037Q05, D037Q06, D037Q12, D037Q17, D037Q18, D049Q03, D073Q04, D073Q07, D073Q09, D073Q11, D085Q07, D085Q08, D115Q02, D115Q03, D115Q04, D115Q07, D127Q06, D127Q07, D247Q07, D247Q08, D247Q09, D253Q07, D283Q01, D301Q06, D313Q04, D313Q05, D325Q05, --申論 (portion:0.020, count:5, errors: 5, accuracy: 0.000) -- D001Q11, D049Q04, D073Q12, D103Q07, D289Q07, Answer Type (ATYPE) => --ATYPE Prediction: YesNo (portion:0.113, count:28, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Kinship (portion:0.121, count:30, errors: 1, accuracy: 0.967) -- D289Q10, --ATYPE Prediction: Num-Measure (portion:0.109, count:27, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Person (portion:0.105, count:26, errors: 1, accuracy: 0.962) -- D325Q03, --ATYPE Prediction: Date-Duration (portion:0.109, count:27, errors: 1, accuracy: 0.963) -- D307Q03, --ATYPE Prediction: Location (portion:0.126, count:31, errors: 1, accuracy: 0.968) -- D241Q08, --ATYPE Prediction: Organization (portion:0.085, count:21, errors: 2, accuracy: 0.905) -- D259Q01, D283Q02, --ATYPE Prediction: Object (portion:0.206, count:51, errors: 6, accuracy: 0.882) -- D049Q04, D103Q07, D241Q09, D289Q07, D313Q01, D313Q02, --ATYPE Prediction: Event (portion:0.020, count:5, errors: 4, accuracy: 0.200) -- D073Q10, D073Q11, D073Q12, D115Q06, --ATYPE Prediction: Misc (portion:0.004, count:1, errors: 1, accuracy: 0.000) -- D001Q11, --ATYPE Prediction Accuracy: 0.931 Answer Mode (AMODE) => -- AMODE Prediction: YesNo (portion:0.113, count:28, errors: 0, accuracy: 1.000) -- -- Answer Prediction: YesNo (portion:0.113, count:28, errors: 9, accuracy: 0.679) -- D037Q17, D037Q18, D115Q02, D127Q06, D253Q07, D301Q06, D313Q04, D313Q05, D325Q05, -- AMODE Prediction: Kinship (portion:0.012, count:3, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Kinship (portion:0.012, count:3, errors: 2, accuracy: 0.333) -- D037Q05, D037Q06, -- AMODE Prediction: Multi-Spans-Extraction (portion:0.085, count:21, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Multi-Spans-Extraction (portion:0.085, count:21, errors: 7, accuracy: 0.667) -- D007Q04, D013Q02, D073Q06, D073Q07, D073Q09, D085Q07, D127Q07, -- AMODE Prediction: Single-Span-Extraction (portion:0.632, count:156, errors: 9, accuracy: 0.942) -- D037Q03, D037Q04, D037Q12, D091Q08, D091Q09, D091Q10, D091Q11, D115Q04, D115Q07, -- Answer Prediction: Single-Span-Extraction (portion:0.632, count:156, errors: 31, accuracy: 0.801) -- D007Q02, D007Q03, D013Q01, D031Q01, D031Q02, D037Q04, D037Q12, D073Q11, D079Q07, D085Q05, D091Q03, D091Q11, D115Q03, D115Q04, D115Q07, D127Q01, D181Q02, D181Q05, D211Q05, D241Q07, D247Q02, D247Q05, D247Q09, D253Q01, D283Q04, D289Q08, D295Q02, D301Q04, D301Q05, D325Q03, D325Q04, ----Single-Span-Extraction module (portion:0.632, count:156, errors: 47, accuracy: 0.699) ---- D007Q02, D007Q03, D013Q01, D031Q01, D031Q02, D037Q01, D037Q02, D037Q03, D037Q04, D037Q07, D037Q08, D037Q09, D037Q10, D037Q12, D037Q13, D037Q14, D037Q15, D037Q16, D073Q11, D079Q07, D085Q05, D091Q03, D091Q05, D091Q06, D091Q08, D091Q09, D091Q10, D091Q11, D091Q12, D103Q05, D115Q03, D115Q04, D115Q07, D127Q01, D181Q02, D181Q05, D211Q05, D247Q02, D247Q09, D253Q01, D283Q04, D289Q08, D295Q02, D301Q04, D301Q05, D325Q03, D325Q04, -- AMODE Prediction: Date-Duration (portion:0.101, count:25, errors: 1, accuracy: 0.960) -- D307Q03, -- Answer Prediction: Date-Duration (portion:0.101, count:25, errors: 4, accuracy: 0.840) -- D061Q04, D103Q04, D247Q08, D307Q03, -- AMODE Prediction: Arithmetic-Operations (portion:0.036, count:9, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Arithmetic-Operations (portion:0.036, count:9, errors: 7, accuracy: 0.222) -- D049Q03, D073Q04, D085Q01, D085Q08, D247Q01, D247Q07, D283Q01, -- AMODE Prediction: Summarize (portion:0.020, count:5, errors: 5, accuracy: 0.000) -- D001Q11, D049Q04, D073Q12, D103Q07, D289Q07, -- Answer Prediction: Summarize (portion:0.020, count:5, errors: 5, accuracy: 0.000) -- D001Q11, D049Q04, D073Q12, D103Q07, D289Q07, --AMODE Prediction Accuracy: 0.939 ================================================================================ Dataset: question_test_result.json total: 193, correct: 136, accuracy: 0.705 Question Type (QTYPE) => --基礎題 (portion:0.720, count:139, errors: 30, accuracy: 0.784) -- D015Q05, D015Q06, D033Q07, D033Q08, D033Q12, D039Q01, D039Q02, D039Q03, D039Q04, D039Q05, D039Q06, D045Q02, D045Q04, D069Q04, D093Q07, D105Q05, D117Q02, D117Q04, D183Q02, D255Q12, D255Q13, D261Q04, D267Q02, D267Q07, D285Q04, D291Q03, D291Q05, D303Q01, D303Q05, D303Q06, --進階題 (portion:0.264, count:51, errors: 24, accuracy: 0.529) -- D003Q03, D009Q04, D033Q01, D033Q03, D033Q04, D033Q05, D033Q06, D069Q05, D069Q11, D069Q12, D069Q13, D087Q03, D087Q04, D093Q04, D105Q04, D117Q01, D117Q08, D201Q05, D255Q07, D303Q03, D309Q02, D309Q05, D315Q02, D315Q06, --申論 (portion:0.016, count:3, errors: 3, accuracy: 0.000) -- D009Q03, D321Q03, D321Q04, Answer Type (ATYPE) => --ATYPE Prediction: YesNo (portion:0.130, count:25, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Kinship (portion:0.062, count:12, errors: 1, accuracy: 0.917) -- D309Q04, --ATYPE Prediction: Num-Measure (portion:0.083, count:16, errors: 1, accuracy: 0.938) -- D183Q03, --ATYPE Prediction: Person (portion:0.088, count:17, errors: 3, accuracy: 0.824) -- D255Q10, D291Q08, D291Q09, --ATYPE Prediction: Date-Duration (portion:0.181, count:35, errors: 5, accuracy: 0.857) -- D117Q01, D117Q02, D117Q03, D117Q06, D273Q01, --ATYPE Prediction: Location (portion:0.140, count:27, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Organization (portion:0.104, count:20, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Object (portion:0.197, count:38, errors: 7, accuracy: 0.816) -- D117Q04, D309Q05, D315Q03, D315Q04, D315Q09, D321Q03, D321Q04, --ATYPE Prediction: Event (portion:0.010, count:2, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Misc (portion:0.005, count:1, errors: 1, accuracy: 0.000) -- D009Q03, --ATYPE Prediction Accuracy: 0.907 Answer Mode (AMODE) => -- AMODE Prediction: YesNo (portion:0.130, count:25, errors: 0, accuracy: 1.000) -- -- Answer Prediction: YesNo (portion:0.130, count:25, errors: 7, accuracy: 0.720) -- D069Q11, D117Q08, D201Q05, D255Q07, D291Q03, D291Q05, D315Q06, -- AMODE Prediction: Multi-Spans-Extraction (portion:0.104, count:20, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Multi-Spans-Extraction (portion:0.104, count:20, errors: 11, accuracy: 0.450) -- D003Q03, D009Q04, D045Q02, D087Q03, D087Q04, D093Q04, D105Q05, D117Q04, D303Q06, D309Q05, D315Q02, -- AMODE Prediction: Single-Span-Extraction (portion:0.580, count:112, errors: 8, accuracy: 0.929) -- D015Q05, D015Q06, D039Q01, D039Q02, D039Q03, D039Q04, D039Q05, D039Q06, -- Answer Prediction: Single-Span-Extraction (portion:0.580, count:112, errors: 27, accuracy: 0.759) -- D015Q05, D015Q06, D033Q01, D033Q03, D033Q04, D033Q05, D033Q06, D033Q07, D033Q08, D033Q12, D039Q01, D039Q02, D039Q03, D039Q04, D039Q05, D039Q06, D045Q04, D069Q12, D093Q07, D183Q02, D255Q12, D255Q13, D261Q04, D267Q02, D303Q01, D303Q03, D309Q02, ----Single-Span-Extraction module (portion:0.580, count:112, errors: 28, accuracy: 0.750) ---- D015Q05, D015Q06, D033Q01, D033Q03, D033Q04, D033Q05, D033Q06, D033Q07, D033Q08, D033Q12, D039Q01, D039Q02, D039Q03, D039Q04, D039Q05, D039Q06, D045Q04, D069Q12, D093Q03, D093Q07, D183Q02, D255Q12, D255Q13, D261Q04, D267Q02, D303Q01, D303Q03, D309Q02, -- AMODE Prediction: Date-Duration (portion:0.161, count:31, errors: 4, accuracy: 0.871) -- D117Q01, D117Q02, D117Q03, D117Q06, -- Answer Prediction: Date-Duration (portion:0.161, count:31, errors: 7, accuracy: 0.774) -- D069Q04, D069Q05, D105Q04, D117Q01, D117Q02, D267Q07, D303Q05, -- AMODE Prediction: Arithmetic-Operations (portion:0.010, count:2, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Arithmetic-Operations (portion:0.010, count:2, errors: 2, accuracy: 0.000) -- D069Q13, D285Q04, -- AMODE Prediction: Summarize (portion:0.016, count:3, errors: 3, accuracy: 0.000) -- D009Q03, D321Q03, D321Q04, -- Answer Prediction: Summarize (portion:0.016, count:3, errors: 3, accuracy: 0.000) -- D009Q03, D321Q03, D321Q04, --AMODE Prediction Accuracy: 0.922 ================================================================================ Dataset: question_train_result.json total: 882, correct: 721, accuracy: 0.817 Question Type (QTYPE) => --基礎題 (portion:0.721, count:636, errors: 62, accuracy: 0.903) -- D002Q04, D004Q02, D004Q07, D010Q06, D035Q01, D035Q03, D036Q15, D036Q18, D040Q14, D042Q15, D046Q02, D070Q11, D071Q08, D072Q05, D078Q07, D082Q02, D086Q01, D086Q02, D092Q12, D096Q02, D096Q03, D100Q01, D106Q03, D108Q05, D108Q07, D113Q05, D116Q03, D116Q04, D116Q05, D116Q08, D120Q07, D124Q05, D126Q01, D179Q04, D210Q01, D215Q10, D244Q05, D251Q05, D252Q01, D252Q05, D256Q01, D256Q05, D260Q01, D263Q05, D270Q05, D275Q06, D275Q09, D278Q04, D278Q06, D281Q03, D282Q04, D282Q08, D282Q12, D282Q14, D292Q02, D292Q07, D298Q05, D302Q02, D304Q01, D310Q03, D311Q01, D324Q03, --進階題 (portion:0.271, count:239, errors: 92, accuracy: 0.615) -- D002Q02, D004Q03, D008Q06, D011Q05, D014Q04, D014Q05, D016Q02, D016Q04, D032Q02, D032Q10, D035Q06, D035Q08, D035Q09, D035Q10, D040Q13, D040Q15, D042Q09, D042Q10, D042Q11, D046Q06, D048Q01, D058Q10, D058Q14, D064Q08, D068Q02, D070Q02, D070Q07, D071Q06, D071Q07, D071Q14, D072Q08, D072Q09, D076Q02, D076Q03, D076Q07, D076Q08, D076Q09, D077Q01, D082Q01, D082Q07, D083Q02, D083Q05, D088Q06, D089Q04, D092Q01, D092Q02, D092Q05, D094Q04, D094Q06, D095Q02, D100Q02, D100Q07, D104Q01, D104Q03, D107Q01, D107Q02, D108Q06, D113Q07, D124Q07, D126Q05, D126Q06, D204Q04, D214Q05, D215Q05, D215Q07, D238Q07, D242Q03, D245Q04, D246Q08, D248Q04, D248Q09, D252Q02, D252Q06, D272Q09, D274Q01, D278Q02, D278Q08, D282Q10, D282Q11, D296Q05, D305Q05, D310Q05, D310Q07, D312Q01, D312Q02, D312Q03, D312Q06, D314Q04, D318Q04, D322Q01, D322Q02, D322Q05, --申論 (portion:0.008, count:7, errors: 7, accuracy: 0.000) -- D006Q02, D048Q09, D086Q03, D094Q01, D245Q05, D288Q12, D322Q07, Answer Type (ATYPE) => --ATYPE Prediction: YesNo (portion:0.099, count:87, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Kinship (portion:0.067, count:59, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Num-Measure (portion:0.080, count:71, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Person (portion:0.101, count:89, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Date-Duration (portion:0.179, count:158, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Location (portion:0.136, count:120, errors: 1, accuracy: 0.992) -- D245Q05, --ATYPE Prediction: Organization (portion:0.095, count:84, errors: 0, accuracy: 1.000) -- --ATYPE Prediction: Object (portion:0.209, count:184, errors: 1, accuracy: 0.995) -- D288Q12, --ATYPE Prediction: Event (portion:0.017, count:15, errors: 1, accuracy: 0.933) -- D322Q07, --ATYPE Prediction: Misc (portion:0.017, count:15, errors: 2, accuracy: 0.867) -- D006Q02, D094Q01, --ATYPE Prediction Accuracy: 0.994 Answer Mode (AMODE) => -- AMODE Prediction: YesNo (portion:0.099, count:87, errors: 0, accuracy: 1.000) -- -- Answer Prediction: YesNo (portion:0.099, count:87, errors: 2, accuracy: 0.977) -- D116Q05, D116Q08, -- AMODE Prediction: Kinship (portion:0.006, count:5, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Kinship (portion:0.006, count:5, errors: 5, accuracy: 0.000) -- D036Q15, D036Q18, D040Q14, D282Q10, D282Q11, -- AMODE Prediction: Multi-Spans-Extraction (portion:0.083, count:73, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Multi-Spans-Extraction (portion:0.083, count:73, errors: 33, accuracy: 0.548) -- D004Q02, D008Q06, D014Q05, D016Q02, D016Q04, D042Q09, D046Q06, D058Q10, D064Q08, D070Q02, D071Q06, D071Q07, D071Q08, D072Q08, D072Q09, D086Q01, D088Q06, D092Q01, D092Q02, D094Q04, D095Q02, D096Q02, D107Q01, D107Q02, D113Q07, D126Q01, D126Q05, D126Q06, D215Q07, D275Q09, D282Q08, D296Q05, D322Q02, -- AMODE Prediction: Single-Span-Extraction (portion:0.619, count:546, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Single-Span-Extraction (portion:0.619, count:546, errors: 61, accuracy: 0.888) -- D002Q04, D004Q03, D004Q07, D010Q06, D011Q05, D032Q02, D035Q03, D035Q06, D040Q13, D040Q15, D042Q15, D046Q02, D058Q14, D070Q11, D072Q05, D076Q09, D078Q07, D082Q02, D086Q02, D089Q04, D092Q12, D100Q07, D104Q03, D106Q03, D116Q03, D116Q04, D120Q07, D124Q05, D179Q04, D204Q04, D210Q01, D242Q03, D244Q05, D251Q05, D252Q01, D256Q01, D260Q01, D263Q05, D270Q05, D272Q09, D275Q06, D278Q02, D278Q04, D278Q06, D278Q08, D281Q03, D282Q04, D282Q12, D282Q14, D292Q02, D292Q07, D298Q05, D302Q02, D305Q05, D311Q01, D312Q06, D314Q04, D318Q04, D322Q01, D322Q05, D324Q03, ----Single-Span-Extraction module (portion:0.619, count:546, errors: 56, accuracy: 0.897) ---- D002Q04, D004Q03, D004Q07, D010Q04, D010Q06, D011Q05, D032Q02, D035Q06, D040Q01, D040Q13, D040Q15, D042Q13, D058Q14, D068Q04, D070Q11, D072Q05, D076Q09, D078Q07, D078Q08, D082Q02, D089Q04, D092Q12, D100Q07, D104Q03, D106Q03, D116Q03, D120Q07, D124Q05, D179Q03, D204Q04, D242Q03, D244Q05, D251Q05, D252Q01, D256Q01, D263Q05, D268Q03, D270Q05, D272Q09, D275Q06, D278Q02, D278Q04, D278Q06, D278Q08, D282Q12, D282Q14, D298Q05, D302Q02, D305Q05, D311Q01, D312Q06, D314Q04, D318Q04, D322Q01, D322Q05, D324Q03, -- AMODE Prediction: Date-Duration (portion:0.166, count:146, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Date-Duration (portion:0.166, count:146, errors: 36, accuracy: 0.753) -- D002Q02, D032Q10, D035Q01, D035Q08, D035Q09, D035Q10, D042Q10, D042Q11, D068Q02, D070Q07, D071Q14, D077Q01, D082Q01, D082Q07, D083Q02, D092Q05, D100Q01, D100Q02, D104Q01, D108Q05, D108Q07, D124Q07, D214Q05, D215Q05, D215Q10, D238Q07, D252Q05, D256Q05, D274Q01, D304Q01, D310Q03, D310Q05, D310Q07, D312Q01, D312Q02, D312Q03, -- AMODE Prediction: Arithmetic-Operations (portion:0.018, count:16, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Arithmetic-Operations (portion:0.018, count:16, errors: 16, accuracy: 0.000) -- D014Q04, D048Q01, D076Q02, D076Q03, D076Q07, D076Q08, D083Q05, D094Q06, D096Q03, D113Q05, D245Q04, D246Q08, D248Q04, D248Q09, D252Q02, D252Q06, -- AMODE Prediction: Comparing-Members (portion:0.002, count:2, errors: 0, accuracy: 1.000) -- -- Answer Prediction: Comparing-Members (portion:0.002, count:2, errors: 1, accuracy: 0.500) -- D108Q06, -- AMODE Prediction: Summarize (portion:0.008, count:7, errors: 7, accuracy: 0.000) -- D006Q02, D048Q09, D086Q03, D094Q01, D245Q05, D288Q12, D322Q07, -- Answer Prediction: Summarize (portion:0.008, count:7, errors: 7, accuracy: 0.000) -- D006Q02, D048Q09, D086Q03, D094Q01, D245Q05, D288Q12, D322Q07, --AMODE Prediction Accuracy: 0.992