dispatcher: model_dir3/epoch_18 ENSEMBLEModule: 12 models (new) MSPE_v18_branchy27 date_duration_module_4 arithmetic_module_4 kiwiQA X ================================================================================ Dataset: question_dev_result.json total: 247, correct: 184, accuracy: 0.745 Question Type (QTYPE) => --基礎題 (portion:0.623, count:154, errors: 30, accuracy: 0.805) -- D007Q02, D007Q03, D031Q01, D031Q02, D061Q04, D073Q06, D079Q07, D085Q01, D085Q05, D091Q03, D091Q11, D103Q04, D127Q01, D181Q02, D181Q05, D211Q05, D241Q07, D247Q01, D247Q02, D247Q05, D253Q01, D283Q04, D289Q08, D295Q02, D301Q04, D301Q05, D307Q03, D313Q01, D313Q02, D325Q03, --進階題 (portion:0.356, count:88, errors: 28, accuracy: 0.682) -- D007Q04, D013Q01, D013Q02, D037Q04, D037Q11, D037Q12, D037Q17, D037Q18, D049Q03, D073Q07, D073Q09, D073Q11, D085Q07, D085Q08, D115Q02, D115Q03, D115Q04, D115Q07, D127Q06, D127Q07, D247Q08, D247Q09, D253Q07, D283Q01, D301Q06, D313Q04, D313Q05, D325Q05, --申論 (portion:0.020, count:5, errors: 5, accuracy: 0.000) -- D001Q11, D049Q04, D073Q12, D103Q07, D289Q07, Answer Type (ATYPE) Prediction => -- YesNo Top1: (portion:0.113, count:28, errors: 0, accuracy: 1.000) -- -- YesNo Top2: (portion:0.113, count:28, errors: 0, accuracy: 1.000) -- -- Kinship Top1: (portion:0.121, count:30, errors: 1, accuracy: 0.967) -- D289Q10, -- Kinship Top2: (portion:0.121, count:30, errors: 1, accuracy: 0.967) -- D289Q10, -- Num-Measure Top1: (portion:0.109, count:27, errors: 0, accuracy: 1.000) -- -- Num-Measure Top2: (portion:0.109, count:27, errors: 0, accuracy: 1.000) -- -- Person Top1: (portion:0.130, count:32, errors: 5, accuracy: 0.844) -- D001Q11, D049Q07, D259Q01, D295Q06, D325Q03, -- Person Top2: (portion:0.130, count:32, errors: 5, accuracy: 0.844) -- D001Q11, D049Q07, D259Q01, D295Q06, D325Q03, -- Date-Duration Top1: (portion:0.109, count:27, errors: 1, accuracy: 0.963) -- D307Q03, -- Date-Duration Top2: (portion:0.109, count:27, errors: 1, accuracy: 0.963) -- D307Q03, -- Location Top1: (portion:0.130, count:32, errors: 2, accuracy: 0.938) -- D241Q05, D295Q04, -- Location Top2: (portion:0.130, count:32, errors: 0, accuracy: 1.000) -- -- Organization Top1: (portion:0.077, count:19, errors: 1, accuracy: 0.947) -- D283Q02, -- Organization Top2: (portion:0.077, count:19, errors: 1, accuracy: 0.947) -- D283Q02, -- Object Top1: (portion:0.198, count:49, errors: 6, accuracy: 0.878) -- D049Q04, D103Q07, D115Q06, D289Q07, D313Q01, D313Q02, -- Object Top2: (portion:0.198, count:49, errors: 4, accuracy: 0.918) -- D049Q04, D103Q07, D115Q06, D289Q07, -- Event Top1: (portion:0.004, count:1, errors: 0, accuracy: 1.000) -- -- Event Top2: (portion:0.004, count:1, errors: 0, accuracy: 1.000) -- -- Misc Top1: (portion:0.008, count:2, errors: 0, accuracy: 1.000) -- -- Misc Top2: (portion:0.008, count:2, errors: 0, accuracy: 1.000) -- -- ATYPE Accuracy: Top-1 0.935 Top-2 0.951 Answer Mode (AMODE) Prediction => -- YesNo AMODE Top1: (portion:0.113, count:28, errors: 0, accuracy: 1.000) -- -- YesNo AMODE Top2: (portion:0.113, count:28, errors: 0, accuracy: 1.000) -- -- YesNo Answer: (portion:0.113, count:28, errors: 9, accuracy: 0.679) -- D037Q17, D037Q18, D115Q02, D127Q06, D253Q07, D301Q06, D313Q04, D313Q05, D325Q05, -- Kinship AMODE Top1: (portion:0.093, count:23, errors: 0, accuracy: 1.000) -- -- Kinship AMODE Top2: (portion:0.093, count:23, errors: 0, accuracy: 1.000) -- -- Kinship Answer: (portion:0.093, count:23, errors: 5, accuracy: 0.783) -- D037Q04, D037Q11, D037Q12, D091Q03, D091Q11, -- Multi-Spans-Extraction AMODE Top1: (portion:0.085, count:21, errors: 0, accuracy: 1.000) -- -- Multi-Spans-Extraction AMODE Top2: (portion:0.085, count:21, errors: 0, accuracy: 1.000) -- -- Multi-Spans-Extraction Answer: (portion:0.085, count:21, errors: 7, accuracy: 0.667) -- D007Q04, D013Q02, D073Q06, D073Q07, D073Q09, D085Q07, D127Q07, -- Single-Span-Extraction AMODE Top1: (portion:0.514, count:127, errors: 4, accuracy: 0.969) -- D115Q04, D115Q07, D313Q01, D313Q02, -- Single-Span-Extraction AMODE Top2: (portion:0.514, count:127, errors: 0, accuracy: 1.000) -- -- Single-Span-Extraction Answer: (portion:0.514, count:127, errors: 25, accuracy: 0.803) -- D007Q02, D007Q03, D013Q01, D031Q01, D031Q02, D073Q11, D079Q07, D085Q05, D115Q03, D115Q04, D115Q07, D127Q01, D181Q02, D181Q05, D211Q05, D247Q02, D253Q01, D283Q04, D289Q08, D295Q02, D301Q04, D301Q05, D313Q01, D313Q02, D325Q03, ---- Single-Span-Extraction module (portion:0.514, count:127, errors: 30, accuracy: 0.764) ---- D007Q02, D007Q03, D013Q01, D031Q01, D031Q02, D037Q07, D037Q08, D037Q09, D037Q10, D073Q11, D079Q07, D085Q05, D115Q03, D115Q04, D115Q07, D127Q01, D181Q02, D181Q05, D211Q05, D247Q02, D253Q01, D283Q04, D289Q08, D295Q02, D301Q04, D301Q05, D313Q01, D313Q02, D325Q03, D325Q04, -- Date-Duration AMODE Top1: (portion:0.093, count:23, errors: 1, accuracy: 0.957) -- D307Q03, -- Date-Duration AMODE Top2: (portion:0.093, count:23, errors: 0, accuracy: 1.000) -- -- Date-Duration Answer: (portion:0.093, count:23, errors: 4, accuracy: 0.826) -- D061Q04, D103Q04, D247Q08, D307Q03, -- Arithmetic-Operations AMODE Top1: (portion:0.081, count:20, errors: 0, accuracy: 1.000) -- -- Arithmetic-Operations AMODE Top2: (portion:0.081, count:20, errors: 0, accuracy: 1.000) -- -- Arithmetic-Operations Answer: (portion:0.081, count:20, errors: 8, accuracy: 0.600) -- D049Q03, D085Q01, D085Q08, D241Q07, D247Q01, D247Q05, D247Q09, D283Q01, -- Summarize AMODE Top1: (portion:0.020, count:5, errors: 5, accuracy: 0.000) -- D001Q11, D049Q04, D073Q12, D103Q07, D289Q07, -- Summarize AMODE Top2: (portion:0.020, count:5, errors: 3, accuracy: 0.400) -- D073Q12, D103Q07, D289Q07, -- Summarize Answer: (portion:0.020, count:5, errors: 5, accuracy: 0.000) -- D001Q11, D049Q04, D073Q12, D103Q07, D289Q07, -- AMODE Accuracy: Top-1 0.960 Top-2 0.988 ================================================================================ Dataset: question_test_result.json total: 193, correct: 138, accuracy: 0.715 Question Type (QTYPE) => --基礎題 (portion:0.720, count:139, errors: 29, accuracy: 0.791) -- D015Q05, D033Q07, D033Q08, D033Q12, D039Q03, D039Q04, D039Q05, D039Q06, D045Q02, D045Q04, D069Q04, D093Q07, D105Q05, D117Q02, D117Q04, D183Q02, D255Q12, D255Q13, D261Q04, D267Q02, D267Q07, D285Q04, D291Q03, D291Q05, D303Q01, D303Q04, D303Q05, D303Q06, D315Q03, --進階題 (portion:0.264, count:51, errors: 23, accuracy: 0.549) -- D003Q03, D009Q04, D033Q01, D033Q03, D033Q04, D033Q05, D033Q06, D069Q05, D069Q11, D069Q12, D069Q13, D087Q03, D087Q04, D093Q04, D105Q04, D117Q08, D201Q05, D255Q07, D303Q03, D309Q02, D309Q05, D315Q02, D315Q06, --申論 (portion:0.016, count:3, errors: 3, accuracy: 0.000) -- D009Q03, D321Q03, D321Q04, Answer Type (ATYPE) Prediction => -- YesNo Top1: (portion:0.130, count:25, errors: 0, accuracy: 1.000) -- -- YesNo Top2: (portion:0.130, count:25, errors: 0, accuracy: 1.000) -- -- Kinship Top1: (portion:0.062, count:12, errors: 1, accuracy: 0.917) -- D303Q04, -- Kinship Top2: (portion:0.062, count:12, errors: 1, accuracy: 0.917) -- D303Q04, -- Num-Measure Top1: (portion:0.109, count:21, errors: 2, accuracy: 0.905) -- D183Q03, D309Q04, -- Num-Measure Top2: (portion:0.109, count:21, errors: 2, accuracy: 0.905) -- D183Q03, D309Q04, -- Person Top1: (portion:0.078, count:15, errors: 2, accuracy: 0.867) -- D255Q10, D291Q09, -- Person Top2: (portion:0.078, count:15, errors: 1, accuracy: 0.933) -- D291Q09, -- Date-Duration Top1: (portion:0.155, count:30, errors: 0, accuracy: 1.000) -- -- Date-Duration Top2: (portion:0.155, count:30, errors: 0, accuracy: 1.000) -- -- Location Top1: (portion:0.140, count:27, errors: 0, accuracy: 1.000) -- -- Location Top2: (portion:0.140, count:27, errors: 0, accuracy: 1.000) -- -- Organization Top1: (portion:0.109, count:21, errors: 1, accuracy: 0.952) -- D105Q07, -- Organization Top2: (portion:0.109, count:21, errors: 1, accuracy: 0.952) -- D105Q07, -- Object Top1: (portion:0.202, count:39, errors: 8, accuracy: 0.795) -- D003Q07, D117Q04, D309Q05, D315Q03, D315Q04, D315Q09, D321Q03, D321Q04, -- Object Top2: (portion:0.202, count:39, errors: 6, accuracy: 0.846) -- D003Q07, D117Q04, D309Q05, D315Q04, D321Q03, D321Q04, -- Event Top1: (portion:0.010, count:2, errors: 0, accuracy: 1.000) -- -- Event Top2: (portion:0.010, count:2, errors: 0, accuracy: 1.000) -- -- Misc Top1: (portion:0.005, count:1, errors: 1, accuracy: 0.000) -- D009Q03, -- Misc Top2: (portion:0.005, count:1, errors: 0, accuracy: 1.000) -- -- ATYPE Accuracy: Top-1 0.922 Top-2 0.943 Answer Mode (AMODE) Prediction => -- YesNo AMODE Top1: (portion:0.130, count:25, errors: 0, accuracy: 1.000) -- -- YesNo AMODE Top2: (portion:0.130, count:25, errors: 0, accuracy: 1.000) -- -- YesNo Answer: (portion:0.130, count:25, errors: 7, accuracy: 0.720) -- D069Q11, D117Q08, D201Q05, D255Q07, D291Q03, D291Q05, D315Q06, -- Kinship AMODE Top1: (portion:0.026, count:5, errors: 0, accuracy: 1.000) -- -- Kinship AMODE Top2: (portion:0.026, count:5, errors: 0, accuracy: 1.000) -- -- Kinship Answer: (portion:0.026, count:5, errors: 4, accuracy: 0.200) -- D039Q03, D039Q04, D039Q05, D039Q06, -- Multi-Spans-Extraction AMODE Top1: (portion:0.119, count:23, errors: 1, accuracy: 0.957) -- D315Q03, -- Multi-Spans-Extraction AMODE Top2: (portion:0.119, count:23, errors: 0, accuracy: 1.000) -- -- Multi-Spans-Extraction Answer: (portion:0.119, count:23, errors: 12, accuracy: 0.478) -- D003Q03, D009Q04, D045Q02, D087Q03, D087Q04, D093Q04, D105Q05, D117Q04, D303Q06, D309Q05, D315Q02, D315Q03, -- Single-Span-Extraction AMODE Top1: (portion:0.503, count:97, errors: 1, accuracy: 0.990) -- D267Q07, -- Single-Span-Extraction AMODE Top2: (portion:0.503, count:97, errors: 0, accuracy: 1.000) -- -- Single-Span-Extraction Answer: (portion:0.503, count:97, errors: 20, accuracy: 0.794) -- D033Q01, D033Q03, D033Q04, D033Q05, D033Q06, D033Q07, D033Q08, D033Q12, D045Q04, D069Q12, D093Q07, D183Q02, D255Q12, D255Q13, D261Q04, D267Q02, D267Q07, D303Q01, D303Q03, D303Q04, ---- Single-Span-Extraction module (portion:0.503, count:97, errors: 20, accuracy: 0.794) ---- D033Q01, D033Q03, D033Q04, D033Q05, D033Q06, D033Q07, D033Q08, D033Q12, D045Q04, D069Q07, D069Q12, D093Q07, D183Q02, D255Q12, D255Q13, D261Q04, D267Q02, D267Q07, D303Q01, D303Q03, -- Date-Duration AMODE Top1: (portion:0.124, count:24, errors: 0, accuracy: 1.000) -- -- Date-Duration AMODE Top2: (portion:0.124, count:24, errors: 0, accuracy: 1.000) -- -- Date-Duration Answer: (portion:0.124, count:24, errors: 4, accuracy: 0.833) -- D069Q04, D069Q05, D105Q04, D303Q05, -- Arithmetic-Operations AMODE Top1: (portion:0.083, count:16, errors: 1, accuracy: 0.938) -- D309Q04, -- Arithmetic-Operations AMODE Top2: (portion:0.083, count:16, errors: 0, accuracy: 1.000) -- -- Arithmetic-Operations Answer: (portion:0.083, count:16, errors: 5, accuracy: 0.688) -- D015Q05, D069Q13, D117Q02, D285Q04, D309Q02, -- Summarize AMODE Top1: (portion:0.016, count:3, errors: 3, accuracy: 0.000) -- D009Q03, D321Q03, D321Q04, -- Summarize AMODE Top2: (portion:0.016, count:3, errors: 2, accuracy: 0.333) -- D321Q03, D321Q04, -- Summarize Answer: (portion:0.016, count:3, errors: 3, accuracy: 0.000) -- D009Q03, D321Q03, D321Q04, -- AMODE Accuracy: Top-1 0.969 Top-2 0.990 ================================================================================ Dataset: question_train_result.json total: 882, correct: 720, accuracy: 0.816 Question Type (QTYPE) => --基礎題 (portion:0.721, count:636, errors: 64, accuracy: 0.899) -- D002Q04, D004Q02, D004Q07, D010Q06, D035Q01, D035Q03, D036Q15, D036Q18, D040Q14, D042Q15, D046Q07, D048Q05, D070Q11, D071Q08, D072Q05, D078Q07, D082Q02, D086Q01, D086Q02, D092Q12, D096Q02, D096Q03, D096Q06, D100Q01, D106Q03, D108Q05, D108Q07, D116Q03, D116Q04, D116Q05, D116Q08, D120Q07, D124Q05, D126Q01, D126Q04, D138Q06, D179Q04, D215Q10, D251Q05, D252Q01, D252Q05, D256Q01, D256Q05, D260Q01, D263Q05, D270Q05, D275Q06, D275Q09, D278Q04, D278Q06, D281Q03, D282Q04, D282Q08, D282Q12, D282Q14, D292Q02, D292Q07, D298Q05, D302Q02, D304Q01, D304Q09, D310Q03, D311Q01, D324Q03, --進階題 (portion:0.271, count:239, errors: 91, accuracy: 0.619) -- D002Q02, D004Q03, D008Q06, D011Q05, D014Q04, D014Q05, D016Q02, D016Q04, D032Q02, D032Q10, D035Q06, D035Q08, D035Q09, D035Q10, D040Q15, D042Q09, D042Q10, D042Q11, D046Q06, D048Q01, D058Q10, D058Q14, D064Q08, D068Q02, D070Q02, D070Q07, D071Q06, D071Q07, D071Q14, D072Q08, D072Q09, D076Q02, D076Q03, D076Q07, D076Q08, D076Q09, D077Q01, D082Q01, D082Q07, D083Q02, D088Q06, D089Q01, D089Q02, D089Q03, D089Q04, D089Q05, D092Q01, D092Q02, D092Q05, D094Q04, D095Q02, D100Q02, D100Q07, D104Q01, D107Q01, D107Q02, D113Q07, D124Q07, D126Q05, D126Q06, D204Q04, D214Q05, D215Q05, D215Q07, D238Q07, D245Q04, D248Q04, D252Q02, D252Q06, D272Q09, D274Q01, D278Q02, D278Q08, D282Q10, D282Q11, D296Q05, D299Q03, D305Q05, D310Q05, D310Q07, D312Q01, D312Q02, D312Q03, D312Q04, D312Q06, D312Q08, D314Q04, D318Q04, D322Q01, D322Q02, D322Q05, --申論 (portion:0.008, count:7, errors: 7, accuracy: 0.000) -- D006Q02, D048Q09, D086Q03, D094Q01, D245Q05, D288Q12, D322Q07, Answer Type (ATYPE) Prediction => -- YesNo Top1: (portion:0.099, count:87, errors: 0, accuracy: 1.000) -- -- YesNo Top2: (portion:0.099, count:87, errors: 0, accuracy: 1.000) -- -- Kinship Top1: (portion:0.067, count:59, errors: 0, accuracy: 1.000) -- -- Kinship Top2: (portion:0.067, count:59, errors: 0, accuracy: 1.000) -- -- Num-Measure Top1: (portion:0.080, count:71, errors: 0, accuracy: 1.000) -- -- Num-Measure Top2: (portion:0.080, count:71, errors: 0, accuracy: 1.000) -- -- Person Top1: (portion:0.101, count:89, errors: 0, accuracy: 1.000) -- -- Person Top2: (portion:0.101, count:89, errors: 0, accuracy: 1.000) -- -- Date-Duration Top1: (portion:0.179, count:158, errors: 0, accuracy: 1.000) -- -- Date-Duration Top2: (portion:0.179, count:158, errors: 0, accuracy: 1.000) -- -- Location Top1: (portion:0.136, count:120, errors: 1, accuracy: 0.992) -- D245Q05, -- Location Top2: (portion:0.136, count:120, errors: 1, accuracy: 0.992) -- D245Q05, -- Organization Top1: (portion:0.095, count:84, errors: 0, accuracy: 1.000) -- -- Organization Top2: (portion:0.095, count:84, errors: 0, accuracy: 1.000) -- -- Object Top1: (portion:0.209, count:184, errors: 1, accuracy: 0.995) -- D288Q12, -- Object Top2: (portion:0.209, count:184, errors: 1, accuracy: 0.995) -- D288Q12, -- Event Top1: (portion:0.017, count:15, errors: 1, accuracy: 0.933) -- D322Q07, -- Event Top2: (portion:0.017, count:15, errors: 1, accuracy: 0.933) -- D322Q07, -- Misc Top1: (portion:0.017, count:15, errors: 2, accuracy: 0.867) -- D006Q02, D094Q01, -- Misc Top2: (portion:0.017, count:15, errors: 2, accuracy: 0.867) -- D006Q02, D094Q01, -- ATYPE Accuracy: Top-1 0.994 Top-2 0.994 Answer Mode (AMODE) Prediction => -- YesNo AMODE Top1: (portion:0.099, count:87, errors: 0, accuracy: 1.000) -- -- YesNo AMODE Top2: (portion:0.099, count:87, errors: 0, accuracy: 1.000) -- -- YesNo Answer: (portion:0.099, count:87, errors: 2, accuracy: 0.977) -- D116Q05, D116Q08, -- Kinship AMODE Top1: (portion:0.063, count:56, errors: 0, accuracy: 1.000) -- -- Kinship AMODE Top2: (portion:0.063, count:56, errors: 0, accuracy: 1.000) -- -- Kinship Answer: (portion:0.063, count:56, errors: 7, accuracy: 0.875) -- D036Q15, D036Q18, D040Q14, D040Q15, D078Q07, D282Q10, D282Q11, -- Multi-Spans-Extraction AMODE Top1: (portion:0.094, count:83, errors: 1, accuracy: 0.988) -- D126Q04, -- Multi-Spans-Extraction AMODE Top2: (portion:0.094, count:83, errors: 0, accuracy: 1.000) -- -- Multi-Spans-Extraction Answer: (portion:0.094, count:83, errors: 40, accuracy: 0.518) -- D004Q02, D008Q06, D014Q05, D016Q02, D016Q04, D042Q09, D046Q06, D046Q07, D048Q05, D058Q10, D064Q08, D070Q02, D071Q06, D071Q07, D071Q08, D072Q08, D072Q09, D076Q09, D086Q01, D088Q06, D092Q01, D092Q02, D094Q04, D095Q02, D096Q02, D107Q01, D107Q02, D113Q07, D126Q01, D126Q04, D126Q05, D126Q06, D179Q04, D215Q07, D275Q09, D282Q08, D296Q05, D318Q04, D322Q01, D322Q02, -- Single-Span-Extraction AMODE Top1: (portion:0.540, count:476, errors: 0, accuracy: 1.000) -- -- Single-Span-Extraction AMODE Top2: (portion:0.540, count:476, errors: 0, accuracy: 1.000) -- -- Single-Span-Extraction Answer: (portion:0.540, count:476, errors: 58, accuracy: 0.878) -- D002Q04, D004Q03, D004Q07, D010Q06, D011Q05, D032Q02, D035Q03, D035Q06, D042Q15, D058Q14, D070Q11, D072Q05, D082Q02, D086Q02, D089Q01, D089Q02, D089Q03, D089Q04, D089Q05, D092Q12, D100Q07, D106Q03, D116Q03, D116Q04, D120Q07, D124Q05, D138Q06, D204Q04, D251Q05, D252Q01, D256Q01, D260Q01, D263Q05, D270Q05, D272Q09, D274Q01, D278Q02, D278Q04, D278Q06, D278Q08, D281Q03, D282Q04, D282Q12, D282Q14, D292Q02, D292Q07, D298Q05, D299Q03, D302Q02, D304Q09, D305Q05, D311Q01, D312Q04, D312Q06, D312Q08, D314Q04, D322Q05, D324Q03, ---- Single-Span-Extraction module (portion:0.540, count:476, errors: 45, accuracy: 0.905) ---- D002Q04, D004Q03, D004Q07, D010Q04, D010Q06, D011Q05, D032Q02, D035Q06, D058Q14, D070Q11, D072Q05, D082Q02, D089Q04, D092Q12, D100Q07, D104Q03, D106Q03, D116Q03, D120Q07, D124Q05, D179Q03, D204Q04, D244Q05, D251Q05, D252Q01, D256Q01, D263Q05, D268Q03, D270Q05, D272Q09, D278Q02, D278Q04, D278Q06, D278Q08, D282Q12, D282Q14, D298Q05, D299Q03, D302Q02, D305Q05, D311Q01, D312Q06, D314Q04, D322Q05, D324Q03, -- Date-Duration AMODE Top1: (portion:0.156, count:138, errors: 0, accuracy: 1.000) -- -- Date-Duration AMODE Top2: (portion:0.156, count:138, errors: 0, accuracy: 1.000) -- -- Date-Duration Answer: (portion:0.156, count:138, errors: 35, accuracy: 0.746) -- D002Q02, D032Q10, D035Q01, D035Q08, D035Q09, D035Q10, D042Q10, D042Q11, D068Q02, D070Q07, D071Q14, D077Q01, D082Q01, D082Q07, D083Q02, D092Q05, D100Q01, D100Q02, D104Q01, D108Q05, D108Q07, D124Q07, D214Q05, D215Q05, D215Q10, D238Q07, D252Q05, D256Q05, D304Q01, D310Q03, D310Q05, D310Q07, D312Q01, D312Q02, D312Q03, -- Arithmetic-Operations AMODE Top1: (portion:0.040, count:35, errors: 0, accuracy: 1.000) -- -- Arithmetic-Operations AMODE Top2: (portion:0.040, count:35, errors: 0, accuracy: 1.000) -- -- Arithmetic-Operations Answer: (portion:0.040, count:35, errors: 13, accuracy: 0.629) -- D014Q04, D048Q01, D076Q02, D076Q03, D076Q07, D076Q08, D096Q03, D096Q06, D245Q04, D248Q04, D252Q02, D252Q06, D275Q06, -- Summarize AMODE Top1: (portion:0.008, count:7, errors: 7, accuracy: 0.000) -- D006Q02, D048Q09, D086Q03, D094Q01, D245Q05, D288Q12, D322Q07, -- Summarize AMODE Top2: (portion:0.008, count:7, errors: 3, accuracy: 0.571) -- D048Q09, D288Q12, D322Q07, -- Summarize Answer: (portion:0.008, count:7, errors: 7, accuracy: 0.000) -- D006Q02, D048Q09, D086Q03, D094Q01, D245Q05, D288Q12, D322Q07, -- AMODE Accuracy: Top-1 0.991 Top-2 0.997