From 557083a156c3dd67ac79e22b4202e9b69b6b00f4 Mon Sep 17 00:00:00 2001 From: Yan Shu <570533048@qq.com> Date: Mon, 8 Jul 2024 16:56:50 +0800 Subject: [PATCH] Add files via upload --- .../mlvu/__pycache__/utils.cpython-310.pyc | Bin 0 -> 3207 bytes lmms_eval/tasks/mlvu/mlvu.yaml | 21 +++ lmms_eval/tasks/mlvu/utils.py | 124 ++++++++++++++++++ 3 files changed, 145 insertions(+) create mode 100644 lmms_eval/tasks/mlvu/__pycache__/utils.cpython-310.pyc create mode 100644 lmms_eval/tasks/mlvu/mlvu.yaml create mode 100644 lmms_eval/tasks/mlvu/utils.py diff --git a/lmms_eval/tasks/mlvu/__pycache__/utils.cpython-310.pyc b/lmms_eval/tasks/mlvu/__pycache__/utils.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..1a9fda0f2b70ce7af4bbcc1868a64d7c8e67571d GIT binary patch literal 3207 zcmZ`*-E$ka5eIO`*_PaPf+llwI)Kzk z_d(;1w8c4g+Hv~ShxR=mL-noyME?-H=E?tpXENz7j*{&pJ@NqT-eLjl{&pAH>}-?3 z6MyrM?k8x_Dx5T_S^9AMC#DX{roaw@i&&bb$8?GDv5LUw~eT!<(vwt!yl$yBPKkbXYcO`<%HvefTJv4n5-!=Tvf*xLSm zlo#6m2&QQFLB9ZzAl9`%q%Z(6C(e33sX7hL9&c;5xy{)hceu6nXj8L$+uVBiXp>tz zJ9jzTd;srVUBCaafB(TJ_eP6r>wj5a3xjY^uI~+cy(sNnpc!Fw0pd>fjA?9&M=tinEGV_E{j zR>+uD+>(|IxD{1{F;y2zpi9=HJEU+Xbphiq0dZej=(CF7vA1}07zvsAX^_a#j2U}< zu-V4wf+sSWdudj9@)=m~n%9pd?AwE*h6f#2vn?Kmd7<*9zo?Y4iQfEs+ZXnuyGLSj?dvw0} zAdL^bUNn?mu_wJ<;Cq=t;967D=BWMKSDX!R)ttUlQ!A+Ee3A(n`*~l6Q8xv^7rDn=iZ^H~e(;dX|F$WE4^r`cxZSHlW6!KYd8@M^8)9kOrezTQ6zn1!B9ybS*Db)Yr8r z74jK?fadB7d;ugWDXPtyZJQl0!zNV_7Jdj=fL^NHSF$Ic{Tim^EofZo(k7jQz1vKo ztKM*=1B{ax`Tz*n;WTPW_MCzvjZ?vS;Mf&X+9h&qaC7Y|dt4JvS&JZkI`z?in;txy z5U(3%gcQJQ!wbA9&5IxnrI&S$hY^(CG{#S4mCPY!`HL0Q`IU9WsV*;wz>~0a;&+o>oS)uQkSW9Am6}e1HZ#- z@cA*EG9qJI5U5v;F%#fz!M?~5mUw?}b1~+grQYeMzs3&OR8zWg(8ehf;Mjm0;vxWFYo@fW`6g{t zwH5DGz8NYDC)crN$I-5`k+Si^qn2>!K$?NekiztoT8fL55Q)h|%g>B&N-LtWqN`g>U-)jV>W@>xGf#UPhTEg-|r`ZCq7Z|;4* zubn>J9nwP6u5Kt9h&W1Ru3Z&8^)U(YMjmvf8R~|FO_=+mrjfQ$5)xw{^a)*w#aSTK z8QjuYZ1B2Z3Z=<>CM6jozvjnR70kT@C43Oe4>1AfA41bIHLG$LR 0 else 0 : .1f}%") + + total_correct = 0 + total_answered = 0 + for k, v in category2score.items(): + total_correct += v["correct"] + total_answered += v["answered"] + eval_logger.info(f"Overall Performance: {100 * total_correct / total_answered if total_answered > 0 else 0 : .1f}%") + + return 100 * total_correct / total_answered if total_answered > 0 else 0