Advertisement
outeai

Untitled

Jul 28th, 2024 (edited)
181
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 6.05 KB | None | 0 0
  1. | Tasks |Version|Filter|n-shot|Metric| |Value | |Stderr|
  2. |---------------------------------------|------:|------|-----:|------|---|-----:|---|-----:|
  3. |mmlu | 1|none | |acc |↑ |0.2305|± |0.0035|
  4. | - humanities | 1|none | |acc |↑ |0.2427|± |0.0062|
  5. | - formal_logic | 0|none | 0|acc |↑ |0.2778|± |0.0401|
  6. | - high_school_european_history | 0|none | 0|acc |↑ |0.2242|± |0.0326|
  7. | - high_school_us_history | 0|none | 0|acc |↑ |0.2500|± |0.0304|
  8. | - high_school_world_history | 0|none | 0|acc |↑ |0.2700|± |0.0289|
  9. | - international_law | 0|none | 0|acc |↑ |0.2397|± |0.0390|
  10. | - jurisprudence | 0|none | 0|acc |↑ |0.2685|± |0.0428|
  11. | - logical_fallacies | 0|none | 0|acc |↑ |0.2209|± |0.0326|
  12. | - moral_disputes | 0|none | 0|acc |↑ |0.2486|± |0.0233|
  13. | - moral_scenarios | 0|none | 0|acc |↑ |0.2413|± |0.0143|
  14. | - philosophy | 0|none | 0|acc |↑ |0.1865|± |0.0221|
  15. | - prehistory | 0|none | 0|acc |↑ |0.2160|± |0.0229|
  16. | - professional_law | 0|none | 0|acc |↑ |0.2458|± |0.0110|
  17. | - world_religions | 0|none | 0|acc |↑ |0.3158|± |0.0357|
  18. | - other | 1|none | |acc |↑ |0.2414|± |0.0077|
  19. | - business_ethics | 0|none | 0|acc |↑ |0.3100|± |0.0465|
  20. | - clinical_knowledge | 0|none | 0|acc |↑ |0.2151|± |0.0253|
  21. | - college_medicine | 0|none | 0|acc |↑ |0.2139|± |0.0313|
  22. | - global_facts | 0|none | 0|acc |↑ |0.1800|± |0.0386|
  23. | - human_aging | 0|none | 0|acc |↑ |0.3139|± |0.0311|
  24. | - management | 0|none | 0|acc |↑ |0.1748|± |0.0376|
  25. | - marketing | 0|none | 0|acc |↑ |0.2991|± |0.0300|
  26. | - medical_genetics | 0|none | 0|acc |↑ |0.2900|± |0.0456|
  27. | - miscellaneous | 0|none | 0|acc |↑ |0.2375|± |0.0152|
  28. | - nutrition | 0|none | 0|acc |↑ |0.2157|± |0.0236|
  29. | - professional_accounting | 0|none | 0|acc |↑ |0.2340|± |0.0253|
  30. | - professional_medicine | 0|none | 0|acc |↑ |0.2022|± |0.0244|
  31. | - virology | 0|none | 0|acc |↑ |0.2831|± |0.0351|
  32. | - social sciences | 1|none | |acc |↑ |0.2174|± |0.0074|
  33. | - econometrics | 0|none | 0|acc |↑ |0.2368|± |0.0400|
  34. | - high_school_geography | 0|none | 0|acc |↑ |0.1768|± |0.0272|
  35. | - high_school_government_and_politics| 0|none | 0|acc |↑ |0.1969|± |0.0287|
  36. | - high_school_macroeconomics | 0|none | 0|acc |↑ |0.2026|± |0.0204|
  37. | - high_school_microeconomics | 0|none | 0|acc |↑ |0.2101|± |0.0265|
  38. | - high_school_psychology | 0|none | 0|acc |↑ |0.1927|± |0.0169|
  39. | - human_sexuality | 0|none | 0|acc |↑ |0.2595|± |0.0384|
  40. | - professional_psychology | 0|none | 0|acc |↑ |0.2516|± |0.0176|
  41. | - public_relations | 0|none | 0|acc |↑ |0.2182|± |0.0396|
  42. | - security_studies | 0|none | 0|acc |↑ |0.1878|± |0.0250|
  43. | - sociology | 0|none | 0|acc |↑ |0.2438|± |0.0304|
  44. | - us_foreign_policy | 0|none | 0|acc |↑ |0.2800|± |0.0451|
  45. | - stem | 1|none | |acc |↑ |0.2141|± |0.0073|
  46. | - abstract_algebra | 0|none | 0|acc |↑ |0.2200|± |0.0416|
  47. | - anatomy | 0|none | 0|acc |↑ |0.1852|± |0.0336|
  48. | - astronomy | 0|none | 0|acc |↑ |0.1711|± |0.0306|
  49. | - college_biology | 0|none | 0|acc |↑ |0.2778|± |0.0375|
  50. | - college_chemistry | 0|none | 0|acc |↑ |0.2000|± |0.0402|
  51. | - college_computer_science | 0|none | 0|acc |↑ |0.2400|± |0.0429|
  52. | - college_mathematics | 0|none | 0|acc |↑ |0.2100|± |0.0409|
  53. | - college_physics | 0|none | 0|acc |↑ |0.2157|± |0.0409|
  54. | - computer_security | 0|none | 0|acc |↑ |0.3100|± |0.0465|
  55. | - conceptual_physics | 0|none | 0|acc |↑ |0.2638|± |0.0288|
  56. | - electrical_engineering | 0|none | 0|acc |↑ |0.2414|± |0.0357|
  57. | - elementary_mathematics | 0|none | 0|acc |↑ |0.2143|± |0.0211|
  58. | - high_school_biology | 0|none | 0|acc |↑ |0.1806|± |0.0219|
  59. | - high_school_chemistry | 0|none | 0|acc |↑ |0.1626|± |0.0260|
  60. | - high_school_computer_science | 0|none | 0|acc |↑ |0.2500|± |0.0435|
  61. | - high_school_mathematics | 0|none | 0|acc |↑ |0.2000|± |0.0244|
  62. | - high_school_physics | 0|none | 0|acc |↑ |0.1921|± |0.0322|
  63. | - high_school_statistics | 0|none | 0|acc |↑ |0.1528|± |0.0245|
  64. | - machine_learning | 0|none | 0|acc |↑ |0.3214|± |0.0443|
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement