| arithmetic-reasoning-on-gsm8k | PaLM 2 (few-shot, k=8, CoT) | |
| arithmetic-reasoning-on-gsm8k | PaLM 2 (few-shot, k=8, SC) | |
| code-generation-on-mbpp | PaLM 2-S* (few-shot) | |
| common-sense-reasoning-on-arc-challenge | PaLM 2-S (1-shot) | |
| common-sense-reasoning-on-arc-challenge | PaLM 2 (few-shot, CoT, SC) | |
| common-sense-reasoning-on-arc-challenge | PaLM 2-M (1-shot) | |
| common-sense-reasoning-on-arc-challenge | PaLM 2-L (1-shot) | |
| common-sense-reasoning-on-arc-easy | PaLM 2-S (1-shot) | |
| common-sense-reasoning-on-arc-easy | PaLM 2-L (1-shot) | |
| common-sense-reasoning-on-arc-easy | PaLM 2-M (1-shot) | |
| common-sense-reasoning-on-big-bench | PaLM 2 (few-shot, k=3, CoT) | |
| common-sense-reasoning-on-big-bench | PaLM 2 (few-shot, k=3, Direct) | |
| common-sense-reasoning-on-big-bench-causal | PaLM 2 (few-shot, k=3, Direct) | |
| common-sense-reasoning-on-big-bench-causal | PaLM 2 (few-shot, k=3, CoT) | |
| common-sense-reasoning-on-big-bench-date | PaLM 2 (few-shot, k=3, CoT) | |
| common-sense-reasoning-on-big-bench-date | PaLM 2 (few-shot, k=3, Direct) | |
| common-sense-reasoning-on-big-bench-sports | PaLM 2(few-shot, k=3, CoT) | |
| common-sense-reasoning-on-big-bench-sports | PaLM 2 (few-shot, k=3, Direct) | |
| common-sense-reasoning-on-commonsenseqa | PaLM 2 (few‑shot, CoT, SC) | |
| common-sense-reasoning-on-record | PaLM 2-L (one-shot) | |
| common-sense-reasoning-on-record | PaLM 2-M (one-shot) | |
| common-sense-reasoning-on-record | PaLM 2-S (one-shot) | |
| common-sense-reasoning-on-winogrande | PaLM 2-S (1-shot) | |
| common-sense-reasoning-on-winogrande | PaLM 2-M (1-shot) | |
| common-sense-reasoning-on-winogrande | PaLM 2-L (1-shot) | |
| coreference-resolution-on-winograd-schema | PaLM 2-M (1-shot) | |
| coreference-resolution-on-winograd-schema | PaLM 2-S (1-shot) | |
| coreference-resolution-on-winograd-schema | PaLM 2-L (1-shot) | |
| cross-lingual-question-answering-on-tydiqa | PaLM 2-M (one-shot) | |
| cross-lingual-question-answering-on-tydiqa | PaLM 2-S (one-shot) | |
| cross-lingual-question-answering-on-tydiqa | PaLM 2-L (one-shot) | |
| cross-lingual-transfer-on-xcopa | PaLM 2 (few-shot) | |
| language-modelling-on-lambada | PaLM 2-M (one-shot) | |
| language-modelling-on-lambada | PaLM 2-L (one-shot) | |
| language-modelling-on-lambada | PaLM 2-S (one-shot) | |
| logical-reasoning-on-big-bench-formal | PaLM 2 (few-shot, k=3, Direct) | |
| logical-reasoning-on-big-bench-formal | PaLM 2 (few-shot, k=3, CoT) | |
| logical-reasoning-on-big-bench-logic-grid | PaLM-62B (few-shot, k=5) | |
| logical-reasoning-on-big-bench-logic-grid | PaLM-540B (few-shot, k=5) | |
| logical-reasoning-on-big-bench-penguins-in-a | PaLM 2 (few-shot, k=3, CoT) | |
| logical-reasoning-on-big-bench-penguins-in-a | PaLM 2 (few-shot, k=3, Direct) | |
| logical-reasoning-on-big-bench-reasoning | PaLM 2 (few-shot, k=3, Direct) | |
| logical-reasoning-on-big-bench-reasoning | PaLM 2 (few-shot, k=3, CoT) | |
| logical-reasoning-on-big-bench-temporal | PaLM 2 (few-shot, k=3, CoT) | |
| logical-reasoning-on-big-bench-temporal | PaLM 2 (few-shot, k=3, Direct) | |
| machine-translation-on-frmt-chinese-mainland | Google Translate | |
| machine-translation-on-frmt-chinese-mainland | PaLM 2 | |
| machine-translation-on-frmt-chinese-mainland | PaLM | |
| machine-translation-on-frmt-chinese-taiwan | PaLM 2 | |
| machine-translation-on-frmt-chinese-taiwan | Google Translate | |
| machine-translation-on-frmt-chinese-taiwan | PaLM | |
| machine-translation-on-frmt-portuguese | PaLM 2 | |
| machine-translation-on-frmt-portuguese | PaLM | |
| machine-translation-on-frmt-portuguese | Google Translate | |
| machine-translation-on-frmt-portuguese-brazil | Google Translate | |
| machine-translation-on-frmt-portuguese-brazil | PaLM | |
| machine-translation-on-frmt-portuguese-brazil | PaLM 2 | |
| math-word-problem-solving-on-math | PaLM 2 (few-shot, k=4, CoT) | |
| math-word-problem-solving-on-math | PaLM 2 (few-shot, k=4, SC) | |
| multi-task-language-understanding-on-mgsm | PaLM 2 (few-shot, k=8, SC) | |
| multi-task-language-understanding-on-mgsm | PaLM 2 (8-shot, CoT) | |
| multiple-choice-question-answering-mcqa-on-27 | PaLM 2 (few-shot, k=3, Direct) | |
| multiple-choice-question-answering-mcqa-on-27 | PaLM 2 (few-shot, k=3, CoT) | |
| multiple-choice-question-answering-mcqa-on-28 | PaLM 2 (few-shot, k=3, Direct) | |
| multiple-choice-question-answering-mcqa-on-28 | PaLM 2 (few-shot, k=3, CoT) | |
| multiple-choice-question-answering-mcqa-on-29 | PaLM 2 (few-shot, k=3, Direct) | |
| multiple-choice-question-answering-mcqa-on-29 | PaLM 2 (few-shot, k=3, CoT) | |
| multiple-choice-question-answering-mcqa-on-30 | PaLM 2 (few-shot, k=3, CoT) | |
| multiple-choice-question-answering-mcqa-on-30 | PaLM 2 (few-shot, k=3, Direct) | |
| natural-language-inference-on-anli-test | PaLM 2-S (one-shot) | |
| natural-language-inference-on-anli-test | PaLM 2-L (one-shot) | |
| natural-language-inference-on-anli-test | PaLM 2-M (one-shot) | |
| natural-language-inference-on-commitmentbank | PaLM 2-S (one-shot) | |
| natural-language-inference-on-commitmentbank | PaLM 2-M (one-shot) | |
| natural-language-inference-on-commitmentbank | PaLM 2-L (one-shot) | |
| natural-language-inference-on-rte | PaLM 2-L (1-shot) | |
| natural-language-inference-on-rte | PaLM 2-S (1-shot) | |
| natural-language-inference-on-rte | PaLM 2-M (1-shot) | |
| question-answering-on-boolq | PaLM 2-S (1-shot) | |
| question-answering-on-boolq | PaLM 2-L (1-shot) | |
| question-answering-on-boolq | PaLM 2-M (1-shot) | |
| question-answering-on-copa | PaLM 2-M (1-shot) | |
| question-answering-on-copa | PaLM 2-S (1-shot) | |
| question-answering-on-copa | PaLM 2-L (1-shot) | |
| question-answering-on-drop-test | PaLM 2 (few-shot) | |
| question-answering-on-multirc | PaLM 2-S (one-shot) | |
| question-answering-on-multirc | PaLM 2-M (one-shot) | |
| question-answering-on-multirc | PaLM 2-L (one-shot) | |
| question-answering-on-natural-questions | PaLM 2-S (one-shot) | |
| question-answering-on-natural-questions | PaLM 2-M (one-shot) | |
| question-answering-on-natural-questions | PaLM 2-L (one-shot) | |
| question-answering-on-openbookqa | PaLM 2-L (1-shot) | |
| question-answering-on-openbookqa | PaLM 2-M (1-shot) | |
| question-answering-on-openbookqa | PaLM 2-S (1-shot) | |
| question-answering-on-piqa | PaLM 2-M (1-shot) | |
| question-answering-on-piqa | PaLM 2-S (1-shot) | |
| question-answering-on-piqa | PaLM 2-L (1-shot) | |
| question-answering-on-story-cloze | PaLM 2-M (one-shot) | |
| question-answering-on-story-cloze | PaLM 2-S (one-shot) | |
| question-answering-on-story-cloze | PaLM 2-L (one-shot) | |
| question-answering-on-strategyqa | PaLM 2 (few-shot, CoT, SC) | |
| question-answering-on-triviaqa | PaLM 2-S (one-shot) | |
| question-answering-on-triviaqa | PaLM 2-M (one-shot) | |
| question-answering-on-triviaqa | PaLM 2-L (one-shot) | |
| question-answering-on-webquestions | PaLM 2-S (one-shot) | |
| question-answering-on-webquestions | PaLM 2-L (one-shot) | |
| question-answering-on-webquestions | PaLM 2-M (one-shot) | |
| sarcasm-detection-on-big-bench-snarks | PaLM 2 (few-shot, k=3, Direct) | |
| sarcasm-detection-on-big-bench-snarks | PaLM 2(few-shot, k=3, CoT) | |
| text-summarization-on-x-sum | PaLM 2-S (one-shot) | |
| text-summarization-on-x-sum | PaLM 2-L (one-shot) | |
| text-summarization-on-x-sum | PaLM 2-M (one-shot) | |
| toxic-comment-classification-on-civil | PaLM 2 (zero-shot) | |
| toxic-comment-classification-on-civil | PaLM 2 (few-shot, k=10) | |
| word-sense-disambiguation-on-words-in-context | PaLM 2-L (one-shot) | |
| word-sense-disambiguation-on-words-in-context | PaLM 2-S (one-shot) | |
| word-sense-disambiguation-on-words-in-context | PaLM 2-M (one-shot) | |