Raw Runs

RunAdaptation method
babi_qa:task=15,model=AlephAlpha_luminous-basegeneration
babi_qa:task=15,model=AlephAlpha_luminous-extendedgeneration
babi_qa:task=15,model=AlephAlpha_luminous-supremegeneration
babi_qa:task=15,model=ai21_j1-grandegeneration
babi_qa:task=15,model=ai21_j1-grande-v2-betageneration
babi_qa:task=15,model=ai21_j1-jumbogeneration
babi_qa:task=15,model=ai21_j1-largegeneration
babi_qa:task=15,model=ai21_j2-grandegeneration
babi_qa:task=15,model=ai21_j2-jumbogeneration
babi_qa:task=15,model=ai21_j2-largegeneration
babi_qa:task=15,model=anthropic_stanford-online-all-v4-s3generation
babi_qa:task=15,model=cohere_command-medium-betageneration
babi_qa:task=15,model=cohere_command-xlarge-betageneration
babi_qa:task=15,model=cohere_large-20220720generation
babi_qa:task=15,model=cohere_medium-20220720generation
babi_qa:task=15,model=cohere_medium-20221108generation
babi_qa:task=15,model=cohere_small-20220720generation
babi_qa:task=15,model=cohere_xlarge-20220609generation
babi_qa:task=15,model=cohere_xlarge-20221108generation
babi_qa:task=15,model=microsoft_TNLGv2_530Bgeneration
babi_qa:task=15,model=microsoft_TNLGv2_7Bgeneration
babi_qa:task=15,model=openai_adageneration
babi_qa:task=15,model=openai_babbagegeneration
babi_qa:task=15,model=openai_code-cushman-001generation
babi_qa:task=15,model=openai_code-davinci-002generation
babi_qa:task=15,model=openai_curiegeneration
babi_qa:task=15,model=openai_davincigeneration
babi_qa:task=15,model=openai_gpt-3.5-turbo-0301generation
babi_qa:task=15,model=openai_text-ada-001generation
babi_qa:task=15,model=openai_text-babbage-001generation
babi_qa:task=15,model=openai_text-curie-001generation
babi_qa:task=15,model=openai_text-davinci-002generation
babi_qa:task=15,model=openai_text-davinci-003generation
babi_qa:task=15,model=together_bloomgeneration
babi_qa:task=15,model=together_glm,stop=hashgeneration
babi_qa:task=15,model=together_gpt-j-6bgeneration
babi_qa:task=15,model=together_gpt-neox-20bgeneration
babi_qa:task=15,model=together_opt-175bgeneration
babi_qa:task=15,model=together_opt-66bgeneration
babi_qa:task=15,model=together_redpajama-incite-base-3b-v1generation
babi_qa:task=15,model=together_t0pp,stop=hashgeneration
babi_qa:task=15,model=together_t5-11b,stop=hashgeneration
babi_qa:task=15,model=together_ul2,stop=hash,global_prefix=nlggeneration
babi_qa:task=15,model=together_yalmgeneration
babi_qa:task=15,model=writer_palmyra-instruct-30generation
babi_qa:task=15,model=writer_palmyra-xgeneration
babi_qa:task=19,model=AlephAlpha_luminous-basegeneration
babi_qa:task=19,model=AlephAlpha_luminous-extendedgeneration
babi_qa:task=19,model=AlephAlpha_luminous-supremegeneration
babi_qa:task=19,model=ai21_j1-grandegeneration
babi_qa:task=19,model=ai21_j1-grande-v2-betageneration
babi_qa:task=19,model=ai21_j1-jumbogeneration
babi_qa:task=19,model=ai21_j1-largegeneration
babi_qa:task=19,model=ai21_j2-grandegeneration
babi_qa:task=19,model=ai21_j2-jumbogeneration
babi_qa:task=19,model=ai21_j2-largegeneration
babi_qa:task=19,model=anthropic_stanford-online-all-v4-s3generation
babi_qa:task=19,model=cohere_command-medium-betageneration
babi_qa:task=19,model=cohere_command-xlarge-betageneration
babi_qa:task=19,model=cohere_large-20220720generation
babi_qa:task=19,model=cohere_medium-20220720generation
babi_qa:task=19,model=cohere_medium-20221108generation
babi_qa:task=19,model=cohere_small-20220720generation
babi_qa:task=19,model=cohere_xlarge-20220609generation
babi_qa:task=19,model=cohere_xlarge-20221108generation
babi_qa:task=19,model=microsoft_TNLGv2_530Bgeneration
babi_qa:task=19,model=microsoft_TNLGv2_7Bgeneration
babi_qa:task=19,model=openai_adageneration
babi_qa:task=19,model=openai_babbagegeneration
babi_qa:task=19,model=openai_code-cushman-001generation
babi_qa:task=19,model=openai_code-davinci-002generation
babi_qa:task=19,model=openai_curiegeneration
babi_qa:task=19,model=openai_davincigeneration
babi_qa:task=19,model=openai_gpt-3.5-turbo-0301generation
babi_qa:task=19,model=openai_text-ada-001generation
babi_qa:task=19,model=openai_text-babbage-001generation
babi_qa:task=19,model=openai_text-curie-001generation
babi_qa:task=19,model=openai_text-davinci-002generation
babi_qa:task=19,model=openai_text-davinci-003generation
babi_qa:task=19,model=together_bloomgeneration
babi_qa:task=19,model=together_glm,stop=hashgeneration
babi_qa:task=19,model=together_gpt-j-6bgeneration
babi_qa:task=19,model=together_gpt-neox-20bgeneration
babi_qa:task=19,model=together_opt-175bgeneration
babi_qa:task=19,model=together_opt-66bgeneration
babi_qa:task=19,model=together_redpajama-incite-base-3b-v1generation
babi_qa:task=19,model=together_t0pp,stop=hashgeneration
babi_qa:task=19,model=together_t5-11b,stop=hashgeneration
babi_qa:task=19,model=together_ul2,stop=hash,global_prefix=nlggeneration
babi_qa:task=19,model=together_yalmgeneration
babi_qa:task=19,model=writer_palmyra-instruct-30generation
babi_qa:task=19,model=writer_palmyra-xgeneration
babi_qa:task=3,model=AlephAlpha_luminous-basegeneration
babi_qa:task=3,model=AlephAlpha_luminous-extendedgeneration
babi_qa:task=3,model=AlephAlpha_luminous-supremegeneration
babi_qa:task=3,model=ai21_j1-grandegeneration
babi_qa:task=3,model=ai21_j1-grande-v2-betageneration
babi_qa:task=3,model=ai21_j1-jumbogeneration
babi_qa:task=3,model=ai21_j1-largegeneration
babi_qa:task=3,model=ai21_j2-grandegeneration
babi_qa:task=3,model=ai21_j2-jumbogeneration
babi_qa:task=3,model=ai21_j2-largegeneration
babi_qa:task=3,model=anthropic_stanford-online-all-v4-s3generation
babi_qa:task=3,model=cohere_command-medium-betageneration
babi_qa:task=3,model=cohere_command-xlarge-betageneration
babi_qa:task=3,model=cohere_large-20220720generation
babi_qa:task=3,model=cohere_medium-20220720generation
babi_qa:task=3,model=cohere_medium-20221108generation
babi_qa:task=3,model=cohere_small-20220720generation
babi_qa:task=3,model=cohere_xlarge-20220609generation
babi_qa:task=3,model=cohere_xlarge-20221108generation
babi_qa:task=3,model=microsoft_TNLGv2_530Bgeneration
babi_qa:task=3,model=microsoft_TNLGv2_7Bgeneration
babi_qa:task=3,model=openai_adageneration
babi_qa:task=3,model=openai_babbagegeneration
babi_qa:task=3,model=openai_code-cushman-001generation
babi_qa:task=3,model=openai_code-davinci-002generation
babi_qa:task=3,model=openai_curiegeneration
babi_qa:task=3,model=openai_davincigeneration
babi_qa:task=3,model=openai_gpt-3.5-turbo-0301generation
babi_qa:task=3,model=openai_text-ada-001generation
babi_qa:task=3,model=openai_text-babbage-001generation
babi_qa:task=3,model=openai_text-curie-001generation
babi_qa:task=3,model=openai_text-davinci-002generation
babi_qa:task=3,model=openai_text-davinci-003generation
babi_qa:task=3,model=together_bloomgeneration
babi_qa:task=3,model=together_glm,stop=hashgeneration
babi_qa:task=3,model=together_gpt-j-6bgeneration
babi_qa:task=3,model=together_gpt-neox-20bgeneration
babi_qa:task=3,model=together_opt-175bgeneration
babi_qa:task=3,model=together_opt-66bgeneration
babi_qa:task=3,model=together_redpajama-incite-base-3b-v1generation
babi_qa:task=3,model=together_t0pp,stop=hashgeneration
babi_qa:task=3,model=together_t5-11b,stop=hashgeneration
babi_qa:task=3,model=together_ul2,stop=hash,global_prefix=nlggeneration
babi_qa:task=3,model=together_yalmgeneration
babi_qa:task=3,model=writer_palmyra-instruct-30generation
babi_qa:task=3,model=writer_palmyra-xgeneration
babi_qa:task=all,model=AlephAlpha_luminous-basegeneration
babi_qa:task=all,model=AlephAlpha_luminous-extendedgeneration
babi_qa:task=all,model=AlephAlpha_luminous-supremegeneration
babi_qa:task=all,model=ai21_j1-grandegeneration
babi_qa:task=all,model=ai21_j1-grande-v2-betageneration
babi_qa:task=all,model=ai21_j1-jumbogeneration
babi_qa:task=all,model=ai21_j1-largegeneration
babi_qa:task=all,model=ai21_j2-grandegeneration
babi_qa:task=all,model=ai21_j2-jumbogeneration
babi_qa:task=all,model=ai21_j2-largegeneration
babi_qa:task=all,model=anthropic_stanford-online-all-v4-s3generation
babi_qa:task=all,model=cohere_command-medium-betageneration
babi_qa:task=all,model=cohere_command-xlarge-betageneration
babi_qa:task=all,model=cohere_large-20220720generation
babi_qa:task=all,model=cohere_medium-20220720generation
babi_qa:task=all,model=cohere_medium-20221108generation
babi_qa:task=all,model=cohere_small-20220720generation
babi_qa:task=all,model=cohere_xlarge-20220609generation
babi_qa:task=all,model=cohere_xlarge-20221108generation
babi_qa:task=all,model=microsoft_TNLGv2_530Bgeneration
babi_qa:task=all,model=microsoft_TNLGv2_7Bgeneration
babi_qa:task=all,model=openai_adageneration
babi_qa:task=all,model=openai_babbagegeneration
babi_qa:task=all,model=openai_code-cushman-001generation
babi_qa:task=all,model=openai_code-davinci-002generation
babi_qa:task=all,model=openai_curiegeneration
babi_qa:task=all,model=openai_davincigeneration
babi_qa:task=all,model=openai_gpt-3.5-turbo-0301generation
babi_qa:task=all,model=openai_text-ada-001generation
babi_qa:task=all,model=openai_text-babbage-001generation
babi_qa:task=all,model=openai_text-curie-001generation
babi_qa:task=all,model=openai_text-davinci-002generation
babi_qa:task=all,model=openai_text-davinci-003generation
babi_qa:task=all,model=together_bloomgeneration
babi_qa:task=all,model=together_glm,stop=hashgeneration
babi_qa:task=all,model=together_gpt-j-6bgeneration
babi_qa:task=all,model=together_gpt-neox-20bgeneration
babi_qa:task=all,model=together_opt-175bgeneration
babi_qa:task=all,model=together_opt-66bgeneration
babi_qa:task=all,model=together_redpajama-incite-base-3b-v1generation
babi_qa:task=all,model=together_t0pp,stop=hashgeneration
babi_qa:task=all,model=together_t5-11b,stop=hashgeneration
babi_qa:task=all,model=together_ul2,stop=hash,global_prefix=nlggeneration
babi_qa:task=all,model=together_yalmgeneration
babi_qa:task=all,model=writer_palmyra-instruct-30generation
babi_qa:task=all,model=writer_palmyra-xgeneration
bbq:subject=all,method=multiple_choice_joint,model=AlephAlpha_luminous-basemultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=AlephAlpha_luminous-extendedmultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=AlephAlpha_luminous-suprememultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j1-grandemultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j1-grande-v2-betamultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j1-jumbomultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j1-largemultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j2-grandemultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j2-jumbomultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=ai21_j2-largemultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=anthropic_stanford-online-all-v4-s3multiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=anthropic_stanford-online-all-v4-s3,groups=ablation_multiple_choicemultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=cohere_command-medium-betamultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=cohere_command-xlarge-betamultiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=cohere_large-20220720multiple_choice_joint
bbq:subject=all,method=multiple_choice_joint,model=cohere_medium-20220720multiple_choice_joint