bash install.sh
Prepare Datasets
bash ./scripts/data/process_data_[DATASETNAME].sh
Inference (e.g., in-domain test)
bash ./scripts/model/[MODELNAME]/in-domain/inference_[DATASETNAME].sh [NUM_INDOMAIN_LIST] [RATIONALE_LIST] [MAX_PROMPT_LENGTH]
-
in-domain: CommonsenseQA / out-domain: GSM8K / seed: [1 10 20 30 40 50 60] / test: [-9,-1] / both / max prompt token: 2048
-
in-domain: GSM8K / out-domain: CommonsenseQA / seed: [1 10 20 30 40 50 60] / test: [-9,-1] / both / max prompt token: 2048
-
in-domain: CommonsenseQA / out-domain: None / seed: [1 10 20 30 40 50 60] / test: [0, 9] / both / max prompt token: 2048
-
in-domain: CommonsenseQA / out-domain: GSM8K / seed: [1 10 20 30 40 50 60] / test: [-25, -10] / without rationale / max prompt token: 2048
-
in-domain: CommonsenseQA / out-domain: None / seed: [1 10 20 30] / test: [0,9] / both / max prompt token: 4096
-
in-domain: CommonsenseQA / out-domain: None / seed: [1 10 20 30] / test: [10,17] / With rationale / max prompt token: 4096
-
in-domain: GSM8K / out-domain: CommonsenseQA / seed: [1 10 20 30] / test: {-8,-4,-2,-1} / Without rationale / max prompt token: 4096
-
in-domain: GSM8K / out-domain: CommonsenseQA / seed: [1 10 20 30] / test: [-9,-1] / With rationale / max prompt token: 4096
-
in-domain: CommonsenseQA / out-domain: GSM8K / seed: [1 10 20 30] / test: [-10,-1] / With rationale / max prompt token: 4096
-
in-domain: CommonsenseQA / out-domain: GSM8K / seed: [1 10 20 30] / test: [-20,-11] / With rationale / max prompt token: 4096
-
in-domain: CommonsenseQA / out-domain: GSM8K / seed: [1 10 20 30] / test: [-25,-1] / Without rationale / max prompt token: 4096
-
in-domain: CommonsenseQA / out-domain: Mathqa / seed: [1 10 20 30] / test: {-19, -17, ..., -1} / both / max prompt token: 4096
-
in-domain: CommonsenseQA / out-domain: GSM8K / seed: [1 10 20 30] / test: [-25,-1] / Without rationale / max prompt token: 4096