-
Notifications
You must be signed in to change notification settings - Fork 54
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #8 from Muennighoff/sgptcepy
Add CE script
- Loading branch information
Showing
5 changed files
with
556 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,27 @@ | ||
#!/bin/bash | ||
#SBATCH --job-name=muennighoffs | ||
#SBATCH --partition=gpu_p5 | ||
#SBATCH --constraint=a100 | ||
#SBATCH --reservation=hug | ||
#SBATCH --qos=qos_gpu-gc # up to 100h | ||
#SBATCH --nodes=1 | ||
#SBATCH --ntasks-per-node=1 # crucial - only 1 task per dist per node! | ||
#SBATCH --cpus-per-task=64 # number of cores per tasks | ||
#SBATCH --hint=nomultithread # we get physical cores not logical | ||
#SBATCH --gres=gpu:8 # number of gpus | ||
#SBATCH --time 100:00:00 # maximum execution time (HH:MM:SS) | ||
#SBATCH --output=%x-%j.out # output file name | ||
#SBATCH --account=six@a100 | ||
|
||
set -x -e | ||
|
||
source $six_ALL_CCFRWORK/start-tr13f-6B3-ml-t0 | ||
conda activate muennighoffs | ||
echo "START TIME: $(date)" | ||
|
||
cd /gpfsscratch/rech/six/commun/experiments/muennighoff/sgpt/biencoder/nli_msmarco/sentence-transformers | ||
|
||
|
||
WANDB_MODE="dryrun" WANDB_BASE_URL=https://api.wandb.ai WANDB_API_KEY=YOUR_KEY WANDB_ENTITY=muennighoff WANDB_PROJECT="sgpt" CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --config_file /gpfsscratch/rech/six/commun/experiments/muennighoff/sgpt/accelerate_config_fp32 examples/training/nli/training_nli_v2.py --model_name EleutherAI/gpt-neo-2.7B --train_batch_size 128 --lr 32e-5 --pooling weightedmean --wandb --wandbwatchlog gradients --gradcache --chunksize 16 | ||
|
||
echo "DONE" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,46 @@ | ||
#!/bin/bash | ||
#SBATCH --job-name=run-array-a100 # job name | ||
#SBATCH --ntasks=1 # number of MP tasks | ||
#SBATCH --nodes=1 | ||
#SBATCH --gres=gpu:1 | ||
#SBATCH --cpus-per-task=8 # number of cores per tasks | ||
#SBATCH --hint=nomultithread # we get physical cores not logical | ||
#SBATCH --time 100:00:00 # maximum execution time (HH:MM:SS) | ||
#SBATCH --output=%x-%j.out # output file name | ||
#SBATCH --account=six@a100 | ||
#SBATCH --reservation=hug | ||
#SBATCH --constraint=a100 | ||
#SBATCH --partition=gpu_p5 | ||
#SBATCH --qos=qos_gpu-gc # up to 100h | ||
|
||
set -x -e | ||
|
||
source $six_ALL_CCFRWORK/start-prod | ||
conda activate muennighoffmtb | ||
|
||
echo "START TIME: $(date)" | ||
|
||
cd /gpfswork/rech/six/commun/code/tr13f-6B3-ml-t0/sgptce/ | ||
|
||
#"fever" | ||
#"climate-fever" | ||
#"nq" | ||
#"hotpotqa" | ||
DATASETS=( | ||
"trec-covid" | ||
"webis-touche2020" | ||
"nfcorpus" | ||
"scifact" | ||
"fiqa" | ||
"dbpedia-entity" | ||
"quora" | ||
"arguana" | ||
"scidocs" | ||
) | ||
|
||
dataset=${DATASETS[$SLURM_ARRAY_TASK_ID]} | ||
|
||
python sgptce.py \ | ||
--batchsize 128 \ | ||
--dataset $dataset \ | ||
--modelpath /gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3/bloom-6b3 |
Oops, something went wrong.