File size: 717 Bytes
be45db4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
# Data paths and options when using EleutherAI cluster
{
  "train-data-paths": ["/fsx/pile/pile_20B_tokenizer_text_document"],
  "valid-data-paths": ["/fsx/pile/pile_20B_tokenizer_text_document"],
  "test-data-paths": ["/fsx/pile/pile_20B_tokenizer_text_document"],

  "tokenizer_type": "HFTokenizer",
  "vocab-file": "/fsx/pile/20B_tokenizer.json",

  "save": "/fsx/shiv/gpt-neox/runs/checkpoints/pythia/13b",
  "load": "/fsx/shiv/gpt-neox/runs/checkpoints/pythia/13b",
  "tensorboard-dir": "/fsx/shiv/gpt-neox/runs/tensorboard",
  "log-dir": "/fsx/shiv/gpt-neox/runs/logs",

  "wandb_team": "eleutherai",
  "wandb_project": "pythia",
  "wandb_group": "13B Decay",
  "launcher": "openmpi",
  "deepspeed_mpi": true
}