forked from NVIDIA/Megatron-LM
-
Notifications
You must be signed in to change notification settings - Fork 0
/
launch.json
50 lines (47 loc) · 1.99 KB
/
launch.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
{
// Use IntelliSense to learn about possible attributes.
// Hover to view descriptions of existing attributes.
// For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
"version": "0.2.0",
"configurations": [
{
"name": "Bert Debug",
"type": "python",
"request": "launch",
"env": {
"CUDA_DEVICE_MAX_CONNECTIONS": "1",
},
"module": "torch.distributed.run",
"args" : ["/workspace/megatron/pretrain_bert.py",
"--num-layers", "12",
"--hidden-size", "1024",
"--num-attention-heads", "16",
"--seq-length", "512",
"--max-position-embeddings", "512",
"--micro-batch-size", "4",
"--global-batch-size", "8",
"--lr", "0.0001",
"--train-iters", "20000",
"--lr-decay-iters", "990000",
"--lr-decay-style", "linear",
"--min-lr", "0.00001",
"--weight-decay", "1e-2",
"--lr-warmup-fraction", ".01",
"--clip-grad", "1.0",
"--fp16",
"--data-path", "/workspace/dataset/europarl/europarl-bert_text_sentence",
"--vocab-file", "/workspace/checkpoints/BERT-345M-uncased/bert-large-uncased-vocab.txt",
"--split", "949,50,1",
"--log-interval", "100",
"--save-interval", "500",
"--eval-interval", "500",
"--eval-iters", "10",
"--log-throughput",
"--save", "/workspace/checkpoints/debug",
"--load", "/workspace/checkpoints/debug",
],
"console": "integratedTerminal",
"justMyCode": true
}
]
}