-
Notifications
You must be signed in to change notification settings - Fork 527
Expand file tree
/
Copy pathlaunch.json
More file actions
97 lines (97 loc) · 3.55 KB
/
launch.json
File metadata and controls
97 lines (97 loc) · 3.55 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
{
"version": "0.2.0",
"configurations": [
{
"name": "Debug MaxText Decode (llama2-7b-int8)",
"type": "python",
"request": "launch",
"console": "integratedTerminal",
"justMyCode": false,
"python": "python3",
"module": "maxtext.inference.decode",
"args": ["src/maxtext/configs/base.yml",
"run_name=runner_$(date +%Y-%m-%d-%H-%M)",
"base_output_directory=gs://test-maxtext-output",
"dataset_path=gs://test-maxtext-dataset",
"model_name=llama2-7b",
"load_parameters_path=gs://msingh-bkt/checkpoints/quant_llama2-7b-chat/20241120034012/int8_",
"tokenizer_path=src/maxtext/assets/tokenizers/tokenizer.llama2",
"per_device_batch_size=8",
"max_prefill_predict_length=8",
"max_target_length=20",
"weight_dtype=bfloat16",
"ici_fsdp_parallelism=1",
"ici_tensor_parallelism=-1",
"scan_layers=false",
"quantization=int8",
"checkpoint_is_quantized=true",
"attention=dot_product",
"autoregressive_decode_assert=travel and explore new places"]
},
{
"name": "Debug MaxText Decode (Test)",
"type": "python",
"request": "launch",
"console": "integratedTerminal",
"justMyCode": false,
"python": "python3",
"module": "maxtext.inference.decode",
"args": ["src/maxtext/configs/base.yml",
"run_name=runner_$(date +%Y-%m-%d-%H-%M)",
"base_output_directory=gs://test-maxtext-output",
"dataset_path=gs://test-maxtext-dataset",
"steps=2",
"attention=dot_product",
"enable_checkpointing=false"]
},
{
"name": "Debug MaxText Train",
"type": "python",
"request": "launch",
"console": "integratedTerminal",
"justMyCode": false,
"python": "python3",
"module": "maxtext.trainers.pre_train.train",
"args": ["src/maxtext/configs/base.yml",
"run_name=runner_$(date +%Y-%m-%d-%H-%M)",
"base_output_directory=gs://test-maxtext-output",
"dataset_path=gs://test-maxtext-dataset",
"steps=2",
"enable_checkpointing=false"]
},
{
"name": "Debug MaxText Inference Microbenchmark",
"type": "python",
"request": "launch",
"console": "integratedTerminal",
"justMyCode": false,
"python": "python3",
"module": "maxtext.inference.inference_microbenchmark",
"args": [
"src/maxtext/configs/base.yml",
"model_name=llama2-7b",
"tokenizer_path=src/maxtext/assets/tokenizers/tokenizer.llama2",
"weight_dtype=bfloat16",
"scan_layers=false",
"attention=dot_product",
"max_prefill_predict_length=1024",
"max_target_length=2048",
"ici_fsdp_parallelism=1",
"ici_tensor_parallelism=-1",
"ici_autoregressive_parallelism=1",
"inference_microbenchmark_prefill_lengths=32,64,128,256,512,1024",
"inference_microbenchmark_stages=generate",
"inference_microbenchmark_loop_iters=1",
"run_name=runner_$(date +%Y-%m-%d-%H-%M)",
"base_output_directory=gs://test-maxtext-output",
"prefill_cache_axis_order=0,2,1,3",
"ar_cache_axis_order=0,2,1,3",
"compute_axis_order=0,2,1,3",
"reshape_q=true",
"per_device_batch_size=24",
"quantization=int8",
"quantize_kvcache=True"
]
}
]
}