We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 37b25d8 commit 52924eaCopy full SHA for 52924ea
1 file changed
tutorials/profiling/configs/distributed_8B_model_profiling.yaml
@@ -6,7 +6,26 @@ settings:
6
benchmark:
7
sequence_length: 4096
8
vocab_size: 50304
9
- batch_size: 2
+ batch_size: 1
10
+ paths:
11
+ experiment_root_path: ${modalities_env:config_folder_path}
12
+
13
+profiler:
14
+ component_key: steppable_profiler
15
+ variant_key: kernel_tracing
16
+ config:
17
+ num_wait_steps: 5
18
+ num_warmup_steps: 5
19
+ num_active_steps: 3
20
+ profiler_activities: [CPU, CUDA]
21
+ record_shapes: false
22
+ profile_memory: false
23
+ with_stack: false
24
+ with_flops: false
25
+ with_modules: false
26
+ tracked_ranks: [0, 1]
27
+ output_folder_path: ${settings.paths.experiment_root_path}/kernel_traces
28
29
30
steppable_component:
31
component_key: steppable_component
0 commit comments