Initial commit
This commit is contained in:
26
configs/h100.yaml
Normal file
26
configs/h100.yaml
Normal file
@@ -0,0 +1,26 @@
|
||||
# H100 Configuration
|
||||
gpu_type: h100
|
||||
gpu_model: "NVIDIA H100 80GB"
|
||||
|
||||
# Default attention implementation
|
||||
default_attention: flash_attention_3_hopper
|
||||
|
||||
# Pretraining defaults
|
||||
pretrain:
|
||||
batch_size: 8
|
||||
sequence_length: 8192
|
||||
num_steps: 10
|
||||
warmup_steps: 3
|
||||
|
||||
# Inference defaults
|
||||
inference:
|
||||
num_requests: 10
|
||||
prompt_length: 512
|
||||
generation_length: 100
|
||||
warmup_requests: 2
|
||||
|
||||
# Hardware specs (for reference)
|
||||
hardware:
|
||||
memory_gb: 80
|
||||
tdp_watts: 700
|
||||
compute_capability: "9.0"
|
||||
Reference in New Issue
Block a user