Learn how to convert legacy YAMLs into the new Trainer YAML configuration.
cszoo config convert_legacy /path/to/v1.yaml -o /path/to/v2.yaml
eval_inputeval_input:
...
eval_input.micro_batch_sizeeval_input:
micro_batch_size: ...
modelmodel:
...
model.compressionmodel:
compression:
...
model.fp16_typemodel:
fp16_type: ...
model.lora_paramsmodel:
lora_params: ...
model.mixed_precisionmodel:
mixed_precision: ...
model.selective_gradmodel:
selective_grad ...
optimizeroptimizer:
...
optimizer.grad_accum_stepsoptimizer:
grad_accum_steps: ...
optimizer.initial_loss_scaleoptimizer:
initial_loss_scale: ...
optimizer.learning_rateoptimizer:
learning_rate:
...
optimizer.log_summariesoptimizer:
log_summaries: ...
optimizer.loss_scaling_factoroptimizer:
loss_scaling_factor: ...
optimizer.max_gradient_normoptimizer:
max_gradient_norm: ...
optimizer.max_gradient_valueoptimizer:
max_gradient_value: ...
optimizer.max_loss_scaleoptimizer:
max_loss_scale: ...
optimizer.min_loss_scaleoptimizer:
min_loss_scale: ...
optimizer.steps_per_increaseoptimizer:
steps_per_increase: ...
runconfig.act_memory_girunconfig:
act_memory_gi: ...
runconfig.autoload_last_checkpointrunconfig:
autoload_last_checkpoint: ...
runconfig.check_loss_valuesrunconfig:
check_loss_values: ...
runconfig.checkpoint_pathrunconfig:
checkpoint_path: ...
runconfig.checkpoint_stepsrunconfig:
checkpoint_steps: ...
runconfig.cmd_memory_girunconfig:
cmd_memory_gi: ...
runconfig.compile_crd_memory_girunconfig:
compile_crd_memory_gi: ...
runconfig.compile_dirrunconfig:
compile_dir: ...
runconfig.compile_onlyrunconfig:
compile_only: ...
runconfig.credentials_pathrunconfig:
credentials_path: ...
runconfig.debug_argsrunconfig:
debug_args:
...
runconfig.debug_args_pathrunconfig:
debug_args_path: ...
runconfig.disable_strict_checkpoint_loadingrunconfig:
disable_strict_checkpoint_loading: ...
runconfig.disable_version_checkrunconfig:
disable_version_check: ...
runconfig.dist_backendrunconfig:
dist_backend: ...
runconfig.drop_datarunconfig:
drop_data: ...
runconfig.dump_activationsrunconfig:
dump_activations: ...
runconfig.enable_act_frequencyrunconfig:
enable_act_frequency: ...
runconfig.enable_distributedrunconfig:
enable_distributed: ...
runconfig.eval_frequencyrunconfig:
eval_frequency: ...
runconfig.eval_stepsrunconfig:
eval_steps: ...
runconfig.execute_crd_memory_girunconfig:
execute_crd_memory_gi: ...
runconfig.experimental.listenersrunconfig:
experimental:
listeners:
...
runconfig.init_methodrunconfig:
init_method: ...
runconfig.job_labelsrunconfig:
job_labels:
...
runconfig.job_priorityrunconfig:
job_priority: ...
runconfig.job_time_secrunconfig:
job_time_sec: ...
runconfig.lazy_initializationrunconfig:
lazy_initialization: ...
runconfig.load_checkpoint_statesrunconfig:
load_checkpoint_states: ...
runconfig.log_initializationrunconfig:
log_initialization: ...
runconfig.log_input_summariesrunconfig:
log_input_summaries: ...
runconfig.log_stepsrunconfig:
log_steps: ...
runconfig.loggingrunconfig:
logging: ...
runconfig.main_process_idrunconfig:
main_process_id: ...
runconfig.max_checkpointsrunconfig:
max_checkpoints: ...
runconfig.max_stepsrunconfig:
max_steps: ...
runconfig.mgmt_addressrunconfig:
mgmt_address: ...
runconfig.mgmt_namespacerunconfig:
mgmt_namespace: ...
runconfig.model_dirrunconfig:
model_dir: ...
runconfig.mount_dirsrunconfig:
mount_dirs:
...
runconfig.num_act_serversrunconfig:
num_act_servers: ...
runconfig.num_csxrunconfig:
num_csx: ...
runconfig.num_epochsrunconfig:
num_epochs: ...
runconfig.num_stepsrunconfig:
num_steps: ...
runconfig.num_wgt_serversrunconfig:
num_wgt_servers: ...
runconfig.num_workers_per_csxrunconfig:
num_workers_per_csx: ...
runconfig.op_profiler_configrunconfig:
op_profiler_config:
...
runconfig.precision_opt_levelrunconfig:
precision_opt_level: ...
runconfig.python_pathsrunconfig:
python_paths:
...
runconfig.retrace_every_iterationrunconfig:
retrace_every_iteration: ...
runconfig.save_initial_checkpointrunconfig:
save_initial_checkpoint: ...
runconfig.seedrunconfig:
seed: ...
runconfig.steps_per_epochrunconfig:
steps_per_epoch: ...
runconfig.sync_batchnormrunconfig:
sync_batchnorm: ...
runconfig.target_devicerunconfig:
target_device: ...
runconfig.transfer_processesrunconfig:
transfer_processes: ...
runconfig.validate_onlyrunconfig:
validate_only: ...
runconfig.wgt_memory_girunconfig:
wgt_memory_gi: ...
runconfig.wrk_memory_girunconfig:
wrk_memory_gi: ...
runconfig.wsc_log_levelrunconfig:
wsc_log_level:
...
sparsitysparsity:
...
sparsity.add_summariessparsity:
add_summaries: ...
train_inputtrain_input:
...
train_input.micro_batch_sizetrain_input:
micro_batch_size: ...
wandb.groupwandb:
group: ...
wandb.job_typewandb:
job_type: ...
wandb.projectwandb:
project: ...
wandb.resumewandb:
resume: ...
wandb.run_idwandb:
run_id: ...
wandb.run_namewandb:
run_name: ...
wandb.tagswandb:
tags: ...