tinker_cookbook.distillation.Config
class tinker_cookbook.distillation.Config(**)
Fields:
- learning_rate (float)
- dataset_configs (list[DistillationDatasetConfig])
- model_name (str)
- renderer_name (str | None) – Default:
None - max_tokens (int)
- temperature (float) – Default:
1.0 - compute_post_kl (bool) – Default:
False - evaluator_builders (list[SamplingClientEvaluatorBuilder]) – Default:
[] - lora_rank (int) – Default:
32 - kl_penalty_coef (float) – Default:
1.0 - kl_discount_factor (float) – Default:
0.0 - loss_fn (LossFnType) – See https://tinker-docs.thinkingmachines.ai/losses Default:
'importance_sampling'. - loss_fn_config (dict[str, Any] | None) – Default:
None - num_substeps (int) – Useful for very large batch sizes. Default:
1. - wandb_project (str | None) – Default:
None - wandb_name (str | None) – Default:
None - log_path (str)
- base_url (str | None) – Default:
None - enable_trace (bool) – Default:
False - span_chart_every (int) – Default:
0 - eval_every (int) – Default:
20 - save_every (int) – Default:
20 - load_checkpoint_path (str | None) – Default:
None - max_steps (int | None) – Maximum number of training steps. If None, train on the full dataset. Default:
None.