Skip to content

Commit d8c2f8c

Browse files
added required keys
Signed-off-by: Grzegorz Karch <gkarch@nvidia.com>
1 parent 6e08b13 commit d8c2f8c

1 file changed

Lines changed: 7 additions & 0 deletions

File tree

examples/puzzletron/configs/llama-3_1-8B_pruneffn_memory/pruning/attn_pruning.yaml

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,15 @@
11
defaults:
22
- pruning_defaults
33

4+
hook_class: ${get_object:modelopt.torch.prune.importance_hooks.base_hooks.IndependentKvHeadContributionHook}
5+
46
activations_log_dir: ${puzzle_dir}/pruning/pruning_scores/attn_${pruning.activation_hooks_kwargs.method}/${pruning.experiment_id}
57

8+
pruning_mixin:
9+
_target_: modelopt.torch.puzzletron.pruning.kv_heads_pruning_mixin.KVHeadsPruningMixIn
10+
layer_descriptor:
11+
_target_: modelopt.torch.puzzletron.anymodel.models.llama.llama_model_descriptor.LlamaKVHeadsLayerDescriptor
12+
613
activation_hooks_kwargs:
714
method: independent_kv_head_contribution
815
optimize_for: memory # IndependentKvHeadContributionHook implementation that consumes less memory

0 commit comments

Comments
 (0)