diff --git a/src/brevitas_examples/llm/config/sample_config.yaml b/src/brevitas_examples/llm/config/sample_config.yaml deleted file mode 100644 index 1c294e22b..000000000 --- a/src/brevitas_examples/llm/config/sample_config.yaml +++ /dev/null @@ -1,78 +0,0 @@ -act_calibration: false -act_equalization: null -act_equalization_alpha: 0.2 -bias_corr: false -checkpoint_name: null -convert_layernorm_to_rmsnorm: false -dataset: wikitext2 -eval: true -export_prefix: null -export_target: null -few_shot_compile: false -few_shot_eval: lighteval -few_shot_limit: null -few_shot_tasks: -- leaderboard|arc:challenge|0|0 -- leaderboard|winogrande|0|0 -- lighteval|arc:easy|0|0 -- leaderboard|hellaswag|0|0 -- lighteval|piqa|0|0 -few_shot_override_batch_size: 64 -few_shot_zeroshot: true -functional_sdpa_quant: false -fuse_sequences: false -gpfq: false -gptq: false -gpxq_act_order: true -gpxq_block_name: model.layers -gpxq_create_weight_orig: false -gpxq_max_accumulator_bit_width: null -gpxq_max_accumulator_tile_size: null -gpxq_use_quant_activations: false -input_bit_width: 4 -input_group_size: 32 -input_param_method: stats -input_quant_format: int -input_quant_granularity: per_row -input_quant_type: asym -input_scale_precision: float_scale -input_scale_type: dynamic -learned_round: null -learned_round_fast_update: true -learned_round_iters: 200 -learned_round_lr: 0.005 -learned_round_scale: false -learned_round_scale_lr: 0.01 -learned_round_scale_momentum: 0.9 -ln_affine_merge: false -load_awq: null -load_checkpoint: false -model: HuggingfaceTB/SmolLM2-135M -dtype: float32 -no_quantize: false -nsamples: 128 -quant_sdpa: false -quantize_input_zero_point: false -quantize_last_layer: false -quantize_weight_zero_point: false -replace_mha: false -replace_rmsnorm: true -rotation: fused_no_fx -rotation_sdpa_regions: true -rotation_mode: had -rotation_orphan_sink: true -rotation_layers_to_expand: -- down_proj -scale_rounding_func_type: null -scaling_min_val: 0.0001 -seed: 0 -seqlen: 2048 -weight_bit_width: 4 -weight_equalization: false -weight_group_dim: null -weight_group_size: null -weight_param_method: mse -weight_quant_format: int -weight_quant_granularity: per_channel -weight_quant_type: sym -weight_scale_precision: float_scale