| cluster_args: | |
| cluster_description: null | |
| cluster_method: agglomerative | |
| compression_ratio: 0.1,0.2,0.3,0.4,0.5 | |
| expert_sim: ttm | |
| frequency_penalty: true | |
| linkage_method: average | |
| max_cluster_size: null | |
| multi_layer: null | |
| num_clusters: null | |
| singleton_outlier_experts: false | |
| singleton_super_experts: false | |
| softmax_temperature: null | |
| ds_args: | |
| dataset_config_name: all | |
| dataset_name: combined | |
| dataset_test_split: test | |
| shuffle: true | |
| split: train | |
| eval_args: | |
| evalplus_tasks: | |
| - mbpp | |
| - humaneval | |
| greedy: true | |
| lm_eval_tasks: | |
| - winogrande | |
| - arc_challenge | |
| - arc_easy | |
| - boolq | |
| - hellaswag | |
| - mmlu | |
| - openbookqa | |
| - rte | |
| min_p: 0.0 | |
| parallel_tasks: 32 | |
| results_dir: null | |
| run_evalplus: false | |
| run_livecodebench: false | |
| run_lm_eval: false | |
| run_math: false | |
| run_wildbench: false | |
| server_log_file_name: server.log | |
| temperature: 0.7 | |
| top_k: 20 | |
| top_p: 0.8 | |
| use_server: true | |
| vllm_port: 8000 | |
| model_args: | |
| model_name: MiniMaxAI/MiniMax-M2.5 | |
| num_experts_per_tok_override: null | |
| obs_args: | |
| distance_measure: cosine | |
| load_in_4bit: true | |
| load_observer_state: artifacts/MiniMax-M2.5/combined/all/observations_1024_cosine.pt | |
| model_max_length: 8 | |
| output_file_name: observations_1024_cosine.pt | |
| overwrite_observations: false | |
| record_pruning_metrics_only: false | |
| renormalize_router_weights: false | |
| return_vllm_tokens_prompt: false | |
| samples_per_category: 50 | |
| select_only_categories: null | |
| split_by_category: false | |
| truncate: false | |
| prune_args: | |
| n_experts_to_prune: null | |
| overwrite_pruned_model: false | |
| perserve_outliers: false | |
| perserve_super_experts: false | |
| prune_method: reap | |
| reap_args: | |
| debug: false | |
| discord_webhook: https://discord.com/api/webhooks/1472407906233352506/2qRcdejykAxDGzgineM-Lek-BKHycLp0N-HLBUqIndk8EJ4d3dvGljqAftl7-CRQrQJL | |
| do_eval: false | |
| plot_clusters: false | |
| profile: true | |
| run_observer_only: false | |
| seed: 42 | |
| smoke_test: true | |
| upload_calibration_to_hf: false | |
| upload_pruned_to_hf: true | |
| verify_model_config: true | |