MiniMax-M2-5-REAP-19 / reap_args.yaml
Akicou's picture
Upload folder using huggingface_hub
89a0b74 verified
cluster_args:
cluster_description: null
cluster_method: agglomerative
compression_ratio: 0.1,0.2,0.3,0.4,0.5
expert_sim: ttm
frequency_penalty: true
linkage_method: average
max_cluster_size: null
multi_layer: null
num_clusters: null
singleton_outlier_experts: false
singleton_super_experts: false
softmax_temperature: null
ds_args:
dataset_config_name: all
dataset_name: combined
dataset_test_split: test
shuffle: true
split: train
eval_args:
evalplus_tasks:
- mbpp
- humaneval
greedy: true
lm_eval_tasks:
- winogrande
- arc_challenge
- arc_easy
- boolq
- hellaswag
- mmlu
- openbookqa
- rte
min_p: 0.0
parallel_tasks: 32
results_dir: null
run_evalplus: false
run_livecodebench: false
run_lm_eval: false
run_math: false
run_wildbench: false
server_log_file_name: server.log
temperature: 0.7
top_k: 20
top_p: 0.8
use_server: true
vllm_port: 8000
model_args:
model_name: MiniMaxAI/MiniMax-M2.5
num_experts_per_tok_override: null
obs_args:
distance_measure: cosine
load_in_4bit: true
load_observer_state: artifacts/MiniMax-M2.5/combined/all/observations_1024_cosine.pt
model_max_length: 8
output_file_name: observations_1024_cosine.pt
overwrite_observations: false
record_pruning_metrics_only: false
renormalize_router_weights: false
return_vllm_tokens_prompt: false
samples_per_category: 50
select_only_categories: null
split_by_category: false
truncate: false
prune_args:
n_experts_to_prune: null
overwrite_pruned_model: false
perserve_outliers: false
perserve_super_experts: false
prune_method: reap
reap_args:
debug: false
discord_webhook: https://discord.com/api/webhooks/1472407906233352506/2qRcdejykAxDGzgineM-Lek-BKHycLp0N-HLBUqIndk8EJ4d3dvGljqAftl7-CRQrQJL
do_eval: false
plot_clusters: false
profile: true
run_observer_only: false
seed: 42
smoke_test: true
upload_calibration_to_hf: false
upload_pruned_to_hf: true
verify_model_config: true