Loading...
Loading...
Compare original and translation side by side
hf_memhf_memuvuvxHF_TOKEN--hf-tokenuvuvxHF_TOKEN--hf-token--model-idmodel.safetensorsmodel.safetensors.index.jsonmodel_index.jsonuvx hf-mem --model-id <model-id> --json-output--gguf-fileuvx hf-mem --model-id <model-id> --gguf-file <file-or-path> --json-outputhf-mem--experimental...ForCausalLM...ForConditionalGeneration--max-model-len--kv-cache-dtypeuvx hf-mem --model-id <model-id> --experimental [--max-model-len N] [--batch-size N] [--kv-cache-dtype auto|bfloat16|fp8|fp8_ds_mla|fp8_e4m3|fp8_e5m2|fp8_inc] --json-outputuvx hf-mem --model-id <model-id> --gguf-file <file-or-path> --experimental [--max-model-len N] [--batch-size N] [--kv-cache-dtype auto|F32|F16|Q4_0|Q4_1|Q5_0|Q5_1|Q8_0|Q8_1|Q2_K|Q3_K|Q4_K|Q5_K|Q6_K|Q8_K|IQ2_XXS|IQ2_XS|IQ3_XXS|IQ1_S|IQ4_NL|IQ3_S|IQ2_S|IQ4_XS|I8|I16|I32|I64|F64|IQ1_M|BF16|TQ1_0|TQ2_0|MXFP4] --json-output--model-idmodel.safetensorsmodel.safetensors.index.jsonmodel_index.jsonuvx hf-mem --model-id <model-id> --json-output--gguf-fileuvx hf-mem --model-id <model-id> --gguf-file <file-or-path> --json-outputhf-mem--experimental...ForCausalLM...ForConditionalGeneration--max-model-len--kv-cache-dtypeuvx hf-mem --model-id <model-id> --experimental [--max-model-len N] [--batch-size N] [--kv-cache-dtype auto|bfloat16|fp8|fp8_ds_mla|fp8_e4m3|fp8_e5m2|fp8_inc] --json-outputuvx hf-mem --model-id <model-id> --gguf-file <file-or-path> --experimental [--max-model-len N] [--batch-size N] [--kv-cache-dtype auto|F32|F16|Q4_0|Q4_1|Q5_0|Q5_1|Q8_0|Q8_1|Q2_K|Q3_K|Q4_K|Q5_K|Q6_K|Q8_K|IQ2_XXS|IQ2_XS|IQ3_XXS|IQ1_S|IQ4_NL|IQ3_S|IQ2_S|IQ4_XS|I8|I16|I32|I64|F64|IQ1_M|BF16|TQ1_0|TQ2_0|MXFP4] --json-outputuvx hf-mem --model-id MiniMaxAI/MiniMax-M2 --json-outputuvx hf-mem --model-id Qwen/Qwen-Image --json-outputuvx hf-mem --model-id google/embeddinggemma-300m --json-output--experimentaluvx hf-mem --model-id mistralai/Mistral-7B-v0.1 --experimental --json-outputuvx hf-mem --model-id unsloth/Qwen3.5-397B-A17B-GGUF --gguf-file Q4_K_M --experimental --json-outputuvx hf-mem --model-id MiniMaxAI/MiniMax-M2 --json-outputuvx hf-mem --model-id Qwen/Qwen-Image --json-outputuvx hf-mem --model-id google/embeddinggemma-300m --json-output--experimentaluvx hf-mem --model-id mistralai/Mistral-7B-v0.1 --experimental --json-outputuvx hf-mem --model-id unsloth/Qwen3.5-397B-A17B-GGUF --gguf-file Q4_K_M --experimental --json-output