llm from nas
This commit is contained in:
parent
ea0aa3043f
commit
c467c76188
1 changed files with 59 additions and 0 deletions
59
justfile
59
justfile
|
@ -125,3 +125,62 @@ clean_lmstudio hf_url quant lm_studio_path org="mlx-community" type="":
|
|||
for q in {{quant}}; do
|
||||
rm -r {{lm_studio_path}}/{{org}}/${repo_name}-${q}bit{{type}} || true
|
||||
done
|
||||
|
||||
process_single_model hf_url:
|
||||
#!/usr/bin/env bash
|
||||
export HF_HUB_CACHE="/Volumes/hf-cache/huggingface/hub"
|
||||
# Store original HF_HUB_CACHE
|
||||
ORIGINAL_HF_HUB_CACHE="${HF_HUB_CACHE:-}"
|
||||
|
||||
model="{{hf_url}}"
|
||||
echo "Processing model: $model"
|
||||
|
||||
# Convert model path to cache directory format (org--model)
|
||||
model_cache_name=$(echo "$model" | sed 's/\//--/g' | sed 's/^/models--/')
|
||||
|
||||
echo "Copying $model_cache_name from NAS..."
|
||||
rclone copyto -P --fast-list --copy-links --transfers 32 --multi-thread-streams 32 \
|
||||
"tower:hf-cache/huggingface/hub/$model_cache_name" \
|
||||
"$HOME/.cache/huggingface/hub/$model_cache_name"
|
||||
|
||||
# Set HF_HUB_CACHE to local cache
|
||||
export HF_HUB_CACHE="$HOME/.cache/huggingface/hub"
|
||||
|
||||
echo "Processing quantizations for $model..."
|
||||
just mlx_create "$model" "3 4 5 6 8" "/Users/elijahmcmorris/.cache/lm-studio/models" NexVeridian true true
|
||||
|
||||
rclone copyto -P --fast-list --copy-links --transfers 32 --multi-thread-streams 32 \
|
||||
"$HOME/.cache/huggingface/hub/$model_cache_name" \
|
||||
"tower:hf-cache/huggingface/hub/$model_cache_name"
|
||||
|
||||
# Clean up local model cache
|
||||
echo "Cleaning up local cache for $model..."
|
||||
rm -rf "$HOME/.cache/huggingface/hub/$model_cache_name"
|
||||
just clean_hf
|
||||
|
||||
# Reset HF_HUB_CACHE to original value
|
||||
if [[ -n "$ORIGINAL_HF_HUB_CACHE" ]]; then
|
||||
export HF_HUB_CACHE="$ORIGINAL_HF_HUB_CACHE"
|
||||
else
|
||||
unset HF_HUB_CACHE
|
||||
fi
|
||||
|
||||
echo "Completed processing $model"
|
||||
|
||||
create_all:
|
||||
#!/usr/bin/env bash
|
||||
# List of models to process
|
||||
models=(
|
||||
# "Qwen/Qwen3-Coder-30B-A3B-Instruct"
|
||||
# "Qwen/Qwen3-Coder-480B-A35B-Instruct"
|
||||
# "moonshotai/Kimi-Dev-72B"
|
||||
# "zai-org/GLM-4.5-Air"
|
||||
# "openai/gpt-oss-20b"
|
||||
# "openai/gpt-oss-120b"
|
||||
"rednote-hilab/dots.llm1.inst"
|
||||
)
|
||||
|
||||
for model in "${models[@]}"; do
|
||||
echo "Processing model: $model"
|
||||
just process_single_model "$model"
|
||||
done
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue