llm from nas

2025-08-14 11:16:44 -07:00 · 2025-08-14 11:16:44 -07:00 · c467c76188
commit c467c76188
parent ea0aa3043f
1 changed files with 59 additions and 0 deletions
--- a/59
+++ b/59
@ -125,3 +125,62 @@ clean_lmstudio hf_url quant lm_studio_path org="mlx-community" type="":
    for q in {{quant}}; do
        rm -r {{lm_studio_path}}/{{org}}/${repo_name}-${q}bit{{type}} || true
    done
+
+process_single_model hf_url:
+    #!/usr/bin/env bash
+    export HF_HUB_CACHE="/Volumes/hf-cache/huggingface/hub"
+    # Store original HF_HUB_CACHE
+    ORIGINAL_HF_HUB_CACHE="${HF_HUB_CACHE:-}"
+
+    model="{{hf_url}}"
+    echo "Processing model: $model"
+
+    # Convert model path to cache directory format (org--model)
+    model_cache_name=$(echo "$model" | sed 's/\//--/g' | sed 's/^/models--/')
+
+    echo "Copying $model_cache_name from NAS..."
+    rclone copyto -P --fast-list --copy-links --transfers 32 --multi-thread-streams 32 \
+        "tower:hf-cache/huggingface/hub/$model_cache_name" \
+        "$HOME/.cache/huggingface/hub/$model_cache_name"
+
+    # Set HF_HUB_CACHE to local cache
+    export HF_HUB_CACHE="$HOME/.cache/huggingface/hub"
+
+    echo "Processing quantizations for $model..."
+    just mlx_create "$model" "3 4 5 6 8" "/Users/elijahmcmorris/.cache/lm-studio/models" NexVeridian true true
+
+    rclone copyto -P --fast-list --copy-links --transfers 32 --multi-thread-streams 32 \
+        "$HOME/.cache/huggingface/hub/$model_cache_name" \
+        "tower:hf-cache/huggingface/hub/$model_cache_name"
+
+    # Clean up local model cache
+    echo "Cleaning up local cache for $model..."
+    rm -rf "$HOME/.cache/huggingface/hub/$model_cache_name"
+    just clean_hf
+
+    # Reset HF_HUB_CACHE to original value
+    if [[ -n "$ORIGINAL_HF_HUB_CACHE" ]]; then
+        export HF_HUB_CACHE="$ORIGINAL_HF_HUB_CACHE"
+    else
+        unset HF_HUB_CACHE
+    fi
+
+    echo "Completed processing $model"
+
+create_all:
+    #!/usr/bin/env bash
+    # List of models to process
+    models=(
+        # "Qwen/Qwen3-Coder-30B-A3B-Instruct"
+        # "Qwen/Qwen3-Coder-480B-A35B-Instruct"
+        # "moonshotai/Kimi-Dev-72B"
+        # "zai-org/GLM-4.5-Air"
+        # "openai/gpt-oss-20b"
+        # "openai/gpt-oss-120b"
+        "rednote-hilab/dots.llm1.inst"
+    )
+
+    for model in "${models[@]}"; do
+        echo "Processing model: $model"
+        just process_single_model "$model"
+    done