gguf-my-repo

Running

Oleg Shulyakov commited on 13 days ago

Commit

1ed03c8

1 Parent(s): 7ea3df7

Skip imatrix re-generation

Files changed (1) hide show

hf-quantize.sh CHANGED Viewed

@@ -135,6 +135,7 @@ else
     if [ $? -ne 0 ]; then
         echo "Error: Failed to download model '$MODEL_ID'."
         exit 1
     fi
@@ -154,6 +155,7 @@ else
     if [ $? -ne 0 ]; then
         echo "Error: Failed to convert model to FP16 GGUF."
         exit 1
     fi
     echo "FP16 GGUF model created at '$FP16_MODEL_PATH'."
@@ -161,23 +163,28 @@ fi
 # --- Step 4: (Optional) Generate Imatrix ---
 if [ "$USE_IMATRIX" = "true" ]; then
-    echo "Generating importance matrix (imatrix)..."
-    IMATRIX_CMD=(
-        llama-imatrix
-        -m "$FP16_MODEL_PATH"
-        -f "$CALIBRATION_FILE_PATH"
-        -ngl 99
-        --output-frequency 10
-        -o "$IMATRIX_FILE_PATH"
-    )
-    echo "Running command: ${IMATRIX_CMD[*]}"
-    "${IMATRIX_CMD[@]}"
-    if [ $? -ne 0 ]; then
-        echo "Error: Failed to generate imatrix."
-        exit 1
     fi
-    echo "Imatrix generated at '$IMATRIX_FILE_PATH'."
 fi
 # --- Step 5: Quantize the GGUF Model ---
@@ -211,6 +218,7 @@ echo "Running command: ${QUANTIZE_CMD[*]}"
 if [ $? -ne 0 ]; then
     echo "Error: Failed to quantize model."
     exit 1
 fi
 echo "Model quantized successfully to '$QUANTIZED_MODEL_PATH'."

     if [ $? -ne 0 ]; then
         echo "Error: Failed to download model '$MODEL_ID'."
+        rm -rf "$MODEL_DOWNLOAD_DIR"
         exit 1
     fi
     if [ $? -ne 0 ]; then
         echo "Error: Failed to convert model to FP16 GGUF."
+        rm -f "$FP16_MODEL_PATH"
         exit 1
     fi
     echo "FP16 GGUF model created at '$FP16_MODEL_PATH'."
 # --- Step 4: (Optional) Generate Imatrix ---
 if [ "$USE_IMATRIX" = "true" ]; then
+    if [ -f "$IMATRIX_FILE_PATH" ]; then
+        echo "Imatrix file '$IMATRIX_FILE_PATH' already exists. Skipping generation."
+    else
+        echo "Generating importance matrix (imatrix)..."
+        IMATRIX_CMD=(
+            llama-imatrix
+            -m "$FP16_MODEL_PATH"
+            -f "$CALIBRATION_FILE_PATH"
+            -ngl 99
+            --output-frequency 10
+            -o "$IMATRIX_FILE_PATH"
+        )
+        echo "Running command: ${IMATRIX_CMD[*]}"
+        "${IMATRIX_CMD[@]}"
+        if [ $? -ne 0 ]; then
+            echo "Error: Failed to generate imatrix."
+            rm -f "$IMATRIX_FILE_PATH"
+            exit 1
+        fi
+        echo "Imatrix generated at '$IMATRIX_FILE_PATH'."
     fi
 fi
 # --- Step 5: Quantize the GGUF Model ---
 if [ $? -ne 0 ]; then
     echo "Error: Failed to quantize model."
+    rm -f "$QUANTIZED_MODEL_PATH"
     exit 1
 fi
 echo "Model quantized successfully to '$QUANTIZED_MODEL_PATH'."