Spaces:

broadfield-dev
/

AMOP

Paused

App Files Files Community

broadfield-dev commited on Sep 14

Commit

de1d3bb

verified ·

1 Parent(s): 7f89b69

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -4

app.py CHANGED Viewed

@@ -27,8 +27,8 @@ os.makedirs(OUTPUT_DIR, exist_ok=True)
 # --- LLAMA.CPP SETUP ---
 LLAMA_CPP_DIR = Path("llama.cpp")
-## FINAL FIX: The script is now named 'convert.py' again in the latest llama.cpp version.
-LLAMA_CPP_CONVERT_SCRIPT = LLAMA_CPP_DIR / "convert.py"
 LLAMA_CPP_QUANTIZE_SCRIPT = LLAMA_CPP_DIR / "quantize"
 def setup_llama_cpp():
@@ -92,7 +92,7 @@ def stage_2_prune_model(model, prune_percentage: float):
 def stage_3_4_onnx_quantize(model_path_or_id: str, onnx_quant_type: str, calibration_data_path: str):
     log_stream = "[STAGE 3 & 4] Converting to ONNX and Quantizing...\n"
-    run_id = datetime.now().strftime("%Ym%d-%H%M%S")
     model_name = model_path_or_id.split('/')[-1]
     onnx_path = os.path.join(OUTPUT_DIR, f"{model_name}-{run_id}-onnx")
@@ -224,7 +224,7 @@ def run_amop_pipeline(model_id: str, pipeline_type: str, do_prune: bool, prune_p
         full_log += log
         full_log += "Packaging & Uploading...\n"; yield {final_output: "Packaging & Uploading (4/5)", log_output: full_log}
-        final_message, log = stage_5_package_and_upload(model_id, optimized_model_path, full_log, options)
         full_log += log
         yield {final_output: gr.update(value="SUCCESS", label="Status"), log_output: full_log, success_box: gr.Markdown(f"✅ **Success!** Model available: [{repo_id_for_link}](https://huggingface.co/{repo_id_for_link})", visible=True), run_button: gr.Button(interactive=True, value="Run Optimization Pipeline", variant="primary"), analyze_button: gr.Button(interactive=True, value="Analyze Model")}

 # --- LLAMA.CPP SETUP ---
 LLAMA_CPP_DIR = Path("llama.cpp")
+## FINAL FIX: The correct, stable script is in the 'tools' subdirectory.
+LLAMA_CPP_CONVERT_SCRIPT = LLAMA_CPP_DIR / "tools" / "convert-hf-to-gguf.py"
 LLAMA_CPP_QUANTIZE_SCRIPT = LLAMA_CPP_DIR / "quantize"
 def setup_llama_cpp():
 def stage_3_4_onnx_quantize(model_path_or_id: str, onnx_quant_type: str, calibration_data_path: str):
     log_stream = "[STAGE 3 & 4] Converting to ONNX and Quantizing...\n"
+    run_id = datetime.now().strftime("%Y%m%d-%H%M%S")
     model_name = model_path_or_id.split('/')[-1]
     onnx_path = os.path.join(OUTPUT_DIR, f"{model_name}-{run_id}-onnx")
         full_log += log
         full_log += "Packaging & Uploading...\n"; yield {final_output: "Packaging & Uploading (4/5)", log_output: full_log}
+        final_message, log = stage_5_package_and_upload(model_id, optimized_path, full_log, options)
         full_log += log
         yield {final_output: gr.update(value="SUCCESS", label="Status"), log_output: full_log, success_box: gr.Markdown(f"✅ **Success!** Model available: [{repo_id_for_link}](https://huggingface.co/{repo_id_for_link})", visible=True), run_button: gr.Button(interactive=True, value="Run Optimization Pipeline", variant="primary"), analyze_button: gr.Button(interactive=True, value="Analyze Model")}