Spaces:
Runtime error
Runtime error
| from pathlib import Path | |
| from subprocess import run | |
| def convert(model_id:str, precision:str, quantization:bool)->Path: | |
| # Conversion | |
| cmd = [ | |
| "python", | |
| "./bloomz.cpp/convert-hf-to-ggml.py", | |
| model_id, # bigscience/bloomz-560m | |
| "./bloomz.cpp/models", | |
| ] | |
| if precision == "FP32": | |
| cmd.append("--use-fp32") | |
| run(cmd, check=True) | |
| # Model file should exist | |
| f_suffix = "f32" if precision == "FP32" else "f16" | |
| _, model_name = model_id.split("/") | |
| model_path = Path(f"./bloomz.cpp/models/ggml-model-{model_name}-{f_suffix}.bin") | |
| assert model_path.is_file() | |
| # Quantization | |
| if quantization: | |
| cmd = [ | |
| "./bloomz.cpp/quantize", | |
| f"./bloomz.cpp/models/ggml-model-{model_name}-{f_suffix}.bin", | |
| f"./bloomz.cpp/models/ggml-model-{model_name}-{f_suffix}-q4_0.bin", | |
| "2", | |
| ] | |
| run(cmd, check=True) | |
| model_path = Path(f"./bloomz.cpp/models/ggml-model-{model_name}-{f_suffix}.bin") | |
| assert model_path.is_file() | |
| # Return | |
| return model_path | |