Docs
API
fn = "Meta-Llama-3-8B-Instruct.Q4_0.gguf" gguf_tensor = Tensor.empty(os.stat(fn).st_size, dtype=dtypes.uint8, device=f"disk:{fn}").to(Device.DEFAULT) kv_data, state_dict = gguf_load(gguf_tensor)