-
Notifications
You must be signed in to change notification settings - Fork 248
Open
Labels
bugSomething isn't workingSomething isn't working
Description
Issue Description
In README, the following command is sugested to try mlx-lm
: ramalama --runtime=mlx serve hf://mlx-community/Unsloth-Phi-4-4bit
But it fails:
>>> ramalama --runtime=mlx serve hf://mlx-community/Unsloth-Phi-4-4bit
Error: Safetensor models are not supported. Please convert it to GGUF via:
$ ramalama convert --gguf=<quantization> hf://mlx-community/Unsloth-Phi-4-4bit <oci-name>
$ ramalama run <oci-name>
Steps to reproduce the issue
.
Describe the results you received
.
Describe the results you expected
.
ramalama info output
{
"Accelerator": "none",
"Config": {},
"Engine": {
"Info": {
"Client": {
"APIVersion": "5.6.0",
"Built": 315532800,
"BuiltTime": "Mon Dec 31 19:00:00 1979",
"GitCommit": "",
"GoVersion": "go1.24.5",
"Os": "darwin",
"OsArch": "darwin/arm64",
"Version": "5.6.0"
},
"host": {
"arch": "arm64",
"buildahVersion": "1.40.1",
"cgroupControllers": [
"cpu",
"io",
"memory",
"pids"
],
"cgroupManager": "systemd",
"cgroupVersion": "v2",
"conmon": {
"package": "conmon-2.1.12-3.fc41.aarch64",
"path": "/usr/bin/conmon",
"version": "conmon version 2.1.12, commit: "
},
"cpuUtilization": {
"idlePercent": 98.96,
"systemPercent": 0.53,
"userPercent": 0.52
},
"cpus": 5,
"databaseBackend": "sqlite",
"distribution": {
"distribution": "fedora",
"variant": "coreos",
"version": "41"
},
"eventLogger": "journald",
"freeLocks": 2046,
"hostname": "localhost.localdomain",
"idMappings": {
"gidmap": [
{
"container_id": 0,
"host_id": 1000,
"size": 1
},
{
"container_id": 1,
"host_id": 100000,
"size": 1000000
}
],
"uidmap": [
{
"container_id": 0,
"host_id": 501,
"size": 1
},
{
"container_id": 1,
"host_id": 100000,
"size": 1000000
}
]
},
"kernel": "6.12.13-200.fc41.aarch64",
"linkmode": "dynamic",
"logDriver": "journald",
"memFree": 5012045824,
"memTotal": 8294567936,
"networkBackend": "netavark",
"networkBackendInfo": {
"backend": "netavark",
"dns": {
"package": "aardvark-dns-1.14.0-1.fc41.aarch64",
"path": "/usr/libexec/podman/aardvark-dns",
"version": "aardvark-dns 1.14.0"
},
"package": "netavark-1.14.0-1.fc41.aarch64",
"path": "/usr/libexec/podman/netavark",
"version": "netavark 1.14.0"
},
"ociRuntime": {
"name": "crun",
"package": "crun-1.20-2.fc41.aarch64",
"path": "/usr/bin/crun",
"version": "crun version 1.20\ncommit: 9c9a76ac11994701dd666c4f0b869ceffb599a66\nrundir: /run/user/501/crun\nspec: 1.0.0\n+SYSTEMD +SELINUX +APPARMOR +CAP +SECCOMP +EBPF +CRIU +LIBKRUN +WASM:wasmedge +YAJL"
},
"os": "linux",
"pasta": {
"executable": "/usr/bin/pasta",
"package": "passt-0^20250121.g4f2c8e7-2.fc41.aarch64",
"version": "pasta 0^20250121.g4f2c8e7-2.fc41.aarch64-pasta\nCopyright Red Hat\nGNU General Public License, version 2 or later\n <https://www.gnu.org/licenses/old-licenses/gpl-2.0.html>\nThis is free software: you are free to change and redistribute it.\nThere is NO WARRANTY, to the extent permitted by law.\n"
},
"remoteSocket": {
"exists": true,
"path": "unix:///run/user/501/podman/podman.sock"
},
"rootlessNetworkCmd": "pasta",
"security": {
"apparmorEnabled": false,
"capabilities": "CAP_CHOWN,CAP_DAC_OVERRIDE,CAP_FOWNER,CAP_FSETID,CAP_KILL,CAP_NET_BIND_SERVICE,CAP_SETFCAP,CAP_SETGID,CAP_SETPCAP,CAP_SETUID,CAP_SYS_CHROOT",
"rootless": true,
"seccompEnabled": true,
"seccompProfilePath": "/usr/share/containers/seccomp.json",
"selinuxEnabled": true
},
"serviceIsRemote": true,
"slirp4netns": {
"executable": "/usr/bin/slirp4netns",
"package": "slirp4netns-1.3.1-1.fc41.aarch64",
"version": "slirp4netns version 1.3.1\ncommit: e5e368c4f5db6ae75c2fce786e31eef9da6bf236\nlibslirp: 4.8.0\nSLIRP_CONFIG_VERSION_MAX: 5\nlibseccomp: 2.5.5"
},
"swapFree": 0,
"swapTotal": 0,
"uptime": "0h 23m 45.00s",
"variant": "v8"
},
"plugins": {
"authorization": null,
"log": [
"k8s-file",
"none",
"passthrough",
"journald"
],
"network": [
"bridge",
"macvlan",
"ipvlan"
],
"volume": [
"local"
]
},
"registries": {
"search": [
"docker.io"
]
},
"store": {
"configFile": "/var/home/core/.config/containers/storage.conf",
"containerStore": {
"number": 2,
"paused": 0,
"running": 0,
"stopped": 2
},
"graphDriverName": "overlay",
"graphOptions": {},
"graphRoot": "/var/home/core/.local/share/containers/storage",
"graphRootAllocated": 106415992832,
"graphRootUsed": 15204184064,
"graphStatus": {
"Backing Filesystem": "xfs",
"Native Overlay Diff": "true",
"Supports d_type": "true",
"Supports shifting": "false",
"Supports volatile": "true",
"Using metacopy": "false"
},
"imageCopyTmpDir": "/var/tmp",
"imageStore": {
"number": 20
},
"runRoot": "/run/user/501/containers",
"transientStore": false,
"volumePath": "/var/home/core/.local/share/containers/storage/volumes"
},
"version": {
"APIVersion": "5.5.2",
"BuildOrigin": "Copr: packit/containers-podman-26503",
"Built": 1750723200,
"BuiltTime": "Mon Jun 23 20:00:00 2025",
"GitCommit": "e7d8226745ba07a64b7176a7f128e4ef53225a0e",
"GoVersion": "go1.23.10",
"Os": "linux",
"OsArch": "linux/arm64",
"Version": "5.5.2"
}
},
"Name": "podman"
},
"Image": "quay.io/ramalama/ramalama:latest",
"Runtime": "llama.cpp",
"Selinux": false,
"Shortnames": {
"Files": [],
"Names": {}
},
"Store": "/Users/ihrachyshka/.local/share/ramalama",
"UseContainer": true,
"Version": "0.12.1"
}
Upstream Latest Release
Yes
Additional environment details
No response
Additional information
No response
Metadata
Metadata
Assignees
Labels
bugSomething isn't workingSomething isn't working