Skip to content

README suggests a command for mlx-lm that doesn't work (using Safetensors model) #1883

@booxter

Description

@booxter

Issue Description

In README, the following command is sugested to try mlx-lm: ramalama --runtime=mlx serve hf://mlx-community/Unsloth-Phi-4-4bit

But it fails:

>>> ramalama --runtime=mlx serve hf://mlx-community/Unsloth-Phi-4-4bit
Error: Safetensor models are not supported. Please convert it to GGUF via:
$ ramalama convert --gguf=<quantization> hf://mlx-community/Unsloth-Phi-4-4bit <oci-name>
$ ramalama run <oci-name>

Steps to reproduce the issue

.

Describe the results you received

.

Describe the results you expected

.

ramalama info output

{
    "Accelerator": "none",
    "Config": {},
    "Engine": {
        "Info": {
            "Client": {
                "APIVersion": "5.6.0",
                "Built": 315532800,
                "BuiltTime": "Mon Dec 31 19:00:00 1979",
                "GitCommit": "",
                "GoVersion": "go1.24.5",
                "Os": "darwin",
                "OsArch": "darwin/arm64",
                "Version": "5.6.0"
            },
            "host": {
                "arch": "arm64",
                "buildahVersion": "1.40.1",
                "cgroupControllers": [
                    "cpu",
                    "io",
                    "memory",
                    "pids"
                ],
                "cgroupManager": "systemd",
                "cgroupVersion": "v2",
                "conmon": {
                    "package": "conmon-2.1.12-3.fc41.aarch64",
                    "path": "/usr/bin/conmon",
                    "version": "conmon version 2.1.12, commit: "
                },
                "cpuUtilization": {
                    "idlePercent": 98.96,
                    "systemPercent": 0.53,
                    "userPercent": 0.52
                },
                "cpus": 5,
                "databaseBackend": "sqlite",
                "distribution": {
                    "distribution": "fedora",
                    "variant": "coreos",
                    "version": "41"
                },
                "eventLogger": "journald",
                "freeLocks": 2046,
                "hostname": "localhost.localdomain",
                "idMappings": {
                    "gidmap": [
                        {
                            "container_id": 0,
                            "host_id": 1000,
                            "size": 1
                        },
                        {
                            "container_id": 1,
                            "host_id": 100000,
                            "size": 1000000
                        }
                    ],
                    "uidmap": [
                        {
                            "container_id": 0,
                            "host_id": 501,
                            "size": 1
                        },
                        {
                            "container_id": 1,
                            "host_id": 100000,
                            "size": 1000000
                        }
                    ]
                },
                "kernel": "6.12.13-200.fc41.aarch64",
                "linkmode": "dynamic",
                "logDriver": "journald",
                "memFree": 5012045824,
                "memTotal": 8294567936,
                "networkBackend": "netavark",
                "networkBackendInfo": {
                    "backend": "netavark",
                    "dns": {
                        "package": "aardvark-dns-1.14.0-1.fc41.aarch64",
                        "path": "/usr/libexec/podman/aardvark-dns",
                        "version": "aardvark-dns 1.14.0"
                    },
                    "package": "netavark-1.14.0-1.fc41.aarch64",
                    "path": "/usr/libexec/podman/netavark",
                    "version": "netavark 1.14.0"
                },
                "ociRuntime": {
                    "name": "crun",
                    "package": "crun-1.20-2.fc41.aarch64",
                    "path": "/usr/bin/crun",
                    "version": "crun version 1.20\ncommit: 9c9a76ac11994701dd666c4f0b869ceffb599a66\nrundir: /run/user/501/crun\nspec: 1.0.0\n+SYSTEMD +SELINUX +APPARMOR +CAP +SECCOMP +EBPF +CRIU +LIBKRUN +WASM:wasmedge +YAJL"
                },
                "os": "linux",
                "pasta": {
                    "executable": "/usr/bin/pasta",
                    "package": "passt-0^20250121.g4f2c8e7-2.fc41.aarch64",
                    "version": "pasta 0^20250121.g4f2c8e7-2.fc41.aarch64-pasta\nCopyright Red Hat\nGNU General Public License, version 2 or later\n  <https://www.gnu.org/licenses/old-licenses/gpl-2.0.html>\nThis is free software: you are free to change and redistribute it.\nThere is NO WARRANTY, to the extent permitted by law.\n"
                },
                "remoteSocket": {
                    "exists": true,
                    "path": "unix:///run/user/501/podman/podman.sock"
                },
                "rootlessNetworkCmd": "pasta",
                "security": {
                    "apparmorEnabled": false,
                    "capabilities": "CAP_CHOWN,CAP_DAC_OVERRIDE,CAP_FOWNER,CAP_FSETID,CAP_KILL,CAP_NET_BIND_SERVICE,CAP_SETFCAP,CAP_SETGID,CAP_SETPCAP,CAP_SETUID,CAP_SYS_CHROOT",
                    "rootless": true,
                    "seccompEnabled": true,
                    "seccompProfilePath": "/usr/share/containers/seccomp.json",
                    "selinuxEnabled": true
                },
                "serviceIsRemote": true,
                "slirp4netns": {
                    "executable": "/usr/bin/slirp4netns",
                    "package": "slirp4netns-1.3.1-1.fc41.aarch64",
                    "version": "slirp4netns version 1.3.1\ncommit: e5e368c4f5db6ae75c2fce786e31eef9da6bf236\nlibslirp: 4.8.0\nSLIRP_CONFIG_VERSION_MAX: 5\nlibseccomp: 2.5.5"
                },
                "swapFree": 0,
                "swapTotal": 0,
                "uptime": "0h 23m 45.00s",
                "variant": "v8"
            },
            "plugins": {
                "authorization": null,
                "log": [
                    "k8s-file",
                    "none",
                    "passthrough",
                    "journald"
                ],
                "network": [
                    "bridge",
                    "macvlan",
                    "ipvlan"
                ],
                "volume": [
                    "local"
                ]
            },
            "registries": {
                "search": [
                    "docker.io"
                ]
            },
            "store": {
                "configFile": "/var/home/core/.config/containers/storage.conf",
                "containerStore": {
                    "number": 2,
                    "paused": 0,
                    "running": 0,
                    "stopped": 2
                },
                "graphDriverName": "overlay",
                "graphOptions": {},
                "graphRoot": "/var/home/core/.local/share/containers/storage",
                "graphRootAllocated": 106415992832,
                "graphRootUsed": 15204184064,
                "graphStatus": {
                    "Backing Filesystem": "xfs",
                    "Native Overlay Diff": "true",
                    "Supports d_type": "true",
                    "Supports shifting": "false",
                    "Supports volatile": "true",
                    "Using metacopy": "false"
                },
                "imageCopyTmpDir": "/var/tmp",
                "imageStore": {
                    "number": 20
                },
                "runRoot": "/run/user/501/containers",
                "transientStore": false,
                "volumePath": "/var/home/core/.local/share/containers/storage/volumes"
            },
            "version": {
                "APIVersion": "5.5.2",
                "BuildOrigin": "Copr: packit/containers-podman-26503",
                "Built": 1750723200,
                "BuiltTime": "Mon Jun 23 20:00:00 2025",
                "GitCommit": "e7d8226745ba07a64b7176a7f128e4ef53225a0e",
                "GoVersion": "go1.23.10",
                "Os": "linux",
                "OsArch": "linux/arm64",
                "Version": "5.5.2"
            }
        },
        "Name": "podman"
    },
    "Image": "quay.io/ramalama/ramalama:latest",
    "Runtime": "llama.cpp",
    "Selinux": false,
    "Shortnames": {
        "Files": [],
        "Names": {}
    },
    "Store": "/Users/ihrachyshka/.local/share/ramalama",
    "UseContainer": true,
    "Version": "0.12.1"
}

Upstream Latest Release

Yes

Additional environment details

No response

Additional information

No response

Metadata

Metadata

Assignees

No one assigned

    Labels

    bugSomething isn't working

    Type

    No type

    Projects

    No projects

    Milestone

    No milestone

    Relationships

    None yet

    Development

    No branches or pull requests

    Issue actions