[GH-ISSUE #15161] Unable to load Qwen3-VL-Embedding. #35464

Closed
opened 2026-04-22 19:57:53 -05:00 by GiteaMirror · 1 comment
Owner

Originally created by @jclab-joseph on GitHub (Mar 31, 2026).
Original GitHub issue: https://github.com/ollama/ollama/issues/15161

What is the issue?

I attempted to embedding with hf.co/DevQuasar/Qwen.Qwen3-VL-Embedding-2B-GGUF:Q8_0 but it failed.

https://github.com/ollama/ollama/issues/14503#issuecomment-4133511574 does not work.

Relevant log output

...
load_hparams: model size:         781.42 MiB
load_hparams: metadata size:      0.11 MiB
load_tensors: loaded 316 tensors from /home/joseph/.ollama/models/blobs/sha256-3f89a7768ffa6606935319f71bf56bb71871249ba549bf1080a0caea7a088613
warmup: warmup with image size = 1472 x 1472
alloc_compute_meta:        CPU compute buffer size =   322.49 MiB
alloc_compute_meta: graph splits = 1, nodes = 766
warmup: flash attention is enabled
time=2026-03-31T12:01:30.210+09:00 level=INFO source=server.go:1390 msg="llama runner started in 1.53 seconds"
time=2026-03-31T12:01:30.210+09:00 level=INFO source=sched.go:561 msg="loaded runners" count=1
time=2026-03-31T12:01:30.210+09:00 level=INFO source=server.go:1352 msg="waiting for llama runner to start responding"
time=2026-03-31T12:01:30.211+09:00 level=INFO source=server.go:1390 msg="llama runner started in 1.53 seconds"
llama-context.cpp:1238: GGML_ASSERT((n_outputs_prev + n_outputs)*n_embd <= (int64_t) embd_size) failed
[New LWP 2711968]
[New LWP 2711967]
[New LWP 2711966]
[New LWP 2711965]
[New LWP 2711964]
[New LWP 2711963]
[New LWP 2711962]
[New LWP 2711961]
[Thread debugging using libthread_db enabled]
Using host libthread_db library "/lib/x86_64-linux-gnu/libthread_db.so.1".
0x00006521ac926143 in ?? ()
#0  0x00006521ac926143 in ?? ()
#1  0x00006521ac8e2110 in ?? ()
#2  0x00006521aee060a0 in ?? ()
#3  0x0000000000000080 in ?? ()
#4  0x0000000000000000 in ?? ()
[Inferior 1 (process 2711960) detached]
SIGABRT: abort
PC=0x7937b569eb2c m=7 sigcode=18446744073709551610
signal arrived during cgo execution

goroutine 51 gp=0xc000582fc0 m=7 mp=0xc000580008 [syscall]:
runtime.cgocall(0x6521ada15630, 0xc0000a1b88)
        runtime/cgocall.go:167 +0x4b fp=0xc0000a1b60 sp=0xc0000a1b28 pc=0x6521ac918dcb
github.com/ollama/ollama/llama._Cfunc_llama_decode(0x79373e68dd20, {0x3, 0x79373c013810, 0x0, 0x79373c00dd30, 0x79373c010bf0, 0x79373cade2a0, 0x79373cb3c4a0})
        _cgo_gotypes.go:685 +0x4a fp=0xc0000a1b88 sp=0xc0000a1b60 pc=0x6521acddab0a
github.com/ollama/ollama/llama.(*Context).Decode.func1(...)
        github.com/ollama/ollama/llama/llama.go:173
github.com/ollama/ollama/llama.(*Context).Decode(0xc000379740?, 0x1?)
        github.com/ollama/ollama/llama/llama.go:173 +0xed fp=0xc0000a1c70 sp=0xc0000a1b88 pc=0x6521acdddc2d
github.com/ollama/ollama/runner/llamarunner.(*Server).processBatch(0xc0004dd4a0, 0xc0006b1d60, 0xc0006b1db0)
        github.com/ollama/ollama/runner/llamarunner/runner.go:494 +0x250 fp=0xc0000a1ee8 sp=0xc0000a1c70 pc=0x6521ace95870
github.com/ollama/ollama/runner/llamarunner.(*Server).run(0xc0004dd4a0, {0x6521ae392350, 0xc0006b1770})
        github.com/ollama/ollama/runner/llamarunner/runner.go:387 +0x1d5 fp=0xc0000a1fb8 sp=0xc0000a1ee8 pc=0x6521ace954b5
github.com/ollama/ollama/runner/llamarunner.Execute.gowrap1()
        github.com/ollama/ollama/runner/llamarunner/runner.go:981 +0x28 fp=0xc0000a1fe0 sp=0xc0000a1fb8 pc=0x6521ace9a888
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0000a1fe8 sp=0xc0000a1fe0 pc=0x6521ac924341
created by github.com/ollama/ollama/runner/llamarunner.Execute in goroutine 1
        github.com/ollama/ollama/runner/llamarunner/runner.go:981 +0x4c5

goroutine 1 gp=0xc000002380 m=nil [IO wait]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000127778 sp=0xc000127758 pc=0x6521ac91c24e
runtime.netpollblock(0xc0001277c8?, 0xac8b5806?, 0x21?)
        runtime/netpoll.go:575 +0xf7 fp=0xc0001277b0 sp=0xc000127778 pc=0x6521ac8e13f7
internal/poll.runtime_pollWait(0x7937b58b96d0, 0x72)
        runtime/netpoll.go:351 +0x85 fp=0xc0001277d0 sp=0xc0001277b0 pc=0x6521ac91b465
internal/poll.(*pollDesc).wait(0xc0004c4980?, 0x900000036?, 0x0)
        internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc0001277f8 sp=0xc0001277d0 pc=0x6521ac9a3967
internal/poll.(*pollDesc).waitRead(...)
        internal/poll/fd_poll_runtime.go:89
internal/poll.(*FD).Accept(0xc0004c4980)
        internal/poll/fd_unix.go:620 +0x295 fp=0xc0001278a0 sp=0xc0001277f8 pc=0x6521ac9a8d35
net.(*netFD).accept(0xc0004c4980)
        net/fd_unix.go:172 +0x29 fp=0xc000127958 sp=0xc0001278a0 pc=0x6521aca1c229
net.(*TCPListener).accept(0xc000379340)
        net/tcpsock_posix.go:159 +0x1b fp=0xc0001279a8 sp=0xc000127958 pc=0x6521aca3213b
net.(*TCPListener).Accept(0xc000379340)
        net/tcpsock.go:380 +0x30 fp=0xc0001279d8 sp=0xc0001279a8 pc=0x6521aca30ff0
net/http.(*onceCloseListener).Accept(0xc0004da510?)
        <autogenerated>:1 +0x24 fp=0xc0001279f0 sp=0xc0001279d8 pc=0x6521acc58604
net/http.(*Server).Serve(0xc00046b700, {0x6521ae38f900, 0xc000379340})
        net/http/server.go:3424 +0x30c fp=0xc000127b20 sp=0xc0001279f0 pc=0x6521acc2fecc
github.com/ollama/ollama/runner/llamarunner.Execute({0xc000034260, 0x4, 0x4})
        github.com/ollama/ollama/runner/llamarunner/runner.go:1002 +0x8f5 fp=0xc000127cf0 sp=0xc000127b20 pc=0x6521ace9a615
github.com/ollama/ollama/runner.Execute({0xc000034250?, 0x0?, 0x0?})
        github.com/ollama/ollama/runner/runner.go:25 +0x190 fp=0xc000127d30 sp=0xc000127cf0 pc=0x6521ad01e1d0
github.com/ollama/ollama/cmd.NewCLI.func3(0xc00046b300?, {0x6521add5b25f?, 0x4?, 0x6521add5b263?})
        github.com/ollama/ollama/cmd/cmd.go:2273 +0x45 fp=0xc000127d58 sp=0xc000127d30 pc=0x6521ad849e85
github.com/spf13/cobra.(*Command).execute(0xc0004dfb08, {0xc000379180, 0x4, 0x4})
        github.com/spf13/cobra@v1.7.0/command.go:940 +0x85c fp=0xc000127e78 sp=0xc000127d58 pc=0x6521aca961bc
github.com/spf13/cobra.(*Command).ExecuteC(0xc0006dd508)
        github.com/spf13/cobra@v1.7.0/command.go:1068 +0x3a5 fp=0xc000127f30 sp=0xc000127e78 pc=0x6521aca96a05
github.com/spf13/cobra.(*Command).Execute(...)
        github.com/spf13/cobra@v1.7.0/command.go:992
github.com/spf13/cobra.(*Command).ExecuteContext(...)
        github.com/spf13/cobra@v1.7.0/command.go:985
main.main()
        github.com/ollama/ollama/main.go:12 +0x4d fp=0xc000127f50 sp=0xc000127f30 pc=0x6521ad84b92d
runtime.main()
        runtime/proc.go:283 +0x29d fp=0xc000127fe0 sp=0xc000127f50 pc=0x6521ac8e8a7d
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000127fe8 sp=0xc000127fe0 pc=0x6521ac924341

goroutine 2 gp=0xc000002e00 m=nil [force gc (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00008efa8 sp=0xc00008ef88 pc=0x6521ac91c24e
runtime.goparkunlock(...)
        runtime/proc.go:441
runtime.forcegchelper()
        runtime/proc.go:348 +0xb8 fp=0xc00008efe0 sp=0xc00008efa8 pc=0x6521ac8e8db8
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008efe8 sp=0xc00008efe0 pc=0x6521ac924341
created by runtime.init.7 in goroutine 1
        runtime/proc.go:336 +0x1a

goroutine 3 gp=0xc000003340 m=nil [GC sweep wait]:
runtime.gopark(0x1?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00008f780 sp=0xc00008f760 pc=0x6521ac91c24e
runtime.goparkunlock(...)
        runtime/proc.go:441
runtime.bgsweep(0xc00004a080)
        runtime/mgcsweep.go:316 +0xdf fp=0xc00008f7c8 sp=0xc00008f780 pc=0x6521ac8d355f
runtime.gcenable.gowrap1()
        runtime/mgc.go:204 +0x25 fp=0xc00008f7e0 sp=0xc00008f7c8 pc=0x6521ac8c7945
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008f7e8 sp=0xc00008f7e0 pc=0x6521ac924341
created by runtime.gcenable in goroutine 1
        runtime/mgc.go:204 +0x66

goroutine 4 gp=0xc000003500 m=nil [GC scavenge wait]:
runtime.gopark(0x10000?, 0x6521adf81528?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00008ff78 sp=0xc00008ff58 pc=0x6521ac91c24e
runtime.goparkunlock(...)
        runtime/proc.go:441
runtime.(*scavengerState).park(0x6521aee00120)
        runtime/mgcscavenge.go:425 +0x49 fp=0xc00008ffa8 sp=0xc00008ff78 pc=0x6521ac8d0fa9
runtime.bgscavenge(0xc00004a080)
        runtime/mgcscavenge.go:658 +0x59 fp=0xc00008ffc8 sp=0xc00008ffa8 pc=0x6521ac8d1539
runtime.gcenable.gowrap2()
        runtime/mgc.go:205 +0x25 fp=0xc00008ffe0 sp=0xc00008ffc8 pc=0x6521ac8c78e5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008ffe8 sp=0xc00008ffe0 pc=0x6521ac924341
created by runtime.gcenable in goroutine 1
        runtime/mgc.go:205 +0xa5

goroutine 5 gp=0xc000003dc0 m=nil [finalizer wait]:
runtime.gopark(0x1b8?, 0xc000002380?, 0x1?, 0x23?, 0xc00008e688?)
        runtime/proc.go:435 +0xce fp=0xc00008e630 sp=0xc00008e610 pc=0x6521ac91c24e
runtime.runfinq()
        runtime/mfinal.go:196 +0x107 fp=0xc00008e7e0 sp=0xc00008e630 pc=0x6521ac8c6907
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008e7e8 sp=0xc00008e7e0 pc=0x6521ac924341
created by runtime.createfing in goroutine 1
        runtime/mfinal.go:166 +0x3d

goroutine 6 gp=0xc0001ea8c0 m=nil [chan receive]:
runtime.gopark(0xc000193cc0?, 0xc000692018?, 0x60?, 0x7?, 0x6521aca02d88?)
        runtime/proc.go:435 +0xce fp=0xc000090718 sp=0xc0000906f8 pc=0x6521ac91c24e
runtime.chanrecv(0xc0000c4310, 0x0, 0x1)
        runtime/chan.go:664 +0x445 fp=0xc000090790 sp=0xc000090718 pc=0x6521ac8b83e5
runtime.chanrecv1(0x0?, 0x0?)
        runtime/chan.go:506 +0x12 fp=0xc0000907b8 sp=0xc000090790 pc=0x6521ac8b7f72
runtime.unique_runtime_registerUniqueMapCleanup.func2(...)
        runtime/mgc.go:1796
runtime.unique_runtime_registerUniqueMapCleanup.gowrap1()
        runtime/mgc.go:1799 +0x2f fp=0xc0000907e0 sp=0xc0000907b8 pc=0x6521ac8caaef
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0000907e8 sp=0xc0000907e0 pc=0x6521ac924341
created by unique.runtime_registerUniqueMapCleanup in goroutine 1
        runtime/mgc.go:1794 +0x85

goroutine 7 gp=0xc0001eac40 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000090f38 sp=0xc000090f18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc000090fc8 sp=0xc000090f38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc000090fe0 sp=0xc000090fc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000090fe8 sp=0xc000090fe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 18 gp=0xc000102380 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00008a738 sp=0xc00008a718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc00008a7c8 sp=0xc00008a738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc00008a7e0 sp=0xc00008a7c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008a7e8 sp=0xc00008a7e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 19 gp=0xc000102540 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00008af38 sp=0xc00008af18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc00008afc8 sp=0xc00008af38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc00008afe0 sp=0xc00008afc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008afe8 sp=0xc00008afe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 20 gp=0xc000102700 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00008b738 sp=0xc00008b718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc00008b7c8 sp=0xc00008b738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc00008b7e0 sp=0xc00008b7c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00008b7e8 sp=0xc00008b7e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 34 gp=0xc000504000 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00050a738 sp=0xc00050a718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc00050a7c8 sp=0xc00050a738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc00050a7e0 sp=0xc00050a7c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00050a7e8 sp=0xc00050a7e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 8 gp=0xc0001eae00 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000091738 sp=0xc000091718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc0000917c8 sp=0xc000091738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc0000917e0 sp=0xc0000917c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0000917e8 sp=0xc0000917e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 9 gp=0xc0001eafc0 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000091f38 sp=0xc000091f18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc000091fc8 sp=0xc000091f38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc000091fe0 sp=0xc000091fc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000091fe8 sp=0xc000091fe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 10 gp=0xc0001eb180 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000506738 sp=0xc000506718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc0005067c8 sp=0xc000506738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc0005067e0 sp=0xc0005067c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0005067e8 sp=0xc0005067e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 11 gp=0xc0001eb340 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000506f38 sp=0xc000506f18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc000506fc8 sp=0xc000506f38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc000506fe0 sp=0xc000506fc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000506fe8 sp=0xc000506fe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 12 gp=0xc0001eb500 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000507738 sp=0xc000507718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc0005077c8 sp=0xc000507738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc0005077e0 sp=0xc0005077c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0005077e8 sp=0xc0005077e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 13 gp=0xc0001eb6c0 m=nil [GC worker (idle)]:
runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000507f38 sp=0xc000507f18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc000507fc8 sp=0xc000507f38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc000507fe0 sp=0xc000507fc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000507fe8 sp=0xc000507fe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 14 gp=0xc0001eb880 m=nil [GC worker (idle)]:
runtime.gopark(0x6521aeed6140?, 0x1?, 0x10?, 0x1e?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000508738 sp=0xc000508718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc0005087c8 sp=0xc000508738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc0005087e0 sp=0xc0005087c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0005087e8 sp=0xc0005087e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 15 gp=0xc0001eba40 m=nil [GC worker (idle)]:
runtime.gopark(0x6521aeed6140?, 0x1?, 0x4f?, 0x29?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000508f38 sp=0xc000508f18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc000508fc8 sp=0xc000508f38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc000508fe0 sp=0xc000508fc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000508fe8 sp=0xc000508fe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 16 gp=0xc0001ebc00 m=nil [GC worker (idle)]:
runtime.gopark(0x28037b5299897?, 0x3?, 0x52?, 0xc6?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000509738 sp=0xc000509718 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc0005097c8 sp=0xc000509738 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc0005097e0 sp=0xc0005097c8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc0005097e8 sp=0xc0005097e0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 50 gp=0xc0001ebdc0 m=nil [GC worker (idle)]:
runtime.gopark(0x6521aeed6140?, 0x1?, 0xe9?, 0x9b?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc000509f38 sp=0xc000509f18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc000509fc8 sp=0xc000509f38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc000509fe0 sp=0xc000509fc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000509fe8 sp=0xc000509fe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 35 gp=0xc0005041c0 m=nil [GC worker (idle)]:
runtime.gopark(0x28037b5299869?, 0x1?, 0xde?, 0x64?, 0x0?)
        runtime/proc.go:435 +0xce fp=0xc00050af38 sp=0xc00050af18 pc=0x6521ac91c24e
runtime.gcBgMarkWorker(0xc0000c5730)
        runtime/mgc.go:1423 +0xe9 fp=0xc00050afc8 sp=0xc00050af38 pc=0x6521ac8c9e09
runtime.gcBgMarkStartWorkers.gowrap1()
        runtime/mgc.go:1339 +0x25 fp=0xc00050afe0 sp=0xc00050afc8 pc=0x6521ac8c9ce5
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00050afe8 sp=0xc00050afe0 pc=0x6521ac924341
created by runtime.gcBgMarkStartWorkers in goroutine 1
        runtime/mgc.go:1339 +0x105

goroutine 52 gp=0xc000583180 m=nil [chan receive]:
runtime.gopark(0x6521ac922354?, 0xc0000578d0?, 0x90?, 0xbd?, 0xc0000578b8?)
        runtime/proc.go:435 +0xce fp=0xc000057898 sp=0xc000057878 pc=0x6521ac91c24e
runtime.chanrecv(0xc000463490, 0xc000057a70, 0x1)
        runtime/chan.go:664 +0x445 fp=0xc000057910 sp=0xc000057898 pc=0x6521ac8b83e5
runtime.chanrecv1(0xc00011c9c0?, 0xc0004c4c00?)
        runtime/chan.go:506 +0x12 fp=0xc000057938 sp=0xc000057910 pc=0x6521ac8b7f72
github.com/ollama/ollama/runner/llamarunner.(*Server).embeddings(0xc0004dd4a0, {0x6521ae38fae0, 0xc0006c5b20}, 0xc0004d7540)
        github.com/ollama/ollama/runner/llamarunner/runner.go:807 +0x72d fp=0xc000057ac0 sp=0xc000057938 pc=0x6521ace983cd
github.com/ollama/ollama/runner/llamarunner.(*Server).embeddings-fm({0x6521ae38fae0?, 0xc0006c5b20?}, 0xc000057b40?)
        <autogenerated>:1 +0x36 fp=0xc000057af0 sp=0xc000057ac0 pc=0x6521ace9ac16
net/http.HandlerFunc.ServeHTTP(0xc0006b8780?, {0x6521ae38fae0?, 0xc0006c5b20?}, 0xc000057b60?)
        net/http/server.go:2294 +0x29 fp=0xc000057b18 sp=0xc000057af0 pc=0x6521acc2c509
net/http.(*ServeMux).ServeHTTP(0x6521ac8c0e25?, {0x6521ae38fae0, 0xc0006c5b20}, 0xc0004d7540)
        net/http/server.go:2822 +0x1c4 fp=0xc000057b68 sp=0xc000057b18 pc=0x6521acc2e404
net/http.serverHandler.ServeHTTP({0x6521ae38bb70?}, {0x6521ae38fae0?, 0xc0006c5b20?}, 0x1?)
        net/http/server.go:3301 +0x8e fp=0xc000057b98 sp=0xc000057b68 pc=0x6521acc4be8e
net/http.(*conn).serve(0xc0004da510, {0x6521ae392318, 0xc0004d9590})
        net/http/server.go:2102 +0x625 fp=0xc000057fb8 sp=0xc000057b98 pc=0x6521acc2aa05
net/http.(*Server).Serve.gowrap3()
        net/http/server.go:3454 +0x28 fp=0xc000057fe0 sp=0xc000057fb8 pc=0x6521acc302c8
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc000057fe8 sp=0xc000057fe0 pc=0x6521ac924341
created by net/http.(*Server).Serve in goroutine 1
        net/http/server.go:3454 +0x485

goroutine 59 gp=0xc0005836c0 m=nil [IO wait]:
runtime.gopark(0x0?, 0x0?, 0xa0?, 0xf1?, 0xb?)
        runtime/proc.go:435 +0xce fp=0xc00050bdd8 sp=0xc00050bdb8 pc=0x6521ac91c24e
runtime.netpollblock(0x6521ac93fc78?, 0xac8b5806?, 0x21?)
        runtime/netpoll.go:575 +0xf7 fp=0xc00050be10 sp=0xc00050bdd8 pc=0x6521ac8e13f7
internal/poll.runtime_pollWait(0x7937b58b95b8, 0x72)
        runtime/netpoll.go:351 +0x85 fp=0xc00050be30 sp=0xc00050be10 pc=0x6521ac91b465
internal/poll.(*pollDesc).wait(0xc0004c4a00?, 0xc0004d9691?, 0x0)
        internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc00050be58 sp=0xc00050be30 pc=0x6521ac9a3967
internal/poll.(*pollDesc).waitRead(...)
        internal/poll/fd_poll_runtime.go:89
internal/poll.(*FD).Read(0xc0004c4a00, {0xc0004d9691, 0x1, 0x1})
        internal/poll/fd_unix.go:165 +0x27a fp=0xc00050bef0 sp=0xc00050be58 pc=0x6521ac9a4c5a
net.(*netFD).Read(0xc0004c4a00, {0xc0004d9691?, 0xc000379418?, 0xc00050bf70?})
        net/fd_posix.go:55 +0x25 fp=0xc00050bf38 sp=0xc00050bef0 pc=0x6521aca1a285
net.(*conn).Read(0xc000160610, {0xc0004d9691?, 0x0?, 0xc0000c53b0?})
        net/net.go:194 +0x45 fp=0xc00050bf80 sp=0xc00050bf38 pc=0x6521aca28645
net/http.(*connReader).backgroundRead(0xc0004d9680)
        net/http/server.go:690 +0x37 fp=0xc00050bfc8 sp=0xc00050bf80 pc=0x6521acc248d7
net/http.(*connReader).startBackgroundRead.gowrap2()
        net/http/server.go:686 +0x25 fp=0xc00050bfe0 sp=0xc00050bfc8 pc=0x6521acc24805
runtime.goexit({})
        runtime/asm_amd64.s:1700 +0x1 fp=0xc00050bfe8 sp=0xc00050bfe0 pc=0x6521ac924341
created by net/http.(*connReader).startBackgroundRead in goroutine 52
        net/http/server.go:686 +0xb6

rax    0x0
rbx    0x29619e
rcx    0x7937b569eb2c
rdx    0x6
rdi    0x296198
rsi    0x29619e
rbp    0x7937673feec0
rsp    0x7937673fee80
r8     0x0
r9     0x7
r10    0x8
r11    0x246
r12    0x6
r13    0x6521adfeb92c
r14    0x16
r15    0x1
rip    0x7937b569eb2c
rflags 0x246
cs     0x33
fs     0x0
gs     0x0
time=2026-03-31T12:01:30.772+09:00 level=ERROR source=server.go:304 msg="llama runner terminated" error="exit status 2"
[GIN] 2026/03/31 - 12:01:30 | 400 |  2.485840802s |       127.0.0.1 | POST     "/api/embed"

OS

Linux

GPU

Other

CPU

Intel

Ollama version

0.18.3

Originally created by @jclab-joseph on GitHub (Mar 31, 2026). Original GitHub issue: https://github.com/ollama/ollama/issues/15161 ### What is the issue? I attempted to embedding with hf.co/DevQuasar/Qwen.Qwen3-VL-Embedding-2B-GGUF:Q8_0 but it failed. https://github.com/ollama/ollama/issues/14503#issuecomment-4133511574 does not work. ### Relevant log output ```shell ... load_hparams: model size: 781.42 MiB load_hparams: metadata size: 0.11 MiB load_tensors: loaded 316 tensors from /home/joseph/.ollama/models/blobs/sha256-3f89a7768ffa6606935319f71bf56bb71871249ba549bf1080a0caea7a088613 warmup: warmup with image size = 1472 x 1472 alloc_compute_meta: CPU compute buffer size = 322.49 MiB alloc_compute_meta: graph splits = 1, nodes = 766 warmup: flash attention is enabled time=2026-03-31T12:01:30.210+09:00 level=INFO source=server.go:1390 msg="llama runner started in 1.53 seconds" time=2026-03-31T12:01:30.210+09:00 level=INFO source=sched.go:561 msg="loaded runners" count=1 time=2026-03-31T12:01:30.210+09:00 level=INFO source=server.go:1352 msg="waiting for llama runner to start responding" time=2026-03-31T12:01:30.211+09:00 level=INFO source=server.go:1390 msg="llama runner started in 1.53 seconds" llama-context.cpp:1238: GGML_ASSERT((n_outputs_prev + n_outputs)*n_embd <= (int64_t) embd_size) failed [New LWP 2711968] [New LWP 2711967] [New LWP 2711966] [New LWP 2711965] [New LWP 2711964] [New LWP 2711963] [New LWP 2711962] [New LWP 2711961] [Thread debugging using libthread_db enabled] Using host libthread_db library "/lib/x86_64-linux-gnu/libthread_db.so.1". 0x00006521ac926143 in ?? () #0 0x00006521ac926143 in ?? () #1 0x00006521ac8e2110 in ?? () #2 0x00006521aee060a0 in ?? () #3 0x0000000000000080 in ?? () #4 0x0000000000000000 in ?? () [Inferior 1 (process 2711960) detached] SIGABRT: abort PC=0x7937b569eb2c m=7 sigcode=18446744073709551610 signal arrived during cgo execution goroutine 51 gp=0xc000582fc0 m=7 mp=0xc000580008 [syscall]: runtime.cgocall(0x6521ada15630, 0xc0000a1b88) runtime/cgocall.go:167 +0x4b fp=0xc0000a1b60 sp=0xc0000a1b28 pc=0x6521ac918dcb github.com/ollama/ollama/llama._Cfunc_llama_decode(0x79373e68dd20, {0x3, 0x79373c013810, 0x0, 0x79373c00dd30, 0x79373c010bf0, 0x79373cade2a0, 0x79373cb3c4a0}) _cgo_gotypes.go:685 +0x4a fp=0xc0000a1b88 sp=0xc0000a1b60 pc=0x6521acddab0a github.com/ollama/ollama/llama.(*Context).Decode.func1(...) github.com/ollama/ollama/llama/llama.go:173 github.com/ollama/ollama/llama.(*Context).Decode(0xc000379740?, 0x1?) github.com/ollama/ollama/llama/llama.go:173 +0xed fp=0xc0000a1c70 sp=0xc0000a1b88 pc=0x6521acdddc2d github.com/ollama/ollama/runner/llamarunner.(*Server).processBatch(0xc0004dd4a0, 0xc0006b1d60, 0xc0006b1db0) github.com/ollama/ollama/runner/llamarunner/runner.go:494 +0x250 fp=0xc0000a1ee8 sp=0xc0000a1c70 pc=0x6521ace95870 github.com/ollama/ollama/runner/llamarunner.(*Server).run(0xc0004dd4a0, {0x6521ae392350, 0xc0006b1770}) github.com/ollama/ollama/runner/llamarunner/runner.go:387 +0x1d5 fp=0xc0000a1fb8 sp=0xc0000a1ee8 pc=0x6521ace954b5 github.com/ollama/ollama/runner/llamarunner.Execute.gowrap1() github.com/ollama/ollama/runner/llamarunner/runner.go:981 +0x28 fp=0xc0000a1fe0 sp=0xc0000a1fb8 pc=0x6521ace9a888 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0000a1fe8 sp=0xc0000a1fe0 pc=0x6521ac924341 created by github.com/ollama/ollama/runner/llamarunner.Execute in goroutine 1 github.com/ollama/ollama/runner/llamarunner/runner.go:981 +0x4c5 goroutine 1 gp=0xc000002380 m=nil [IO wait]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000127778 sp=0xc000127758 pc=0x6521ac91c24e runtime.netpollblock(0xc0001277c8?, 0xac8b5806?, 0x21?) runtime/netpoll.go:575 +0xf7 fp=0xc0001277b0 sp=0xc000127778 pc=0x6521ac8e13f7 internal/poll.runtime_pollWait(0x7937b58b96d0, 0x72) runtime/netpoll.go:351 +0x85 fp=0xc0001277d0 sp=0xc0001277b0 pc=0x6521ac91b465 internal/poll.(*pollDesc).wait(0xc0004c4980?, 0x900000036?, 0x0) internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc0001277f8 sp=0xc0001277d0 pc=0x6521ac9a3967 internal/poll.(*pollDesc).waitRead(...) internal/poll/fd_poll_runtime.go:89 internal/poll.(*FD).Accept(0xc0004c4980) internal/poll/fd_unix.go:620 +0x295 fp=0xc0001278a0 sp=0xc0001277f8 pc=0x6521ac9a8d35 net.(*netFD).accept(0xc0004c4980) net/fd_unix.go:172 +0x29 fp=0xc000127958 sp=0xc0001278a0 pc=0x6521aca1c229 net.(*TCPListener).accept(0xc000379340) net/tcpsock_posix.go:159 +0x1b fp=0xc0001279a8 sp=0xc000127958 pc=0x6521aca3213b net.(*TCPListener).Accept(0xc000379340) net/tcpsock.go:380 +0x30 fp=0xc0001279d8 sp=0xc0001279a8 pc=0x6521aca30ff0 net/http.(*onceCloseListener).Accept(0xc0004da510?) <autogenerated>:1 +0x24 fp=0xc0001279f0 sp=0xc0001279d8 pc=0x6521acc58604 net/http.(*Server).Serve(0xc00046b700, {0x6521ae38f900, 0xc000379340}) net/http/server.go:3424 +0x30c fp=0xc000127b20 sp=0xc0001279f0 pc=0x6521acc2fecc github.com/ollama/ollama/runner/llamarunner.Execute({0xc000034260, 0x4, 0x4}) github.com/ollama/ollama/runner/llamarunner/runner.go:1002 +0x8f5 fp=0xc000127cf0 sp=0xc000127b20 pc=0x6521ace9a615 github.com/ollama/ollama/runner.Execute({0xc000034250?, 0x0?, 0x0?}) github.com/ollama/ollama/runner/runner.go:25 +0x190 fp=0xc000127d30 sp=0xc000127cf0 pc=0x6521ad01e1d0 github.com/ollama/ollama/cmd.NewCLI.func3(0xc00046b300?, {0x6521add5b25f?, 0x4?, 0x6521add5b263?}) github.com/ollama/ollama/cmd/cmd.go:2273 +0x45 fp=0xc000127d58 sp=0xc000127d30 pc=0x6521ad849e85 github.com/spf13/cobra.(*Command).execute(0xc0004dfb08, {0xc000379180, 0x4, 0x4}) github.com/spf13/cobra@v1.7.0/command.go:940 +0x85c fp=0xc000127e78 sp=0xc000127d58 pc=0x6521aca961bc github.com/spf13/cobra.(*Command).ExecuteC(0xc0006dd508) github.com/spf13/cobra@v1.7.0/command.go:1068 +0x3a5 fp=0xc000127f30 sp=0xc000127e78 pc=0x6521aca96a05 github.com/spf13/cobra.(*Command).Execute(...) github.com/spf13/cobra@v1.7.0/command.go:992 github.com/spf13/cobra.(*Command).ExecuteContext(...) github.com/spf13/cobra@v1.7.0/command.go:985 main.main() github.com/ollama/ollama/main.go:12 +0x4d fp=0xc000127f50 sp=0xc000127f30 pc=0x6521ad84b92d runtime.main() runtime/proc.go:283 +0x29d fp=0xc000127fe0 sp=0xc000127f50 pc=0x6521ac8e8a7d runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000127fe8 sp=0xc000127fe0 pc=0x6521ac924341 goroutine 2 gp=0xc000002e00 m=nil [force gc (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00008efa8 sp=0xc00008ef88 pc=0x6521ac91c24e runtime.goparkunlock(...) runtime/proc.go:441 runtime.forcegchelper() runtime/proc.go:348 +0xb8 fp=0xc00008efe0 sp=0xc00008efa8 pc=0x6521ac8e8db8 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008efe8 sp=0xc00008efe0 pc=0x6521ac924341 created by runtime.init.7 in goroutine 1 runtime/proc.go:336 +0x1a goroutine 3 gp=0xc000003340 m=nil [GC sweep wait]: runtime.gopark(0x1?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00008f780 sp=0xc00008f760 pc=0x6521ac91c24e runtime.goparkunlock(...) runtime/proc.go:441 runtime.bgsweep(0xc00004a080) runtime/mgcsweep.go:316 +0xdf fp=0xc00008f7c8 sp=0xc00008f780 pc=0x6521ac8d355f runtime.gcenable.gowrap1() runtime/mgc.go:204 +0x25 fp=0xc00008f7e0 sp=0xc00008f7c8 pc=0x6521ac8c7945 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008f7e8 sp=0xc00008f7e0 pc=0x6521ac924341 created by runtime.gcenable in goroutine 1 runtime/mgc.go:204 +0x66 goroutine 4 gp=0xc000003500 m=nil [GC scavenge wait]: runtime.gopark(0x10000?, 0x6521adf81528?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00008ff78 sp=0xc00008ff58 pc=0x6521ac91c24e runtime.goparkunlock(...) runtime/proc.go:441 runtime.(*scavengerState).park(0x6521aee00120) runtime/mgcscavenge.go:425 +0x49 fp=0xc00008ffa8 sp=0xc00008ff78 pc=0x6521ac8d0fa9 runtime.bgscavenge(0xc00004a080) runtime/mgcscavenge.go:658 +0x59 fp=0xc00008ffc8 sp=0xc00008ffa8 pc=0x6521ac8d1539 runtime.gcenable.gowrap2() runtime/mgc.go:205 +0x25 fp=0xc00008ffe0 sp=0xc00008ffc8 pc=0x6521ac8c78e5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008ffe8 sp=0xc00008ffe0 pc=0x6521ac924341 created by runtime.gcenable in goroutine 1 runtime/mgc.go:205 +0xa5 goroutine 5 gp=0xc000003dc0 m=nil [finalizer wait]: runtime.gopark(0x1b8?, 0xc000002380?, 0x1?, 0x23?, 0xc00008e688?) runtime/proc.go:435 +0xce fp=0xc00008e630 sp=0xc00008e610 pc=0x6521ac91c24e runtime.runfinq() runtime/mfinal.go:196 +0x107 fp=0xc00008e7e0 sp=0xc00008e630 pc=0x6521ac8c6907 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008e7e8 sp=0xc00008e7e0 pc=0x6521ac924341 created by runtime.createfing in goroutine 1 runtime/mfinal.go:166 +0x3d goroutine 6 gp=0xc0001ea8c0 m=nil [chan receive]: runtime.gopark(0xc000193cc0?, 0xc000692018?, 0x60?, 0x7?, 0x6521aca02d88?) runtime/proc.go:435 +0xce fp=0xc000090718 sp=0xc0000906f8 pc=0x6521ac91c24e runtime.chanrecv(0xc0000c4310, 0x0, 0x1) runtime/chan.go:664 +0x445 fp=0xc000090790 sp=0xc000090718 pc=0x6521ac8b83e5 runtime.chanrecv1(0x0?, 0x0?) runtime/chan.go:506 +0x12 fp=0xc0000907b8 sp=0xc000090790 pc=0x6521ac8b7f72 runtime.unique_runtime_registerUniqueMapCleanup.func2(...) runtime/mgc.go:1796 runtime.unique_runtime_registerUniqueMapCleanup.gowrap1() runtime/mgc.go:1799 +0x2f fp=0xc0000907e0 sp=0xc0000907b8 pc=0x6521ac8caaef runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0000907e8 sp=0xc0000907e0 pc=0x6521ac924341 created by unique.runtime_registerUniqueMapCleanup in goroutine 1 runtime/mgc.go:1794 +0x85 goroutine 7 gp=0xc0001eac40 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000090f38 sp=0xc000090f18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc000090fc8 sp=0xc000090f38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc000090fe0 sp=0xc000090fc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000090fe8 sp=0xc000090fe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 18 gp=0xc000102380 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00008a738 sp=0xc00008a718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc00008a7c8 sp=0xc00008a738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc00008a7e0 sp=0xc00008a7c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008a7e8 sp=0xc00008a7e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 19 gp=0xc000102540 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00008af38 sp=0xc00008af18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc00008afc8 sp=0xc00008af38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc00008afe0 sp=0xc00008afc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008afe8 sp=0xc00008afe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 20 gp=0xc000102700 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00008b738 sp=0xc00008b718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc00008b7c8 sp=0xc00008b738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc00008b7e0 sp=0xc00008b7c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00008b7e8 sp=0xc00008b7e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 34 gp=0xc000504000 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00050a738 sp=0xc00050a718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc00050a7c8 sp=0xc00050a738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc00050a7e0 sp=0xc00050a7c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00050a7e8 sp=0xc00050a7e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 8 gp=0xc0001eae00 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000091738 sp=0xc000091718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc0000917c8 sp=0xc000091738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc0000917e0 sp=0xc0000917c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0000917e8 sp=0xc0000917e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 9 gp=0xc0001eafc0 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000091f38 sp=0xc000091f18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc000091fc8 sp=0xc000091f38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc000091fe0 sp=0xc000091fc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000091fe8 sp=0xc000091fe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 10 gp=0xc0001eb180 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000506738 sp=0xc000506718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc0005067c8 sp=0xc000506738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc0005067e0 sp=0xc0005067c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0005067e8 sp=0xc0005067e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 11 gp=0xc0001eb340 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000506f38 sp=0xc000506f18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc000506fc8 sp=0xc000506f38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc000506fe0 sp=0xc000506fc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000506fe8 sp=0xc000506fe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 12 gp=0xc0001eb500 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000507738 sp=0xc000507718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc0005077c8 sp=0xc000507738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc0005077e0 sp=0xc0005077c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0005077e8 sp=0xc0005077e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 13 gp=0xc0001eb6c0 m=nil [GC worker (idle)]: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000507f38 sp=0xc000507f18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc000507fc8 sp=0xc000507f38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc000507fe0 sp=0xc000507fc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000507fe8 sp=0xc000507fe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 14 gp=0xc0001eb880 m=nil [GC worker (idle)]: runtime.gopark(0x6521aeed6140?, 0x1?, 0x10?, 0x1e?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000508738 sp=0xc000508718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc0005087c8 sp=0xc000508738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc0005087e0 sp=0xc0005087c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0005087e8 sp=0xc0005087e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 15 gp=0xc0001eba40 m=nil [GC worker (idle)]: runtime.gopark(0x6521aeed6140?, 0x1?, 0x4f?, 0x29?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000508f38 sp=0xc000508f18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc000508fc8 sp=0xc000508f38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc000508fe0 sp=0xc000508fc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000508fe8 sp=0xc000508fe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 16 gp=0xc0001ebc00 m=nil [GC worker (idle)]: runtime.gopark(0x28037b5299897?, 0x3?, 0x52?, 0xc6?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000509738 sp=0xc000509718 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc0005097c8 sp=0xc000509738 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc0005097e0 sp=0xc0005097c8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc0005097e8 sp=0xc0005097e0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 50 gp=0xc0001ebdc0 m=nil [GC worker (idle)]: runtime.gopark(0x6521aeed6140?, 0x1?, 0xe9?, 0x9b?, 0x0?) runtime/proc.go:435 +0xce fp=0xc000509f38 sp=0xc000509f18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc000509fc8 sp=0xc000509f38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc000509fe0 sp=0xc000509fc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000509fe8 sp=0xc000509fe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 35 gp=0xc0005041c0 m=nil [GC worker (idle)]: runtime.gopark(0x28037b5299869?, 0x1?, 0xde?, 0x64?, 0x0?) runtime/proc.go:435 +0xce fp=0xc00050af38 sp=0xc00050af18 pc=0x6521ac91c24e runtime.gcBgMarkWorker(0xc0000c5730) runtime/mgc.go:1423 +0xe9 fp=0xc00050afc8 sp=0xc00050af38 pc=0x6521ac8c9e09 runtime.gcBgMarkStartWorkers.gowrap1() runtime/mgc.go:1339 +0x25 fp=0xc00050afe0 sp=0xc00050afc8 pc=0x6521ac8c9ce5 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00050afe8 sp=0xc00050afe0 pc=0x6521ac924341 created by runtime.gcBgMarkStartWorkers in goroutine 1 runtime/mgc.go:1339 +0x105 goroutine 52 gp=0xc000583180 m=nil [chan receive]: runtime.gopark(0x6521ac922354?, 0xc0000578d0?, 0x90?, 0xbd?, 0xc0000578b8?) runtime/proc.go:435 +0xce fp=0xc000057898 sp=0xc000057878 pc=0x6521ac91c24e runtime.chanrecv(0xc000463490, 0xc000057a70, 0x1) runtime/chan.go:664 +0x445 fp=0xc000057910 sp=0xc000057898 pc=0x6521ac8b83e5 runtime.chanrecv1(0xc00011c9c0?, 0xc0004c4c00?) runtime/chan.go:506 +0x12 fp=0xc000057938 sp=0xc000057910 pc=0x6521ac8b7f72 github.com/ollama/ollama/runner/llamarunner.(*Server).embeddings(0xc0004dd4a0, {0x6521ae38fae0, 0xc0006c5b20}, 0xc0004d7540) github.com/ollama/ollama/runner/llamarunner/runner.go:807 +0x72d fp=0xc000057ac0 sp=0xc000057938 pc=0x6521ace983cd github.com/ollama/ollama/runner/llamarunner.(*Server).embeddings-fm({0x6521ae38fae0?, 0xc0006c5b20?}, 0xc000057b40?) <autogenerated>:1 +0x36 fp=0xc000057af0 sp=0xc000057ac0 pc=0x6521ace9ac16 net/http.HandlerFunc.ServeHTTP(0xc0006b8780?, {0x6521ae38fae0?, 0xc0006c5b20?}, 0xc000057b60?) net/http/server.go:2294 +0x29 fp=0xc000057b18 sp=0xc000057af0 pc=0x6521acc2c509 net/http.(*ServeMux).ServeHTTP(0x6521ac8c0e25?, {0x6521ae38fae0, 0xc0006c5b20}, 0xc0004d7540) net/http/server.go:2822 +0x1c4 fp=0xc000057b68 sp=0xc000057b18 pc=0x6521acc2e404 net/http.serverHandler.ServeHTTP({0x6521ae38bb70?}, {0x6521ae38fae0?, 0xc0006c5b20?}, 0x1?) net/http/server.go:3301 +0x8e fp=0xc000057b98 sp=0xc000057b68 pc=0x6521acc4be8e net/http.(*conn).serve(0xc0004da510, {0x6521ae392318, 0xc0004d9590}) net/http/server.go:2102 +0x625 fp=0xc000057fb8 sp=0xc000057b98 pc=0x6521acc2aa05 net/http.(*Server).Serve.gowrap3() net/http/server.go:3454 +0x28 fp=0xc000057fe0 sp=0xc000057fb8 pc=0x6521acc302c8 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc000057fe8 sp=0xc000057fe0 pc=0x6521ac924341 created by net/http.(*Server).Serve in goroutine 1 net/http/server.go:3454 +0x485 goroutine 59 gp=0xc0005836c0 m=nil [IO wait]: runtime.gopark(0x0?, 0x0?, 0xa0?, 0xf1?, 0xb?) runtime/proc.go:435 +0xce fp=0xc00050bdd8 sp=0xc00050bdb8 pc=0x6521ac91c24e runtime.netpollblock(0x6521ac93fc78?, 0xac8b5806?, 0x21?) runtime/netpoll.go:575 +0xf7 fp=0xc00050be10 sp=0xc00050bdd8 pc=0x6521ac8e13f7 internal/poll.runtime_pollWait(0x7937b58b95b8, 0x72) runtime/netpoll.go:351 +0x85 fp=0xc00050be30 sp=0xc00050be10 pc=0x6521ac91b465 internal/poll.(*pollDesc).wait(0xc0004c4a00?, 0xc0004d9691?, 0x0) internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc00050be58 sp=0xc00050be30 pc=0x6521ac9a3967 internal/poll.(*pollDesc).waitRead(...) internal/poll/fd_poll_runtime.go:89 internal/poll.(*FD).Read(0xc0004c4a00, {0xc0004d9691, 0x1, 0x1}) internal/poll/fd_unix.go:165 +0x27a fp=0xc00050bef0 sp=0xc00050be58 pc=0x6521ac9a4c5a net.(*netFD).Read(0xc0004c4a00, {0xc0004d9691?, 0xc000379418?, 0xc00050bf70?}) net/fd_posix.go:55 +0x25 fp=0xc00050bf38 sp=0xc00050bef0 pc=0x6521aca1a285 net.(*conn).Read(0xc000160610, {0xc0004d9691?, 0x0?, 0xc0000c53b0?}) net/net.go:194 +0x45 fp=0xc00050bf80 sp=0xc00050bf38 pc=0x6521aca28645 net/http.(*connReader).backgroundRead(0xc0004d9680) net/http/server.go:690 +0x37 fp=0xc00050bfc8 sp=0xc00050bf80 pc=0x6521acc248d7 net/http.(*connReader).startBackgroundRead.gowrap2() net/http/server.go:686 +0x25 fp=0xc00050bfe0 sp=0xc00050bfc8 pc=0x6521acc24805 runtime.goexit({}) runtime/asm_amd64.s:1700 +0x1 fp=0xc00050bfe8 sp=0xc00050bfe0 pc=0x6521ac924341 created by net/http.(*connReader).startBackgroundRead in goroutine 52 net/http/server.go:686 +0xb6 rax 0x0 rbx 0x29619e rcx 0x7937b569eb2c rdx 0x6 rdi 0x296198 rsi 0x29619e rbp 0x7937673feec0 rsp 0x7937673fee80 r8 0x0 r9 0x7 r10 0x8 r11 0x246 r12 0x6 r13 0x6521adfeb92c r14 0x16 r15 0x1 rip 0x7937b569eb2c rflags 0x246 cs 0x33 fs 0x0 gs 0x0 time=2026-03-31T12:01:30.772+09:00 level=ERROR source=server.go:304 msg="llama runner terminated" error="exit status 2" [GIN] 2026/03/31 - 12:01:30 | 400 | 2.485840802s | 127.0.0.1 | POST "/api/embed" ``` ### OS Linux ### GPU Other ### CPU Intel ### Ollama version 0.18.3
GiteaMirror added the bug label 2026-04-22 19:57:53 -05:00
Author
Owner

@rick-github commented on GitHub (Mar 31, 2026):

Ollama doesn't currently support multi-modal embedding models.

<!-- gh-comment-id:4160298633 --> @rick-github commented on GitHub (Mar 31, 2026): Ollama doesn't currently support multi-modal embedding models.
Sign in to join this conversation.
1 Participants
Notifications
Due Date
No due date set.
Dependencies

No dependencies set.

Reference: github-starred/ollama#35464