mirror of
https://github.com/ollama/ollama.git
synced 2026-05-08 00:51:34 -05:00
Closed
opened 2026-05-04 09:32:24 -05:00 by GiteaMirror
·
4 comments
No Branch/Tag Specified
main
dhiltgen/ci
dhiltgen/llama-runner
parth-launch-codex-app
hoyyeva/anthropic-local-image-path
hoyyeva/anthropic-reference-images-path
parth-anthropic-reference-images-path
brucemacd/download-before-remove
hoyyeva/editor-config-repair
parth-mlx-decode-checkpoints
hoyyeva/fix-codex-model-metadata-warning
hoyyeva/qwen
parth/hide-claude-desktop-till-release
hoyyeva/opencode-image-modality
parth-add-claude-code-autoinstall
release_v0.22.0
pdevine/manifest-list
codex/fix-codex-model-metadata-warning
pdevine/addressable-manifest
brucemacd/launch-fetch-reccomended
jmorganca/llama-compat
launch-copilot-cli
hoyyeva/opencode-thinking
release_v0.20.7
parth-auto-save-backup
parth-test
jmorganca/gemma4-audio-replacements
fix-manifest-digest-on-pull
hoyyeva/vscode-improve
brucemacd/install-server-wait
parth/update-claude-docs
brucemac/start-ap-install
pdevine/mlx-update
pdevine/qwen35_vision
drifkin/api-show-fallback
mintlify/image-generation-1773352582
hoyyeva/server-context-length-local-config
jmorganca/faster-reptition-penalties
jmorganca/convert-nemotron
parth-pi-thinking
pdevine/sampling-penalties
jmorganca/fix-create-quantization-memory
dongchen/resumable_transfer_fix
pdevine/sampling-cache-error
jessegross/mlx-usage
hoyyeva/openclaw-config
hoyyeva/app-html
pdevine/qwen3next
brucemacd/sign-sh-install
brucemacd/tui-update
brucemacd/usage-api
jmorganca/launch-empty
fix-app-dist-embed
mxyng/mlx-compile
mxyng/mlx-quant
mxyng/mlx-glm4.7
mxyng/mlx
brucemacd/simplify-model-picker
jmorganca/qwen3-concurrent
fix-glm-4.7-flash-mla-config
drifkin/qwen3-coder-opening-tag
brucemacd/usage-cli
fix-cuda12-fattn-shmem
ollama-imagegen-docs
parth/fix-multiline-inputs
brucemacd/config-docs
mxyng/model-files
mxyng/simple-execute
fix-imagegen-ollama-models
mxyng/async-upload
jmorganca/lazy-no-dtype-changes
imagegen-auto-detect-create
parth/decrease-concurrent-download-hf
fix-mlx-quantize-init
jmorganca/x-cleanup
usage
imagegen-readme
jmorganca/glm-image
mlx-gpu-cd
jmorganca/imagegen-modelfile
parth/agent-skills
parth/agent-allowlist
parth/signed-in-offline
parth/agents
parth/fix-context-chopping
improve-cloud-flow
parth/add-models-websearch
parth/prompt-renderer-mcp
jmorganca/native-settings
jmorganca/download-stream-hash
jmorganca/client2-rebased
brucemacd/oai-chat-req-multipart
jessegross/multi_chunk_reserve
grace/additional-omit-empty
grace/mistral-3-large
mxyng/tokenizer2
mxyng/tokenizer
jessegross/flash
hoyyeva/windows-nacked-app
mxyng/cleanup-attention
grace/deepseek-parser
hoyyeva/remember-unsent-prompt
parth/add-lfs-pointer-error-conversion
parth/olmo2-test2
hoyyeva/ollama-launchagent-plist
nicole/olmo-model
parth/olmo-test
mxyng/remove-embedded
parth/render-template
jmorganca/intellect-3
parth/remove-prealloc-linter
jmorganca/cmd-eval
nicole/nomic-embed-text-fix
mxyng/lint-2
hoyyeva/add-gemini-3-pro-preview
hoyyeva/load-model-list
mxyng/expand-path
mxyng/environ-2
hoyyeva/deeplink-json-encoding
parth/improve-tool-calling-tests
hoyyeva/conversation
hoyyeva/assistant-edit-response
hoyyeva/thinking
origin/brucemacd/invalid-char-i-err
parth/improve-tool-calling
jmorganca/required-omitempty
grace/qwen3-vl-tests
mxyng/iter-client
parth/docs-readme
nicole/embed-test
pdevine/integration-benchstat
parth/remove-generate-cmd
parth/add-toolcall-id
mxyng/server-tests
jmorganca/glm-4.6
jmorganca/gin-h-compat
drifkin/stable-tool-args
pdevine/qwen3-more-thinking
parth/add-websearch-client
nicole/websearch_local
jmorganca/qwen3-coder-updates
grace/deepseek-v3-migration-tests
mxyng/fix-create
jmorganca/cloud-errors
pdevine/parser-tidy
revert-12233-parth/simplify-entrypoints-runner
parth/enable-so-gpt-oss
brucemacd/qwen3vl
jmorganca/readme-simplify
parth/gpt-oss-structured-outputs
revert-12039-jmorganca/tools-braces
mxyng/embeddings
mxyng/gguf
mxyng/benchmark
mxyng/types-null
parth/move-parsing
mxyng/gemma2
jmorganca/docs
mxyng/16-bit
mxyng/create-stdin
pdevine/authorizedkeys
mxyng/quant
parth/opt-in-error-context-window
brucemacd/cache-models
brucemacd/runner-completion
jmorganca/llama-update-6
brucemacd/benchmark-list
brucemacd/partial-read-caps
parth/deepseek-r1-tools
mxyng/omit-array
parth/tool-prefix-temp
brucemacd/runner-test
jmorganca/qwen25vl
brucemacd/model-forward-test-ext
parth/python-function-parsing
jmorganca/cuda-compression-none
drifkin/num-parallel
drifkin/chat-truncation-fix
jmorganca/sync
parth/python-tools-calling
drifkin/array-head-count
brucemacd/create-no-loop
parth/server-enable-content-stream-with-tools
qwen25omni
mxyng/v3
brucemacd/ropeconfig
jmorganca/silence-tokenizer
parth/sample-so-test
parth/sampling-structured-outputs
brucemacd/doc-go-engine
parth/constrained-sampling-json
jmorganca/mistral-wip
brucemacd/mistral-small-convert
parth/sample-unmarshal-json-for-params
brucemacd/jomorganca/mistral
pdevine/bfloat16
jmorganca/mistral
brucemacd/mistral
pdevine/logging
parth/sample-correctness-fix
parth/sample-fix-sorting
jmorgan/sample-fix-sorting-extras
jmorganca/temp-0-images
brucemacd/parallel-embed-models
brucemacd/shim-grammar
jmorganca/fix-gguf-error
bmizerany/nameswork
jmorganca/faster-releases
bmizerany/validatenames
brucemacd/err-no-vocab
brucemacd/rope-config
brucemacd/err-hint
brucemacd/qwen2_5
brucemacd/logprobs
brucemacd/new_runner_graph_bench
progress-flicker
brucemacd/forward-test
brucemacd/go_qwen2
pdevine/gemma2
jmorganca/add-missing-symlink-eval
mxyng/next-debug
parth/set-context-size-openai
brucemacd/next-bpe-bench
brucemacd/next-bpe-test
brucemacd/new_runner_e2e
brucemacd/new_runner_qwen2
pdevine/convert-cohere2
brucemacd/convert-cli
parth/log-probs
mxyng/next-mlx
mxyng/cmd-history
parth/templating
parth/tokenize-detokenize
brucemacd/check-key-register
bmizerany/grammar
jmorganca/vendor-081b29bd
mxyng/func-checks
jmorganca/fix-null-format
parth/fix-default-to-warn-json
jmorganca/qwen2vl
jmorganca/no-concat
parth/cmd-cleanup-SO
brucemacd/check-key-register-structured-err
parth/openai-stream-usage
parth/fix-referencing-so
stream-tools-stop
jmorganca/degin-1
brucemacd/install-path-clean
brucemacd/push-name-validation
brucemacd/browser-key-register
jmorganca/openai-fix-first-message
jmorganca/fix-proxy
jessegross/sample
parth/disallow-streaming-tools
dhiltgen/remove_submodule
jmorganca/ga
jmorganca/mllama
pdevine/newlines
pdevine/geems-2b
jmorganca/llama-bump
mxyng/modelname-7
mxyng/gin-slog
mxyng/modelname-6
jyan/convert-prog
jyan/quant5
paligemma-support
pdevine/import-docs
jmorganca/openai-context
jyan/paligemma
jyan/p2
jyan/palitest
bmizerany/embedspeedup
jmorganca/llama-vit
brucemacd/allow-ollama
royh/ep-methods
royh/whisper
mxyng/api-models
mxyng/fix-memory
jyan/q4_4/8
jyan/ollama-v
royh/stream-tools
roy-embed-parallel
bmizerany/hrm
revert-5963-revert-5924-mxyng/llama3.1-rope
royh/embed-viz
jyan/local2
jyan/auth
jyan/local
jyan/parse-temp
jmorganca/template-mistral
jyan/reord-g
royh-openai-suffixdocs
royh-imgembed
royh-embed-parallel
jyan/quant4
royh-precision
jyan/progress
pdevine/fix-template
jyan/quant3
pdevine/ggla
mxyng/update-registry-domain
jmorganca/ggml-static
mxyng/create-context
jyan/v0.146
mxyng/layers-from-files
build_dist
bmizerany/noseek
royh-ls
royh-name
timeout
mxyng/server-timestamp
bmizerany/nosillyggufslurps
royh-params
jmorganca/llama-cpp-7c26775
royh-openai-delete
royh-show-rigid
jmorganca/enable-fa
jmorganca/no-error-template
jyan/format
royh-testdelete
bmizerany/fastverify
language_support
pdevine/ps-glitches
brucemacd/tokenize
bruce/iq-quants
bmizerany/filepathwithcoloninhost
mxyng/split-bin
bmizerany/client-registry
jmorganca/if-none-match
native
jmorganca/native
jmorganca/batch-embeddings
jmorganca/initcmake
jmorganca/mm
pdevine/showggmlinfo
modenameenforcealphanum
bmizerany/modenameenforcealphanum
jmorganca/done-reason
jmorganca/llama-cpp-8960fe8
ollama.com
bmizerany/filepathnobuild
bmizerany/types/model/defaultfix
rmdisplaylong
nogogen
bmizerany/x
modelfile-readme
bmizerany/replacecolon
jmorganca/limit
jmorganca/execstack
jmorganca/replace-assets
mxyng/tune-concurrency
jmorganca/testing
whitespace-detection
jmorganca/options
upgrade-all
scratch
cuda-search
mattw/airenamer
mattw/allmodelsonhuggingface
mattw/quantcontext
mattw/whatneedstorun
brucemacd/llama-mem-calc
mattw/faq-context
mattw/communitylinks
mattw/noprune
mattw/python-functioncalling
rename
mxyng/install
pulse
remove-first
editor
mattw/selfqueryingretrieval
cgo
mattw/howtoquant
api
matt/streamingapi
format-config
mxyng/extra-args
shell
update-nous-hermes
cp-model
upload-progress
fix-unknown-model
fix-model-names
delete-fix
insecure-registry
ls
deletemodels
progressbar
readme-updates
license-layers
skip-list
list-models
modelpath
matt/examplemodelfiles
distribution
go-opts
v0.30.0-rc7
v0.30.0-rc6
v0.30.0-rc5
v0.23.2
v0.23.2-rc0
v0.30.0-rc4
v0.30.0-rc3
v0.30.0-rc2
v0.30.0-rc1
v0.30.0-rc0
v0.23.1
v0.23.1-rc0
v0.23.0
v0.23.0-rc0
v0.22.1
v0.22.1-rc1
v0.22.1-rc0
v0.22.0
v0.22.0-rc1
v0.21.3-rc0
v0.21.2-rc1
v0.21.2
v0.21.2-rc0
v0.21.1
v0.21.1-rc1
v0.21.1-rc0
v0.21.0
v0.21.0-rc1
v0.21.0-rc0
v0.20.8-rc0
v0.20.7
v0.20.7-rc1
v0.20.7-rc0
v0.20.6
v0.20.6-rc1
v0.20.6-rc0
v0.20.5
v0.20.5-rc2
v0.20.5-rc1
v0.20.5-rc0
v0.20.4
v0.20.4-rc2
v0.20.4-rc1
v0.20.4-rc0
v0.20.3
v0.20.3-rc0
v0.20.2
v0.20.1
v0.20.1-rc2
v0.20.1-rc1
v0.20.1-rc0
v0.20.0
v0.20.0-rc1
v0.20.0-rc0
v0.19.0
v0.19.0-rc2
v0.19.0-rc1
v0.19.0-rc0
v0.18.4-rc1
v0.18.4-rc0
v0.18.3
v0.18.3-rc2
v0.18.3-rc1
v0.18.3-rc0
v0.18.2
v0.18.2-rc1
v0.18.2-rc0
v0.18.1
v0.18.1-rc1
v0.18.1-rc0
v0.18.0
v0.18.0-rc2
v0.18.0-rc1
v0.18.0-rc0
v0.17.8-rc4
v0.17.8-rc3
v0.17.8-rc2
v0.17.8-rc1
v0.17.8-rc0
v0.17.7
v0.17.7-rc2
v0.17.7-rc1
v0.17.7-rc0
v0.17.6
v0.17.5
v0.17.4
v0.17.3
v0.17.2
v0.17.1
v0.17.1-rc2
v0.17.1-rc1
v0.17.1-rc0
v0.17.0
v0.17.0-rc2
v0.17.0-rc1
v0.17.0-rc0
v0.16.3
v0.16.3-rc2
v0.16.3-rc1
v0.16.3-rc0
v0.16.2
v0.16.2-rc0
v0.16.1
v0.16.0
v0.16.0-rc2
v0.16.0-rc0
v0.16.0-rc1
v0.15.6
v0.15.5
v0.15.5-rc5
v0.15.5-rc4
v0.15.5-rc3
v0.15.5-rc2
v0.15.5-rc1
v0.15.5-rc0
v0.15.4
v0.15.3
v0.15.2
v0.15.1
v0.15.1-rc1
v0.15.1-rc0
v0.15.0-rc6
v0.15.0
v0.15.0-rc5
v0.15.0-rc4
v0.15.0-rc3
v0.15.0-rc2
v0.15.0-rc1
v0.15.0-rc0
v0.14.3
v0.14.3-rc3
v0.14.3-rc2
v0.14.3-rc1
v0.14.3-rc0
v0.14.2
v0.14.2-rc1
v0.14.2-rc0
v0.14.1
v0.14.0-rc11
v0.14.0
v0.14.0-rc10
v0.14.0-rc9
v0.14.0-rc8
v0.14.0-rc7
v0.14.0-rc6
v0.14.0-rc5
v0.14.0-rc4
v0.14.0-rc3
v0.14.0-rc2
v0.14.0-rc1
v0.14.0-rc0
v0.13.5
v0.13.5-rc1
v0.13.5-rc0
v0.13.4-rc2
v0.13.4
v0.13.4-rc1
v0.13.4-rc0
v0.13.3
v0.13.3-rc1
v0.13.3-rc0
v0.13.2
v0.13.2-rc2
v0.13.2-rc1
v0.13.2-rc0
v0.13.1
v0.13.1-rc2
v0.13.1-rc1
v0.13.1-rc0
v0.13.0
v0.13.0-rc0
v0.12.11
v0.12.11-rc1
v0.12.11-rc0
v0.12.10
v0.12.10-rc1
v0.12.10-rc0
v0.12.9-rc0
v0.12.9
v0.12.8
v0.12.8-rc0
v0.12.7
v0.12.7-rc1
v0.12.7-rc0
v0.12.7-citest0
v0.12.6
v0.12.6-rc1
v0.12.6-rc0
v0.12.5
v0.12.5-rc0
v0.12.4
v0.12.4-rc7
v0.12.4-rc6
v0.12.4-rc5
v0.12.4-rc4
v0.12.4-rc3
v0.12.4-rc2
v0.12.4-rc1
v0.12.4-rc0
v0.12.3
v0.12.2
v0.12.2-rc0
v0.12.1
v0.12.1-rc1
v0.12.1-rc2
v0.12.1-rc0
v0.12.0
v0.12.0-rc1
v0.12.0-rc0
v0.11.11
v0.11.11-rc3
v0.11.11-rc2
v0.11.11-rc1
v0.11.11-rc0
v0.11.10
v0.11.9
v0.11.9-rc0
v0.11.8
v0.11.8-rc0
v0.11.7-rc1
v0.11.7-rc0
v0.11.7
v0.11.6
v0.11.6-rc0
v0.11.5-rc4
v0.11.5-rc3
v0.11.5
v0.11.5-rc5
v0.11.5-rc2
v0.11.5-rc1
v0.11.5-rc0
v0.11.4
v0.11.4-rc0
v0.11.3
v0.11.3-rc0
v0.11.2
v0.11.1
v0.11.0-rc0
v0.11.0-rc1
v0.11.0-rc2
v0.11.0
v0.10.2-int1
v0.10.1
v0.10.0
v0.10.0-rc4
v0.10.0-rc3
v0.10.0-rc2
v0.10.0-rc1
v0.10.0-rc0
v0.9.7-rc1
v0.9.7-rc0
v0.9.6
v0.9.6-rc0
v0.9.6-ci0
v0.9.5
v0.9.4-rc5
v0.9.4-rc6
v0.9.4
v0.9.4-rc3
v0.9.4-rc4
v0.9.4-rc1
v0.9.4-rc2
v0.9.4-rc0
v0.9.3
v0.9.3-rc5
v0.9.4-citest0
v0.9.3-rc4
v0.9.3-rc3
v0.9.3-rc2
v0.9.3-rc1
v0.9.3-rc0
v0.9.2
v0.9.1
v0.9.1-rc1
v0.9.1-rc0
v0.9.1-ci1
v0.9.1-ci0
v0.9.0
v0.9.0-rc0
v0.8.0
v0.8.0-rc0
v0.7.1-rc2
v0.7.1
v0.7.1-rc1
v0.7.1-rc0
v0.7.0
v0.7.0-rc1
v0.7.0-rc0
v0.6.9-rc0
v0.6.8
v0.6.8-rc0
v0.6.7
v0.6.7-rc2
v0.6.7-rc1
v0.6.7-rc0
v0.6.6
v0.6.6-rc2
v0.6.6-rc1
v0.6.6-rc0
v0.6.5-rc1
v0.6.5
v0.6.5-rc0
v0.6.4-rc0
v0.6.4
v0.6.3-rc1
v0.6.3
v0.6.3-rc0
v0.6.2
v0.6.2-rc0
v0.6.1
v0.6.1-rc0
v0.6.0-rc0
v0.6.0
v0.5.14-rc0
v0.5.13
v0.5.13-rc6
v0.5.13-rc5
v0.5.13-rc4
v0.5.13-rc3
v0.5.13-rc2
v0.5.13-rc1
v0.5.13-rc0
v0.5.12
v0.5.12-rc1
v0.5.12-rc0
v0.5.11
v0.5.10
v0.5.9
v0.5.9-rc0
v0.5.8-rc13
v0.5.8
v0.5.8-rc12
v0.5.8-rc11
v0.5.8-rc10
v0.5.8-rc9
v0.5.8-rc8
v0.5.8-rc7
v0.5.8-rc6
v0.5.8-rc5
v0.5.8-rc4
v0.5.8-rc3
v0.5.8-rc2
v0.5.8-rc1
v0.5.8-rc0
v0.5.7
v0.5.6
v0.5.5
v0.5.5-rc0
v0.5.4
v0.5.3
v0.5.3-rc0
v0.5.2
v0.5.2-rc3
v0.5.2-rc2
v0.5.2-rc1
v0.5.2-rc0
v0.5.1
v0.5.0
v0.5.0-rc1
v0.4.8-rc0
v0.4.7
v0.4.6
v0.4.5
v0.4.4
v0.4.3
v0.4.3-rc0
v0.4.2
v0.4.2-rc1
v0.4.2-rc0
v0.4.1
v0.4.1-rc0
v0.4.0
v0.4.0-rc8
v0.4.0-rc7
v0.4.0-rc6
v0.4.0-rc5
v0.4.0-rc4
v0.4.0-rc3
v0.4.0-rc2
v0.4.0-rc1
v0.4.0-rc0
v0.4.0-ci3
v0.3.14
v0.3.14-rc0
v0.3.13
v0.3.12
v0.3.12-rc5
v0.3.12-rc4
v0.3.12-rc3
v0.3.12-rc2
v0.3.12-rc1
v0.3.11
v0.3.11-rc4
v0.3.11-rc3
v0.3.11-rc2
v0.3.11-rc1
v0.3.10
v0.3.10-rc1
v0.3.9
v0.3.8
v0.3.7
v0.3.7-rc6
v0.3.7-rc5
v0.3.7-rc4
v0.3.7-rc3
v0.3.7-rc2
v0.3.7-rc1
v0.3.6
v0.3.5
v0.3.4
v0.3.3
v0.3.2
v0.3.1
v0.3.0
v0.2.8
v0.2.8-rc2
v0.2.8-rc1
v0.2.7
v0.2.6
v0.2.5
v0.2.4
v0.2.3
v0.2.2
v0.2.2-rc2
v0.2.2-rc1
v0.2.1
v0.2.0
v0.1.49-rc14
v0.1.49-rc13
v0.1.49-rc12
v0.1.49-rc11
v0.1.49-rc10
v0.1.49-rc9
v0.1.49-rc8
v0.1.49-rc7
v0.1.49-rc6
v0.1.49-rc4
v0.1.49-rc5
v0.1.49-rc3
v0.1.49-rc2
v0.1.49-rc1
v0.1.48
v0.1.47
v0.1.46
v0.1.45-rc5
v0.1.45
v0.1.45-rc4
v0.1.45-rc3
v0.1.45-rc2
v0.1.45-rc1
v0.1.44
v0.1.43
v0.1.42
v0.1.41
v0.1.40
v0.1.40-rc1
v0.1.39
v0.1.39-rc2
v0.1.39-rc1
v0.1.38
v0.1.37
v0.1.36
v0.1.35
v0.1.35-rc1
v0.1.34
v0.1.34-rc1
v0.1.33
v0.1.33-rc7
v0.1.33-rc6
v0.1.33-rc5
v0.1.33-rc4
v0.1.33-rc3
v0.1.33-rc2
v0.1.33-rc1
v0.1.32
v0.1.32-rc2
v0.1.32-rc1
v0.1.31
v0.1.30
v0.1.29
v0.1.28
v0.1.27
v0.1.26
v0.1.25
v0.1.24
v0.1.23
v0.1.22
v0.1.21
v0.1.20
v0.1.19
v0.1.18
v0.1.17
v0.1.16
v0.1.15
v0.1.14
v0.1.13
v0.1.12
v0.1.11
v0.1.10
v0.1.9
v0.1.8
v0.1.7
v0.1.6
v0.1.5
v0.1.4
v0.1.3
v0.1.2
v0.1.1
v0.1.0
v0.0.21
v0.0.20
v0.0.19
v0.0.18
v0.0.17
v0.0.16
v0.0.15
v0.0.14
v0.0.13
v0.0.12
v0.0.11
v0.0.10
v0.0.9
v0.0.8
v0.0.7
v0.0.6
v0.0.5
v0.0.4
v0.0.3
v0.0.2
v0.0.1
Labels
Clear labels
amd
api
app
bug
build
cli
cloud
compatibility
context-length
create
docker
documentation
embeddings
feature request
feedback wanted
good first issue
gpt-oss
gpu
harmony
help wanted
image
install
intel
js
launch
linux
macos
memory
mlx
model
needs more info
networking
nvidia
ollama.com
performance
pull-request
python
question
registry
rendering
thinking
tools
top
vulkan
windows
wsl
Mirrored from GitHub Pull Request
No Label
Milestone
No items
No Milestone
Projects
Clear projects
No project
No Assignees
Notifications
Due Date
No due date set.
Dependencies
No dependencies set.
Reference: github-starred/ollama#67138
Reference in New Issue
Block a user
Blocking a user prevents them from interacting with repositories, such as opening or commenting on pull requests or issues. Learn more about blocking a user.
Delete Branch "%!s()"
Deleting a branch is permanent. Although the deleted branch may continue to exist for a short time before it actually gets removed, it CANNOT be undone in most cases. Continue?
Originally created by @datamg-star on GitHub (Dec 5, 2024).
Original GitHub issue: https://github.com/ollama/ollama/issues/7941
[root@localhost data]# ollama run llama3.1:8b
tail -200 /var/log/messages
Dec 5 10:29:10 localhost ollama: Device 0: NVIDIA A800-SXM4-40GB, compute capability 8.0, VMM: yes
Dec 5 10:29:10 localhost ollama: llm_load_tensors: ggml ctx size = 0.27 MiB
Dec 5 10:29:11 localhost ollama: llm_load_tensors: offloading 32 repeating layers to GPU
Dec 5 10:29:11 localhost ollama: llm_load_tensors: offloading non-repeating layers to GPU
Dec 5 10:29:11 localhost ollama: llm_load_tensors: offloaded 33/33 layers to GPU
Dec 5 10:29:11 localhost ollama: llm_load_tensors: CPU buffer size = 281.81 MiB
Dec 5 10:29:11 localhost ollama: llm_load_tensors: CUDA0 buffer size = 4403.50 MiB
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: n_ctx = 8192
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: n_batch = 2048
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: n_ubatch = 512
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: flash_attn = 0
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: freq_base = 500000.0
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: freq_scale = 1
Dec 5 10:29:16 localhost ollama: llama_kv_cache_init: CUDA0 KV buffer size = 1024.00 MiB
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: KV self size = 1024.00 MiB, K (f16): 512.00 MiB, V (f16): 512.00 MiB
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: CUDA_Host output buffer size = 2.02 MiB
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: CUDA0 compute buffer size = 560.00 MiB
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: CUDA_Host compute buffer size = 24.01 MiB
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: graph nodes = 1030
Dec 5 10:29:16 localhost ollama: llama_new_context_with_model: graph splits = 2
Dec 5 10:29:16 localhost ollama: time=2024-12-05T10:29:16.838+08:00 level=INFO source=server.go:601 msg="llama runner started in 13.05 seconds"
Dec 5 10:29:16 localhost ollama: [GIN] 2024/12/05 - 10:29:16 | 200 | 13.185062523s | 127.0.0.1 | POST "/api/generate"
Dec 5 10:29:24 localhost ollama: SIGSEGV: segmentation violation
Dec 5 10:29:24 localhost ollama: PC=0x7f74e0682a00 m=4 sigcode=1 addr=0x7f74359ca7ca
Dec 5 10:29:24 localhost ollama: signal arrived during cgo execution
Dec 5 10:29:24 localhost ollama: goroutine 36 gp=0xc000104700 m=4 mp=0xc000057808 [syscall]:
Dec 5 10:29:24 localhost ollama: runtime.cgocall(0x5640ed665110, 0xc0002a8b48)
Dec 5 10:29:24 localhost ollama: runtime/cgocall.go:157 +0x4b fp=0xc0002a8b20 sp=0xc0002a8ae8 pc=0x5640ed3e63cb
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama._Cfunc_llama_decode(0x7f74893e78e0, {0x1, 0x7f74887e89a0, 0x0, 0x0, 0x7f74887ea9b0, 0x7f74887ec9c0, 0x7f74887ee9d0, 0x7f7488802480, 0x0, ...})
Dec 5 10:29:24 localhost ollama: _cgo_gotypes.go:543 +0x52 fp=0xc0002a8b48 sp=0xc0002a8b20 pc=0x5640ed4e3952
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama.(*Context).Decode.func1(0x5640ed660e0b?, 0x7f74893e78e0?)
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/llama.go:167 +0xd8 fp=0xc0002a8c68 sp=0xc0002a8b48 pc=0x5640ed4e5f78
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama.(*Context).Decode(0x5640edc560e0?, 0x0?)
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/llama.go:167 +0x13 fp=0xc0002a8cb0 sp=0xc0002a8c68 pc=0x5640ed4e5e13
Dec 5 10:29:24 localhost ollama: main.(*Server).processBatch(0xc00013c120, 0xc0002ac000, 0xc0002a8f10)
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/runner/runner.go:425 +0x24d fp=0xc0002a8ed0 sp=0xc0002a8cb0 pc=0x5640ed65facd
Dec 5 10:29:24 localhost ollama: main.(*Server).run(0xc00013c120, {0x5640ed99ecc0, 0xc00017a050})
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/runner/runner.go:333 +0x1e5 fp=0xc0002a8fb8 sp=0xc0002a8ed0 pc=0x5640ed65f545
Dec 5 10:29:24 localhost ollama: main.main.gowrap2()
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/runner/runner.go:934 +0x28 fp=0xc0002a8fe0 sp=0xc0002a8fb8 pc=0x5640ed664148
Dec 5 10:29:24 localhost ollama: runtime.goexit({})
Dec 5 10:29:24 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc0002a8fe8 sp=0xc0002a8fe0 pc=0x5640ed44ede1
Dec 5 10:29:24 localhost ollama: created by main.main in goroutine 1
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/runner/runner.go:934 +0xc52
Dec 5 10:29:24 localhost ollama: goroutine 1 gp=0xc0000061c0 m=nil [IO wait]:
Dec 5 10:29:24 localhost ollama: runtime.gopark(0xc000034a08?, 0x0?, 0xc0?, 0x61?, 0xc0000298b8?)
Dec 5 10:29:24 localhost ollama: runtime/proc.go:402 +0xce fp=0xc000029880 sp=0xc000029860 pc=0x5640ed41d00e
Dec 5 10:29:24 localhost ollama: runtime.netpollblock(0xc000029918?, 0xed3e5b26?, 0x40?)
Dec 5 10:29:24 localhost ollama: runtime/netpoll.go:573 +0xf7 fp=0xc0000298b8 sp=0xc000029880 pc=0x5640ed415257
Dec 5 10:29:24 localhost ollama: internal/poll.runtime_pollWait(0x7f74975fef20, 0x72)
Dec 5 10:29:24 localhost ollama: runtime/netpoll.go:345 +0x85 fp=0xc0000298d8 sp=0xc0000298b8 pc=0x5640ed449aa5
Dec 5 10:29:24 localhost ollama: internal/poll.(*pollDesc).wait(0x3?, 0x3fe?, 0x0)
Dec 5 10:29:24 localhost ollama: internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc000029900 sp=0xc0000298d8 pc=0x5640ed4999c7
Dec 5 10:29:24 localhost ollama: internal/poll.(*pollDesc).waitRead(...)
Dec 5 10:29:24 localhost ollama: internal/poll/fd_poll_runtime.go:89
Dec 5 10:29:24 localhost ollama: internal/poll.(*FD).Accept(0xc000174080)
Dec 5 10:29:24 localhost ollama: internal/poll/fd_unix.go:611 +0x2ac fp=0xc0000299a8 sp=0xc000029900 pc=0x5640ed49ae8c
Dec 5 10:29:24 localhost ollama: net.(*netFD).accept(0xc000174080)
Dec 5 10:29:24 localhost ollama: net/fd_unix.go:172 +0x29 fp=0xc000029a60 sp=0xc0000299a8 pc=0x5640ed509a09
Dec 5 10:29:24 localhost ollama: net.(*TCPListener).accept(0xc00013e1c0)
Dec 5 10:29:24 localhost ollama: net/tcpsock_posix.go:159 +0x1e fp=0xc000029a88 sp=0xc000029a60 pc=0x5640ed51a73e
Dec 5 10:29:24 localhost ollama: net.(*TCPListener).Accept(0xc00013e1c0)
Dec 5 10:29:24 localhost ollama: net/tcpsock.go:327 +0x30 fp=0xc000029ab8 sp=0xc000029a88 pc=0x5640ed519a90
Dec 5 10:29:24 localhost ollama: net/http.(*onceCloseListener).Accept(0xc00013c1b0?)
Dec 5 10:29:24 localhost ollama: :1 +0x24 fp=0xc000029ad0 sp=0xc000029ab8 pc=0x5640ed640ca4
Dec 5 10:29:24 localhost ollama: net/http.(*Server).Serve(0xc0001220f0, {0x5640ed99e680, 0xc00013e1c0})
Dec 5 10:29:24 localhost ollama: net/http/server.go:3260 +0x33e fp=0xc000029c00 sp=0xc000029ad0 pc=0x5640ed637abe
Dec 5 10:29:24 localhost ollama: main.main()
Dec 5 10:29:24 localhost ollama: github.com/ollama/ollama/llama/runner/runner.go:954 +0xfec fp=0xc000029f50 sp=0xc000029c00 pc=0x5640ed663ecc
Dec 5 10:29:24 localhost ollama: runtime.main()
Dec 5 10:29:24 localhost ollama: runtime/proc.go:271 +0x29d fp=0xc000029fe0 sp=0xc000029f50 pc=0x5640ed41cbdd
Dec 5 10:29:24 localhost ollama: runtime.goexit({})
Dec 5 10:29:24 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc000029fe8 sp=0xc000029fe0 pc=0x5640ed44ede1
Dec 5 10:29:24 localhost ollama: goroutine 2 gp=0xc000006c40 m=nil [force gc (idle)]:
Dec 5 10:29:24 localhost ollama: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
Dec 5 10:29:24 localhost ollama: runtime/proc.go:402 +0xce fp=0xc000050fa8 sp=0xc000050f88 pc=0x5640ed41d00e
Dec 5 10:29:24 localhost ollama: runtime.goparkunlock(...)
Dec 5 10:29:24 localhost ollama: runtime/proc.go:408
Dec 5 10:29:24 localhost ollama: runtime.forcegchelper()
Dec 5 10:29:24 localhost ollama: runtime/proc.go:326 +0xb8 fp=0xc000050fe0 sp=0xc000050fa8 pc=0x5640ed41ce98
Dec 5 10:29:24 localhost ollama: runtime.goexit({})
Dec 5 10:29:24 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc000050fe8 sp=0xc000050fe0 pc=0x5640ed44ede1
Dec 5 10:29:24 localhost ollama: created by runtime.init.6 in goroutine 1
Dec 5 10:29:24 localhost ollama: runtime/proc.go:314 +0x1a
Dec 5 10:29:24 localhost ollama: goroutine 18 gp=0xc00008a380 m=nil [GC sweep wait]:
Dec 5 10:29:24 localhost ollama: runtime.gopark(0x0?, 0x0?, 0x0?, 0x0?, 0x0?)
Dec 5 10:29:24 localhost ollama: runtime/proc.go:402 +0xce fp=0xc00004c780 sp=0xc00004c760 pc=0x5640ed41d00e
Dec 5 10:29:24 localhost ollama: runtime.goparkunlock(...)
Dec 5 10:29:24 localhost ollama: runtime/proc.go:408
Dec 5 10:29:24 localhost ollama: runtime.bgsweep(0xc000096000)
Dec 5 10:29:24 localhost ollama: runtime/mgcsweep.go:278 +0x94 fp=0xc00004c7c8 sp=0xc00004c780 pc=0x5640ed407b54
Dec 5 10:29:24 localhost ollama: runtime.gcenable.gowrap1()
Dec 5 10:29:24 localhost ollama: runtime/mgc.go:203 +0x25 fp=0xc00004c7e0 sp=0xc00004c7c8 pc=0x5640ed3fc685
Dec 5 10:29:24 localhost ollama: runtime.goexit({})
Dec 5 10:29:25 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc00004c7e8 sp=0xc00004c7e0 pc=0x5640ed44ede1
Dec 5 10:29:25 localhost ollama: created by runtime.gcenable in goroutine 1
Dec 5 10:29:25 localhost ollama: runtime/mgc.go:203 +0x66
Dec 5 10:29:25 localhost ollama: goroutine 19 gp=0xc00008a540 m=nil [GC scavenge wait]:
Dec 5 10:29:25 localhost ollama: runtime.gopark(0xc000096000?, 0x5640ed8a02b0?, 0x1?, 0x0?, 0xc00008a540?)
Dec 5 10:29:25 localhost ollama: runtime/proc.go:402 +0xce fp=0xc00004cf78 sp=0xc00004cf58 pc=0x5640ed41d00e
Dec 5 10:29:25 localhost ollama: runtime.goparkunlock(...)
Dec 5 10:29:25 localhost ollama: runtime/proc.go:408
Dec 5 10:29:25 localhost ollama: runtime.(*scavengerState).park(0x5640edb6d540)
Dec 5 10:29:25 localhost ollama: runtime/mgcscavenge.go:425 +0x49 fp=0xc00004cfa8 sp=0xc00004cf78 pc=0x5640ed405549
Dec 5 10:29:25 localhost ollama: runtime.bgscavenge(0xc000096000)
Dec 5 10:29:25 localhost ollama: runtime/mgcscavenge.go:653 +0x3c fp=0xc00004cfc8 sp=0xc00004cfa8 pc=0x5640ed405adc
Dec 5 10:29:25 localhost ollama: runtime.gcenable.gowrap2()
Dec 5 10:29:25 localhost ollama: runtime/mgc.go:204 +0x25 fp=0xc00004cfe0 sp=0xc00004cfc8 pc=0x5640ed3fc625
Dec 5 10:29:25 localhost ollama: runtime.goexit({})
Dec 5 10:29:25 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc00004cfe8 sp=0xc00004cfe0 pc=0x5640ed44ede1
Dec 5 10:29:25 localhost ollama: created by runtime.gcenable in goroutine 1
Dec 5 10:29:25 localhost ollama: runtime/mgc.go:204 +0xa5
Dec 5 10:29:25 localhost ollama: goroutine 34 gp=0xc000104380 m=nil [finalizer wait]:
Dec 5 10:29:25 localhost ollama: runtime.gopark(0xc000050648?, 0x5640ed3eff85?, 0xa8?, 0x1?, 0xc0000061c0?)
Dec 5 10:29:25 localhost ollama: runtime/proc.go:402 +0xce fp=0xc000050620 sp=0xc000050600 pc=0x5640ed41d00e
Dec 5 10:29:25 localhost ollama: runtime.runfinq()
Dec 5 10:29:25 localhost ollama: runtime/mfinal.go:194 +0x107 fp=0xc0000507e0 sp=0xc000050620 pc=0x5640ed3fb6c7
Dec 5 10:29:25 localhost ollama: runtime.goexit({})
Dec 5 10:29:25 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc0000507e8 sp=0xc0000507e0 pc=0x5640ed44ede1
Dec 5 10:29:25 localhost ollama: created by runtime.createfing in goroutine 1
Dec 5 10:29:25 localhost ollama: runtime/mfinal.go:164 +0x3d
Dec 5 10:29:25 localhost ollama: goroutine 32 gp=0xc000104540 m=nil [IO wait]:
Dec 5 10:29:25 localhost ollama: runtime.gopark(0x10?, 0x10?, 0xf0?, 0x5d?, 0xb?)
Dec 5 10:29:25 localhost ollama: runtime/proc.go:402 +0xce fp=0xc000185da8 sp=0xc000185d88 pc=0x5640ed41d00e
Dec 5 10:29:25 localhost ollama: runtime.netpollblock(0x5640ed483558?, 0xed3e5b26?, 0x40?)
Dec 5 10:29:25 localhost ollama: runtime/netpoll.go:573 +0xf7 fp=0xc000185de0 sp=0xc000185da8 pc=0x5640ed415257
Dec 5 10:29:25 localhost ollama: internal/poll.runtime_pollWait(0x7f74975fee28, 0x72)
Dec 5 10:29:25 localhost ollama: runtime/netpoll.go:345 +0x85 fp=0xc000185e00 sp=0xc000185de0 pc=0x5640ed449aa5
Dec 5 10:29:25 localhost ollama: internal/poll.(*pollDesc).wait(0xc000174100?, 0xc000114ee1?, 0x0)
Dec 5 10:29:25 localhost ollama: internal/poll/fd_poll_runtime.go:84 +0x27 fp=0xc000185e28 sp=0xc000185e00 pc=0x5640ed4999c7
Dec 5 10:29:25 localhost ollama: internal/poll.(*pollDesc).waitRead(...)
Dec 5 10:29:25 localhost ollama: internal/poll/fd_poll_runtime.go:89
Dec 5 10:29:25 localhost ollama: internal/poll.(*FD).Read(0xc000174100, {0xc000114ee1, 0x1, 0x1})
Dec 5 10:29:25 localhost ollama: internal/poll/fd_unix.go:164 +0x27a fp=0xc000185ec0 sp=0xc000185e28 pc=0x5640ed49a51a
Dec 5 10:29:25 localhost ollama: net.(*netFD).Read(0xc000174100, {0xc000114ee1?, 0xc000185f48?, 0x5640ed44b6d0?})
Dec 5 10:29:25 localhost ollama: net/fd_posix.go:55 +0x25 fp=0xc000185f08 sp=0xc000185ec0 pc=0x5640ed508905
Dec 5 10:29:25 localhost ollama: net.(*conn).Read(0xc000112090, {0xc000114ee1?, 0x0?, 0x5640edc560e0?})
Dec 5 10:29:25 localhost ollama: net/net.go:185 +0x45 fp=0xc000185f50 sp=0xc000185f08 pc=0x5640ed512bc5
Dec 5 10:29:25 localhost ollama: net.(*TCPConn).Read(0x5640edb2e870?, {0xc000114ee1?, 0x0?, 0x0?})
Dec 5 10:29:25 localhost ollama: :1 +0x25 fp=0xc000185f80 sp=0xc000185f50 pc=0x5640ed51e5a5
Dec 5 10:29:25 localhost ollama: net/http.(*connReader).backgroundRead(0xc000114ed0)
Dec 5 10:29:25 localhost ollama: net/http/server.go:681 +0x37 fp=0xc000185fc8 sp=0xc000185f80 pc=0x5640ed62d437
Dec 5 10:29:25 localhost ollama: net/http.(*connReader).startBackgroundRead.gowrap2()
Dec 5 10:29:25 localhost ollama: net/http/server.go:677 +0x25 fp=0xc000185fe0 sp=0xc000185fc8 pc=0x5640ed62d365
Dec 5 10:29:25 localhost ollama: runtime.goexit({})
Dec 5 10:29:25 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc000185fe8 sp=0xc000185fe0 pc=0x5640ed44ede1
Dec 5 10:29:25 localhost ollama: created by net/http.(*connReader).startBackgroundRead in goroutine 37
Dec 5 10:29:25 localhost ollama: net/http/server.go:677 +0xba
Dec 5 10:29:25 localhost ollama: goroutine 37 gp=0xc0001048c0 m=nil [select]:
Dec 5 10:29:25 localhost ollama: runtime.gopark(0xc0000d9a48?, 0x2?, 0xd8?, 0x96?, 0xc0000d97ec?)
Dec 5 10:29:25 localhost ollama: runtime/proc.go:402 +0xce fp=0xc0000d9658 sp=0xc0000d9638 pc=0x5640ed41d00e
Dec 5 10:29:25 localhost ollama: runtime.selectgo(0xc0000d9a48, 0xc0000d97e8, 0xc0002b0000?, 0x0, 0x1?, 0x1)
Dec 5 10:29:25 localhost ollama: runtime/select.go:327 +0x725 fp=0xc0000d9778 sp=0xc0000d9658 pc=0x5640ed42e3e5
Dec 5 10:29:25 localhost ollama: main.(*Server).completion(0xc00013c120, {0x5640ed99e830, 0xc0000aca80}, 0xc0000a2d80)
Dec 5 10:29:25 localhost ollama: github.com/ollama/ollama/llama/runner/runner.go:679 +0xa45 fp=0xc0000d9ab8 sp=0xc0000d9778 pc=0x5640ed6618e5
Dec 5 10:29:25 localhost ollama: main.(*Server).completion-fm({0x5640ed99e830?, 0xc0000aca80?}, 0x5640ed63bded?)
Dec 5 10:29:25 localhost ollama: :1 +0x36 fp=0xc0000d9ae8 sp=0xc0000d9ab8 pc=0x5640ed664936
Dec 5 10:29:25 localhost ollama: net/http.HandlerFunc.ServeHTTP(0xc000116d00?, {0x5640ed99e830?, 0xc0000aca80?}, 0x10?)
Dec 5 10:29:25 localhost ollama: net/http/server.go:2171 +0x29 fp=0xc0000d9b10 sp=0xc0000d9ae8 pc=0x5640ed634889
Dec 5 10:29:25 localhost ollama: net/http.(*ServeMux).ServeHTTP(0x5640ed3eff85?, {0x5640ed99e830, 0xc0000aca80}, 0xc0000a2d80)
Dec 5 10:29:25 localhost ollama: net/http/server.go:2688 +0x1ad fp=0xc0000d9b60 sp=0xc0000d9b10 pc=0x5640ed63670d
Dec 5 10:29:25 localhost ollama: net/http.serverHandler.ServeHTTP({0x5640ed99db80?}, {0x5640ed99e830?, 0xc0000aca80?}, 0x6?)
Dec 5 10:29:25 localhost ollama: net/http/server.go:3142 +0x8e fp=0xc0000d9b90 sp=0xc0000d9b60 pc=0x5640ed63772e
Dec 5 10:29:25 localhost ollama: net/http.(*conn).serve(0xc00013c1b0, {0x5640ed99ec88, 0xc000114db0})
Dec 5 10:29:25 localhost ollama: net/http/server.go:2044 +0x5e8 fp=0xc0000d9fb8 sp=0xc0000d9b90 pc=0x5640ed6334c8
Dec 5 10:29:25 localhost ollama: net/http.(*Server).Serve.gowrap3()
Dec 5 10:29:25 localhost ollama: net/http/server.go:3290 +0x28 fp=0xc0000d9fe0 sp=0xc0000d9fb8 pc=0x5640ed637ea8
Dec 5 10:29:25 localhost ollama: runtime.goexit({})
Dec 5 10:29:25 localhost ollama: runtime/asm_amd64.s:1695 +0x1 fp=0xc0000d9fe8 sp=0xc0000d9fe0 pc=0x5640ed44ede1
Dec 5 10:29:25 localhost ollama: created by net/http.(*Server).Serve in goroutine 1
Dec 5 10:29:25 localhost ollama: net/http/server.go:3290 +0x4b4
Dec 5 10:29:25 localhost ollama: rax 0x7f74600fc0e0
Dec 5 10:29:25 localhost ollama: rbx 0x7f749864b7b0
Dec 5 10:29:25 localhost ollama: rcx 0x7f74600fc0e0
Dec 5 10:29:25 localhost ollama: rdx 0x7f74e0682a00
Dec 5 10:29:25 localhost ollama: rdi 0x7f74600fc0e0
Dec 5 10:29:25 localhost ollama: rsi 0x7f74359ca7ca
Dec 5 10:29:25 localhost ollama: rbp 0x7f749864b700
Dec 5 10:29:25 localhost ollama: rsp 0x7f749864b6a8
Dec 5 10:29:25 localhost ollama: r8 0x4
Dec 5 10:29:25 localhost ollama: r9 0x4c
Dec 5 10:29:25 localhost ollama: r10 0x0
Dec 5 10:29:25 localhost ollama: r11 0x7f74e06b4750
Dec 5 10:29:25 localhost ollama: r12 0x7f7468296fd0
Dec 5 10:29:25 localhost ollama: r13 0x7f7468297910
Dec 5 10:29:25 localhost ollama: r14 0x7f74682970d0
Dec 5 10:29:25 localhost ollama: r15 0x7f746851a1e0
Dec 5 10:29:25 localhost ollama: rip 0x7f74e0682a00
Dec 5 10:29:25 localhost ollama: rflags 0x10287
Dec 5 10:29:25 localhost ollama: cs 0x33
Dec 5 10:29:25 localhost ollama: fs 0x0
Dec 5 10:29:25 localhost ollama: gs 0x0
Dec 5 10:29:25 localhost ollama: [GIN] 2024/12/05 - 10:29:25 | 200 | 2.175286662s | 127.0.0.1 | POST "/api/chat"
Dec 5 10:30:02 localhost systemd: Started Session 306 of user root.
Dec 5 10:34:30 localhost ollama: time=2024-12-05T10:34:30.066+08:00 level=WARN source=sched.go:646 msg="gpu VRAM usage didn't recover within timeout" seconds=5.032960268 model=/data/ollama/models/blobs/sha256-667b0c1932bc6ffc593ed1d03f895bf2dc8dc6df21db3042284a6f4416b06a29
Dec 5 10:34:30 localhost ollama: time=2024-12-05T10:34:30.316+08:00 level=WARN source=sched.go:646 msg="gpu VRAM usage didn't recover within timeout" seconds=5.2833089730000005 model=/data/ollama/models/blobs/sha256-667b0c1932bc6ffc593ed1d03f895bf2dc8dc6df21db3042284a6f4416b06a29
Dec 5 10:34:30 localhost ollama: time=2024-12-05T10:34:30.565+08:00 level=WARN source=sched.go:646 msg="gpu VRAM usage didn't recover within timeout" seconds=5.532611974 model=/data/ollama/models/blobs/sha256-667b0c1932bc6ffc593ed1d03f895bf2dc8dc6df21db3042284a6f4416b06a29
@Pekkari commented on GitHub (Dec 19, 2024):
I'm facing this error in latest ollama:rocm container image where, when I start a new conversation using open-webui, ollama will crash with the following output:
This used to work in former versions of ollama:rocm container, it broke when I updated recently to last version of the container.
@ican2002 commented on GitHub (Feb 5, 2025):
can anyone help to resolve this issue? thanks.
CPU: intel i7-6700HQ
OS: windows10
GPU: 960M
seems CPU and GPU detected: in the log "Dynamic LLM libraries" runners="[cpu_avx cpu_avx2 cuda_v11_avx cuda_v12_avx rocm_avx cpu]"
and cgo related problems as log shows:
runtime.cgocall(0x7ff6bdc60920, 0xc0003f4c10)
runtime/cgocall.go:167 +0x3e fp=0xc0003f4be8 sp=0xc0003f4b80 pc=0x7ff6bcea9c3e
seems many ones are facing this problems.
if anyone resloeved it, please reply to this, thank you.
===================================================================
2025/02/05 20:47:23 routes.go:1187: INFO server config env="map[CUDA_VISIBLE_DEVICES: GPU_DEVICE_ORDINAL: HIP_VISIBLE_DEVICES: HSA_OVERRIDE_GFX_VERSION: HTTPS_PROXY: HTTP_PROXY: NO_PROXY: OLLAMA_DEBUG:false OLLAMA_FLASH_ATTENTION:false OLLAMA_GPU_OVERHEAD:0 OLLAMA_HOST:http://127.0.0.1:11434 OLLAMA_INTEL_GPU:false OLLAMA_KEEP_ALIVE:5m0s OLLAMA_KV_CACHE_TYPE: OLLAMA_LLM_LIBRARY: OLLAMA_LOAD_TIMEOUT:5m0s OLLAMA_MAX_LOADED_MODELS:0 OLLAMA_MAX_QUEUE:512 OLLAMA_MODELS:C:\Users\can\.ollama\models OLLAMA_MULTIUSER_CACHE:false OLLAMA_NOHISTORY:false OLLAMA_NOPRUNE:false OLLAMA_NUM_PARALLEL:0 OLLAMA_ORIGINS:[http://localhost https://localhost http://localhost:* https://localhost:* http://127.0.0.1 https://127.0.0.1 http://127.0.0.1:* https://127.0.0.1:* http://0.0.0.0 https://0.0.0.0 http://0.0.0.0:* https://0.0.0.0:* app://* file://* tauri://* vscode-webview://*] OLLAMA_SCHED_SPREAD:false ROCR_VISIBLE_DEVICES:]"
time=2025-02-05T20:47:23.684+08:00 level=INFO source=images.go:432 msg="total blobs: 0"
time=2025-02-05T20:47:23.685+08:00 level=INFO source=images.go:439 msg="total unused blobs removed: 0"
time=2025-02-05T20:47:23.686+08:00 level=INFO source=routes.go:1238 msg="Listening on 127.0.0.1:11434 (version 0.5.7)"
time=2025-02-05T20:47:23.687+08:00 level=INFO source=routes.go:1267 msg="Dynamic LLM libraries" runners="[cpu_avx cpu_avx2 cuda_v11_avx cuda_v12_avx rocm_avx cpu]"
time=2025-02-05T20:47:23.687+08:00 level=INFO source=gpu.go:226 msg="looking for compatible GPUs"
time=2025-02-05T20:47:23.687+08:00 level=INFO source=gpu_windows.go:167 msg=packages count=1
time=2025-02-05T20:47:23.687+08:00 level=INFO source=gpu_windows.go:214 msg="" package=0 cores=4 efficiency=0 threads=8
Exception 0xc0000005 0x0 0x10 0x7ffcaca97983
PC=0x7ffcaca97983
signal arrived during external code execution
runtime.cgocall(0x7ff6bdc60920, 0xc0003f4c10)
runtime/cgocall.go:167 +0x3e fp=0xc0003f4be8 sp=0xc0003f4b80 pc=0x7ff6bcea9c3e
github.com/ollama/ollama/discover._Cfunc_nvml_init(0x2041ea093d0, 0xc00004f440)
_cgo_gotypes.go:573 +0x4d fp=0xc0003f4c10 sp=0xc0003f4be8 pc=0x7ff6bd476f8d
github.com/ollama/ollama/discover.loadNVMLMgmt.func2(0x2041ea093d0, 0xc00004f440)
github.com/ollama/ollama/discover/gpu.go:651 +0x4a fp=0xc0003f4c40 sp=0xc0003f4c10 pc=0x7ff6bd47e68a
github.com/ollama/ollama/discover.loadNVMLMgmt({0xc00004f400, 0x3, 0x7ff6be8b9410?})
github.com/ollama/ollama/discover/gpu.go:651 +0x245 fp=0xc0003f4d30 sp=0xc0003f4c40 pc=0x7ff6bd47e4c5
github.com/ollama/ollama/discover.initCudaHandles()
github.com/ollama/ollama/discover/gpu.go:118 +0x4fa fp=0xc0003f4f98 sp=0xc0003f4d30 pc=0x7ff6bd477a3a
github.com/ollama/ollama/discover.GetGPUInfo()
github.com/ollama/ollama/discover/gpu.go:262 +0x705 fp=0xc0003f5ae0 sp=0xc0003f4f98 pc=0x7ff6bd478b45
github.com/ollama/ollama/server.Serve({0x7ff6be099760, 0xc000608a80})
github.com/ollama/ollama/server/routes.go:1274 +0x8aa fp=0xc0003f5d18 sp=0xc0003f5ae0 pc=0x7ff6bda2e94a
github.com/ollama/ollama/cmd.RunServer(0xc00062a400?, {0x7ff6be955020?, 0x4?, 0x7ff6bdeda1ef?})
github.com/ollama/ollama/cmd/cmd.go:1033 +0x4a fp=0xc0003f5d58 sp=0xc0003f5d18 pc=0x7ff6bda5daaa
github.com/spf13/cobra.(*Command).execute(0xc0000bc608, {0x7ff6be955020, 0x0, 0x0})
github.com/spf13/cobra@v1.7.0/command.go:940 +0x862 fp=0xc0003f5e78 sp=0xc0003f5d58 pc=0x7ff6bd02c122
github.com/spf13/cobra.(*Command).ExecuteC(0xc00008b508)
github.com/spf13/cobra@v1.7.0/command.go:1068 +0x3a5 fp=0xc0003f5f30 sp=0xc0003f5e78 pc=0x7ff6bd02c965
github.com/spf13/cobra.(*Command).Execute(...)
github.com/spf13/cobra@v1.7.0/command.go:992
github.com/spf13/cobra.(*Command).ExecuteContext(...)
github.com/spf13/cobra@v1.7.0/command.go:985
main.main()
github.com/ollama/ollama/main.go:12 +0x4d fp=0xc0003f5f50 sp=0xc0003f5f30 pc=0x7ff6bda65c8d
runtime.main()
runtime/proc.go:272 +0x27d fp=0xc0003f5fe0 sp=0xc0003f5f50 pc=0x7ff6bce7dfbd
runtime.goexit({})
runtime/asm_amd64.s:1700 +0x1 fp=0xc0003f5fe8 sp=0xc0003f5fe0 pc=0x7ff6bceb8921
@jessegross commented on GitHub (Feb 6, 2025):
@ican2002 All three of these issues look different to me. Please create a new bug and include your logs there.
@ican2002 commented on GitHub (Feb 6, 2025):
@jessegross I create an issue at
https://github.com/ollama/ollama/issues/8886
Thanks.