mirror of
https://github.com/ollama/ollama.git
synced 2026-05-05 23:53:43 -05:00
* mlx: add laguna model support * convert: support fp8 safetensors import Decode HF F8_E4M3 safetensors with block scale companions into GGUF-supported tensor types, and record which output tensors came from FP8 source weights. Use that source-precision metadata during create quantization: default FP8-sourced GGUFs to Q8_0, keep non-FP8 tensors at their original precision for Q8_0, and promote non-FP8 quantizable tensors to Q8_0 for Q4_K requests. * ggml: add laguna model support * server: preserve generate logprobs with builtin parsers Generate requests were dropping logprob-only chunks whenever a builtin parser buffered visible content. Chat already handled this case, but generate only forwarded chunks with visible response, thinking, or tool-call output. Keep generate chunks that carry logprobs even when the builtin parser has not flushed visible content yet, and add a regression test that exercises the behavior with a generic thinking parser. * review comments - perf improvements * ggml: implement nemotron 3 nano omni * add poolside integration * update poolside doc * adapt to new cache setup * fix test * fix test --------- Co-authored-by: Eva Ho <hoyyeva@gmail.com>
52 lines
1.1 KiB
Go
52 lines
1.1 KiB
Go
package launch
|
|
|
|
import (
|
|
"fmt"
|
|
"os"
|
|
"os/exec"
|
|
"runtime"
|
|
|
|
"github.com/ollama/ollama/envconfig"
|
|
)
|
|
|
|
// Poolside implements Runner for Poolside's CLI.
|
|
type Poolside struct{}
|
|
|
|
var poolsideGOOS = runtime.GOOS
|
|
|
|
func (p *Poolside) String() string { return "Poolside" }
|
|
|
|
func poolsideUnsupportedError() error {
|
|
return fmt.Errorf("Warning: Poolside is not currently supported on Windows")
|
|
}
|
|
|
|
func (p *Poolside) args(model string, extra []string) []string {
|
|
var args []string
|
|
if model != "" {
|
|
args = append(args, "-m", model)
|
|
}
|
|
args = append(args, extra...)
|
|
return args
|
|
}
|
|
|
|
func (p *Poolside) Run(model string, args []string) error {
|
|
if poolsideGOOS == "windows" {
|
|
return poolsideUnsupportedError()
|
|
}
|
|
|
|
bin, err := exec.LookPath("pool")
|
|
if err != nil {
|
|
return fmt.Errorf("pool is not installed")
|
|
}
|
|
|
|
cmd := exec.Command(bin, p.args(model, args)...)
|
|
cmd.Stdin = os.Stdin
|
|
cmd.Stdout = os.Stdout
|
|
cmd.Stderr = os.Stderr
|
|
cmd.Env = append(os.Environ(),
|
|
"POOLSIDE_STANDALONE_BASE_URL="+envconfig.Host().String()+"/v1",
|
|
"POOLSIDE_API_KEY=ollama",
|
|
)
|
|
return cmd.Run()
|
|
}
|