mirror of
https://github.com/ollama/ollama.git
synced 2026-04-30 07:57:51 -05:00
Use flash attention flag for now (#4580)
* put flash attention behind flag for now * add test * remove print * up timeout for sheduler tests
This commit is contained in:
@@ -151,7 +151,7 @@ func newScenario(t *testing.T, ctx context.Context, modelName string, estimatedV
|
||||
}
|
||||
|
||||
func TestRequests(t *testing.T) {
|
||||
ctx, done := context.WithTimeout(context.Background(), 500*time.Millisecond)
|
||||
ctx, done := context.WithTimeout(context.Background(), time.Second)
|
||||
defer done()
|
||||
|
||||
// Same model, same request
|
||||
|
||||
Reference in New Issue
Block a user