From b0023dc858d9e2091b3ad29d2c5abc084ac4552f Mon Sep 17 00:00:00 2001 From: Christopher Creutzig <89011131+ccreutzi@users.noreply.github.com> Date: Tue, 20 Aug 2024 10:23:37 +0200 Subject: [PATCH] tests still unreliable with Ollama version in GitHub CI MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit These tests should work and do work locally. But they fail in GitHub CI – for an unknown reason that almost certainly is in Ollama, not in our code. --- tests/tollamaChat.m | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/tests/tollamaChat.m b/tests/tollamaChat.m index 342e7df..bdde8b9 100644 --- a/tests/tollamaChat.m +++ b/tests/tollamaChat.m @@ -50,7 +50,7 @@ function extremeTopK(testCase) %% This should work, and it does on some computers. On others, Ollama %% receives the parameter, but either Ollama or llama.cpp fails to %% honor it correctly. - % testCase.assumeTrue(false,"disabled due to Ollama/llama.cpp not honoring parameter reliably"); + testCase.assumeTrue(false,"disabled due to Ollama/llama.cpp not honoring parameter reliably"); % setting top-k to k=1 leaves no random choice, % so we expect to get a fixed response. @@ -65,7 +65,7 @@ function extremeMinP(testCase) %% This should work, and it does on some computers. On others, Ollama %% receives the parameter, but either Ollama or llama.cpp fails to %% honor it correctly. - % testCase.assumeTrue(false,"disabled due to Ollama/llama.cpp not honoring parameter reliably"); + testCase.assumeTrue(false,"disabled due to Ollama/llama.cpp not honoring parameter reliably"); % setting min-p to p=1 means only tokens with the same logit as % the most likely one can be chosen, which will almost certainly @@ -81,7 +81,7 @@ function extremeTfsZ(testCase) %% This should work, and it does on some computers. On others, Ollama %% receives the parameter, but either Ollama or llama.cpp fails to %% honor it correctly. - % testCase.assumeTrue(false,"disabled due to Ollama/llama.cpp not honoring parameter reliably"); + testCase.assumeTrue(false,"disabled due to Ollama/llama.cpp not honoring parameter reliably"); % setting tfs_z to z=0 leaves no random choice, but degrades to % greedy sampling, so we expect to get a fixed response.