Merge pull request #39 from wacunn:updates

PiperOrigin-RevId: 621196556 Change-Id: I24679b6abc732686a893b63592cdd37ed5ba9f94
google-deepmind · Apr 2, 2024 · 8863427 · 8863427
2 parents 1cda0b5 + 661148f
commit 8863427
Show file tree

Hide file tree

Showing 2 changed files with 115 additions and 0 deletions.
diff --git a/concordia/language_model/ollama_model.py b/concordia/language_model/ollama_model.py
@@ -0,0 +1,114 @@
+# Copyright 2024 DeepMind Technologies Limited.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Ollama Language Model."""
+
+from collections.abc import Collection, Sequence
+import re
+
+from concordia.language_model import language_model
+from concordia.utils import measurements as measurements_lib
+from langchain import llms
+from typing_extensions import override
+
+
+def _extract_choices(text):
+  match = re.search(r"\(?(\w)\)", text)
+  if match:
+    return match.group(1)
+  return None
+
+
+class OllamaLanguageModel(language_model.LanguageModel):
+  """Language Model that uses Ollama LLM models."""
+
+  def __init__(
+      self,
+      model_name: str,
+      *,
+      system_message: str = "",
+      measurements: measurements_lib.Measurements | None = None,
+      channel: str = language_model.DEFAULT_STATS_CHANNEL,
+  ) -> None:
+    """Initializes the instance.
+
+    Args:
+        model_name: The language model to use. For more details, see
+          https://github.com/ollama/ollama.
+        system_message: System message to prefix to requests when prompting the
+          model.
+        measurements: The measurements object to log usage statistics to.
+        channel: The channel to write the statistics to.
+    """
+    self._model_name = model_name
+    self._system_message = system_message
+    self._measurements = measurements
+    self._channel = channel
+    self._client = llms.Ollama(model=model_name)
+
+  @override
+  def sample_text(
+      self,
+      prompt: str,
+      *,
+      max_tokens: int = language_model.DEFAULT_MAX_TOKENS,
+      max_characters: int = language_model.DEFAULT_MAX_CHARACTERS,
+      terminators: Collection[str] = language_model.DEFAULT_TERMINATORS,
+      temperature: float = language_model.DEFAULT_TEMPERATURE,
+      timeout: float = language_model.DEFAULT_TIMEOUT_SECONDS,
+      seed: int | None = None,
+  ) -> str:
+    prompt_with_system_message = f"{self._system_message}\n\n{prompt}"
+
+    response = self._client(
+        prompt_with_system_message,
+        stop=terminators,
+        temperature=temperature,
+    )
+
+    if self._measurements is not None:
+      self._measurements.publish_datum(
+          self._channel, {"raw_text_length": len(response)}
+      )
+    return response
+
+  @override
+  def sample_choice(
+      self,
+      prompt: str,
+      responses: Sequence[str],
+      *,
+      seed: int | None = None,
+  ) -> tuple[int, str, dict[str, float]]:
+    max_characters = len(max(responses, key=len))
+    prompt_with_system_message = f"{self._system_message}\n\n{prompt}"
+    sample = self.sample_text(
+        prompt_with_system_message,
+        max_characters=max_characters,
+        temperature=0.0,
+        seed=seed,
+    )
+    answer = _extract_choices(sample)
+    try:
+      idx = responses.index(answer)
+    except ValueError:
+      raise language_model.InvalidResponseError(
+          f"Invalid response: {answer}. "
+          f"LLM Input: {prompt}\nLLM Output: {sample}"
+      ) from None
+
+    if self._measurements is not None:
+      self._measurements.publish_datum(self._channel, {"choices_calls": 1})
+    debug = {}
+    return idx, responses[idx], debug
diff --git a/setup.py b/setup.py
@@ -25,6 +25,7 @@
     'absl-py',
     'google-cloud-aiplatform',
     'ipython',
+    'langchain',
     'matplotlib',
     'numpy',
     'openai>=1.3.0',