FEATURE: Tools for models from Ollama provider (#819)

Adds support for Ollama function calling
2024-10-11 07:25:53 +11:00 · 2024-10-11 07:25:53 +11:00 · 94010a5f78
parent 6c4c96e83c
commit 94010a5f78
9 changed files with 404 additions and 20 deletions
--- a/app/models/llm_model.rb
+++ b/app/models/llm_model.rb
@ -31,6 +31,7 @@ class LlmModel < ActiveRecord::Base
      },
      ollama: {
        disable_system_prompt: :checkbox,
        enable_native_tool: :checkbox,
      },
    }
  end
--- a/config/locales/client.en.yml
+++ b/config/locales/client.en.yml
@ -312,6 +312,7 @@ en:
          region: "AWS Bedrock Region"
          organization: "Optional OpenAI Organization ID"
          disable_system_prompt: "Disable system message in prompts"
          enable_native_tool: "Enable native tool support"
      related_topics:
        title: "Related Topics"
--- a/lib/completions/dialects/ollama.rb
+++ b/lib/completions/dialects/ollama.rb
@ -10,7 +10,9 @@ module DiscourseAi
          end
        end
-        # TODO: Add tool suppport
+        def native_tool_support?
          enable_native_tool?
        end
        def max_prompt_tokens
          llm_model.max_prompt_tokens
@ -18,6 +20,14 @@ module DiscourseAi
        private
        def tools_dialect
          if enable_native_tool?
            @tools_dialect ||= DiscourseAi::Completions::Dialects::OllamaTools.new(prompt.tools)
          else
            super
          end
        end
        def tokenizer
          llm_model.tokenizer_class
        end
@ -26,8 +36,28 @@ module DiscourseAi
          { role: "assistant", content: msg[:content] }
        end
        def tool_call_msg(msg)
          tools_dialect.from_raw_tool_call(msg)
        end
        def tool_msg(msg)
          tools_dialect.from_raw_tool(msg)
        end
        def system_msg(msg)
-          { role: "system", content: msg[:content] }
+          msg = { role: "system", content: msg[:content] }
          if tools_dialect.instructions.present?
            msg[:content] = msg[:content].dup << "\n\n#{tools_dialect.instructions}"
          end
          msg
        end
        def enable_native_tool?
          return @enable_native_tool if defined?(@enable_native_tool)
          @enable_native_tool = llm_model.lookup_custom_param("enable_native_tool")
        end
        def user_msg(msg)
--- a/lib/completions/dialects/ollama_tools.rb
+++ b/lib/completions/dialects/ollama_tools.rb
@ -0,0 +1,58 @@
 # frozen_string_literal: true
 module DiscourseAi
  module Completions
    module Dialects
      # TODO: Define the Tool class to be inherited by all tools.
      class OllamaTools
        def initialize(tools)
          @raw_tools = tools
        end
        def instructions
          "" # Noop. Tools are listed separate.
        end
        def translated_tools
          raw_tools.map do |t|
            tool = t.dup
            tool[:parameters] = t[:parameters]
              .to_a
              .reduce({ type: "object", properties: {}, required: [] }) do |memo, p|
                name = p[:name]
                memo[:required] << name if p[:required]
                except = %i[name required item_type]
                except << :enum if p[:enum].blank?
                memo[:properties][name] = p.except(*except)
                memo
              end
            { type: "function", function: tool }
          end
        end
        def from_raw_tool_call(raw_message)
          call_details = JSON.parse(raw_message[:content], symbolize_names: true)
          call_details[:name] = raw_message[:name]
          {
            role: "assistant",
            content: nil,
            tool_calls: [{ type: "function", function: call_details }],
          }
        end
        def from_raw_tool(raw_message)
          { role: "tool", content: raw_message[:content], name: raw_message[:name] }
        end
        private
        attr_reader :raw_tools
      end
    end
  end
 end
--- a/lib/completions/endpoints/ollama.rb
+++ b/lib/completions/endpoints/ollama.rb
@ -37,11 +37,28 @@ module DiscourseAi
          URI(llm_model.url)
        end
-        def prepare_payload(prompt, model_params, _dialect)
+        def native_tool_support?
          @native_tool_support
        end
        def has_tool?(_response_data)
          @has_function_call
        end
        def prepare_payload(prompt, model_params, dialect)
          @native_tool_support = dialect.native_tool_support?
          # https://github.com/ollama/ollama/blob/main/docs/api.md#parameters-1
          # Due to ollama enforce a 'stream: false' for tool calls, instead of complicating the code,
          # we will just disable streaming for all ollama calls if native tool support is enabled
          default_options
            .merge(model_params)
            .merge(messages: prompt)
-            .tap { |payload| payload[:stream] = false if !@streaming_mode }
+            .tap { |payload| payload[:stream] = false if @native_tool_support || !@streaming_mode }
            .tap do |payload|
              payload[:tools] = dialect.tools if @native_tool_support && dialect.tools.present?
            end
        end
        def prepare_request(payload)
@ -58,7 +75,66 @@ module DiscourseAi
          parsed = JSON.parse(response_raw, symbolize_names: true)
          return if !parsed
-          parsed.dig(:message, :content)
+          response_h = parsed.dig(:message)
          @has_function_call ||= response_h.dig(:tool_calls).present?
          @has_function_call ? response_h.dig(:tool_calls, 0) : response_h.dig(:content)
        end
        def add_to_function_buffer(function_buffer, payload: nil, partial: nil)
          @args_buffer ||= +""
          if @streaming_mode
            return function_buffer if !partial
          else
            partial = payload
          end
          f_name = partial.dig(:function, :name)
          @current_function ||= function_buffer.at("invoke")
          if f_name
            current_name = function_buffer.at("tool_name").content
            if current_name.blank?
              # first call
            else
              # we have a previous function, so we need to add a noop
              @args_buffer = +""
              @current_function =
                function_buffer.at("function_calls").add_child(
                  Nokogiri::HTML5::DocumentFragment.parse(noop_function_call_text + "\n"),
                )
            end
          end
          @current_function.at("tool_name").content = f_name if f_name
          @current_function.at("tool_id").content = partial[:id] if partial[:id]
          args = partial.dig(:function, :arguments)
          # allow for SPACE within arguments
          if args && args != ""
            @args_buffer << args.to_json
            begin
              json_args = JSON.parse(@args_buffer, symbolize_names: true)
              argument_fragments =
                json_args.reduce(+"") do |memo, (arg_name, value)|
                  memo << "\n<#{arg_name}>#{value}</#{arg_name}>"
                end
              argument_fragments << "\n"
              @current_function.at("parameters").children =
                Nokogiri::HTML5::DocumentFragment.parse(argument_fragments)
            rescue JSON::ParserError
              return function_buffer
            end
          end
          function_buffer
        end
      end
    end
--- a/spec/fabricators/llm_model_fabricator.rb
+++ b/spec/fabricators/llm_model_fabricator.rb
@ -87,4 +87,5 @@ Fabricator(:ollama_model, from: :llm_model) do
  api_key "ABC"
  tokenizer "DiscourseAi::Tokenizer::Llama3Tokenizer"
  url "http://api.ollama.ai/api/chat"
  provider_params { { enable_native_tool: true } }
 end
--- a/spec/lib/completions/dialects/ollama_spec.rb
+++ b/spec/lib/completions/dialects/ollama_spec.rb
@ -7,6 +7,7 @@ RSpec.describe DiscourseAi::Completions::Dialects::Ollama do
  let(:context) { DialectContext.new(described_class, model) }
  describe "#translate" do
    context "when native tool support is enabled" do
      it "translates a prompt written in our generic format to the Ollama format" do
        ollama_version = [
          { role: "system", content: context.system_insts },
@ -17,6 +18,27 @@ RSpec.describe DiscourseAi::Completions::Dialects::Ollama do
        expect(translated).to eq(ollama_version)
      end
    end
    context "when native tool support is disabled - XML tools" do
      it "includes the instructions in the system message" do
        allow(model).to receive(:lookup_custom_param).with("enable_native_tool").and_return(false)
        DiscourseAi::Completions::Dialects::XmlTools
          .any_instance
          .stubs(:instructions)
          .returns("Instructions")
        ollama_version = [
          { role: "system", content: "#{context.system_insts}\n\nInstructions" },
          { role: "user", content: context.simple_user_input },
        ]
        translated = context.system_user_scenario
        expect(translated).to eq(ollama_version)
      end
    end
    it "trims content if it's getting too long" do
      model.max_prompt_tokens = 5000
@ -33,4 +55,40 @@ RSpec.describe DiscourseAi::Completions::Dialects::Ollama do
      expect(context.dialect(nil).max_prompt_tokens).to eq(10_000)
    end
  end
  describe "#tools" do
    context "when native tools are enabled" do
      it "returns the translated tools from the OllamaTools class" do
        tool = instance_double(DiscourseAi::Completions::Dialects::OllamaTools)
        allow(model).to receive(:lookup_custom_param).with("enable_native_tool").and_return(true)
        allow(tool).to receive(:translated_tools)
        allow(DiscourseAi::Completions::Dialects::OllamaTools).to receive(:new).and_return(tool)
        context.dialect_tools
        expect(DiscourseAi::Completions::Dialects::OllamaTools).to have_received(:new).with(
          context.prompt.tools,
        )
        expect(tool).to have_received(:translated_tools)
      end
    end
    context "when native tools are disabled" do
      it "returns the translated tools from the XmlTools class" do
        tool = instance_double(DiscourseAi::Completions::Dialects::XmlTools)
        allow(model).to receive(:lookup_custom_param).with("enable_native_tool").and_return(false)
        allow(tool).to receive(:translated_tools)
        allow(DiscourseAi::Completions::Dialects::XmlTools).to receive(:new).and_return(tool)
        context.dialect_tools
        expect(DiscourseAi::Completions::Dialects::XmlTools).to have_received(:new).with(
          context.prompt.tools,
        )
        expect(tool).to have_received(:translated_tools)
      end
    end
  end
 end
--- a/spec/lib/completions/dialects/ollama_tools_spec.rb
+++ b/spec/lib/completions/dialects/ollama_tools_spec.rb
@ -0,0 +1,112 @@
 # frozen_string_literal: true
 require_relative "dialect_context"
 RSpec.describe DiscourseAi::Completions::Dialects::OllamaTools do
  describe "#translated_tools" do
    it "translates a tool from our generic format to the Ollama format" do
      tools = [
        {
          name: "github_file_content",
          description: "Retrieves the content of specified GitHub files",
          parameters: [
            {
              name: "repo_name",
              description: "The name of the GitHub repository (e.g., 'discourse/discourse')",
              type: "string",
              required: true,
            },
            {
              name: "file_paths",
              description: "The paths of the files to retrieve within the repository",
              type: "array",
              item_type: "string",
              required: true,
            },
            {
              name: "branch",
              description: "The branch or commit SHA to retrieve the files from (default: 'main')",
              type: "string",
              required: false,
            },
          ],
        },
      ]
      ollama_tools = described_class.new(tools)
      translated_tools = ollama_tools.translated_tools
      expect(translated_tools).to eq(
        [
          {
            type: "function",
            function: {
              name: "github_file_content",
              description: "Retrieves the content of specified GitHub files",
              parameters: {
                type: "object",
                properties: {
                  "repo_name" => {
                    description: "The name of the GitHub repository (e.g., 'discourse/discourse')",
                    type: "string",
                  },
                  "file_paths" => {
                    description: "The paths of the files to retrieve within the repository",
                    type: "array",
                  },
                  "branch" => {
                    description:
                      "The branch or commit SHA to retrieve the files from (default: 'main')",
                    type: "string",
                  },
                },
                required: %w[repo_name file_paths],
              },
            },
          },
        ],
      )
    end
  end
  describe "#from_raw_tool_call" do
    it "converts a raw tool call to the Ollama tool format" do
      raw_message = {
        content: '{"repo_name":"discourse/discourse","file_paths":["README.md"],"branch":"main"}',
      }
      ollama_tools = described_class.new([])
      tool_call = ollama_tools.from_raw_tool_call(raw_message)
      expect(tool_call).to eq(
        {
          role: "assistant",
          content: nil,
          tool_calls: [
            {
              type: "function",
              function: {
                repo_name: "discourse/discourse",
                file_paths: ["README.md"],
                branch: "main",
                name: nil,
              },
            },
          ],
        },
      )
    end
  end
  describe "#from_raw_tool" do
    it "converts a raw tool to the Ollama tool format" do
      raw_message = { content: "Hello, world!", name: "github_file_content" }
      ollama_tools = described_class.new([])
      tool = ollama_tools.from_raw_tool(raw_message)
      expect(tool).to eq({ role: "tool", content: "Hello, world!", name: "github_file_content" })
    end
  end
 end
--- a/spec/lib/completions/endpoints/ollama_spec.rb
+++ b/spec/lib/completions/endpoints/ollama_spec.rb
@ -3,8 +3,13 @@
 require_relative "endpoint_compliance"
 class OllamaMock < EndpointMock
-  def response(content)
+  def response(content, tool_call: false)
-    message_content = { content: content }
+    message_content =
      if tool_call
        { content: "", tool_calls: [content] }
      else
        { content: content }
      end
    {
      created_at: "2024-09-25T06:47:21.283028Z",
@ -21,11 +26,11 @@ class OllamaMock < EndpointMock
    }
  end
-  def stub_response(prompt, response_text)
+  def stub_response(prompt, response_text, tool_call: false)
    WebMock
      .stub_request(:post, "http://api.ollama.ai/api/chat")
-      .with(body: request_body(prompt))
+      .with(body: request_body(prompt, tool_call: tool_call))
-      .to_return(status: 200, body: JSON.dump(response(response_text)))
+      .to_return(status: 200, body: JSON.dump(response(response_text, tool_call: tool_call)))
  end
  def stream_line(delta)
@ -71,14 +76,50 @@ class OllamaMock < EndpointMock
    WebMock
      .stub_request(:post, "http://api.ollama.ai/api/chat")
-      .with(body: request_body(prompt, stream: true))
+      .with(body: request_body(prompt))
      .to_return(status: 200, body: chunks)
    yield if block_given?
  end
-  def request_body(prompt, stream: false)
+  def tool_response
-    model.default_options.merge(messages: prompt).tap { |b| b[:stream] = false if !stream }.to_json
+    { function: { name: "get_weather", arguments: { location: "Sydney", unit: "c" } } }
  end
  def tool_payload
    {
      type: "function",
      function: {
        name: "get_weather",
        description: "Get the weather in a city",
        parameters: {
          type: "object",
          properties: {
            location: {
              type: "string",
              description: "the city name",
            },
            unit: {
              type: "string",
              description: "the unit of measurement celcius c or fahrenheit f",
              enum: %w[c f],
            },
          },
          required: %w[location unit],
        },
      },
    }
  end
  def request_body(prompt, tool_call: false)
    model
      .default_options
      .merge(messages: prompt)
      .tap do |b|
        b[:stream] = false
        b[:tools] = [tool_payload] if tool_call
      end
      .to_json
  end
 end
@ -100,6 +141,12 @@ RSpec.describe DiscourseAi::Completions::Endpoints::Ollama do
        compliance.regular_mode_simple_prompt(ollama_mock)
      end
    end
    context "with tools" do
      it "returns a function invocation" do
        compliance.regular_mode_tools(ollama_mock)
      end
    end
  end
  describe "when using streaming mode" do