FIX: Llm selector / forced tools / search tool (#862)

* FIX: Llm selector / forced tools / search tool This fixes a few issues: 1. When search was not finding any semantic results we would break the tool 2. Gemin / Anthropic models did not implement forced tools previously despite it being an API option 3. Mechanics around displaying llm selector were not right. If you disabled LLM selector server side persona PM did not work correctly. 4. Disabling native tools for anthropic model moved out of a site setting. This deliberately does not migrate cause this feature is really rare to need now, people who had it set probably did not need it. 5. Updates anthropic model names to latest release * linting * fix a couple of tests I missed * clean up conditional
2024-10-25 06:24:53 +11:00 · 2024-10-25 06:24:53 +11:00 · 4923837165
parent 3022d34613
commit 4923837165
16 changed files with 121 additions and 40 deletions
--- a/app/models/llm_model.rb
+++ b/app/models/llm_model.rb
@ -19,6 +19,10 @@ class LlmModel < ActiveRecord::Base
      aws_bedrock: {
        access_key_id: :text,
        region: :text,
        disable_native_tools: :checkbox,
      },
      anthropic: {
        disable_native_tools: :checkbox,
      },
      open_ai: {
        organization: :text,
--- a/assets/javascripts/discourse/connectors/composer-fields/persona-llm-selector.gjs
+++ b/assets/javascripts/discourse/connectors/composer-fields/persona-llm-selector.gjs
@ -15,7 +15,7 @@ function isBotMessage(composer, currentUser) {
    const reciepients = composer.targetRecipients.split(",");
    return currentUser.ai_enabled_chat_bots
-      .filter((bot) => !bot.is_persona)
+      .filter((bot) => bot.username)
      .any((bot) => reciepients.any((username) => username === bot.username));
  }
  return false;
@ -43,7 +43,7 @@ export default class BotSelector extends Component {
  constructor() {
    super(...arguments);
-    if (this.botOptions && this.composer) {
+    if (this.botOptions && this.botOptions.length && this.composer) {
      let personaId = this.preferredPersonaStore.getObject("id");
      this._value = this.botOptions[0].id;
@ -57,13 +57,18 @@ export default class BotSelector extends Component {
      this.composer.metaData = { ai_persona_id: this._value };
      this.setAllowLLMSelector();
      if (this.hasLlmSelector) {
        let llm = this.preferredLlmStore.getObject("id");
        const llmOption =
          this.llmOptions.find((innerLlmOption) => innerLlmOption.id === llm) ||
          this.llmOptions[0];
        if (llmOption) {
          llm = llmOption.id;
        } else {
          llm = "";
        }
        if (llm) {
          next(() => {
@ -71,15 +76,30 @@ export default class BotSelector extends Component {
          });
        }
      }
      next(() => {
        this.resetTargetRecipients();
      });
    }
  }
  get composer() {
    return this.args?.outletArgs?.model;
  }
  get hasLlmSelector() {
    return this.currentUser.ai_enabled_chat_bots.any((bot) => !bot.is_persona);
  }
  get botOptions() {
    if (this.currentUser.ai_enabled_personas) {
-      return this.currentUser.ai_enabled_personas.map((persona) => {
+      let enabledPersonas = this.currentUser.ai_enabled_personas;
      if (!this.hasLlmSelector) {
        enabledPersonas = enabledPersonas.filter((persona) => persona.username);
      }
      return enabledPersonas.map((persona) => {
        return {
          id: persona.id,
          name: persona.name,
@ -106,6 +126,11 @@ export default class BotSelector extends Component {
  }
  setAllowLLMSelector() {
    if (!this.hasLlmSelector) {
      this.allowLLMSelector = false;
      return;
    }
    const persona = this.currentUser.ai_enabled_personas.find(
      (innerPersona) => innerPersona.id === this._value
    );
--- a/config/locales/client.en.yml
+++ b/config/locales/client.en.yml
@ -329,6 +329,7 @@ en:
          organization: "Optional OpenAI Organization ID"
          disable_system_prompt: "Disable system message in prompts"
          enable_native_tool: "Enable native tool support"
          disable_native_tools: "Disable native tool support (use XML based tools)"
      related_topics:
        title: "Related Topics"
--- a/config/locales/server.en.yml
+++ b/config/locales/server.en.yml
@ -49,7 +49,6 @@ en:
    ai_openai_embeddings_url: "Custom URL used for the OpenAI embeddings API. (in the case of Azure it can be: https://COMPANY.openai.azure.com/openai/deployments/DEPLOYMENT/embeddings?api-version=2023-05-15)"
    ai_openai_api_key: "API key for OpenAI API. ONLY used for embeddings and Dall-E. For GPT use the LLM config tab"
    ai_anthropic_native_tool_call_models: "List of models that will use native tool calls vs legacy XML based tools."
    ai_hugging_face_tei_endpoint: URL where the API is running for the Hugging Face text embeddings inference
    ai_hugging_face_tei_api_key: API key for Hugging Face text embeddings inference
--- a/config/settings.yml
+++ b/config/settings.yml
@ -125,16 +125,6 @@ discourse_ai:
  ai_anthropic_api_key:
    default: ""
    hidden: true
  ai_anthropic_native_tool_call_models:
    type: list
    list_type: compact
    default: "claude-3-sonnet|claude-3-haiku"
    allow_any: false
    choices:
      - claude-3-opus
      - claude-3-sonnet
      - claude-3-haiku
      - claude-3-5-sonnet
  ai_cohere_api_key:
    default: ""
    hidden: true
--- a/lib/ai_bot/entry_point.rb
+++ b/lib/ai_bot/entry_point.rb
@ -145,6 +145,8 @@ module DiscourseAi
          persona_users = AiPersona.persona_users(user: scope.user)
          if persona_users.present?
            persona_users.filter! { |persona_user| persona_user[:username].present? }
            bots_map.concat(
              persona_users.map do |persona_user|
                {
--- a/lib/completions/dialects/claude.rb
+++ b/lib/completions/dialects/claude.rb
@ -61,7 +61,7 @@ module DiscourseAi
        end
        def native_tool_support?
-          SiteSetting.ai_anthropic_native_tool_call_models_map.include?(llm_model.name)
+          !llm_model.lookup_custom_param("disable_native_tools")
        end
        private
--- a/lib/completions/endpoints/anthropic.rb
+++ b/lib/completions/endpoints/anthropic.rb
@ -27,7 +27,7 @@ module DiscourseAi
            when "claude-3-opus"
              "claude-3-opus-20240229"
            when "claude-3-5-sonnet"
-              "claude-3-5-sonnet-20240620"
+              "claude-3-5-sonnet-latest"
            else
              llm_model.name
            end
@ -70,7 +70,12 @@ module DiscourseAi
          payload[:system] = prompt.system_prompt if prompt.system_prompt.present?
          payload[:stream] = true if @streaming_mode
-          payload[:tools] = prompt.tools if prompt.has_tools?
+          if prompt.has_tools?
            payload[:tools] = prompt.tools
            if dialect.tool_choice.present?
              payload[:tool_choice] = { type: "tool", name: dialect.tool_choice }
            end
          end
          payload
        end
--- a/lib/completions/endpoints/aws_bedrock.rb
+++ b/lib/completions/endpoints/aws_bedrock.rb
@ -61,7 +61,7 @@ module DiscourseAi
            when "claude-3-opus"
              "anthropic.claude-3-opus-20240229-v1:0"
            when "claude-3-5-sonnet"
-              "anthropic.claude-3-5-sonnet-20240620-v1:0"
+              "anthropic.claude-3-5-sonnet-20241022-v2:0"
            else
              llm_model.name
            end
@ -83,7 +83,13 @@ module DiscourseAi
          payload = default_options(dialect).merge(model_params).merge(messages: prompt.messages)
          payload[:system] = prompt.system_prompt if prompt.system_prompt.present?
-          payload[:tools] = prompt.tools if prompt.has_tools?
+
          if prompt.has_tools?
            payload[:tools] = prompt.tools
            if dialect.tool_choice.present?
              payload[:tool_choice] = { type: "tool", name: dialect.tool_choice }
            end
          end
          payload
        end
--- a/lib/completions/endpoints/gemini.rb
+++ b/lib/completions/endpoints/gemini.rb
@ -67,7 +67,16 @@ module DiscourseAi
          } if prompt[:system_instruction].present?
          if tools.present?
            payload[:tools] = tools
-            payload[:tool_config] = { function_calling_config: { mode: "AUTO" } }
+
            function_calling_config = { mode: "AUTO" }
            if dialect.tool_choice.present?
              function_calling_config = {
                mode: "ANY",
                allowed_function_names: [dialect.tool_choice],
              }
            end
            payload[:tool_config] = { function_calling_config: function_calling_config }
          end
          payload[:generationConfig].merge!(model_params) if model_params.present?
          payload
@ -88,8 +97,10 @@ module DiscourseAi
            end
          response_h = parsed.dig(:candidates, 0, :content, :parts, 0)
          if response_h
            @has_function_call ||= response_h.dig(:functionCall).present?
-          @has_function_call ? response_h[:functionCall] : response_h.dig(:text)
+            @has_function_call ? response_h.dig(:functionCall) : response_h.dig(:text)
          end
        end
        def partials_from(decoded_chunk)
--- a/lib/embeddings/semantic_search.rb
+++ b/lib/embeddings/semantic_search.rb
@ -79,7 +79,9 @@ module DiscourseAi
        search = Search.new(query, { guardian: guardian })
        search_term = search.term
-        return [] if search_term.nil? || search_term.length < SiteSetting.min_search_term_length
+        if search_term.blank? || search_term.length < SiteSetting.min_search_term_length
          return Post.none
        end
        search_embedding = hyde ? hyde_embedding(search_term) : embedding(search_term)
--- a/spec/lib/completions/dialects/claude_spec.rb
+++ b/spec/lib/completions/dialects/claude_spec.rb
@ -35,7 +35,8 @@ RSpec.describe DiscourseAi::Completions::Dialects::Claude do
    end
    it "can properly translate a prompt (legacy tools)" do
-      SiteSetting.ai_anthropic_native_tool_call_models = ""
+      llm_model.provider_params["disable_native_tools"] = true
      llm_model.save!
      tools = [
        {
@ -88,8 +89,6 @@ RSpec.describe DiscourseAi::Completions::Dialects::Claude do
    end
    it "can properly translate a prompt (native tools)" do
      SiteSetting.ai_anthropic_native_tool_call_models = "claude-3-opus"
      tools = [
        {
          name: "echo",
--- a/spec/lib/completions/endpoints/anthropic_spec.rb
+++ b/spec/lib/completions/endpoints/anthropic_spec.rb
@ -48,7 +48,6 @@ RSpec.describe DiscourseAi::Completions::Endpoints::Anthropic do
  end
  it "does not eat spaces with tool calls" do
    SiteSetting.ai_anthropic_native_tool_call_models = "claude-3-opus"
    body = <<~STRING
    event: message_start
    data: {"type":"message_start","message":{"id":"msg_01Ju4j2MiGQb9KV9EEQ522Y3","type":"message","role":"assistant","model":"claude-3-haiku-20240307","content":[],"stop_reason":null,"stop_sequence":null,"usage":{"input_tokens":1293,"output_tokens":1}}   }
@ -195,8 +194,6 @@ RSpec.describe DiscourseAi::Completions::Endpoints::Anthropic do
  end
  it "supports non streaming tool calls" do
    SiteSetting.ai_anthropic_native_tool_call_models = "claude-3-opus"
    tool = {
      name: "calculate",
      description: "calculate something",
--- a/spec/lib/completions/endpoints/aws_bedrock_spec.rb
+++ b/spec/lib/completions/endpoints/aws_bedrock_spec.rb
@ -28,7 +28,9 @@ RSpec.describe DiscourseAi::Completions::Endpoints::AwsBedrock do
  describe "function calling" do
    it "supports old school xml function calls" do
-      SiteSetting.ai_anthropic_native_tool_call_models = ""
+      model.provider_params["disable_native_tools"] = true
      model.save!
      proxy = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")
      incomplete_tool_call = <<~XML.strip
--- a/spec/lib/modules/ai_bot/tools/search_spec.rb
+++ b/spec/lib/modules/ai_bot/tools/search_spec.rb
@ -138,6 +138,22 @@ RSpec.describe DiscourseAi::AiBot::Tools::Search do
        expect(results[:args]).to eq({ search_query: "hello world, sam", status: "public" })
        expect(results[:rows].length).to eq(1)
        # it also works with no query
        search =
          described_class.new(
            { order: "likes", user: "sam", status: "public", search_query: "a" },
            llm: llm,
            bot_user: bot_user,
          )
        # results will be expanded by semantic search, but it will find nothing
        results =
          DiscourseAi::Completions::Llm.with_prepared_responses(["<ai>#{query}</ai>"]) do
            search.invoke(&progress_blk)
          end
        expect(results[:rows].length).to eq(0)
      end
    end
--- a/spec/system/ai_bot/ai_bot_helper_spec.rb
+++ b/spec/system/ai_bot/ai_bot_helper_spec.rb
@ -22,13 +22,35 @@ RSpec.describe "AI chat channel summarization", type: :system, js: true do
    group.add(user)
    group.save
    allowed_persona = AiPersona.last
    allowed_persona.update!(allowed_group_ids: [group.id], enabled: true)
    visit "/latest"
    expect(page).to have_selector(".ai-bot-button")
    find(".ai-bot-button").click
-    # composer is open
+    find(".gpt-persona").click
    expect(page).to have_css(".gpt-persona ul li", count: 1)
    find(".llm-selector").click
    expect(page).to have_css(".llm-selector ul li", count: 2)
    expect(page).to have_selector(".d-editor-container")
    # lets disable bots but still allow 1 persona
    allowed_persona.create_user!
    allowed_persona.update!(default_llm: "custom:#{gpt_4.id}")
    gpt_4.update!(enabled_chat_bot: false)
    gpt_3_5_turbo.update!(enabled_chat_bot: false)
    visit "/latest"
    find(".ai-bot-button").click
    find(".gpt-persona").click
    expect(page).to have_css(".gpt-persona ul li", count: 1)
    expect(page).not_to have_selector(".llm-selector")
    SiteSetting.ai_bot_add_to_header = false
    visit "/latest"
    expect(page).not_to have_selector(".ai-bot-button")