FIX: guide GPT 3.5 better (#77)

* FIX: guide GPT 3.5 better This limits search results to 10 cause we were blowing the whole token budget on search results, additionally it includes a quick exchange at the start of a session to try and guide GPT 3.5 to follow instructions Sadly GPT 3.5 drifts off very quickly but this does improve stuff a bit. It also attempts to correct some issues with anthropic, though it still is surprisingly hard to ground * add status:public, this is a bit of a hack but ensures that we can search for any filter provided * fix specs
2023-05-23 23:08:17 +10:00 · 2023-05-23 23:08:17 +10:00 · d85b503ed4
parent b82fc1e692
commit d85b503ed4
11 changed files with 104 additions and 35 deletions
--- a/lib/modules/ai_bot/anthropic_bot.rb
+++ b/lib/modules/ai_bot/anthropic_bot.rb
@ -15,6 +15,26 @@ module DiscourseAi
        7500 # https://console.anthropic.com/docs/prompt-design#what-is-a-prompt
      end

+      def get_delta(partial, context)
+        context[:pos] ||= 0
+
+        full = partial[:completion]
+        delta = full[context[:pos]..-1]
+
+        context[:pos] = full.length
+
+        if !context[:processed]
+          delta = ""
+          index = full.index("Assistant: ")
+          if index
+            delta = full[index + 11..-1]
+            context[:processed] = true
+          end
+        end
+
+        delta
+      end
+
      private

      def build_message(poster_username, content, system: false)
@ -27,10 +47,6 @@ module DiscourseAi
        "claude-v1"
      end

-      def update_with_delta(_, partial)
-        partial[:completion]
-      end
-
      def get_updated_title(prompt)
        DiscourseAi::Inference::AnthropicCompletions.perform!(
          prompt,
--- a/lib/modules/ai_bot/bot.rb
+++ b/lib/modules/ai_bot/bot.rb
@ -3,6 +3,8 @@
 module DiscourseAi
  module AiBot
    class Bot
+      attr_reader :bot_user
+
      BOT_NOT_FOUND = Class.new(StandardError)
      MAX_COMPLETIONS = 3

@ -50,13 +52,14 @@ module DiscourseAi
          end

        redis_stream_key = nil
-        reply = bot_reply_post ? bot_reply_post.raw : ""
+        reply = +(bot_reply_post ? bot_reply_post.raw.dup : "")
        start = Time.now

        setup_cancel = false
+        context = {}

        submit_prompt(prompt, prefer_low_cost: prefer_low_cost) do |partial, cancel|
-          reply = update_with_delta(reply, partial)
+          reply << get_delta(partial, context)

          if redis_stream_key && !Discourse.redis.get(redis_stream_key)
            cancel&.call
@ -92,6 +95,7 @@ module DiscourseAi

        if bot_reply_post
          publish_update(bot_reply_post, done: true)
+
          bot_reply_post.revise(
            bot_user,
            { raw: reply },
@ -154,6 +158,9 @@ module DiscourseAi
            memo.unshift(build_message(username, raw))
          end

+        # we need this to ground the model (especially GPT-3.5)
+        messages.unshift(build_message(bot_user.username, "!echo 1"))
+        messages.unshift(build_message("user", "please echo 1"))
        messages.unshift(build_message(bot_user.username, rendered_system_prompt, system: true))
        messages
      end
@ -205,7 +212,9 @@ module DiscourseAi
          The participants in this conversation are: #{post.topic.allowed_users.map(&:username).join(", ")}
          The date now is: #{Time.zone.now}, much has changed since you were trained.

-          You can complete some tasks using multiple steps and have access to some special commands!
+          You can complete some tasks using !commands.
+
+          NEVER ask user to issue !commands, they have no access, only you do.

          #{available_commands.map(&:desc).join("\n")}

@ -233,9 +242,11 @@ module DiscourseAi
        raise NotImplemented
      end

-      protected
+      def get_delta(partial, context)
+        raise NotImplemented
+      end

-      attr_reader :bot_user
+      protected

      def get_updated_title(prompt)
        raise NotImplemented
@ -245,10 +256,6 @@ module DiscourseAi
        raise NotImplemented
      end

-      def get_delta_from(partial)
-        raise NotImplemented
-      end
-
      def conversation_context(post)
        context =
          post
--- a/lib/modules/ai_bot/commands/command.rb
+++ b/lib/modules/ai_bot/commands/command.rb
@ -29,6 +29,10 @@ module DiscourseAi
          @args = args
        end

+        def bot
+          @bot ||= DiscourseAi::AiBot::Bot.as(bot_user)
+        end
+
        def standalone?
          false
        end
@ -81,6 +85,9 @@ module DiscourseAi

          raw << custom_raw if custom_raw.present?

+          replacement = "!#{self.class.name} #{args}"
+          raw = post.raw.sub(replacement, raw) if post.raw.include?(replacement)
+
          if chain_next_response
            post.raw = raw
            post.save!(validate: false)
--- a/lib/modules/ai_bot/commands/search_command.rb
+++ b/lib/modules/ai_bot/commands/search_command.rb
@ -93,10 +93,18 @@ module DiscourseAi::AiBot::Commands

      @last_query = search_string
      results =
-        Search.execute(search_string.to_s, search_type: :full_page, guardian: Guardian.new())
+        Search.execute(
+          search_string.to_s + " status:public",
+          search_type: :full_page,
+          guardian: Guardian.new(),
+        )
+
+      # let's be frugal with tokens, 50 results is too much and stuff gets cut off
+      limit ||= 10
+      limit = 10 if limit > 10

      posts = results&.posts || []
-      posts = posts[0..limit - 1] if limit
+      posts = posts[0..limit - 1]

      @last_num_results = posts.length

--- a/lib/modules/ai_bot/commands/summarize_command.rb
+++ b/lib/modules/ai_bot/commands/summarize_command.rb
@ -84,10 +84,6 @@ module DiscourseAi::AiBot::Commands
      false
    end

-    def bot
-      @bot ||= DiscourseAi::AiBot::Bot.as(bot_user)
-    end
-
    def summarize(data, guidance, topic)
      text = +""
      data.each do |id, post_number, raw, username|
--- a/lib/modules/ai_bot/open_ai_bot.rb
+++ b/lib/modules/ai_bot/open_ai_bot.rb
@ -75,8 +75,8 @@ module DiscourseAi
        "gpt-3.5-turbo"
      end

-      def update_with_delta(current_delta, partial)
-        current_delta + partial.dig(:choices, 0, :delta, :content).to_s
+      def get_delta(partial, _context)
+        partial.dig(:choices, 0, :delta, :content).to_s
      end

      def get_updated_title(prompt)
--- a/spec/lib/modules/ai_bot/anthropic_bot_spec.rb
+++ b/spec/lib/modules/ai_bot/anthropic_bot_spec.rb
@ -0,0 +1,27 @@
+# frozen_string_literal: true
+
+RSpec.describe DiscourseAi::AiBot::AnthropicBot do
+  describe "#update_with_delta" do
+    def bot_user
+      User.find(DiscourseAi::AiBot::EntryPoint::GPT4_ID)
+    end
+
+    subject { described_class.new(bot_user) }
+
+    describe "get_delta" do
+      it "can properly remove Assistant prefix" do
+        context = {}
+        reply = +""
+
+        reply << subject.get_delta({ completion: "\n\nAssist" }, context)
+        expect(reply).to eq("")
+
+        reply << subject.get_delta({ completion: "\n\nAssistant: test" }, context)
+        expect(reply).to eq("test")
+
+        reply << subject.get_delta({ completion: "\n\nAssistant: test\nworld" }, context)
+        expect(reply).to eq("test\nworld")
+      end
+    end
+  end
+end
--- a/spec/lib/modules/ai_bot/bot_spec.rb
+++ b/spec/lib/modules/ai_bot/bot_spec.rb
@ -43,7 +43,7 @@ RSpec.describe DiscourseAi::AiBot::Bot do
    it "can respond to !search" do
      bot.system_prompt_style!(:simple)

-      expected_response = "!search test search"
+      expected_response = "ok, searching...\n!search test search"

      prompt = bot.bot_prompt_with_topic_context(second_post)

@ -65,12 +65,14 @@ RSpec.describe DiscourseAi::AiBot::Bot do
      bot.reply_to(second_post)

      last = second_post.topic.posts.order("id desc").first
-      expect(last.post_custom_prompt.custom_prompt.to_s).to include("We are done now")

      expect(last.raw).to include("<details>")
      expect(last.raw).to include("<summary>Search</summary>")
      expect(last.raw).not_to include("translation missing")
+      expect(last.raw).to include("ok, searching...")
      expect(last.raw).to include("We are done now")
+
+      expect(last.post_custom_prompt.custom_prompt.to_s).to include("We are done now")
    end
  end

--- a/spec/lib/modules/ai_bot/commands/search_command_spec.rb
+++ b/spec/lib/modules/ai_bot/commands/search_command_spec.rb
@ -13,7 +13,7 @@ RSpec.describe DiscourseAi::AiBot::Commands::SearchCommand do
      post1 = Fabricate(:post)
      search = described_class.new(bot_user, post1)

-      results = search.process("order:fake")
+      results = search.process("order:fake ABDDCDCEDGDG")
      expect(results).to eq("No results found")
    end

@ -29,6 +29,10 @@ RSpec.describe DiscourseAi::AiBot::Commands::SearchCommand do

      # title + 2 rows
      expect(results.split("\n").length).to eq(3)
+
+      # just searching for everything
+      results = search.process("order:latest_topic")
+      expect(results.split("\n").length).to be > 1
    end
  end
 end
--- a/spec/lib/modules/ai_bot/jobs/regular/create_ai_reply_spec.rb
+++ b/spec/lib/modules/ai_bot/jobs/regular/create_ai_reply_spec.rb
@ -63,7 +63,8 @@ RSpec.describe Jobs::CreateAiReply do
    end

    context "when chatting with Claude from Anthropic" do
-      let(:deltas) { expected_response.split(" ").map { |w| "#{w} " } }
+      let(:claude_response) { "Assistant: #{expected_response}" }
+      let(:deltas) { claude_response.split(" ").map { |w| "#{w} " } }

      before do
        bot_user = User.find(DiscourseAi::AiBot::EntryPoint::CLAUDE_V1_ID)
--- a/spec/lib/modules/ai_bot/open_ai_bot_spec.rb
+++ b/spec/lib/modules/ai_bot/open_ai_bot_spec.rb
@ -20,7 +20,7 @@ RSpec.describe DiscourseAi::AiBot::OpenAiBot do
      it "includes it in the prompt" do
        prompt_messages = subject.bot_prompt_with_topic_context(post_1)

-        post_1_message = prompt_messages[1]
+        post_1_message = prompt_messages[-1]

        expect(post_1_message[:role]).to eq("user")
        expect(post_1_message[:content]).to eq("#{post_1.user.username}: #{post_body(1)}")
@ -33,11 +33,11 @@ RSpec.describe DiscourseAi::AiBot::OpenAiBot do
      it "trims the prompt" do
        prompt_messages = subject.bot_prompt_with_topic_context(post_1)

-        expect(prompt_messages[0][:role]).to eq("system")
-        expect(prompt_messages[1][:role]).to eq("user")
+        expect(prompt_messages[-2][:role]).to eq("assistant")
+        expect(prompt_messages[-1][:role]).to eq("user")
        # trimming is tricky... it needs to account for system message as
        # well... just make sure we trim for now
-        expect(prompt_messages[1][:content].length).to be < post_1.raw.length
+        expect(prompt_messages[-1][:content].length).to be < post_1.raw.length
      end
    end

@ -51,14 +51,15 @@ RSpec.describe DiscourseAi::AiBot::OpenAiBot do
      it "includes them in the prompt respecting the post number order" do
        prompt_messages = subject.bot_prompt_with_topic_context(post_3)

-        expect(prompt_messages[1][:role]).to eq("user")
-        expect(prompt_messages[1][:content]).to eq("#{post_1.username}: #{post_body(1)}")
+        # negative cause we may have grounding prompts
+        expect(prompt_messages[-3][:role]).to eq("user")
+        expect(prompt_messages[-3][:content]).to eq("#{post_1.username}: #{post_body(1)}")

-        expect(prompt_messages[2][:role]).to eq("assistant")
-        expect(prompt_messages[2][:content]).to eq(post_body(2))
+        expect(prompt_messages[-2][:role]).to eq("assistant")
+        expect(prompt_messages[-2][:content]).to eq(post_body(2))

-        expect(prompt_messages[3][:role]).to eq("user")
-        expect(prompt_messages[3][:content]).to eq("#{post_3.username}: #{post_body(3)}")
+        expect(prompt_messages[-1][:role]).to eq("user")
+        expect(prompt_messages[-1][:content]).to eq("#{post_3.username}: #{post_body(3)}")
      end
    end
  end