discourse-ai/lib/modules/ai_bot/open_ai_bot.rb

# frozen_string_literal: true

module DiscourseAi
  module AiBot
    class OpenAiBot < Bot
      def self.can_reply_as?(bot_user)
        open_ai_bot_ids = [
          DiscourseAi::AiBot::EntryPoint::GPT4_ID,
          DiscourseAi::AiBot::EntryPoint::GPT3_5_TURBO_ID,
        ]

        open_ai_bot_ids.include?(bot_user.id)
      end

      def prompt_limit
        # note GPT counts both reply and request tokens in limits...
        # also allow for an extra 500 or so spare tokens
        if bot_user.id == DiscourseAi::AiBot::EntryPoint::GPT4_ID
          8192 - 3500
        else
          16_384 - 2000
        end
      end

      def reply_params
        max_tokens =
          if bot_user.id == DiscourseAi::AiBot::EntryPoint::GPT4_ID
            3000
          else
            1500
          end

        { temperature: 0.4, top_p: 0.9, max_tokens: max_tokens }
      end

      def submit_prompt(
        prompt,
        prefer_low_cost: false,
        temperature: nil,
        top_p: nil,
        max_tokens: nil,
        &blk
      )
        params =
          reply_params.merge(
            temperature: temperature,
            top_p: top_p,
            max_tokens: max_tokens,
            functions: available_functions,
          ) { |key, old_value, new_value| new_value.nil? ? old_value : new_value }

        model = model_for(low_cost: prefer_low_cost)

        DiscourseAi::Inference::OpenAiCompletions.perform!(prompt, model, **params, &blk)
      end

      def tokenize(text)
        DiscourseAi::Tokenizer::OpenAiTokenizer.tokenize(text)
      end

      def available_functions
        # note if defined? can be a problem in test
        # this can never be nil so it is safe
        return @available_functions if @available_functions

        functions = []

        functions =
          available_commands.map do |command|
            function =
              DiscourseAi::Inference::OpenAiCompletions::Function.new(
                name: command.name,
                description: command.desc,
              )
            command.parameters.each do |parameter|
              function.add_parameter(
                name: parameter.name,
                type: parameter.type,
                description: parameter.description,
                required: parameter.required,
              )
            end
            function
          end

        @available_functions = functions
      end

      def available_commands
        # note: Summarize command is not ready yet, leave it out for now
        @cmds ||=
          [
            Commands::CategoriesCommand,
            Commands::TimeCommand,
            Commands::SearchCommand,
          ].tap do |cmds|
            cmds << Commands::TagsCommand if SiteSetting.tagging_enabled
            cmds << Commands::ImageCommand if SiteSetting.ai_stability_api_key.present?
            if SiteSetting.ai_google_custom_search_api_key.present? &&
                 SiteSetting.ai_google_custom_search_cx.present?
              cmds << Commands::GoogleCommand
            end
          end
      end

      def model_for(low_cost: false)
        return "gpt-4-0613" if bot_user.id == DiscourseAi::AiBot::EntryPoint::GPT4_ID && !low_cost
        "gpt-3.5-turbo-16k"
      end

      def clean_username(username)
        if username.match?(/\0[a-zA-Z0-9_-]{1,64}\z/)
          username
        else
          # not the best in the world, but this is what we have to work with
          # if sites enable unicode usernames this can get messy
          username.gsub(/[^a-zA-Z0-9_-]/, "_")[0..63]
        end
      end

      private

      def populate_functions(partial, functions)
        fn = partial.dig(:choices, 0, :delta, :function_call)
        if fn
          functions.add_function(fn[:name]) if fn[:name].present?
          functions.add_argument_fragment(fn[:arguments]) if fn[:arguments].present?
        end
      end

      def build_message(poster_username, content, function: false, system: false)
        is_bot = poster_username == bot_user.username

        if function
          role = "function"
        elsif system
          role = "system"
        else
          role = is_bot ? "assistant" : "user"
        end

        result = { role: role, content: content }

        if function
          result[:name] = poster_username
        elsif !system && poster_username != bot_user.username && poster_username.present?
          # Open AI restrict name to 64 chars and only A-Za-z._ (work around)
          result[:name] = clean_username(poster_username)
        end

        result
      end

      def get_delta(partial, _context)
        partial.dig(:choices, 0, :delta, :content).to_s
      end

      def get_updated_title(prompt)
        DiscourseAi::Inference::OpenAiCompletions.perform!(
          prompt,
          model_for,
          temperature: 0.7,
          top_p: 0.9,
          max_tokens: 40,
        ).dig(:choices, 0, :message, :content)
      end
    end
  end
end
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00			`# frozen_string_literal: true`

			`module DiscourseAi`
			`module AiBot`
			`class OpenAiBot < Bot`
			`def self.can_reply_as?(bot_user)`
			`open_ai_bot_ids = [`
			`DiscourseAi::AiBot::EntryPoint::GPT4_ID,`
			`DiscourseAi::AiBot::EntryPoint::GPT3_5_TURBO_ID,`
			`]`

			`open_ai_bot_ids.include?(bot_user.id)`
			`end`

			`def prompt_limit`
FEATURE: add support for GPT <-> Forum integration This change-set connects GPT based chat with the forum it runs on. Allowing it to perform search, lookup tags and categories and summarize topics. The integration is currently restricted to public portions of the forum. Changes made: - Do not run ai reply job for small actions - Improved composable system prompt - Trivial summarizer for topics - Image generator - Google command for searching via Google - Corrected trimming of posts raw (was replacing with numbers) - Bypass of problem specs The feature works best with GPT-4 --------- Co-authored-by: Roman Rizzi <rizziromanalejandro@gmail.com> 2023-05-20 03:45:54 -04:00			`# note GPT counts both reply and request tokens in limits...`
			`# also allow for an extra 500 or so spare tokens`
			`if bot_user.id == DiscourseAi::AiBot::EntryPoint::GPT4_ID`
			`8192 - 3500`
			`else`
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`16_384 - 2000`
FEATURE: add support for GPT <-> Forum integration This change-set connects GPT based chat with the forum it runs on. Allowing it to perform search, lookup tags and categories and summarize topics. The integration is currently restricted to public portions of the forum. Changes made: - Do not run ai reply job for small actions - Improved composable system prompt - Trivial summarizer for topics - Image generator - Google command for searching via Google - Corrected trimming of posts raw (was replacing with numbers) - Bypass of problem specs The feature works best with GPT-4 --------- Co-authored-by: Roman Rizzi <rizziromanalejandro@gmail.com> 2023-05-20 03:45:54 -04:00			`end`
			`end`

			`def reply_params`
			`max_tokens =`
			`if bot_user.id == DiscourseAi::AiBot::EntryPoint::GPT4_ID`
			`3000`
			`else`
			`1500`
			`end`

			`{ temperature: 0.4, top_p: 0.9, max_tokens: max_tokens }`
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00			`end`

iterate commands (#73) * FEATURE: introduce a more efficient formatter Previous formatting style was space inefficient given JSON consumes lots of tokens, the new format is now used consistently across commands Also fixes - search limited to 10 - search breaking on limit: non existent directive * Slight improvement to summarizer Stop blowing up context with custom prompts * ensure we include the guiding message * correct spec * langchain style summarizer ... much more accurate (albeit more expensive) * lint 2023-05-21 22:09:14 -04:00			`def submit_prompt(`
			`prompt,`
			`prefer_low_cost: false,`
			`temperature: nil,`
			`top_p: nil,`
			`max_tokens: nil,`
			`&blk`
			`)`
			`params =`
			`reply_params.merge(`
			`temperature: temperature,`
			`top_p: top_p,`
			`max_tokens: max_tokens,`
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`functions: available_functions,`
iterate commands (#73) * FEATURE: introduce a more efficient formatter Previous formatting style was space inefficient given JSON consumes lots of tokens, the new format is now used consistently across commands Also fixes - search limited to 10 - search breaking on limit: non existent directive * Slight improvement to summarizer Stop blowing up context with custom prompts * ensure we include the guiding message * correct spec * langchain style summarizer ... much more accurate (albeit more expensive) * lint 2023-05-21 22:09:14 -04:00			`) { \|key, old_value, new_value\| new_value.nil? ? old_value : new_value }`

FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`model = model_for(low_cost: prefer_low_cost)`

iterate commands (#73) * FEATURE: introduce a more efficient formatter Previous formatting style was space inefficient given JSON consumes lots of tokens, the new format is now used consistently across commands Also fixes - search limited to 10 - search breaking on limit: non existent directive * Slight improvement to summarizer Stop blowing up context with custom prompts * ensure we include the guiding message * correct spec * langchain style summarizer ... much more accurate (albeit more expensive) * lint 2023-05-21 22:09:14 -04:00			`DiscourseAi::Inference::OpenAiCompletions.perform!(prompt, model, **params, &blk)`
			`end`

			`def tokenize(text)`
			`DiscourseAi::Tokenizer::OpenAiTokenizer.tokenize(text)`
			`end`

FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`def available_functions`
			`# note if defined? can be a problem in test`
			`# this can never be nil so it is safe`
			`return @available_functions if @available_functions`

			`functions = []`

			`functions =`
			`available_commands.map do \|command\|`
			`function =`
			`DiscourseAi::Inference::OpenAiCompletions::Function.new(`
			`name: command.name,`
			`description: command.desc,`
			`)`
			`command.parameters.each do \|parameter\|`
			`function.add_parameter(`
			`name: parameter.name,`
			`type: parameter.type,`
			`description: parameter.description,`
			`required: parameter.required,`
			`)`
			`end`
			`function`
			`end`

			`@available_functions = functions`
			`end`

FEATURE: disable smart commands on Claude and GPT 3.5 (#84) For the time being smart commands only work consistently on GPT 4. Avoid using any smart commands on the earlier models. Additionally adds better error handling to Claude which sometimes streams partial json and slightly tunes the search command. 2023-05-31 19:10:33 -04:00			`def available_commands`
FIX: avoid storing corrupt prompts (#92) ``` prompt << build_message(bot_user.username, reply) ``` Would store a "cooked" prompt which is invalid, instead just store the raw values which are later passed to build_message Additionally: 1. Disable summary command which needs honing 2. Stop storing decorations (searched for X) in prompt which leads to straying 3. Ship username directly to model, avoiding "user: content" in prompts. This was causing GPT to stray 2023-06-20 01:44:03 -04:00			`# note: Summarize command is not ready yet, leave it out for now`
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`@cmds \|\|=`
			`[`
			`Commands::CategoriesCommand,`
			`Commands::TimeCommand,`
			`Commands::SearchCommand,`
			`].tap do \|cmds\|`
			`cmds << Commands::TagsCommand if SiteSetting.tagging_enabled`
			`cmds << Commands::ImageCommand if SiteSetting.ai_stability_api_key.present?`
			`if SiteSetting.ai_google_custom_search_api_key.present? &&`
			`SiteSetting.ai_google_custom_search_cx.present?`
			`cmds << Commands::GoogleCommand`
FEATURE: disable smart commands on Claude and GPT 3.5 (#84) For the time being smart commands only work consistently on GPT 4. Avoid using any smart commands on the earlier models. Additionally adds better error handling to Claude which sometimes streams partial json and slightly tunes the search command. 2023-05-31 19:10:33 -04:00			`end`
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`end`
			`end`

			`def model_for(low_cost: false)`
			`return "gpt-4-0613" if bot_user.id == DiscourseAi::AiBot::EntryPoint::GPT4_ID && !low_cost`
			`"gpt-3.5-turbo-16k"`
FEATURE: disable smart commands on Claude and GPT 3.5 (#84) For the time being smart commands only work consistently on GPT 4. Avoid using any smart commands on the earlier models. Additionally adds better error handling to Claude which sometimes streams partial json and slightly tunes the search command. 2023-05-31 19:10:33 -04:00			`end`

FIX: avoid storing corrupt prompts (#92) ``` prompt << build_message(bot_user.username, reply) ``` Would store a "cooked" prompt which is invalid, instead just store the raw values which are later passed to build_message Additionally: 1. Disable summary command which needs honing 2. Stop storing decorations (searched for X) in prompt which leads to straying 3. Ship username directly to model, avoiding "user: content" in prompts. This was causing GPT to stray 2023-06-20 01:44:03 -04:00			`def clean_username(username)`
			`if username.match?(/\0[a-zA-Z0-9_-]{1,64}\z/)`
			`username`
			`else`
			`# not the best in the world, but this is what we have to work with`
			`# if sites enable unicode usernames this can get messy`
			`username.gsub(/[^a-zA-Z0-9_-]/, "_")[0..63]`
			`end`
			`end`

FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00			`private`

FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`def populate_functions(partial, functions)`
			`fn = partial.dig(:choices, 0, :delta, :function_call)`
			`if fn`
			`functions.add_function(fn[:name]) if fn[:name].present?`
			`functions.add_argument_fragment(fn[:arguments]) if fn[:arguments].present?`
			`end`
			`end`

			`def build_message(poster_username, content, function: false, system: false)`
FEATURE: add support for GPT <-> Forum integration This change-set connects GPT based chat with the forum it runs on. Allowing it to perform search, lookup tags and categories and summarize topics. The integration is currently restricted to public portions of the forum. Changes made: - Do not run ai reply job for small actions - Improved composable system prompt - Trivial summarizer for topics - Image generator - Google command for searching via Google - Corrected trimming of posts raw (was replacing with numbers) - Bypass of problem specs The feature works best with GPT-4 --------- Co-authored-by: Roman Rizzi <rizziromanalejandro@gmail.com> 2023-05-20 03:45:54 -04:00			`is_bot = poster_username == bot_user.username`

FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`if function`
			`role = "function"`
			`elsif system`
FEATURE: add support for GPT <-> Forum integration This change-set connects GPT based chat with the forum it runs on. Allowing it to perform search, lookup tags and categories and summarize topics. The integration is currently restricted to public portions of the forum. Changes made: - Do not run ai reply job for small actions - Improved composable system prompt - Trivial summarizer for topics - Image generator - Google command for searching via Google - Corrected trimming of posts raw (was replacing with numbers) - Bypass of problem specs The feature works best with GPT-4 --------- Co-authored-by: Roman Rizzi <rizziromanalejandro@gmail.com> 2023-05-20 03:45:54 -04:00			`role = "system"`
			`else`
			`role = is_bot ? "assistant" : "user"`
			`end`
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`result = { role: role, content: content }`

			`if function`
			`result[:name] = poster_username`
FIX: avoid storing corrupt prompts (#92) ``` prompt << build_message(bot_user.username, reply) ``` Would store a "cooked" prompt which is invalid, instead just store the raw values which are later passed to build_message Additionally: 1. Disable summary command which needs honing 2. Stop storing decorations (searched for X) in prompt which leads to straying 3. Ship username directly to model, avoiding "user: content" in prompts. This was causing GPT to stray 2023-06-20 01:44:03 -04:00			`elsif !system && poster_username != bot_user.username && poster_username.present?`
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`# Open AI restrict name to 64 chars and only A-Za-z._ (work around)`
FIX: avoid storing corrupt prompts (#92) ``` prompt << build_message(bot_user.username, reply) ``` Would store a "cooked" prompt which is invalid, instead just store the raw values which are later passed to build_message Additionally: 1. Disable summary command which needs honing 2. Stop storing decorations (searched for X) in prompt which leads to straying 3. Ship username directly to model, avoiding "user: content" in prompts. This was causing GPT to stray 2023-06-20 01:44:03 -04:00			`result[:name] = clean_username(poster_username)`
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`end`
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00
FEATURE: add full bot support for GPT 3.5 (#87) Given latest GPT 3.5 16k which is both better steered and supports functions we can now support rich bot integration. Clunky system message based steering is removed and instead we use the function framework provided by Open AI 2023-06-19 18:45:31 -04:00			`result`
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00			`end`

FIX: guide GPT 3.5 better (#77) * FIX: guide GPT 3.5 better This limits search results to 10 cause we were blowing the whole token budget on search results, additionally it includes a quick exchange at the start of a session to try and guide GPT 3.5 to follow instructions Sadly GPT 3.5 drifts off very quickly but this does improve stuff a bit. It also attempts to correct some issues with anthropic, though it still is surprisingly hard to ground * add status:public, this is a bit of a hack but ensures that we can search for any filter provided * fix specs 2023-05-23 09:08:17 -04:00			`def get_delta(partial, _context)`
			`partial.dig(:choices, 0, :delta, :content).to_s`
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00			`end`

FEATURE: Less friction for starting a conversation with an AI bot. (#63) * FEATURE: Less friction for starting a conversation with an AI bot. This PR adds a new header icon as a shortcut to start a conversation with one of our AI Bots. After clicking and selecting one from the dropdown menu, we'll open the composer with some fields already filled (recipients and title). If you leave the title as is, we'll queue a job after five minutes to update it using a bot suggestion. * Update assets/javascripts/initializers/ai-bot-replies.js Co-authored-by: Rafael dos Santos Silva <xfalcox@gmail.com> * Update assets/javascripts/initializers/ai-bot-replies.js Co-authored-by: Rafael dos Santos Silva <xfalcox@gmail.com> --------- Co-authored-by: Rafael dos Santos Silva <xfalcox@gmail.com> 2023-05-16 13:38:21 -04:00			`def get_updated_title(prompt)`
			`DiscourseAi::Inference::OpenAiCompletions.perform!(`
			`prompt,`
			`model_for,`
			`temperature: 0.7,`
			`top_p: 0.9,`
			`max_tokens: 40,`
			`).dig(:choices, 0, :message, :content)`
			`end`
FEATURE: Multi-model support for the AI Bot module. (#56) We'll create one bot user for each available model. When listed in the `ai_bot_enabled_chat_bots` setting, they will reply. This PR lets us use Claude-v1 in stream mode. 2023-05-11 09:03:03 -04:00			`end`
			`end`
			`end`