discourse-ai/lib/completions/endpoints/cohere.rb

# frozen_string_literal: true

module DiscourseAi
  module Completions
    module Endpoints
      class Cohere < Base
        class << self
          def can_contact?(endpoint_name)
            endpoint_name == "cohere"
          end

          def dependant_setting_names
            %w[ai_cohere_api_key]
          end

          def correctly_configured?(_model_name)
            SiteSetting.ai_cohere_api_key.present?
          end

          def endpoint_name(model_name)
            "Cohere - #{model_name}"
          end
        end

        def normalize_model_params(model_params)
          model_params = model_params.dup
          model_params[:p] = model_params.delete(:top_p) if model_params[:top_p]
          model_params
        end

        def default_options(dialect)
          { model: "command-r-plus" }
        end

        def provider_id
          AiApiAuditLog::Provider::Cohere
        end

        private

        def model_uri
          url = llm_model&.url || "https://api.cohere.ai/v1/chat"

          URI(url)
        end

        def prepare_payload(prompt, model_params, dialect)
          payload = default_options(dialect).merge(model_params).merge(prompt)
          if prompt[:tools].present?
            payload[:tools] = prompt[:tools]
            payload[:force_single_step] = false
          end
          payload[:tool_results] = prompt[:tool_results] if prompt[:tool_results].present?
          payload[:stream] = true if @streaming_mode

          payload
        end

        def prepare_request(payload)
          headers = {
            "Content-Type" => "application/json",
            "Authorization" => "Bearer #{llm_model&.api_key || SiteSetting.ai_cohere_api_key}",
          }

          Net::HTTP::Post.new(model_uri, headers).tap { |r| r.body = payload }
        end

        def extract_completion_from(response_raw)
          parsed = JSON.parse(response_raw, symbolize_names: true)

          if @streaming_mode
            if parsed[:event_type] == "text-generation"
              parsed[:text]
            elsif parsed[:event_type] == "tool-calls-generation"
              # could just be random thinking...
              if parsed.dig(:tool_calls).present?
                @has_tool = true
                parsed.dig(:tool_calls).to_json
              else
                ""
              end
            else
              if parsed[:event_type] == "stream-end"
                @input_tokens = parsed.dig(:response, :meta, :billed_units, :input_tokens)
                @output_tokens = parsed.dig(:response, :meta, :billed_units, :output_tokens)
              end
              nil
            end
          else
            @input_tokens = parsed.dig(:meta, :billed_units, :input_tokens)
            @output_tokens = parsed.dig(:meta, :billed_units, :output_tokens)
            parsed[:text].to_s
          end
        end

        def has_tool?(_ignored)
          @has_tool
        end

        def native_tool_support?
          true
        end

        def add_to_function_buffer(function_buffer, partial: nil, payload: nil)
          if partial
            tools = JSON.parse(partial)
            tools.each do |tool|
              name = tool["name"]
              parameters = tool["parameters"]
              xml_params = parameters.map { |k, v| "<#{k}>#{v}</#{k}>\n" }.join

              current_function = function_buffer.at("invoke")
              if current_function.nil? || current_function.at("tool_name").content.present?
                current_function =
                  function_buffer.at("function_calls").add_child(
                    Nokogiri::HTML5::DocumentFragment.parse(noop_function_call_text + "\n"),
                  )
              end

              current_function.at("tool_name").content = name == "search_local" ? "search" : name
              current_function.at("parameters").children =
                Nokogiri::HTML5::DocumentFragment.parse(xml_params)
            end
          end
          function_buffer
        end

        def final_log_update(log)
          log.request_tokens = @input_tokens if @input_tokens
          log.response_tokens = @output_tokens if @output_tokens
        end

        def partials_from(decoded_chunk)
          decoded_chunk.split("\n").compact
        end

        def extract_prompt_for_tokenizer(prompt)
          text = +""
          if prompt[:chat_history]
            text << prompt[:chat_history]
              .map { |message| message[:content] || message["content"] || "" }
              .join("\n")
          end

          text << prompt[:message] if prompt[:message]
          text << prompt[:preamble] if prompt[:preamble]

          text
        end
      end
    end
  end
end
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`# frozen_string_literal: true`

			`module DiscourseAi`
			`module Completions`
			`module Endpoints`
			`class Cohere < Base`
			`class << self`
HACK: Llama3 support for summarization/AI helper. (#616) There are still some limitations to which models we can support with the `LlmModel` class. This will enable support for Llama3 while we sort those out. 2024-05-13 14:54:42 -04:00			`def can_contact?(endpoint_name)`
			`endpoint_name == "cohere"`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`end`

			`def dependant_setting_names`
			`%w[ai_cohere_api_key]`
			`end`

HACK: Llama3 support for summarization/AI helper. (#616) There are still some limitations to which models we can support with the `LlmModel` class. This will enable support for Llama3 while we sort those out. 2024-05-13 14:54:42 -04:00			`def correctly_configured?(_model_name)`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`SiteSetting.ai_cohere_api_key.present?`
			`end`

			`def endpoint_name(model_name)`
			`"Cohere - #{model_name}"`
			`end`
			`end`

			`def normalize_model_params(model_params)`
			`model_params = model_params.dup`
			`model_params[:p] = model_params.delete(:top_p) if model_params[:top_p]`
			`model_params`
			`end`

			`def default_options(dialect)`
FEATURE: Add native Cohere tool support (#655) Add native Cohere tool support - Introduce CohereTools class for tool translation and result processing - Update Command dialect to integrate with CohereTools - Modify Cohere endpoint to support passing tools and processing tool calls - Add spec for testing tool triggering with Cohere endpoint 2024-06-03 18:59:15 -04:00			`{ model: "command-r-plus" }`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`end`

			`def provider_id`
			`AiApiAuditLog::Provider::Cohere`
			`end`

			`private`

			`def model_uri`
FEATURE: Set endpoint credentials directly from LlmModel. (#625) * FEATURE: Set endpoint credentials directly from LlmModel. Drop Llama2Tokenizer since we no longer use it. * Allow http for custom LLMs --------- Co-authored-by: Rafael Silva <xfalcox@gmail.com> 2024-05-16 08:50:22 -04:00			`url = llm_model&.url \|\| "https://api.cohere.ai/v1/chat"`

			`URI(url)`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`end`

			`def prepare_payload(prompt, model_params, dialect)`
			`payload = default_options(dialect).merge(model_params).merge(prompt)`
FEATURE: Add native Cohere tool support (#655) Add native Cohere tool support - Introduce CohereTools class for tool translation and result processing - Update Command dialect to integrate with CohereTools - Modify Cohere endpoint to support passing tools and processing tool calls - Add spec for testing tool triggering with Cohere endpoint 2024-06-03 18:59:15 -04:00			`if prompt[:tools].present?`
			`payload[:tools] = prompt[:tools]`
			`payload[:force_single_step] = false`
			`end`
			`payload[:tool_results] = prompt[:tool_results] if prompt[:tool_results].present?`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`payload[:stream] = true if @streaming_mode`

			`payload`
			`end`

			`def prepare_request(payload)`
			`headers = {`
			`"Content-Type" => "application/json",`
FEATURE: Set endpoint credentials directly from LlmModel. (#625) * FEATURE: Set endpoint credentials directly from LlmModel. Drop Llama2Tokenizer since we no longer use it. * Allow http for custom LLMs --------- Co-authored-by: Rafael Silva <xfalcox@gmail.com> 2024-05-16 08:50:22 -04:00			`"Authorization" => "Bearer #{llm_model&.api_key \|\| SiteSetting.ai_cohere_api_key}",`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`}`

			`Net::HTTP::Post.new(model_uri, headers).tap { \|r\| r.body = payload }`
			`end`

			`def extract_completion_from(response_raw)`
			`parsed = JSON.parse(response_raw, symbolize_names: true)`

			`if @streaming_mode`
			`if parsed[:event_type] == "text-generation"`
			`parsed[:text]`
FEATURE: Add native Cohere tool support (#655) Add native Cohere tool support - Introduce CohereTools class for tool translation and result processing - Update Command dialect to integrate with CohereTools - Modify Cohere endpoint to support passing tools and processing tool calls - Add spec for testing tool triggering with Cohere endpoint 2024-06-03 18:59:15 -04:00			`elsif parsed[:event_type] == "tool-calls-generation"`
			`# could just be random thinking...`
			`if parsed.dig(:tool_calls).present?`
			`@has_tool = true`
			`parsed.dig(:tool_calls).to_json`
			`else`
			`""`
			`end`
FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`else`
			`if parsed[:event_type] == "stream-end"`
			`@input_tokens = parsed.dig(:response, :meta, :billed_units, :input_tokens)`
			`@output_tokens = parsed.dig(:response, :meta, :billed_units, :output_tokens)`
			`end`
			`nil`
			`end`
			`else`
			`@input_tokens = parsed.dig(:meta, :billed_units, :input_tokens)`
			`@output_tokens = parsed.dig(:meta, :billed_units, :output_tokens)`
			`parsed[:text].to_s`
			`end`
			`end`

FEATURE: Add native Cohere tool support (#655) Add native Cohere tool support - Introduce CohereTools class for tool translation and result processing - Update Command dialect to integrate with CohereTools - Modify Cohere endpoint to support passing tools and processing tool calls - Add spec for testing tool triggering with Cohere endpoint 2024-06-03 18:59:15 -04:00			`def has_tool?(_ignored)`
			`@has_tool`
			`end`

			`def native_tool_support?`
			`true`
			`end`

			`def add_to_function_buffer(function_buffer, partial: nil, payload: nil)`
			`if partial`
			`tools = JSON.parse(partial)`
			`tools.each do \|tool\|`
			`name = tool["name"]`
			`parameters = tool["parameters"]`
			`xml_params = parameters.map { \|k, v\| "<#{k}>#{v}</#{k}>\n" }.join`

			`current_function = function_buffer.at("invoke")`
			`if current_function.nil? \|\| current_function.at("tool_name").content.present?`
			`current_function =`
			`function_buffer.at("function_calls").add_child(`
			`Nokogiri::HTML5::DocumentFragment.parse(noop_function_call_text + "\n"),`
			`)`
			`end`

			`current_function.at("tool_name").content = name == "search_local" ? "search" : name`
			`current_function.at("parameters").children =`
			`Nokogiri::HTML5::DocumentFragment.parse(xml_params)`
			`end`
			`end`
			`function_buffer`
			`end`

FEATURE: Cohere Command R support (#558) - Added Cohere Command models (Command, Command Light, Command R, Command R Plus) to the available model list - Added a new site setting `ai_cohere_api_key` for configuring the Cohere API key - Implemented a new `DiscourseAi::Completions::Endpoints::Cohere` class to handle interactions with the Cohere API, including: - Translating request parameters to the Cohere API format - Parsing Cohere API responses - Supporting streaming and non-streaming completions - Supporting "tools" which allow the model to call back to discourse to lookup additional information - Implemented a new `DiscourseAi::Completions::Dialects::Command` class to translate between the generic Discourse AI prompt format and the Cohere Command format - Added specs covering the new Cohere endpoint and dialect classes - Updated `DiscourseAi::AiBot::Bot.guess_model` to map the new Cohere model to the appropriate bot user In summary, this PR adds support for using the Cohere Command family of models with the Discourse AI plugin. It handles configuring API keys, making requests to the Cohere API, and translating between Discourse's generic prompt format and Cohere's specific format. Thorough test coverage was added for the new functionality. 2024-04-10 17:24:17 -04:00			`def final_log_update(log)`
			`log.request_tokens = @input_tokens if @input_tokens`
			`log.response_tokens = @output_tokens if @output_tokens`
			`end`

			`def partials_from(decoded_chunk)`
			`decoded_chunk.split("\n").compact`
			`end`

			`def extract_prompt_for_tokenizer(prompt)`
			`text = +""`
			`if prompt[:chat_history]`
			`text << prompt[:chat_history]`
			`.map { \|message\| message[:content] \|\| message["content"] \|\| "" }`
			`.join("\n")`
			`end`

			`text << prompt[:message] if prompt[:message]`
			`text << prompt[:preamble] if prompt[:preamble]`

			`text`
			`end`
			`end`
			`end`
			`end`
			`end`