discourse-ai/spec/lib/completions/endpoints/endpoint_compliance.rb

# frozen_string_literal: true

require "net/http"

class EndpointMock
  def initialize(model)
    @model = model
  end

  attr_reader :model

  def stub_simple_call(prompt)
    stub_response(prompt, simple_response)
  end

  def stub_tool_call(prompt)
    stub_response(prompt, tool_response, tool_call: true)
  end

  def stub_streamed_simple_call(prompt)
    with_chunk_array_support do
      stub_streamed_response(prompt, streamed_simple_deltas)
      yield
    end
  end

  def stub_streamed_tool_call(prompt)
    with_chunk_array_support do
      stub_streamed_response(prompt, tool_deltas, tool_call: true)
      yield
    end
  end

  def simple_response
    "1. Serenity\\n2. Laughter\\n3. Adventure"
  end

  def streamed_simple_deltas
    ["Mount", "ain", " ", "Tree ", "Frog"]
  end

  def tool_deltas
    ["Let me use a tool for that<function", <<~REPLY.strip, <<~REPLY.strip, <<~REPLY.strip]
      _calls>
      <invoke>
      <tool_name>get_weather</tool_name>
      <parameters>
      <location>Sydney</location>
      <unit>c</unit>
      </para
      REPLY
      meters>
      </invoke>
      </funct
      REPLY
      ion_calls>
      REPLY
  end

  def tool_response
    tool_deltas.join
  end

  def invocation_response
    <<~TEXT
      <function_calls>
      <invoke>
      <tool_name>get_weather</tool_name>
      <parameters>
      <location>Sydney</location>
      <unit>c</unit>
      </parameters>
      <tool_id>tool_0</tool_id>
      </invoke>
      </function_calls>
    TEXT
  end

  def tool_id
    "get_weather"
  end

  def tool
    {
      name: "get_weather",
      description: "Get the weather in a city",
      parameters: [
        { name: "location", type: "string", description: "the city name", required: true },
        {
          name: "unit",
          type: "string",
          description: "the unit of measurement celcius c or fahrenheit f",
          enum: %w[c f],
          required: true,
        },
      ],
    }
  end

  def with_chunk_array_support
    mock = mocked_http
    @original_net_http = ::FinalDestination.send(:remove_const, :HTTP)
    ::FinalDestination.send(:const_set, :HTTP, mock)

    yield
  ensure
    ::FinalDestination.send(:remove_const, :HTTP)
    ::FinalDestination.send(:const_set, :HTTP, @original_net_http)
  end

  def self.with_chunk_array_support(&blk)
    self.new(nil).with_chunk_array_support(&blk)
  end

  protected

  # Copied from https://github.com/bblimke/webmock/issues/629
  # Workaround for stubbing a streamed response
  def mocked_http
    Class.new(FinalDestination::HTTP) do
      def request(*)
        super do |response|
          response.instance_eval do
            def read_body(*, &block)
              if block_given?
                @body.each(&block)
              else
                super
              end
            end
          end

          yield response if block_given?

          response
        end
      end
    end
  end
end

class EndpointsCompliance
  def initialize(rspec, endpoint, dialect_klass, user)
    @rspec = rspec
    @endpoint = endpoint
    @dialect_klass = dialect_klass
    @user = user
  end

  delegate :expect, :eq, :be_present, to: :rspec

  def generic_prompt(tools: [])
    DiscourseAi::Completions::Prompt.new(
      "You write words",
      messages: [{ type: :user, content: "write 3 words" }],
      tools: tools,
    )
  end

  def dialect(prompt: generic_prompt)
    dialect_klass.new(prompt, endpoint.model)
  end

  def regular_mode_simple_prompt(mock)
    mock.stub_simple_call(dialect.translate)

    completion_response = endpoint.perform_completion!(dialect, user)

    expect(completion_response).to eq(mock.simple_response)

    expect(AiApiAuditLog.count).to eq(1)
    log = AiApiAuditLog.first

    expect(log.provider_id).to eq(endpoint.provider_id)
    expect(log.user_id).to eq(user.id)
    expect(log.raw_request_payload).to be_present
    expect(log.raw_response_payload).to eq(mock.response(completion_response).to_json)
    expect(log.request_tokens).to eq(endpoint.prompt_size(dialect.translate))
    expect(log.response_tokens).to eq(endpoint.tokenizer.size(completion_response))
  end

  def regular_mode_tools(mock)
    prompt = generic_prompt(tools: [mock.tool])
    a_dialect = dialect(prompt: prompt)
    mock.stub_tool_call(a_dialect.translate)

    completion_response = endpoint.perform_completion!(a_dialect, user)
    expect(completion_response).to eq(mock.invocation_response)
  end

  def streaming_mode_simple_prompt(mock)
    mock.stub_streamed_simple_call(dialect.translate) do
      completion_response = +""

      endpoint.perform_completion!(dialect, user) do |partial, cancel|
        completion_response << partial
        cancel.call if completion_response.split(" ").length == 2
      end

      expect(AiApiAuditLog.count).to eq(1)
      log = AiApiAuditLog.first

      expect(log.provider_id).to eq(endpoint.provider_id)
      expect(log.user_id).to eq(user.id)
      expect(log.raw_request_payload).to be_present
      expect(log.raw_response_payload).to be_present
      expect(log.request_tokens).to eq(endpoint.prompt_size(dialect.translate))
      expect(log.response_tokens).to eq(
        endpoint.tokenizer.size(mock.streamed_simple_deltas[0...-1].join),
      )
    end
  end

  def streaming_mode_tools(mock)
    prompt = generic_prompt(tools: [mock.tool])
    a_dialect = dialect(prompt: prompt)

    mock.stub_streamed_tool_call(a_dialect.translate) do
      buffered_partial = +""

      endpoint.perform_completion!(a_dialect, user) do |partial, cancel|
        buffered_partial << partial
        cancel.call if buffered_partial.include?("<function_calls>")
      end

      expect(buffered_partial).to eq(mock.invocation_response)
    end
  end

  attr_reader :rspec, :endpoint, :dialect_klass, :user
end
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`# frozen_string_literal: true`

			`require "net/http"`

			`class EndpointMock`
			`def initialize(model)`
			`@model = model`
			`end`

			`attr_reader :model`

			`def stub_simple_call(prompt)`
			`stub_response(prompt, simple_response)`
			`end`

			`def stub_tool_call(prompt)`
			`stub_response(prompt, tool_response, tool_call: true)`
			`end`

			`def stub_streamed_simple_call(prompt)`
			`with_chunk_array_support do`
			`stub_streamed_response(prompt, streamed_simple_deltas)`
			`yield`
			`end`
			`end`

			`def stub_streamed_tool_call(prompt)`
			`with_chunk_array_support do`
			`stub_streamed_response(prompt, tool_deltas, tool_call: true)`
			`yield`
			`end`
			`end`

			`def simple_response`
			`"1. Serenity\\n2. Laughter\\n3. Adventure"`
			`end`

			`def streamed_simple_deltas`
			`["Mount", "ain", " ", "Tree ", "Frog"]`
			`end`

			`def tool_deltas`
			`["Let me use a tool for that<function", <<~REPLY.strip, <<~REPLY.strip, <<~REPLY.strip]`
			`_calls>`
			`<invoke>`
			`<tool_name>get_weather</tool_name>`
			`<parameters>`
			`<location>Sydney</location>`
			`<unit>c</unit>`
			`</para`
			`REPLY`
			`meters>`
			`</invoke>`
			`</funct`
			`REPLY`
			`ion_calls>`
			`REPLY`
			`end`

			`def tool_response`
			`tool_deltas.join`
			`end`

			`def invocation_response`
			`<<~TEXT`
			`<function_calls>`
			`<invoke>`
			`<tool_name>get_weather</tool_name>`
			`<parameters>`
			`<location>Sydney</location>`
			`<unit>c</unit>`
			`</parameters>`
FEATURE: Add GitHub Helper AI Bot persona and tools (#513) Introduces a new AI Bot persona called 'GitHub Helper' which is specialized in assisting with GitHub-related tasks and questions. It includes the following key changes: - Implements the GitHub Helper persona class with its system prompt and available tools - Adds three new AI Bot tools for GitHub interactions: - github_file_content: Retrieves content of files from a GitHub repository - github_pull_request_diff: Retrieves the diff for a GitHub pull request - github_search_code: Searches for code in a GitHub repository - Updates the AI Bot dialects to support the new GitHub tools - Implements multiple function calls for standard tool dialect 2024-03-07 14:37:23 -05:00			`<tool_id>tool_0</tool_id>`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`</invoke>`
			`</function_calls>`
			`TEXT`
			`end`

			`def tool_id`
			`"get_weather"`
			`end`

			`def tool`
			`{`
			`name: "get_weather",`
			`description: "Get the weather in a city",`
			`parameters: [`
			`{ name: "location", type: "string", description: "the city name", required: true },`
			`{`
			`name: "unit",`
			`type: "string",`
			`description: "the unit of measurement celcius c or fahrenheit f",`
			`enum: %w[c f],`
			`required: true,`
			`},`
			`],`
			`}`
			`end`

			`def with_chunk_array_support`
			`mock = mocked_http`
SECURITY: Place a SSRF protection when calling services from the plugin. (#485) The Faraday adapter and `FinalDestionation::HTTP` will protect us from admin-initiated SSRF attacks when interacting with the external services powering this plugin features.: 2024-02-21 15:14:50 -05:00			`@original_net_http = ::FinalDestination.send(:remove_const, :HTTP)`
			`::FinalDestination.send(:const_set, :HTTP, mock)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00
			`yield`
			`ensure`
SECURITY: Place a SSRF protection when calling services from the plugin. (#485) The Faraday adapter and `FinalDestionation::HTTP` will protect us from admin-initiated SSRF attacks when interacting with the external services powering this plugin features.: 2024-02-21 15:14:50 -05:00			`::FinalDestination.send(:remove_const, :HTTP)`
			`::FinalDestination.send(:const_set, :HTTP, @original_net_http)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`end`

FEATURE: add Claude 3 Haiku bot support (#552) it is close in performance to GPT 4 at a fraction of the cost, nice to add it to the mix. Also improves a test case to simulate streaming, I am hunting for the "calls" word that is jumping into function calls and can't quite find it. 2024-04-03 01:06:27 -04:00			`def self.with_chunk_array_support(&blk)`
			`self.new(nil).with_chunk_array_support(&blk)`
			`end`

DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`protected`

			`# Copied from https://github.com/bblimke/webmock/issues/629`
			`# Workaround for stubbing a streamed response`
			`def mocked_http`
SECURITY: Place a SSRF protection when calling services from the plugin. (#485) The Faraday adapter and `FinalDestionation::HTTP` will protect us from admin-initiated SSRF attacks when interacting with the external services powering this plugin features.: 2024-02-21 15:14:50 -05:00			`Class.new(FinalDestination::HTTP) do`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`def request(*)`
			`super do \|response\|`
			`response.instance_eval do`
			`def read_body(*, &block)`
			`if block_given?`
			`@body.each(&block)`
			`else`
			`super`
			`end`
			`end`
			`end`

			`yield response if block_given?`

			`response`
			`end`
			`end`
			`end`
			`end`
			`end`

			`class EndpointsCompliance`
			`def initialize(rspec, endpoint, dialect_klass, user)`
			`@rspec = rspec`
			`@endpoint = endpoint`
			`@dialect_klass = dialect_klass`
			`@user = user`
			`end`

			`delegate :expect, :eq, :be_present, to: :rspec`

			`def generic_prompt(tools: [])`
			`DiscourseAi::Completions::Prompt.new(`
			`"You write words",`
			`messages: [{ type: :user, content: "write 3 words" }],`
			`tools: tools,`
			`)`
			`end`

			`def dialect(prompt: generic_prompt)`
			`dialect_klass.new(prompt, endpoint.model)`
			`end`

			`def regular_mode_simple_prompt(mock)`
			`mock.stub_simple_call(dialect.translate)`

			`completion_response = endpoint.perform_completion!(dialect, user)`

			`expect(completion_response).to eq(mock.simple_response)`

			`expect(AiApiAuditLog.count).to eq(1)`
			`log = AiApiAuditLog.first`

			`expect(log.provider_id).to eq(endpoint.provider_id)`
			`expect(log.user_id).to eq(user.id)`
			`expect(log.raw_request_payload).to be_present`
			`expect(log.raw_response_payload).to eq(mock.response(completion_response).to_json)`
			`expect(log.request_tokens).to eq(endpoint.prompt_size(dialect.translate))`
			`expect(log.response_tokens).to eq(endpoint.tokenizer.size(completion_response))`
			`end`

			`def regular_mode_tools(mock)`
			`prompt = generic_prompt(tools: [mock.tool])`
			`a_dialect = dialect(prompt: prompt)`
			`mock.stub_tool_call(a_dialect.translate)`

			`completion_response = endpoint.perform_completion!(a_dialect, user)`
			`expect(completion_response).to eq(mock.invocation_response)`
			`end`

			`def streaming_mode_simple_prompt(mock)`
			`mock.stub_streamed_simple_call(dialect.translate) do`
			`completion_response = +""`

			`endpoint.perform_completion!(dialect, user) do \|partial, cancel\|`
			`completion_response << partial`
			`cancel.call if completion_response.split(" ").length == 2`
			`end`

			`expect(AiApiAuditLog.count).to eq(1)`
			`log = AiApiAuditLog.first`

			`expect(log.provider_id).to eq(endpoint.provider_id)`
			`expect(log.user_id).to eq(user.id)`
			`expect(log.raw_request_payload).to be_present`
			`expect(log.raw_response_payload).to be_present`
			`expect(log.request_tokens).to eq(endpoint.prompt_size(dialect.translate))`
			`expect(log.response_tokens).to eq(`
			`endpoint.tokenizer.size(mock.streamed_simple_deltas[0...-1].join),`
			`)`
			`end`
			`end`

			`def streaming_mode_tools(mock)`
			`prompt = generic_prompt(tools: [mock.tool])`
			`a_dialect = dialect(prompt: prompt)`

			`mock.stub_streamed_tool_call(a_dialect.translate) do`
			`buffered_partial = +""`

			`endpoint.perform_completion!(a_dialect, user) do \|partial, cancel\|`
			`buffered_partial << partial`
			`cancel.call if buffered_partial.include?("<function_calls>")`
			`end`

			`expect(buffered_partial).to eq(mock.invocation_response)`
			`end`
			`end`

			`attr_reader :rspec, :endpoint, :dialect_klass, :user`
			`end`