discourse-ai/spec/lib/completions/endpoints/gemini_spec.rb

# frozen_string_literal: true

require_relative "endpoint_compliance"

class GeminiMock < EndpointMock
  def response(content, tool_call: false)
    {
      candidates: [
        {
          content: {
            parts: [(tool_call ? content : { text: content })],
            role: "model",
          },
          finishReason: "STOP",
          index: 0,
          safetyRatings: [
            { category: "HARM_CATEGORY_SEXUALLY_EXPLICIT", probability: "NEGLIGIBLE" },
            { category: "HARM_CATEGORY_HATE_SPEECH", probability: "NEGLIGIBLE" },
            { category: "HARM_CATEGORY_HARASSMENT", probability: "NEGLIGIBLE" },
            { category: "HARM_CATEGORY_DANGEROUS_CONTENT", probability: "NEGLIGIBLE" },
          ],
        },
      ],
      promptFeedback: {
        safetyRatings: [
          { category: "HARM_CATEGORY_SEXUALLY_EXPLICIT", probability: "NEGLIGIBLE" },
          { category: "HARM_CATEGORY_HATE_SPEECH", probability: "NEGLIGIBLE" },
          { category: "HARM_CATEGORY_HARASSMENT", probability: "NEGLIGIBLE" },
          { category: "HARM_CATEGORY_DANGEROUS_CONTENT", probability: "NEGLIGIBLE" },
        ],
      },
    }
  end

  def stub_response(prompt, response_text, tool_call: false)
    WebMock
      .stub_request(
        :post,
        "https://generativelanguage.googleapis.com/v1beta/models/gemini-pro:generateContent?key=#{SiteSetting.ai_gemini_api_key}",
      )
      .with(body: request_body(prompt, tool_call))
      .to_return(status: 200, body: JSON.dump(response(response_text, tool_call: tool_call)))
  end

  def stream_line(delta, finish_reason: nil, tool_call: false)
    {
      candidates: [
        {
          content: {
            parts: [(tool_call ? delta : { text: delta })],
            role: "model",
          },
          finishReason: finish_reason,
          index: 0,
          safetyRatings: [
            { category: "HARM_CATEGORY_SEXUALLY_EXPLICIT", probability: "NEGLIGIBLE" },
            { category: "HARM_CATEGORY_HATE_SPEECH", probability: "NEGLIGIBLE" },
            { category: "HARM_CATEGORY_HARASSMENT", probability: "NEGLIGIBLE" },
            { category: "HARM_CATEGORY_DANGEROUS_CONTENT", probability: "NEGLIGIBLE" },
          ],
        },
      ],
    }.to_json
  end

  def stub_streamed_response(prompt, deltas, tool_call: false)
    chunks =
      deltas.each_with_index.map do |_, index|
        if index == (deltas.length - 1)
          stream_line(deltas[index], finish_reason: "STOP", tool_call: tool_call)
        else
          stream_line(deltas[index], tool_call: tool_call)
        end
      end

    chunks = chunks.join("\n,\n").prepend("[\n").concat("\n]").split("")

    WebMock
      .stub_request(
        :post,
        "https://generativelanguage.googleapis.com/v1beta/models/gemini-pro:streamGenerateContent?key=#{SiteSetting.ai_gemini_api_key}",
      )
      .with(body: request_body(prompt, tool_call))
      .to_return(status: 200, body: chunks)
  end

  def tool_payload
    {
      name: "get_weather",
      description: "Get the weather in a city",
      parameters: {
        type: "object",
        required: %w[location unit],
        properties: {
          "location" => {
            type: "string",
            description: "the city name",
          },
          "unit" => {
            type: "string",
            description: "the unit of measurement celcius c or fahrenheit f",
            enum: %w[c f],
          },
        },
      },
    }
  end

  def request_body(prompt, tool_call)
    model
      .default_options
      .merge(contents: prompt)
      .tap { |b| b[:tools] = [{ function_declarations: [tool_payload] }] if tool_call }
      .to_json
  end

  def tool_deltas
    [
      { "functionCall" => { name: "get_weather", args: {} } },
      { "functionCall" => { name: "get_weather", args: { location: "" } } },
      { "functionCall" => { name: "get_weather", args: { location: "Sydney", unit: "c" } } },
    ]
  end

  def tool_response
    { "functionCall" => { name: "get_weather", args: { location: "Sydney", unit: "c" } } }
  end
end

RSpec.describe DiscourseAi::Completions::Endpoints::Gemini do
  subject(:endpoint) { described_class.new(model) }

  fab!(:model) { Fabricate(:gemini_model, vision_enabled: true) }

  fab!(:user)

  let(:image100x100) { plugin_file_from_fixtures("100x100.jpg") }
  let(:upload100x100) do
    UploadCreator.new(image100x100, "image.jpg").create_for(Discourse.system_user.id)
  end

  let(:gemini_mock) { GeminiMock.new(endpoint) }

  let(:compliance) do
    EndpointsCompliance.new(self, endpoint, DiscourseAi::Completions::Dialects::Gemini, user)
  end

  let(:echo_tool) do
    {
      name: "echo",
      description: "echo something",
      parameters: [{ name: "text", type: "string", description: "text to echo", required: true }],
    }
  end

  # by default gemini is meant to use AUTO mode, however new experimental models
  # appear to require this to be explicitly set
  it "Explicitly specifies tool config" do
    prompt = DiscourseAi::Completions::Prompt.new("Hello", tools: [echo_tool])

    response = gemini_mock.response("World").to_json

    req_body = nil

    llm = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")
    url = "#{model.url}:generateContent?key=123"

    stub_request(:post, url).with(
      body:
        proc do |_req_body|
          req_body = _req_body
          true
        end,
    ).to_return(status: 200, body: response)

    response = llm.generate(prompt, user: user)

    expect(response).to eq("World")

    parsed = JSON.parse(req_body, symbolize_names: true)

    expect(parsed[:tool_config]).to eq({ function_calling_config: { mode: "AUTO" } })
  end

  it "Supports Vision API" do
    prompt =
      DiscourseAi::Completions::Prompt.new(
        "You are image bot",
        messages: [type: :user, id: "user1", content: "hello", upload_ids: [upload100x100.id]],
      )

    encoded = prompt.encoded_uploads(prompt.messages.last)

    response = gemini_mock.response("World").to_json

    req_body = nil

    llm = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")
    url = "#{model.url}:generateContent?key=123"

    stub_request(:post, url).with(
      body:
        proc do |_req_body|
          req_body = _req_body
          true
        end,
    ).to_return(status: 200, body: response)

    response = llm.generate(prompt, user: user)

    expect(response).to eq("World")

    expected_prompt = {
      "generationConfig" => {
      },
      "safetySettings" => [
        { "category" => "HARM_CATEGORY_HARASSMENT", "threshold" => "BLOCK_NONE" },
        { "category" => "HARM_CATEGORY_SEXUALLY_EXPLICIT", "threshold" => "BLOCK_NONE" },
        { "category" => "HARM_CATEGORY_HATE_SPEECH", "threshold" => "BLOCK_NONE" },
        { "category" => "HARM_CATEGORY_DANGEROUS_CONTENT", "threshold" => "BLOCK_NONE" },
      ],
      "contents" => [
        {
          "role" => "user",
          "parts" => [
            { "text" => "hello" },
            { "inlineData" => { "mimeType" => "image/jpeg", "data" => encoded[0][:base64] } },
          ],
        },
      ],
      "systemInstruction" => {
        "role" => "system",
        "parts" => [{ "text" => "You are image bot" }],
      },
    }

    expect(JSON.parse(req_body)).to eq(expected_prompt)
  end

  it "Can correctly handle streamed responses even if they are chunked badly" do
    data = +""
    data << "da|ta: |"
    data << gemini_mock.response("Hello").to_json
    data << "\r\n\r\ndata: "
    data << gemini_mock.response(" |World").to_json
    data << "\r\n\r\ndata: "
    data << gemini_mock.response(" Sam").to_json

    split = data.split("|")

    llm = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")
    url = "#{model.url}:streamGenerateContent?alt=sse&key=123"

    output = +""
    gemini_mock.with_chunk_array_support do
      stub_request(:post, url).to_return(status: 200, body: split)
      llm.generate("Hello", user: user) { |partial| output << partial }
    end

    expect(output).to eq("Hello World Sam")
  end
end
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`# frozen_string_literal: true`

DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`require_relative "endpoint_compliance"`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`class GeminiMock < EndpointMock`
DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`def response(content, tool_call: false)`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`{`
			`candidates: [`
			`{`
			`content: {`
DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`parts: [(tool_call ? content : { text: content })],`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`role: "model",`
			`},`
			`finishReason: "STOP",`
			`index: 0,`
			`safetyRatings: [`
			`{ category: "HARM_CATEGORY_SEXUALLY_EXPLICIT", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_HATE_SPEECH", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_HARASSMENT", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_DANGEROUS_CONTENT", probability: "NEGLIGIBLE" },`
			`],`
			`},`
			`],`
			`promptFeedback: {`
			`safetyRatings: [`
			`{ category: "HARM_CATEGORY_SEXUALLY_EXPLICIT", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_HATE_SPEECH", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_HARASSMENT", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_DANGEROUS_CONTENT", probability: "NEGLIGIBLE" },`
			`],`
			`},`
			`}`
			`end`

DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`def stub_response(prompt, response_text, tool_call: false)`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`WebMock`
			`.stub_request(`
			`:post,`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`"https://generativelanguage.googleapis.com/v1beta/models/gemini-pro:generateContent?key=#{SiteSetting.ai_gemini_api_key}",`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`.with(body: request_body(prompt, tool_call))`
DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`.to_return(status: 200, body: JSON.dump(response(response_text, tool_call: tool_call)))`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`end`

DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`def stream_line(delta, finish_reason: nil, tool_call: false)`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`{`
			`candidates: [`
			`{`
			`content: {`
DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`parts: [(tool_call ? delta : { text: delta })],`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`role: "model",`
			`},`
			`finishReason: finish_reason,`
			`index: 0,`
			`safetyRatings: [`
			`{ category: "HARM_CATEGORY_SEXUALLY_EXPLICIT", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_HATE_SPEECH", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_HARASSMENT", probability: "NEGLIGIBLE" },`
			`{ category: "HARM_CATEGORY_DANGEROUS_CONTENT", probability: "NEGLIGIBLE" },`
			`],`
			`},`
			`],`
			`}.to_json`
			`end`

DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`def stub_streamed_response(prompt, deltas, tool_call: false)`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`chunks =`
			`deltas.each_with_index.map do \|_, index\|`
			`if index == (deltas.length - 1)`
DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`stream_line(deltas[index], finish_reason: "STOP", tool_call: tool_call)`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`else`
DEV: Tool support for the LLM service. (#366) This PR adds tool support to available LLMs. We'll buffer tool invocations and return them instead of making users of this service parse the response. It also adds support for conversation context in the generic prompt. It includes bot messages, user messages, and tool invocations, which we'll trim to make sure it doesn't exceed the prompt limit, then translate them to the correct dialect. Finally, It adds some buffering when reading chunks to handle cases when streaming is extremely slow.:M 2023-12-18 16:06:01 -05:00			`stream_line(deltas[index], tool_call: tool_call)`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`end`
			`end`

FEATURE: AI Bot Gemini support. (#402) It also corrects the syntax around tool support, which was wrong. Gemini doesn't want us to include messages about previous tool invocations, so I had to shuffle around some code to send the response it generated from those invocations instead. For this, I created the "multi_turn" context, which bundles all the context involved in the interaction. 2024-01-04 16:15:34 -05:00			`chunks = chunks.join("\n,\n").prepend("[\n").concat("\n]").split("")`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00
			`WebMock`
			`.stub_request(`
			`:post,`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`"https://generativelanguage.googleapis.com/v1beta/models/gemini-pro:streamGenerateContent?key=#{SiteSetting.ai_gemini_api_key}",`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`.with(body: request_body(prompt, tool_call))`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`.to_return(status: 200, body: chunks)`
			`end`

DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`def tool_payload`
			`{`
			`name: "get_weather",`
			`description: "Get the weather in a city",`
			`parameters: {`
			`type: "object",`
			`required: %w[location unit],`
			`properties: {`
			`"location" => {`
			`type: "string",`
			`description: "the city name",`
			`},`
			`"unit" => {`
			`type: "string",`
			`description: "the unit of measurement celcius c or fahrenheit f",`
			`enum: %w[c f],`
			`},`
			`},`
			`},`
			`}`
			`end`

			`def request_body(prompt, tool_call)`
			`model`
			`.default_options`
			`.merge(contents: prompt)`
			`.tap { \|b\| b[:tools] = [{ function_declarations: [tool_payload] }] if tool_call }`
			`.to_json`
			`end`

			`def tool_deltas`
			`[`
			`{ "functionCall" => { name: "get_weather", args: {} } },`
			`{ "functionCall" => { name: "get_weather", args: { location: "" } } },`
			`{ "functionCall" => { name: "get_weather", args: { location: "Sydney", unit: "c" } } },`
			`]`
			`end`

			`def tool_response`
			`{ "functionCall" => { name: "get_weather", args: { location: "Sydney", unit: "c" } } }`
			`end`
			`end`

			`RSpec.describe DiscourseAi::Completions::Endpoints::Gemini do`
DEV: Remove old code now that features rely on LlmModels. (#729) * DEV: Remove old code now that features rely on LlmModels. * Hide old settings and migrate persona llm overrides * Remove shadowing special URL + seeding code. Use srv:// prefix instead. 2024-07-30 12:44:57 -04:00			`subject(:endpoint) { described_class.new(model) }`

			`fab!(:model) { Fabricate(:gemini_model, vision_enabled: true) }`
FEATURE: Track if a model can do vision in the llm_models table (#725) * FEATURE: Track if a model can do vision in the llm_models table * Data migration 2024-07-24 15:29:47 -04:00
DEV: Fix new Rubocop offenses 2024-03-05 10:48:28 -05:00			`fab!(:user)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00			`let(:image100x100) { plugin_file_from_fixtures("100x100.jpg") }`
			`let(:upload100x100) do`
			`UploadCreator.new(image100x100, "image.jpg").create_for(Discourse.system_user.id)`
			`end`

FEATURE: Add GitHub Helper AI Bot persona and tools (#513) Introduces a new AI Bot persona called 'GitHub Helper' which is specialized in assisting with GitHub-related tasks and questions. It includes the following key changes: - Implements the GitHub Helper persona class with its system prompt and available tools - Adds three new AI Bot tools for GitHub interactions: - github_file_content: Retrieves content of files from a GitHub repository - github_pull_request_diff: Retrieves the diff for a GitHub pull request - github_search_code: Searches for code in a GitHub repository - Updates the AI Bot dialects to support the new GitHub tools - Implements multiple function calls for standard tool dialect 2024-03-07 14:37:23 -05:00			`let(:gemini_mock) { GeminiMock.new(endpoint) }`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00
			`let(:compliance) do`
			`EndpointsCompliance.new(self, endpoint, DiscourseAi::Completions::Dialects::Gemini, user)`
			`end`

FIX: gemini 0801 tool calls (#748) Gemini experimental model requires tool_config. Previously defaults would apply. This corrects prompts containing multiple tools on gemini. 2024-08-12 02:10:16 -04:00			`let(:echo_tool) do`
			`{`
			`name: "echo",`
			`description: "echo something",`
			`parameters: [{ name: "text", type: "string", description: "text to echo", required: true }],`
			`}`
			`end`

			`# by default gemini is meant to use AUTO mode, however new experimental models`
			`# appear to require this to be explicitly set`
			`it "Explicitly specifies tool config" do`
			`prompt = DiscourseAi::Completions::Prompt.new("Hello", tools: [echo_tool])`

			`response = gemini_mock.response("World").to_json`

			`req_body = nil`

			`llm = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")`
			`url = "#{model.url}:generateContent?key=123"`

			`stub_request(:post, url).with(`
			`body:`
			`proc do \|_req_body\|`
			`req_body = _req_body`
			`true`
			`end,`
			`).to_return(status: 200, body: response)`

			`response = llm.generate(prompt, user: user)`

			`expect(response).to eq("World")`

			`parsed = JSON.parse(req_body, symbolize_names: true)`

			`expect(parsed[:tool_config]).to eq({ function_calling_config: { mode: "AUTO" } })`
			`end`

FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00			`it "Supports Vision API" do`
			`prompt =`
			`DiscourseAi::Completions::Prompt.new(`
			`"You are image bot",`
			`messages: [type: :user, id: "user1", content: "hello", upload_ids: [upload100x100.id]],`
			`)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00			`encoded = prompt.encoded_uploads(prompt.messages.last)`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00			`response = gemini_mock.response("World").to_json`

			`req_body = nil`

FEATURE: Track if a model can do vision in the llm_models table (#725) * FEATURE: Track if a model can do vision in the llm_models table * Data migration 2024-07-24 15:29:47 -04:00			`llm = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")`
DEV: Remove old code now that features rely on LlmModels. (#729) * DEV: Remove old code now that features rely on LlmModels. * Hide old settings and migrate persona llm overrides * Remove shadowing special URL + seeding code. Use srv:// prefix instead. 2024-07-30 12:44:57 -04:00			`url = "#{model.url}:generateContent?key=123"`
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00
			`stub_request(:post, url).with(`
			`body:`
			`proc do \|_req_body\|`
			`req_body = _req_body`
			`true`
			`end,`
			`).to_return(status: 200, body: response)`

			`response = llm.generate(prompt, user: user)`

			`expect(response).to eq("World")`

			`expected_prompt = {`
			`"generationConfig" => {`
			`},`
FIX: when creating an llm we were not creating user (#685) This meant that if you toggle ai user early it surprisingly did not work. Also remove safety settings from gemini, it is overly cautious 2024-06-23 19:59:42 -04:00			`"safetySettings" => [`
			`{ "category" => "HARM_CATEGORY_HARASSMENT", "threshold" => "BLOCK_NONE" },`
			`{ "category" => "HARM_CATEGORY_SEXUALLY_EXPLICIT", "threshold" => "BLOCK_NONE" },`
			`{ "category" => "HARM_CATEGORY_HATE_SPEECH", "threshold" => "BLOCK_NONE" },`
			`{ "category" => "HARM_CATEGORY_DANGEROUS_CONTENT", "threshold" => "BLOCK_NONE" },`
			`],`
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00			`"contents" => [`
			`{`
			`"role" => "user",`
			`"parts" => [`
			`{ "text" => "hello" },`
			`{ "inlineData" => { "mimeType" => "image/jpeg", "data" => encoded[0][:base64] } },`
			`],`
			`},`
			`],`
			`"systemInstruction" => {`
			`"role" => "system",`
			`"parts" => [{ "text" => "You are image bot" }],`
			`},`
			`}`

			`expect(JSON.parse(req_body)).to eq(expected_prompt)`
			`end`

			`it "Can correctly handle streamed responses even if they are chunked badly" do`
			`data = +""`
			`data << "da\|ta: \|"`
			`data << gemini_mock.response("Hello").to_json`
			`data << "\r\n\r\ndata: "`
			`data << gemini_mock.response(" \|World").to_json`
			`data << "\r\n\r\ndata: "`
			`data << gemini_mock.response(" Sam").to_json`

			`split = data.split("\|")`

FEATURE: Track if a model can do vision in the llm_models table (#725) * FEATURE: Track if a model can do vision in the llm_models table * Data migration 2024-07-24 15:29:47 -04:00			`llm = DiscourseAi::Completions::Llm.proxy("custom:#{model.id}")`
DEV: Remove old code now that features rely on LlmModels. (#729) * DEV: Remove old code now that features rely on LlmModels. * Hide old settings and migrate persona llm overrides * Remove shadowing special URL + seeding code. Use srv:// prefix instead. 2024-07-30 12:44:57 -04:00			`url = "#{model.url}:streamGenerateContent?alt=sse&key=123"`
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00
			`output = +""`
			`gemini_mock.with_chunk_array_support do`
			`stub_request(:post, url).to_return(status: 200, body: split)`
			`llm.generate("Hello", user: user) { \|partial\| output << partial }`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`end`
FIX: correct gemini streaming implementation (#632) This also implements image support and gemini-flash support 2024-05-22 02:35:29 -04:00
			`expect(output).to eq("Hello World Sam")`
DEV: Stop using shared_examples for endpoint specs (#430) 2024-01-17 13:08:49 -05:00			`end`
FEATURE: Support for Gemini in AiHelper / Search / Summarization (#358) 2023-12-15 12:32:01 -05:00			`end`