discourse-ai/spec/lib/modules/summarization/models/discourse_spec.rb

# frozen_string_literal: true

RSpec.describe DiscourseAi::Summarization::Models::Discourse do
  subject(:model) { described_class.new(model_name, max_tokens: max_tokens) }

  let(:model_name) { "bart-large-cnn-samsum" }
  let(:max_tokens) { 20 }

  let(:content) do
    {
      resource_path: "/t/1/POST_NUMBER",
      content_title: "This is a title",
      contents: [{ poster: "asd", id: 1, text: "This is a text" }],
    }
  end

  before { SiteSetting.ai_summarization_discourse_service_api_endpoint = "https://test.com" }

  def stub_request(prompt, response)
    WebMock
      .stub_request(
        :post,
        "#{SiteSetting.ai_summarization_discourse_service_api_endpoint}/api/v1/classify",
      )
      .with(body: JSON.dump(model: model_name, content: prompt))
      .to_return(status: 200, body: JSON.dump(summary_text: response))
  end

  def expected_messages(contents, opts)
    contents.reduce("") do |memo, item|
      memo += "(#{item[:id]} #{item[:poster]} said: #{item[:text]} "
    end
  end

  def as_chunk(item)
    { ids: [item[:id]], summary: "(#{item[:id]} #{item[:poster]} said: #{item[:text]} " }
  end

  describe "#summarize_in_chunks" do
    context "when the content fits in a single chunk" do
      it "performs a request to summarize" do
        opts = content.except(:contents)

        stub_request(expected_messages(content[:contents], opts), "This is summary 1")

        chunks = content[:contents].map { |c| as_chunk(c) }
        summarized_chunks = model.summarize_in_chunks(chunks, opts).map { |c| c[:summary] }

        expect(summarized_chunks).to contain_exactly("This is summary 1")
      end
    end

    context "when the content fits in multiple chunks" do
      it "performs a request for each one to summarize" do
        content[:contents] << {
          poster: "asd2",
          id: 2,
          text: "This is a different text to summarize",
        }
        opts = content.except(:contents)

        content[:contents].each_with_index do |item, idx|
          stub_request(expected_messages([item], opts), "This is summary #{idx + 1}")
        end

        chunks = content[:contents].map { |c| as_chunk(c) }
        summarized_chunks = model.summarize_in_chunks(chunks, opts).map { |c| c[:summary] }

        expect(summarized_chunks).to contain_exactly("This is summary 1", "This is summary 2")
      end
    end
  end

  describe "#concatenate_summaries" do
    it "combines all the different summaries into a single one" do
      messages = ["summary 1", "summary 2"].join("\n")

      stub_request(messages, "concatenated summary")

      expect(model.concatenate_summaries(["summary 1", "summary 2"])).to eq("concatenated summary")
    end
  end

  describe "#summarize_with_truncation" do
    let(:max_tokens) { 9 }

    it "truncates the context to meet the token limit" do
      opts = content.except(:contents)

      stub_request("( 1 asd said : this is", "truncated summary")

      expect(model.summarize_with_truncation(content[:contents], opts)).to eq("truncated summary")
    end
  end
end
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00			`# frozen_string_literal: true`

			`RSpec.describe DiscourseAi::Summarization::Models::Discourse do`
FIX: Claude's max_tookens_to_sample is a required field (#97) 2023-06-27 13:42:33 -04:00			`subject(:model) { described_class.new(model_name, max_tokens: max_tokens) }`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00
FIX: Claude's max_tookens_to_sample is a required field (#97) 2023-06-27 13:42:33 -04:00			`let(:model_name) { "bart-large-cnn-samsum" }`
			`let(:max_tokens) { 20 }`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00
			`let(:content) do`
			`{`
			`resource_path: "/t/1/POST_NUMBER",`
			`content_title: "This is a title",`
			`contents: [{ poster: "asd", id: 1, text: "This is a text" }],`
			`}`
			`end`

			`before { SiteSetting.ai_summarization_discourse_service_api_endpoint = "https://test.com" }`

			`def stub_request(prompt, response)`
			`WebMock`
			`.stub_request(`
			`:post,`
			`"#{SiteSetting.ai_summarization_discourse_service_api_endpoint}/api/v1/classify",`
			`)`
FIX: Claude's max_tookens_to_sample is a required field (#97) 2023-06-27 13:42:33 -04:00			`.with(body: JSON.dump(model: model_name, content: prompt))`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00			`.to_return(status: 200, body: JSON.dump(summary_text: response))`
			`end`

			`def expected_messages(contents, opts)`
			`contents.reduce("") do \|memo, item\|`
			`memo += "(#{item[:id]} #{item[:poster]} said: #{item[:text]} "`
			`end`
			`end`

REFACTOR: Cohesive narrative for single-chunk summaries. (#103) Single and multi-chunk summaries end using different prompts for the last summary. This change detects when the summarized content fits in a single chunk and uses a slightly different prompt, which leads to more consistent summary formats. This PR also moves the chunk-splitting step to the `FoldContent` strategy as preparation for implementing streamed summaries. 2023-07-13 16:05:41 -04:00			`def as_chunk(item)`
			`{ ids: [item[:id]], summary: "(#{item[:id]} #{item[:poster]} said: #{item[:text]} " }`
			`end`

DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00			`describe "#summarize_in_chunks" do`
			`context "when the content fits in a single chunk" do`
			`it "performs a request to summarize" do`
			`opts = content.except(:contents)`

			`stub_request(expected_messages(content[:contents], opts), "This is summary 1")`

REFACTOR: Cohesive narrative for single-chunk summaries. (#103) Single and multi-chunk summaries end using different prompts for the last summary. This change detects when the summarized content fits in a single chunk and uses a slightly different prompt, which leads to more consistent summary formats. This PR also moves the chunk-splitting step to the `FoldContent` strategy as preparation for implementing streamed summaries. 2023-07-13 16:05:41 -04:00			`chunks = content[:contents].map { \|c\| as_chunk(c) }`
			`summarized_chunks = model.summarize_in_chunks(chunks, opts).map { \|c\| c[:summary] }`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00
			`expect(summarized_chunks).to contain_exactly("This is summary 1")`
			`end`
			`end`

			`context "when the content fits in multiple chunks" do`
			`it "performs a request for each one to summarize" do`
			`content[:contents] << {`
			`poster: "asd2",`
			`id: 2,`
			`text: "This is a different text to summarize",`
			`}`
			`opts = content.except(:contents)`

			`content[:contents].each_with_index do \|item, idx\|`
			`stub_request(expected_messages([item], opts), "This is summary #{idx + 1}")`
			`end`

REFACTOR: Cohesive narrative for single-chunk summaries. (#103) Single and multi-chunk summaries end using different prompts for the last summary. This change detects when the summarized content fits in a single chunk and uses a slightly different prompt, which leads to more consistent summary formats. This PR also moves the chunk-splitting step to the `FoldContent` strategy as preparation for implementing streamed summaries. 2023-07-13 16:05:41 -04:00			`chunks = content[:contents].map { \|c\| as_chunk(c) }`
			`summarized_chunks = model.summarize_in_chunks(chunks, opts).map { \|c\| c[:summary] }`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00
			`expect(summarized_chunks).to contain_exactly("This is summary 1", "This is summary 2")`
			`end`
			`end`
			`end`

			`describe "#concatenate_summaries" do`
			`it "combines all the different summaries into a single one" do`
			`messages = ["summary 1", "summary 2"].join("\n")`

			`stub_request(messages, "concatenated summary")`

FIX: Claude's max_tookens_to_sample is a required field (#97) 2023-06-27 13:42:33 -04:00			`expect(model.concatenate_summaries(["summary 1", "summary 2"])).to eq("concatenated summary")`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00			`end`
			`end`

			`describe "#summarize_with_truncation" do`
			`let(:max_tokens) { 9 }`

			`it "truncates the context to meet the token limit" do`
			`opts = content.except(:contents)`

			`stub_request("( 1 asd said : this is", "truncated summary")`

FIX: Claude's max_tookens_to_sample is a required field (#97) 2023-06-27 13:42:33 -04:00			`expect(model.summarize_with_truncation(content[:contents], opts)).to eq("truncated summary")`
DEV: Better strategies for summarization (#88) * DEV: Better strategies for summarization The strategy responsibility needs to be "Given a collection of texts, I know how to summarize them most efficiently, using the minimum amount of requests and maximizing token usage". There are different token limits for each model, so it all boils down to two different strategies: Fold all these texts into a single one, doing the summarization in chunks, and then build a summary from those. Build it by combining texts in a single prompt, and truncate it according to your token limits. While the latter is less than ideal, we need it for "bart-large-cnn-samsum" and "flan-t5-base-samsum", both with low limits. The rest will rely on folding. * Expose summarized chunks to users 2023-06-27 11:26:33 -04:00			`end`
			`end`
			`end`