2024-11-04 15:48:11 -05:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
RSpec.describe Jobs::SummariesBackfill do
|
|
|
|
fab!(:topic) { Fabricate(:topic, word_count: 200, highest_post_number: 2) }
|
|
|
|
let(:limit) { 24 } # guarantee two summaries per batch
|
2024-11-07 11:40:18 -05:00
|
|
|
let(:intervals) { 12 } # budget is split into intervals. Job runs every five minutes.
|
2024-11-04 15:48:11 -05:00
|
|
|
|
|
|
|
before do
|
|
|
|
assign_fake_provider_to(:ai_summarization_model)
|
|
|
|
SiteSetting.ai_summarization_enabled = true
|
|
|
|
SiteSetting.ai_summary_backfill_maximum_topics_per_hour = limit
|
2024-11-26 11:44:12 -05:00
|
|
|
SiteSetting.ai_summary_gists_enabled = true
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
describe "#current_budget" do
|
2024-11-07 11:40:18 -05:00
|
|
|
let(:type) { AiSummary.summary_types[:complete] }
|
|
|
|
|
2024-11-04 15:48:11 -05:00
|
|
|
context "when no summary has been backfilled yet" do
|
|
|
|
it "returns the full budget" do
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.current_budget(type)).to eq(limit / intervals)
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
it "ignores summaries generated by users" do
|
|
|
|
Fabricate(:ai_summary, target: topic, origin: AiSummary.origins[:human])
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.current_budget(type)).to eq(limit / intervals)
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
it "only accounts for summaries of the given type" do
|
2024-11-04 15:48:11 -05:00
|
|
|
Fabricate(:topic_ai_gist, target: topic, origin: AiSummary.origins[:human])
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.current_budget(type)).to eq(limit / intervals)
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
describe "#backfill_candidates" do
|
2024-11-07 11:40:18 -05:00
|
|
|
let(:type) { AiSummary.summary_types[:complete] }
|
|
|
|
|
2024-11-04 15:48:11 -05:00
|
|
|
it "only selects posts with enough words" do
|
|
|
|
topic.update!(word_count: 100)
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.backfill_candidates(type)).to be_empty
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
it "ignores up to date summaries" do
|
|
|
|
Fabricate(:ai_summary, target: topic, content_range: (1..2))
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.backfill_candidates(type)).to be_empty
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
it "orders candidates by topic#last_posted_at" do
|
|
|
|
topic.update!(last_posted_at: 1.minute.ago)
|
|
|
|
topic_2 = Fabricate(:topic, word_count: 200, last_posted_at: 2.minutes.ago)
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.backfill_candidates(type).map(&:id)).to contain_exactly(topic.id, topic_2.id)
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
it "prioritizes topics without summaries" do
|
|
|
|
topic_2 =
|
|
|
|
Fabricate(:topic, word_count: 200, last_posted_at: 2.minutes.ago, highest_post_number: 1)
|
|
|
|
topic.update!(last_posted_at: 1.minute.ago)
|
|
|
|
Fabricate(:ai_summary, target: topic, content_range: (1..1))
|
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(subject.backfill_candidates(type).map(&:id)).to contain_exactly(topic_2.id, topic.id)
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
describe "#execute" do
|
|
|
|
it "backfills a batch" do
|
|
|
|
topic_2 =
|
|
|
|
Fabricate(:topic, word_count: 200, last_posted_at: 2.minutes.ago, highest_post_number: 1)
|
|
|
|
topic.update!(last_posted_at: 1.minute.ago)
|
|
|
|
Fabricate(:ai_summary, target: topic, created_at: 3.hours.ago, content_range: (1..1))
|
2024-11-07 11:40:18 -05:00
|
|
|
Fabricate(:topic_ai_gist, target: topic, created_at: 3.hours.ago, content_range: (1..1))
|
2024-11-04 15:48:11 -05:00
|
|
|
|
|
|
|
summary_1 = "Summary of topic_2"
|
2024-11-07 11:40:18 -05:00
|
|
|
gist_1 = "Gist of topic_2"
|
2024-11-04 15:48:11 -05:00
|
|
|
summary_2 = "Summary of topic"
|
2024-11-07 11:40:18 -05:00
|
|
|
gist_2 = "Gist of topic"
|
2024-11-04 15:48:11 -05:00
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
DiscourseAi::Completions::Llm.with_prepared_responses(
|
|
|
|
[summary_1, summary_2, gist_1, gist_2],
|
|
|
|
) { subject.execute({}) }
|
2024-11-04 15:48:11 -05:00
|
|
|
|
2024-11-07 11:40:18 -05:00
|
|
|
expect(AiSummary.complete.find_by(target: topic_2).summarized_text).to eq(summary_1)
|
|
|
|
expect(AiSummary.gist.find_by(target: topic_2).summarized_text).to eq(gist_1)
|
|
|
|
expect(AiSummary.complete.find_by(target: topic).summarized_text).to eq(summary_2)
|
|
|
|
expect(AiSummary.gist.find_by(target: topic).summarized_text).to eq(gist_2)
|
2024-11-04 15:48:11 -05:00
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|