2023-03-31 14:29:56 -04:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
RSpec.describe DiscourseAi::Embeddings::SemanticSearch do
|
|
|
|
fab!(:post) { Fabricate(:post) }
|
|
|
|
fab!(:user) { Fabricate(:user) }
|
|
|
|
|
2023-07-13 11:41:36 -04:00
|
|
|
let(:query) { "test_query" }
|
|
|
|
let(:subject) { described_class.new(Guardian.new(user)) }
|
2023-03-31 14:29:56 -04:00
|
|
|
|
|
|
|
describe "#search_for_topics" do
|
2023-09-05 10:08:23 -04:00
|
|
|
let(:hypothetical_post) { "This is an hypothetical post generated from the keyword test_query" }
|
|
|
|
|
|
|
|
before do
|
|
|
|
SiteSetting.ai_embeddings_discourse_service_api_endpoint = "http://test.com"
|
|
|
|
|
|
|
|
prompt = DiscourseAi::Embeddings::HydeGenerators::OpenAi.new.prompt(query)
|
2023-09-05 15:11:07 -04:00
|
|
|
OpenAiCompletionsInferenceStubs.stub_response(
|
|
|
|
prompt,
|
|
|
|
hypothetical_post,
|
|
|
|
req_opts: {
|
|
|
|
max_tokens: 400,
|
|
|
|
},
|
|
|
|
)
|
2023-09-05 10:08:23 -04:00
|
|
|
|
|
|
|
hyde_embedding = [0.049382, 0.9999]
|
|
|
|
EmbeddingsGenerationStubs.discourse_service(
|
|
|
|
SiteSetting.ai_embeddings_model,
|
|
|
|
hypothetical_post,
|
|
|
|
hyde_embedding,
|
|
|
|
)
|
|
|
|
end
|
|
|
|
|
|
|
|
after { described_class.clear_cache_for(query) }
|
|
|
|
|
2023-03-31 14:29:56 -04:00
|
|
|
def stub_candidate_ids(candidate_ids)
|
2023-09-05 10:08:23 -04:00
|
|
|
DiscourseAi::Embeddings::VectorRepresentations::AllMpnetBaseV2
|
2023-03-31 14:29:56 -04:00
|
|
|
.any_instance
|
2023-09-05 10:08:23 -04:00
|
|
|
.expects(:asymmetric_topics_similarity_search)
|
2023-03-31 14:29:56 -04:00
|
|
|
.returns(candidate_ids)
|
|
|
|
end
|
|
|
|
|
|
|
|
it "returns the first post of a topic included in the asymmetric search results" do
|
|
|
|
stub_candidate_ids([post.topic_id])
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to contain_exactly(post)
|
|
|
|
end
|
|
|
|
|
|
|
|
describe "applies different scopes to the candidates" do
|
|
|
|
context "when the topic is not visible" do
|
|
|
|
it "returns an empty list" do
|
|
|
|
post.topic.update!(visible: false)
|
|
|
|
stub_candidate_ids([post.topic_id])
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to be_empty
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context "when the post is not public" do
|
|
|
|
it "returns an empty list" do
|
|
|
|
pm_post = Fabricate(:private_message_post)
|
|
|
|
stub_candidate_ids([pm_post.topic_id])
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to be_empty
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context "when the post type is not visible" do
|
|
|
|
it "returns an empty list" do
|
|
|
|
post.update!(post_type: Post.types[:whisper])
|
|
|
|
stub_candidate_ids([post.topic_id])
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to be_empty
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context "when the post is not the first post in the topic" do
|
|
|
|
it "returns an empty list" do
|
|
|
|
reply = Fabricate(:reply)
|
|
|
|
reply.topic.first_post.trash!
|
|
|
|
stub_candidate_ids([reply.topic_id])
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to be_empty
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context "when the post is not a candidate" do
|
|
|
|
it "doesn't include it in the results" do
|
|
|
|
post_2 = Fabricate(:post)
|
|
|
|
stub_candidate_ids([post.topic_id])
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).not_to include(post_2)
|
|
|
|
end
|
|
|
|
end
|
2023-09-06 09:00:20 -04:00
|
|
|
|
|
|
|
context "when the post belongs to a secured category" do
|
|
|
|
fab!(:group) { Fabricate(:group) }
|
|
|
|
fab!(:private_category) { Fabricate(:private_category, group: group) }
|
|
|
|
|
|
|
|
before do
|
|
|
|
post.topic.update!(category: private_category)
|
|
|
|
stub_candidate_ids([post.topic_id])
|
|
|
|
end
|
|
|
|
|
|
|
|
it "returns an empty list" do
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to be_empty
|
|
|
|
end
|
|
|
|
|
|
|
|
it "returns the results if the user has access to the category" do
|
|
|
|
group.add(user)
|
|
|
|
|
|
|
|
posts = subject.search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to contain_exactly(post)
|
|
|
|
end
|
|
|
|
|
|
|
|
context "while searching as anon" do
|
|
|
|
it "returns an empty list" do
|
|
|
|
posts = described_class.new(Guardian.new(nil)).search_for_topics(query)
|
|
|
|
|
|
|
|
expect(posts).to be_empty
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
2023-03-31 14:29:56 -04:00
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|