| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  | # frozen_string_literal: true | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | require_relative "../../../../support/anthropic_completion_stubs" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | RSpec.describe DiscourseAi::Summarization::Models::Anthropic do | 
					
						
							| 
									
										
										
										
											2023-06-27 14:42:33 -03:00
										 |  |  |   subject(:model) { described_class.new(model_name, max_tokens: max_tokens) } | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-07-27 11:24:44 +10:00
										 |  |  |   let(:model_name) { "claude-2" } | 
					
						
							| 
									
										
										
										
											2023-06-27 14:42:33 -03:00
										 |  |  |   let(:max_tokens) { 720 } | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  | 
 | 
					
						
							|  |  |  |   let(:content) do | 
					
						
							|  |  |  |     { | 
					
						
							| 
									
										
										
										
											2023-09-04 12:04:47 -03:00
										 |  |  |       resource_path: "/t/-/1", | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  |       content_title: "This is a title", | 
					
						
							|  |  |  |       contents: [{ poster: "asd", id: 1, text: "This is a text" }], | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  |   end | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-07-13 17:05:41 -03:00
										 |  |  |   def as_chunk(item) | 
					
						
							|  |  |  |     { ids: [item[:id]], summary: "(#{item[:id]} #{item[:poster]} said: #{item[:text]} " } | 
					
						
							|  |  |  |   end | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  |   def expected_messages(contents, opts) | 
					
						
							|  |  |  |     base_prompt = <<~TEXT | 
					
						
							|  |  |  |       Human: Summarize the following forum discussion inside the given <input> tag. | 
					
						
							| 
									
										
										
										
											2023-09-04 12:04:47 -03:00
										 |  |  |       Try to keep the summary in the same language as the forum discussion. | 
					
						
							| 
									
										
										
										
											2023-08-16 15:09:52 -03:00
										 |  |  |       Format the response, including links, using markdown. | 
					
						
							| 
									
										
										
										
											2023-09-04 12:04:47 -03:00
										 |  |  |       Try generating links as well the format is #{opts[:resource_path]}/POST_ID | 
					
						
							|  |  |  |       For example, a link to the 3rd post in the topic would be [post 3](#{opts[:resource_path]}/3) | 
					
						
							|  |  |  |       Wrap the whole the summary inside <ai> tags. | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  |       The discussion title is: #{opts[:content_title]}. | 
					
						
							|  |  |  |       Don't use more than 400 words. | 
					
						
							|  |  |  |     TEXT | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     text = | 
					
						
							|  |  |  |       contents.reduce("") do |memo, item| | 
					
						
							|  |  |  |         memo += "(#{item[:id]} #{item[:poster]} said: #{item[:text]} " | 
					
						
							|  |  |  |       end | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     base_prompt += "<input>#{text}</input>\nAssistant:\n" | 
					
						
							|  |  |  |   end | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   describe "#summarize_in_chunks" do | 
					
						
							|  |  |  |     context "when the content fits in a single chunk" do | 
					
						
							|  |  |  |       it "performs a request to summarize" do | 
					
						
							|  |  |  |         opts = content.except(:contents) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         AnthropicCompletionStubs.stub_response( | 
					
						
							|  |  |  |           expected_messages(content[:contents], opts), | 
					
						
							|  |  |  |           "<ai>This is summary 1</ai>", | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-07-13 17:05:41 -03:00
										 |  |  |         chunks = content[:contents].map { |c| as_chunk(c) } | 
					
						
							|  |  |  |         summarized_chunks = model.summarize_in_chunks(chunks, opts).map { |c| c[:summary] } | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  | 
 | 
					
						
							|  |  |  |         expect(summarized_chunks).to contain_exactly("This is summary 1") | 
					
						
							|  |  |  |       end | 
					
						
							|  |  |  |     end | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     context "when the content fits in multiple chunks" do | 
					
						
							|  |  |  |       it "performs a request for each one to summarize" do | 
					
						
							|  |  |  |         content[:contents] << { | 
					
						
							|  |  |  |           poster: "asd2", | 
					
						
							|  |  |  |           id: 2, | 
					
						
							|  |  |  |           text: "This is a different text to summarize", | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  |         opts = content.except(:contents) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         content[:contents].each_with_index do |item, idx| | 
					
						
							|  |  |  |           AnthropicCompletionStubs.stub_response( | 
					
						
							|  |  |  |             expected_messages([item], opts), | 
					
						
							|  |  |  |             "<ai>This is summary #{idx + 1}</ai>", | 
					
						
							|  |  |  |           ) | 
					
						
							|  |  |  |         end | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-07-13 17:05:41 -03:00
										 |  |  |         chunks = content[:contents].map { |c| as_chunk(c) } | 
					
						
							|  |  |  |         summarized_chunks = model.summarize_in_chunks(chunks, opts).map { |c| c[:summary] } | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  | 
 | 
					
						
							|  |  |  |         expect(summarized_chunks).to contain_exactly("This is summary 1", "This is summary 2") | 
					
						
							|  |  |  |       end | 
					
						
							|  |  |  |     end | 
					
						
							|  |  |  |   end | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   describe "#concatenate_summaries" do | 
					
						
							|  |  |  |     it "combines all the different summaries into a single one" do | 
					
						
							|  |  |  |       messages = <<~TEXT | 
					
						
							|  |  |  |         Human: Concatenate the following disjoint summaries inside the given input tags, creating a cohesive narrative. | 
					
						
							|  |  |  |         Include only the summary inside <ai> tags. | 
					
						
							|  |  |  |         <input>summary 1</input>
 | 
					
						
							|  |  |  |         <input>summary 2</input>
 | 
					
						
							|  |  |  |         Assistant: | 
					
						
							|  |  |  |       TEXT | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |       AnthropicCompletionStubs.stub_response(messages, "<ai>concatenated summary</ai>") | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-27 14:42:33 -03:00
										 |  |  |       expect(model.concatenate_summaries(["summary 1", "summary 2"])).to eq("concatenated summary") | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  |     end | 
					
						
							|  |  |  |   end | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   describe "#summarize_with_truncation" do | 
					
						
							|  |  |  |     let(:max_tokens) { 709 } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     it "truncates the context to meet the token limit" do | 
					
						
							|  |  |  |       opts = content.except(:contents) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |       instructions = <<~TEXT | 
					
						
							|  |  |  |         Human: Summarize the following forum discussion inside the given <input> tag. | 
					
						
							| 
									
										
										
										
											2023-09-04 12:04:47 -03:00
										 |  |  |         Try to keep the summary in the same language as the forum discussion. | 
					
						
							| 
									
										
										
										
											2023-08-16 15:09:52 -03:00
										 |  |  |         Format the response, including links, using markdown. | 
					
						
							| 
									
										
										
										
											2023-09-04 12:04:47 -03:00
										 |  |  |         Try generating links as well the format is #{opts[:resource_path]}/POST_ID | 
					
						
							|  |  |  |         For example, a link to the 3rd post in the topic would be [post 3](#{opts[:resource_path]}/3) | 
					
						
							|  |  |  |         Wrap the whole the summary inside <ai> tags. | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  |         The discussion title is: #{opts[:content_title]}. | 
					
						
							|  |  |  |         Don't use more than 400 words. | 
					
						
							|  |  |  |         <input>(1 asd said: This is a</input>
 | 
					
						
							|  |  |  |         Assistant: | 
					
						
							|  |  |  |       TEXT | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |       AnthropicCompletionStubs.stub_response(instructions, "<ai>truncated summary</ai>") | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-06-27 14:42:33 -03:00
										 |  |  |       expect(model.summarize_with_truncation(content[:contents], opts)).to eq("truncated summary") | 
					
						
							| 
									
										
										
										
											2023-06-27 12:26:33 -03:00
										 |  |  |     end | 
					
						
							|  |  |  |   end | 
					
						
							|  |  |  | end |