mirror of
				https://github.com/discourse/discourse-ai.git
				synced 2025-10-25 03:28:40 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			85 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			Ruby
		
	
	
	
	
	
			
		
		
	
	
			85 lines
		
	
	
		
			2.1 KiB
		
	
	
	
		
			Ruby
		
	
	
	
	
	
| # frozen_string_literal: true
 | |
| 
 | |
| class DiscourseAi::Evals::PromptEvaluator
 | |
|   def initialize(llm)
 | |
|     @llm = llm.llm_model.to_llm
 | |
|   end
 | |
| 
 | |
|   def prompt_call(args)
 | |
|     args = [args] if !args.is_a?(Array)
 | |
|     runner = DiscourseAi::Evals::PromptSingleTestRunner.new(@llm)
 | |
| 
 | |
|     with_tests_progress(total: args.size) do |bump_progress|
 | |
|       args.flat_map do |test|
 | |
|         bump_progress.call
 | |
| 
 | |
|         prompts, messages, followups, output_thinking, stream, temperature, tools =
 | |
|           symbolize_test_args(test)
 | |
| 
 | |
|         prompts.flat_map do |prompt|
 | |
|           messages.map do |message|
 | |
|             runner.run_single_test(
 | |
|               prompt,
 | |
|               message,
 | |
|               followups,
 | |
|               output_thinking,
 | |
|               stream,
 | |
|               temperature,
 | |
|               tools,
 | |
|             )
 | |
|           end
 | |
|         end
 | |
|       end
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   private
 | |
| 
 | |
|   def symbolize_test_args(args)
 | |
|     prompts = args[:prompts] || [args[:prompt]]
 | |
|     messages = args[:messages] || [args[:message]]
 | |
|     followups = symbolize_followups(args)
 | |
|     output_thinking = args[:output_thinking] || false
 | |
|     stream = args[:stream] || false
 | |
|     temperature = args[:temperature]
 | |
|     tools = symbolize_tools(args[:tools])
 | |
|     [prompts, messages, followups, output_thinking, stream, temperature, tools]
 | |
|   end
 | |
| 
 | |
|   def symbolize_followups(args)
 | |
|     return nil if args[:followups].nil? && args[:followup].nil?
 | |
|     followups = args[:followups] || [args[:followup]]
 | |
|     followups.map do |followup|
 | |
|       followup = followup.dup.symbolize_keys!
 | |
|       message = followup[:message].dup.symbolize_keys!
 | |
|       message[:type] = message[:type].to_sym if message[:type]
 | |
|       followup[:message] = message
 | |
|       followup
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   def symbolize_tools(tools)
 | |
|     return nil if tools.nil?
 | |
|     tools.map do |tool|
 | |
|       tool.symbolize_keys!
 | |
|       tool.merge(
 | |
|         parameters: tool[:parameters]&.map { |param| param.transform_keys(&:to_sym) },
 | |
|       ).compact
 | |
|     end
 | |
|   end
 | |
| 
 | |
|   def with_tests_progress(total:)
 | |
|     puts ""
 | |
|     count = 0
 | |
|     result =
 | |
|       yield(
 | |
|         -> do
 | |
|           count += 1
 | |
|           print "\rProcessing test #{count}/#{total}"
 | |
|         end
 | |
|       )
 | |
|     print "\r\033[K"
 | |
|     result
 | |
|   end
 | |
| end
 |