mirror of
https://github.com/discourse/discourse-ai.git
synced 2025-10-26 12:08:39 +00:00
This PR lets you associate uploads to an AI persona, which we'll split and generate embeddings from. When building the system prompt to get a bot reply, we'll do a similarity search followed by a re-ranking (if available). This will let us find the most relevant fragments from the body of knowledge you associated with the persona, resulting in better, more informed responses. For now, we'll only allow plain-text files, but this will change in the future. Commits: * FEATURE: RAG embeddings for the AI Bot This first commit introduces a UI where admins can upload text files, which we'll store, split into fragments, and generate embeddings of. In a next commit, we'll use those to give the bot additional information during conversations. * Basic asymmetric similarity search to provide guidance in system prompt * Fix tests and lint * Apply reranker to fragments * Uploads filter, css adjustments and file validations * Add placeholder for rag fragments * Update annotations
169 lines
4.7 KiB
Ruby
169 lines
4.7 KiB
Ruby
# frozen_string_literal: true
|
|
|
|
module DiscourseAi
|
|
module Admin
|
|
class AiPersonasController < ::Admin::AdminController
|
|
requires_plugin ::DiscourseAi::PLUGIN_NAME
|
|
|
|
before_action :find_ai_persona, only: %i[show update destroy create_user]
|
|
|
|
def index
|
|
ai_personas =
|
|
AiPersona.ordered.map do |persona|
|
|
# we use a special serializer here cause names and descriptions are
|
|
# localized for system personas
|
|
LocalizedAiPersonaSerializer.new(persona, root: false)
|
|
end
|
|
tools =
|
|
DiscourseAi::AiBot::Personas::Persona.all_available_tools.map do |tool|
|
|
AiToolSerializer.new(tool, root: false)
|
|
end
|
|
llms =
|
|
DiscourseAi::Configuration::LlmEnumerator.values.map do |hash|
|
|
{ id: hash[:value], name: hash[:name] }
|
|
end
|
|
render json: { ai_personas: ai_personas, meta: { commands: tools, llms: llms } }
|
|
end
|
|
|
|
def show
|
|
render json: LocalizedAiPersonaSerializer.new(@ai_persona)
|
|
end
|
|
|
|
def create
|
|
ai_persona = AiPersona.new(ai_persona_params.except(:rag_uploads))
|
|
if ai_persona.save
|
|
RagDocumentFragment.link_persona_and_uploads(ai_persona, attached_upload_ids)
|
|
|
|
render json: { ai_persona: ai_persona }, status: :created
|
|
else
|
|
render_json_error ai_persona
|
|
end
|
|
end
|
|
|
|
def create_user
|
|
user = @ai_persona.create_user!
|
|
render json: BasicUserSerializer.new(user, root: "user")
|
|
end
|
|
|
|
def update
|
|
if @ai_persona.update(ai_persona_params.except(:rag_uploads))
|
|
RagDocumentFragment.update_persona_uploads(@ai_persona, attached_upload_ids)
|
|
|
|
render json: @ai_persona
|
|
else
|
|
render_json_error @ai_persona
|
|
end
|
|
end
|
|
|
|
def destroy
|
|
if @ai_persona.destroy
|
|
head :no_content
|
|
else
|
|
render_json_error @ai_persona
|
|
end
|
|
end
|
|
|
|
def upload_file
|
|
file = params[:file] || params[:files].first
|
|
|
|
if !SiteSetting.ai_embeddings_enabled?
|
|
raise Discourse::InvalidAccess.new("Embeddings not enabled")
|
|
end
|
|
|
|
validate_extension!(file.original_filename)
|
|
validate_file_size!(file.tempfile.size)
|
|
|
|
hijack do
|
|
upload =
|
|
UploadCreator.new(
|
|
file.tempfile,
|
|
file.original_filename,
|
|
type: "discourse_ai_rag_upload",
|
|
skip_validations: true,
|
|
).create_for(current_user.id)
|
|
|
|
if upload.persisted?
|
|
render json: UploadSerializer.new(upload)
|
|
else
|
|
render json: failed_json.merge(errors: upload.errors.full_messages), status: 422
|
|
end
|
|
end
|
|
end
|
|
|
|
private
|
|
|
|
def find_ai_persona
|
|
@ai_persona = AiPersona.find(params[:id])
|
|
end
|
|
|
|
def attached_upload_ids
|
|
ai_persona_params[:rag_uploads].to_a.map { |h| h[:id] }
|
|
end
|
|
|
|
def ai_persona_params
|
|
permitted =
|
|
params.require(:ai_persona).permit(
|
|
:name,
|
|
:description,
|
|
:enabled,
|
|
:system_prompt,
|
|
:priority,
|
|
:top_p,
|
|
:temperature,
|
|
:default_llm,
|
|
:user_id,
|
|
:mentionable,
|
|
:max_context_posts,
|
|
:vision_enabled,
|
|
:vision_max_pixels,
|
|
allowed_group_ids: [],
|
|
rag_uploads: [:id],
|
|
)
|
|
|
|
if commands = params.dig(:ai_persona, :commands)
|
|
permitted[:commands] = permit_commands(commands)
|
|
end
|
|
|
|
permitted
|
|
end
|
|
|
|
def permit_commands(commands)
|
|
return [] if !commands.is_a?(Array)
|
|
|
|
commands.filter_map do |command, options|
|
|
break nil if !command.is_a?(String)
|
|
options&.permit! if options && options.is_a?(ActionController::Parameters)
|
|
|
|
if options
|
|
[command, options]
|
|
else
|
|
command
|
|
end
|
|
end
|
|
end
|
|
|
|
def validate_extension!(filename)
|
|
extension = File.extname(filename)[1..-1] || ""
|
|
authorized_extension = "txt"
|
|
if extension != authorized_extension
|
|
raise Discourse::InvalidParameters.new(
|
|
I18n.t("upload.unauthorized", authorized_extensions: authorized_extension),
|
|
)
|
|
end
|
|
end
|
|
|
|
def validate_file_size!(filesize)
|
|
max_size_bytes = 20.megabytes
|
|
if filesize > max_size_bytes
|
|
raise Discourse::InvalidParameters.new(
|
|
I18n.t(
|
|
"upload.attachments.too_large_humanized",
|
|
max_size: ActiveSupport::NumberHelper.number_to_human_size(max_size_bytes),
|
|
),
|
|
)
|
|
end
|
|
end
|
|
end
|
|
end
|
|
end
|