discourse-ai/app/controllers/discourse_ai/admin/rag_document_fragments_controller.rb

# frozen_string_literal: true

module DiscourseAi
  module Admin
    class RagDocumentFragmentsController < ::Admin::AdminController
      requires_plugin ::DiscourseAi::PLUGIN_NAME

      def indexing_status_check
        if params[:target_type] == "AiPersona"
          @target = AiPersona.find(params[:target_id])
        elsif params[:target_type] == "AiTool"
          @target = AiTool.find(params[:target_id])
        else
          raise Discourse::InvalidParameters.new("Invalid target type")
        end

        render json: RagDocumentFragment.indexing_status(@target, @target.uploads)
      end

      def upload_file
        file = params[:file] || params[:files].first

        if !DiscourseAi::Embeddings.enabled?
          raise Discourse::InvalidAccess.new("Embeddings not enabled")
        end

        validate_extension!(file.original_filename)
        validate_file_size!(file.tempfile.size)

        hijack do
          upload =
            UploadCreator.new(
              file.tempfile,
              file.original_filename,
              type: "discourse_ai_rag_upload",
              skip_validations: true,
            ).create_for(current_user.id)

          if upload.persisted?
            render json: UploadSerializer.new(upload)
          else
            render json: failed_json.merge(errors: upload.errors.full_messages), status: 422
          end
        end
      end

      private

      def validate_extension!(filename)
        extension = File.extname(filename)[1..-1] || ""
        authorized_extensions = %w[txt md]
        authorized_extensions.concat(%w[pdf png jpg jpeg]) if SiteSetting.ai_rag_pdf_images_enabled
        if !authorized_extensions.include?(extension)
          raise Discourse::InvalidParameters.new(
                  I18n.t(
                    "upload.unauthorized",
                    authorized_extensions: authorized_extensions.join(" "),
                  ),
                )
        end
      end

      def validate_file_size!(filesize)
        max_size_bytes = 20.megabytes
        if filesize > max_size_bytes
          raise Discourse::InvalidParameters.new(
                  I18n.t(
                    "upload.attachments.too_large_humanized",
                    max_size: ActiveSupport::NumberHelper.number_to_human_size(max_size_bytes),
                  ),
                )
        end
      end
    end
  end
end
FEATURE: RAG search within tools (#802) This allows custom tools access to uploads and sophisticated searches using embedding. It introduces: - A shared front end for listing and uploading files (shared with personas) - Backend implementation of index.search function within a custom tool. Custom tools now may search through uploaded files function invoke(params) { return index.search(params.query) } This means that RAG implementers now may preload tools with knowledge and have high fidelity over the search. The search function support specifying max results specifying a subset of files to search (from uploads) Also - Improved documentation for tools (when creating a tool a preamble explains all the functionality) - uploads were a bit finicky, fixed an edge case where the UI would not show them as updated 2024-09-30 16:27:50 +09:00			`# frozen_string_literal: true`

			`module DiscourseAi`
			`module Admin`
			`class RagDocumentFragmentsController < ::Admin::AdminController`
			`requires_plugin ::DiscourseAi::PLUGIN_NAME`

			`def indexing_status_check`
			`if params[:target_type] == "AiPersona"`
			`@target = AiPersona.find(params[:target_id])`
			`elsif params[:target_type] == "AiTool"`
			`@target = AiTool.find(params[:target_id])`
			`else`
			`raise Discourse::InvalidParameters.new("Invalid target type")`
			`end`

			`render json: RagDocumentFragment.indexing_status(@target, @target.uploads)`
			`end`

			`def upload_file`
			`file = params[:file] \|\| params[:files].first`

DEV: Robust check for embeddings enabled (#1116) 2025-02-06 12:18:55 -03:00			`if !DiscourseAi::Embeddings.enabled?`
FEATURE: RAG search within tools (#802) This allows custom tools access to uploads and sophisticated searches using embedding. It introduces: - A shared front end for listing and uploading files (shared with personas) - Backend implementation of index.search function within a custom tool. Custom tools now may search through uploaded files function invoke(params) { return index.search(params.query) } This means that RAG implementers now may preload tools with knowledge and have high fidelity over the search. The search function support specifying max results specifying a subset of files to search (from uploads) Also - Improved documentation for tools (when creating a tool a preamble explains all the functionality) - uploads were a bit finicky, fixed an edge case where the UI would not show them as updated 2024-09-30 16:27:50 +09:00			`raise Discourse::InvalidAccess.new("Embeddings not enabled")`
			`end`

			`validate_extension!(file.original_filename)`
			`validate_file_size!(file.tempfile.size)`

			`hijack do`
			`upload =`
			`UploadCreator.new(`
			`file.tempfile,`
			`file.original_filename,`
			`type: "discourse_ai_rag_upload",`
			`skip_validations: true,`
			`).create_for(current_user.id)`

			`if upload.persisted?`
			`render json: UploadSerializer.new(upload)`
			`else`
			`render json: failed_json.merge(errors: upload.errors.full_messages), status: 422`
			`end`
			`end`
			`end`

			`private`

			`def validate_extension!(filename)`
			`extension = File.extname(filename)[1..-1] \|\| ""`
			`authorized_extensions = %w[txt md]`
FEATURE: PDF support for rag pipeline (#1118) This PR introduces several enhancements and refactorings to the AI Persona and RAG (Retrieval-Augmented Generation) functionalities within the discourse-ai plugin. Here's a breakdown of the changes: 1. LLM Model Association for RAG and Personas: - New Database Columns: Adds `rag_llm_model_id` to both `ai_personas` and `ai_tools` tables. This allows specifying a dedicated LLM for RAG indexing, separate from the persona's primary LLM. Adds `default_llm_id` and `question_consolidator_llm_id` to `ai_personas`. - Migration: Includes a migration (`20250210032345_migrate_persona_to_llm_model_id.rb`) to populate the new `default_llm_id` and `question_consolidator_llm_id` columns in `ai_personas` based on the existing `default_llm` and `question_consolidator_llm` string columns, and a post migration to remove the latter. - Model Changes: The `AiPersona` and `AiTool` models now `belong_to` an `LlmModel` via `rag_llm_model_id`. The `LlmModel.proxy` method now accepts an `LlmModel` instance instead of just an identifier. `AiPersona` now has `default_llm_id` and `question_consolidator_llm_id` attributes. - UI Updates: The AI Persona and AI Tool editors in the admin panel now allow selecting an LLM for RAG indexing (if PDF/image support is enabled). The RAG options component displays an LLM selector. - Serialization: The serializers (`AiCustomToolSerializer`, `AiCustomToolListSerializer`, `LocalizedAiPersonaSerializer`) have been updated to include the new `rag_llm_model_id`, `default_llm_id` and `question_consolidator_llm_id` attributes. 2. PDF and Image Support for RAG: - Site Setting: Introduces a new hidden site setting, `ai_rag_pdf_images_enabled`, to control whether PDF and image files can be indexed for RAG. This defaults to `false`. - File Upload Validation: The `RagDocumentFragmentsController` now checks the `ai_rag_pdf_images_enabled` setting and allows PDF, PNG, JPG, and JPEG files if enabled. Error handling is included for cases where PDF/image indexing is attempted with the setting disabled. - PDF Processing: Adds a new utility class, `DiscourseAi::Utils::PdfToImages`, which uses ImageMagick (`magick`) to convert PDF pages into individual PNG images. A maximum PDF size and conversion timeout are enforced. - Image Processing: A new utility class, `DiscourseAi::Utils::ImageToText`, is included to handle OCR for the images and PDFs. - RAG Digestion Job: The `DigestRagUpload` job now handles PDF and image uploads. It uses `PdfToImages` and `ImageToText` to extract text and create document fragments. - UI Updates: The RAG uploader component now accepts PDF and image file types if `ai_rag_pdf_images_enabled` is true. The UI text is adjusted to indicate supported file types. 3. Refactoring and Improvements: - LLM Enumeration: The `DiscourseAi::Configuration::LlmEnumerator` now provides a `values_for_serialization` method, which returns a simplified array of LLM data (id, name, vision_enabled) suitable for use in serializers. This avoids exposing unnecessary details to the frontend. - AI Helper: The `AiHelper::Assistant` now takes optional `helper_llm` and `image_caption_llm` parameters in its constructor, allowing for greater flexibility. - Bot and Persona Updates: Several updates were made across the codebase, changing the string based association to a LLM to the new model based. - Audit Logs: The `DiscourseAi::Completions::Endpoints::Base` now formats raw request payloads as pretty JSON for easier auditing. - Eval Script: An evaluation script is included. 4. Testing: - The PR introduces a new eval system for LLMs, this allows us to test how functionality works across various LLM providers. This lives in `/evals` 2025-02-14 12:15:07 +11:00			`authorized_extensions.concat(%w[pdf png jpg jpeg]) if SiteSetting.ai_rag_pdf_images_enabled`
FEATURE: RAG search within tools (#802) This allows custom tools access to uploads and sophisticated searches using embedding. It introduces: - A shared front end for listing and uploading files (shared with personas) - Backend implementation of index.search function within a custom tool. Custom tools now may search through uploaded files function invoke(params) { return index.search(params.query) } This means that RAG implementers now may preload tools with knowledge and have high fidelity over the search. The search function support specifying max results specifying a subset of files to search (from uploads) Also - Improved documentation for tools (when creating a tool a preamble explains all the functionality) - uploads were a bit finicky, fixed an edge case where the UI would not show them as updated 2024-09-30 16:27:50 +09:00			`if !authorized_extensions.include?(extension)`
			`raise Discourse::InvalidParameters.new(`
			`I18n.t(`
			`"upload.unauthorized",`
			`authorized_extensions: authorized_extensions.join(" "),`
			`),`
			`)`
			`end`
			`end`

			`def validate_file_size!(filesize)`
			`max_size_bytes = 20.megabytes`
			`if filesize > max_size_bytes`
			`raise Discourse::InvalidParameters.new(`
			`I18n.t(`
			`"upload.attachments.too_large_humanized",`
			`max_size: ActiveSupport::NumberHelper.number_to_human_size(max_size_bytes),`
			`),`
			`)`
			`end`
			`end`
			`end`
			`end`
			`end`