discourse-ai/lib/sentiment/sentiment_classification.rb

# frozen_string_literal: true

module DiscourseAi
  module Sentiment
    class SentimentClassification
      def type
        :sentiment
      end

      def available_classifiers
        DiscourseAi::Sentiment::SentimentSiteSettingJsonSchema.values
      end

      def can_classify?(target)
        content_of(target).present?
      end

      def get_verdicts(_)
        available_classifiers.reduce({}) do |memo, model|
          memo[model.model_name] = false
          memo
        end
      end

      def should_flag_based_on?(_verdicts)
        # We don't flag based on sentiment classification.
        false
      end

      def request(target_to_classify)
        target_content = content_of(target_to_classify)

        available_classifiers.reduce({}) do |memo, model|
          memo[model.model_name] = request_with(target_content, model)
          memo
        end
      end

      def transform_result(result)
        hash_result = {}
        result.each { |r| hash_result[r[:label]] = r[:score] }
        hash_result
      end

      private

      def request_with(content, model_config)
        result = ::DiscourseAi::Inference::HuggingFaceTextEmbeddings.classify(content, model_config)
        transform_result(result)
      end

      def content_of(target_to_classify)
        content =
          if target_to_classify.post_number == 1
            "#{target_to_classify.topic.title}\n#{target_to_classify.raw}"
          else
            target_to_classify.raw
          end

        Tokenizer::BertTokenizer.truncate(content, 512)
      end
    end
  end
end
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`# frozen_string_literal: true`

DEV: DiscourseAI -> DiscourseAi rename to have consistent folders and files (#9) 2023-03-14 15:03:50 -04:00			`module DiscourseAi`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`module Sentiment`
			`class SentimentClassification`
			`def type`
			`:sentiment`
			`end`

Migrate sentiment to a TEI backend (#886) 2024-11-04 07:14:34 -05:00			`def available_classifiers`
			`DiscourseAi::Sentiment::SentimentSiteSettingJsonSchema.values`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`end`

			`def can_classify?(target)`
			`content_of(target).present?`
			`end`

FEATURE: Use dedicated reviewables for AI flags. (#4) This change adds two new reviewable types: ReviewableAIPost and ReviewableAIChatMessage. They have the same actions as their existing counterparts: ReviewableFlaggedPost and ReviewableChatMessage. We'll display the model used and their accuracy when showing these flags in the review queue and adjust the latter after staff performs an action, tracking a global accuracy per existing model in a separate table. * FEATURE: Dedicated reviewables for AI flags * Store and adjust model accuracy * Display accuracy in reviewable templates 2023-03-07 13:39:28 -05:00			`def get_verdicts(_)`
Migrate sentiment to a TEI backend (#886) 2024-11-04 07:14:34 -05:00			`available_classifiers.reduce({}) do \|memo, model\|`
			`memo[model.model_name] = false`
FEATURE: Use dedicated reviewables for AI flags. (#4) This change adds two new reviewable types: ReviewableAIPost and ReviewableAIChatMessage. They have the same actions as their existing counterparts: ReviewableFlaggedPost and ReviewableChatMessage. We'll display the model used and their accuracy when showing these flags in the review queue and adjust the latter after staff performs an action, tracking a global accuracy per existing model in a separate table. * FEATURE: Dedicated reviewables for AI flags * Store and adjust model accuracy * Display accuracy in reviewable templates 2023-03-07 13:39:28 -05:00			`memo`
			`end`
			`end`

			`def should_flag_based_on?(_verdicts)`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`# We don't flag based on sentiment classification.`
			`false`
			`end`

			`def request(target_to_classify)`
Revert "FEATURE: User sentiment on profile summary page (#329)" (#383) This reverts commit 71c5077228c8caa98191ee590ec7a59f54ade893. 2023-12-27 19:01:57 -05:00			`target_content = content_of(target_to_classify)`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00
Migrate sentiment to a TEI backend (#886) 2024-11-04 07:14:34 -05:00			`available_classifiers.reduce({}) do \|memo, model\|`
			`memo[model.model_name] = request_with(target_content, model)`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`memo`
			`end`
			`end`

Migrate sentiment to a TEI backend (#886) 2024-11-04 07:14:34 -05:00			`def transform_result(result)`
			`hash_result = {}`
			`result.each { \|r\| hash_result[r[:label]] = r[:score] }`
			`hash_result`
			`end`

REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`private`

Migrate sentiment to a TEI backend (#886) 2024-11-04 07:14:34 -05:00			`def request_with(content, model_config)`
			`result = ::DiscourseAi::Inference::HuggingFaceTextEmbeddings.classify(content, model_config)`
			`transform_result(result)`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`end`

			`def content_of(target_to_classify)`
FIX: Truncate content for sentiment/toxicity classification (#431) 2024-01-17 13:17:58 -05:00			`content =`
			`if target_to_classify.post_number == 1`
			`"#{target_to_classify.topic.title}\n#{target_to_classify.raw}"`
			`else`
			`target_to_classify.raw`
			`end`

			`Tokenizer::BertTokenizer.truncate(content, 512)`
REFACTOR: Streamline flag and classification process 2023-02-24 11:25:02 -05:00			`end`
			`end`
			`end`
			`end`