2023-06-13 13:21:46 -04:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
# Base class that defines the interface that every summarization
|
|
|
|
# strategy must implement.
|
|
|
|
# Above each method, you'll find an explanation of what
|
|
|
|
# it does and what it should return.
|
|
|
|
|
2023-06-13 13:21:46 -04:00
|
|
|
module Summarization
|
|
|
|
class Base
|
2023-06-27 10:44:34 -04:00
|
|
|
class << self
|
|
|
|
def available_strategies
|
|
|
|
DiscoursePluginRegistry.summarization_strategies
|
|
|
|
end
|
2023-06-13 13:21:46 -04:00
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
def find_strategy(strategy_model)
|
|
|
|
available_strategies.detect { |s| s.model == strategy_model }
|
|
|
|
end
|
2023-06-13 13:21:46 -04:00
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
def selected_strategy
|
|
|
|
return if SiteSetting.summarization_strategy.blank?
|
2023-06-13 13:21:46 -04:00
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
find_strategy(SiteSetting.summarization_strategy)
|
|
|
|
end
|
2023-06-13 13:21:46 -04:00
|
|
|
|
2023-07-12 10:21:51 -04:00
|
|
|
def can_see_summary?(target, user)
|
|
|
|
return false if SiteSetting.summarization_strategy.blank?
|
2024-04-05 11:12:59 -04:00
|
|
|
return false if target.class == Topic && target.private_message?
|
2023-07-12 10:21:51 -04:00
|
|
|
|
|
|
|
has_cached_summary = SummarySection.exists?(target: target, meta_section_id: nil)
|
|
|
|
return has_cached_summary if user.nil?
|
|
|
|
|
|
|
|
has_cached_summary || can_request_summary_for?(user)
|
|
|
|
end
|
|
|
|
|
|
|
|
def can_request_summary_for?(user)
|
|
|
|
return false unless user
|
|
|
|
|
|
|
|
user_group_ids = user.group_ids
|
2023-06-13 13:21:46 -04:00
|
|
|
|
2023-07-12 10:21:51 -04:00
|
|
|
SiteSetting.custom_summarization_allowed_groups_map.any? do |group_id|
|
|
|
|
user_group_ids.include?(group_id)
|
|
|
|
end
|
2023-06-13 13:21:46 -04:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
# Some strategies could require other conditions to work correctly,
|
|
|
|
# like site settings.
|
|
|
|
# This method gets called when admins attempt to select it,
|
|
|
|
# checking if we met those conditions.
|
2023-06-13 13:21:46 -04:00
|
|
|
def correctly_configured?
|
|
|
|
raise NotImplemented
|
|
|
|
end
|
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
# Strategy name to display to admins in the available strategies dropdown.
|
2023-06-13 13:21:46 -04:00
|
|
|
def display_name
|
|
|
|
raise NotImplemented
|
|
|
|
end
|
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
# If we don't meet the conditions to enable this strategy,
|
|
|
|
# we'll display this hint as an error to admins.
|
2023-06-13 13:21:46 -04:00
|
|
|
def configuration_hint
|
|
|
|
raise NotImplemented
|
|
|
|
end
|
|
|
|
|
2023-06-27 10:44:34 -04:00
|
|
|
# The idea behind this method is "give me a collection of texts,
|
|
|
|
# and I'll handle the summarization to the best of my capabilities.".
|
|
|
|
# It's important to emphasize the "collection of texts" part, which implies
|
|
|
|
# it's not tied to any model and expects the "content" to be a hash instead.
|
|
|
|
#
|
|
|
|
# @param content { Hash } - Includes the content to summarize, plus additional
|
|
|
|
# context to help the strategy produce a better result. Keys present in the content hash:
|
|
|
|
# - resource_path (optional): Helps the strategy build links to the content in the summary (e.g. "/t/-/:topic_id/POST_NUMBER")
|
|
|
|
# - content_title (optional): Provides guidance about what the content is about.
|
|
|
|
# - contents (required): Array of hashes with content to summarize (e.g. [{ poster: "asd", id: 1, text: "This is a text" }])
|
|
|
|
# All keys are required.
|
2023-08-11 14:08:49 -04:00
|
|
|
# @param &on_partial_blk { Block - Optional } - If the strategy supports it, the passed block
|
|
|
|
# will get called with partial summarized text as its generated.
|
2023-06-27 10:44:34 -04:00
|
|
|
#
|
2023-11-21 11:27:27 -05:00
|
|
|
# @param current_user { User } - User requesting the summary.
|
|
|
|
#
|
2023-06-27 10:44:34 -04:00
|
|
|
# @returns { Hash } - The summarized content, plus chunks if the content couldn't be summarized in one pass. Example:
|
|
|
|
# {
|
|
|
|
# summary: "This is the final summary",
|
|
|
|
# chunks: [
|
|
|
|
# { ids: [topic.first_post.post_number], summary: "this is the first chunk" },
|
|
|
|
# { ids: [post_1.post_number, post_2.post_number], summary: "this is the second chunk" },
|
|
|
|
# ],
|
|
|
|
# }
|
2023-11-21 11:27:27 -05:00
|
|
|
def summarize(content, current_user)
|
2023-06-13 13:21:46 -04:00
|
|
|
raise NotImplemented
|
|
|
|
end
|
2023-06-27 10:44:34 -04:00
|
|
|
|
|
|
|
# Returns the string we'll store in the selected strategy site setting.
|
|
|
|
def model
|
|
|
|
raise NotImplemented
|
|
|
|
end
|
2023-06-13 13:21:46 -04:00
|
|
|
end
|
|
|
|
end
|