123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259 |
- # frozen_string_literal: true
- class SearchQueryTransformer < Parslet::Transform
- SUPPORTED_PREFIXES = %w(
- has
- is
- language
- from
- before
- after
- during
- in
- ).freeze
- class Query
- def initialize(clauses, options = {})
- raise ArgumentError if options[:current_account].nil?
- @clauses = clauses
- @options = options
- flags_from_clauses!
- end
- def request
- search = Chewy::Search::Request.new(*indexes).filter(default_filter)
- must_clauses.each { |clause| search = search.query.must(clause.to_query) }
- must_not_clauses.each { |clause| search = search.query.must_not(clause.to_query) }
- filter_clauses.each { |clause| search = search.filter(**clause.to_query) }
- search
- end
- private
- def clauses_by_operator
- @clauses_by_operator ||= @clauses.compact.chunk(&:operator).to_h
- end
- def flags_from_clauses!
- @flags = clauses_by_operator.fetch(:flag, []).to_h { |clause| [clause.prefix, clause.term] }
- end
- def must_clauses
- clauses_by_operator.fetch(:must, [])
- end
- def must_not_clauses
- clauses_by_operator.fetch(:must_not, [])
- end
- def filter_clauses
- clauses_by_operator.fetch(:filter, [])
- end
- def indexes
- case @flags['in']
- when 'library'
- [StatusesIndex]
- when 'public'
- [PublicStatusesIndex]
- else
- [PublicStatusesIndex, StatusesIndex]
- end
- end
- def default_filter
- {
- bool: {
- should: [
- {
- term: {
- _index: PublicStatusesIndex.index_name,
- },
- },
- {
- bool: {
- must: [
- {
- term: {
- _index: StatusesIndex.index_name,
- },
- },
- {
- term: {
- searchable_by: @options[:current_account].id,
- },
- },
- ],
- },
- },
- ],
- minimum_should_match: 1,
- },
- }
- end
- end
- class Operator
- class << self
- def symbol(str)
- case str
- when '+', nil
- :must
- when '-'
- :must_not
- else
- raise "Unknown operator: #{str}"
- end
- end
- end
- end
- class TermClause
- attr_reader :operator, :term
- def initialize(operator, term)
- @operator = Operator.symbol(operator)
- @term = term
- end
- def to_query
- if @term.start_with?('#')
- { match: { tags: { query: @term, operator: 'and' } } }
- else
- { multi_match: { type: 'most_fields', query: @term, fields: ['text', 'text.stemmed'], operator: 'and' } }
- end
- end
- end
- class PhraseClause
- attr_reader :operator, :phrase
- def initialize(operator, phrase)
- @operator = Operator.symbol(operator)
- @phrase = phrase
- end
- def to_query
- { match_phrase: { text: { query: @phrase } } }
- end
- end
- class PrefixClause
- EPOCH_RE = /\A\d+\z/
- attr_reader :operator, :prefix, :term
- def initialize(prefix, operator, term, options = {})
- @prefix = prefix
- @negated = operator == '-'
- @options = options
- @operator = :filter
- case prefix
- when 'has', 'is'
- @filter = :properties
- @type = :term
- @term = term
- when 'language'
- @filter = :language
- @type = :term
- @term = language_code_from_term(term)
- when 'from'
- @filter = :account_id
- @type = :term
- @term = account_id_from_term(term)
- when 'before'
- @filter = :created_at
- @type = :range
- @term = { lt: date_from_term(term), time_zone: @options[:current_account]&.user_time_zone.presence || 'UTC' }
- when 'after'
- @filter = :created_at
- @type = :range
- @term = { gt: date_from_term(term), time_zone: @options[:current_account]&.user_time_zone.presence || 'UTC' }
- when 'during'
- @filter = :created_at
- @type = :range
- @term = { gte: date_from_term(term), lte: date_from_term(term), time_zone: @options[:current_account]&.user_time_zone.presence || 'UTC' }
- when 'in'
- @operator = :flag
- @term = term
- else
- raise "Unknown prefix: #{prefix}"
- end
- end
- def to_query
- if @negated
- { bool: { must_not: { @type => { @filter => @term } } } }
- else
- { @type => { @filter => @term } }
- end
- end
- private
- def account_id_from_term(term)
- return @options[:current_account]&.id || -1 if term == 'me'
- username, domain = term.gsub(/\A@/, '').split('@')
- domain = nil if TagManager.instance.local_domain?(domain)
- account = Account.find_remote(username, domain)
- # If the account is not found, we want to return empty results, so return
- # an ID that does not exist
- account&.id || -1
- end
- def language_code_from_term(term)
- language_code = term
- return language_code if LanguagesHelper::SUPPORTED_LOCALES.key?(language_code.to_sym)
- language_code = term.downcase
- return language_code if LanguagesHelper::SUPPORTED_LOCALES.key?(language_code.to_sym)
- language_code = term.split(/[_-]/).first.downcase
- return language_code if LanguagesHelper::SUPPORTED_LOCALES.key?(language_code.to_sym)
- term
- end
- def date_from_term(term)
- DateTime.iso8601(term) unless term.match?(EPOCH_RE) # This will raise Date::Error if the date is invalid
- term
- end
- end
- rule(clause: subtree(:clause)) do
- prefix = clause[:prefix][:term].to_s.downcase if clause[:prefix]
- operator = clause[:operator]&.to_s
- term = clause[:phrase] ? clause[:phrase].map { |term| term[:term].to_s }.join(' ') : clause[:term].to_s
- if clause[:prefix] && SUPPORTED_PREFIXES.include?(prefix)
- PrefixClause.new(prefix, operator, term, current_account: current_account)
- elsif clause[:prefix]
- TermClause.new(operator, "#{prefix} #{term}")
- elsif clause[:term]
- TermClause.new(operator, term)
- elsif clause[:phrase]
- PhraseClause.new(operator, term)
- else
- raise "Unexpected clause type: #{clause}"
- end
- end
- rule(junk: subtree(:junk)) do
- nil
- end
- rule(query: sequence(:clauses)) do
- Query.new(clauses, current_account: current_account)
- end
- end
|