2019-07-27 04:42:08 +02:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
class SearchQueryTransformer < Parslet::Transform
|
|
|
|
class Query
|
2022-02-14 00:17:09 +01:00
|
|
|
attr_reader :should_clauses, :must_not_clauses, :must_clauses, :filter_clauses
|
2019-07-27 04:42:08 +02:00
|
|
|
|
|
|
|
def initialize(clauses)
|
|
|
|
grouped = clauses.chunk(&:operator).to_h
|
|
|
|
@should_clauses = grouped.fetch(:should, [])
|
|
|
|
@must_not_clauses = grouped.fetch(:must_not, [])
|
|
|
|
@must_clauses = grouped.fetch(:must, [])
|
2022-02-14 00:17:09 +01:00
|
|
|
@filter_clauses = grouped.fetch(:filter, [])
|
2019-07-27 04:42:08 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
def apply(search)
|
|
|
|
should_clauses.each { |clause| search = search.query.should(clause_to_query(clause)) }
|
|
|
|
must_clauses.each { |clause| search = search.query.must(clause_to_query(clause)) }
|
|
|
|
must_not_clauses.each { |clause| search = search.query.must_not(clause_to_query(clause)) }
|
2022-02-14 00:17:09 +01:00
|
|
|
filter_clauses.each { |clause| search = search.filter(**clause_to_filter(clause)) }
|
2019-07-27 04:42:08 +02:00
|
|
|
search.query.minimum_should_match(1)
|
|
|
|
end
|
|
|
|
|
|
|
|
private
|
|
|
|
|
|
|
|
def clause_to_query(clause)
|
|
|
|
case clause
|
|
|
|
when TermClause
|
|
|
|
{ multi_match: { type: 'most_fields', query: clause.term, fields: ['text', 'text.stemmed'] } }
|
|
|
|
when PhraseClause
|
|
|
|
{ match_phrase: { text: { query: clause.phrase } } }
|
|
|
|
else
|
|
|
|
raise "Unexpected clause type: #{clause}"
|
|
|
|
end
|
|
|
|
end
|
2022-02-14 00:17:09 +01:00
|
|
|
|
|
|
|
def clause_to_filter(clause)
|
|
|
|
case clause
|
|
|
|
when PrefixClause
|
2023-08-28 10:31:51 +02:00
|
|
|
if clause.negated?
|
|
|
|
{ bool: { must_not: { clause.type => { clause.filter => clause.term } } } }
|
|
|
|
else
|
|
|
|
{ clause.type => { clause.filter => clause.term } }
|
|
|
|
end
|
2022-02-14 00:17:09 +01:00
|
|
|
else
|
|
|
|
raise "Unexpected clause type: #{clause}"
|
|
|
|
end
|
|
|
|
end
|
2019-07-27 04:42:08 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
class Operator
|
|
|
|
class << self
|
|
|
|
def symbol(str)
|
|
|
|
case str
|
2023-08-24 16:40:04 +02:00
|
|
|
when '+', nil
|
2019-07-27 04:42:08 +02:00
|
|
|
:must
|
|
|
|
when '-'
|
|
|
|
:must_not
|
|
|
|
else
|
|
|
|
raise "Unknown operator: #{str}"
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
class TermClause
|
|
|
|
attr_reader :prefix, :operator, :term
|
|
|
|
|
|
|
|
def initialize(prefix, operator, term)
|
|
|
|
@prefix = prefix
|
|
|
|
@operator = Operator.symbol(operator)
|
|
|
|
@term = term
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
class PhraseClause
|
|
|
|
attr_reader :prefix, :operator, :phrase
|
|
|
|
|
|
|
|
def initialize(prefix, operator, phrase)
|
|
|
|
@prefix = prefix
|
|
|
|
@operator = Operator.symbol(operator)
|
|
|
|
@phrase = phrase
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2022-02-14 00:17:09 +01:00
|
|
|
class PrefixClause
|
2023-08-24 16:40:04 +02:00
|
|
|
attr_reader :type, :filter, :operator, :term
|
2022-02-14 00:17:09 +01:00
|
|
|
|
2023-08-28 12:43:00 +02:00
|
|
|
def initialize(prefix, operator, term, options = {})
|
2023-08-28 10:31:51 +02:00
|
|
|
@negated = operator == '-'
|
2023-08-28 12:43:00 +02:00
|
|
|
@options = options
|
2022-02-14 00:17:09 +01:00
|
|
|
@operator = :filter
|
2023-08-24 16:40:04 +02:00
|
|
|
|
2022-02-14 00:17:09 +01:00
|
|
|
case prefix
|
2023-08-24 16:40:04 +02:00
|
|
|
when 'has', 'is'
|
|
|
|
@filter = :properties
|
|
|
|
@type = :term
|
|
|
|
@term = term
|
|
|
|
when 'language'
|
|
|
|
@filter = :language
|
|
|
|
@type = :term
|
2023-08-30 16:07:26 +02:00
|
|
|
@term = language_code_from_term(term)
|
2022-02-14 00:17:09 +01:00
|
|
|
when 'from'
|
|
|
|
@filter = :account_id
|
2023-08-24 16:40:04 +02:00
|
|
|
@type = :term
|
|
|
|
@term = account_id_from_term(term)
|
|
|
|
when 'before'
|
|
|
|
@filter = :created_at
|
|
|
|
@type = :range
|
2023-08-28 12:43:00 +02:00
|
|
|
@term = { lt: term, time_zone: @options[:current_account]&.user_time_zone || 'UTC' }
|
2023-08-24 16:40:04 +02:00
|
|
|
when 'after'
|
|
|
|
@filter = :created_at
|
|
|
|
@type = :range
|
2023-08-28 12:43:00 +02:00
|
|
|
@term = { gt: term, time_zone: @options[:current_account]&.user_time_zone || 'UTC' }
|
2023-08-24 16:40:04 +02:00
|
|
|
when 'during'
|
|
|
|
@filter = :created_at
|
|
|
|
@type = :range
|
2023-08-28 12:43:00 +02:00
|
|
|
@term = { gte: term, lte: term, time_zone: @options[:current_account]&.user_time_zone || 'UTC' }
|
2022-02-14 00:17:09 +01:00
|
|
|
else
|
2022-04-08 21:21:49 +02:00
|
|
|
raise Mastodon::SyntaxError
|
2022-02-14 00:17:09 +01:00
|
|
|
end
|
|
|
|
end
|
2023-08-24 16:40:04 +02:00
|
|
|
|
2023-08-28 10:31:51 +02:00
|
|
|
def negated?
|
|
|
|
@negated
|
|
|
|
end
|
|
|
|
|
2023-08-24 16:40:04 +02:00
|
|
|
private
|
|
|
|
|
|
|
|
def account_id_from_term(term)
|
2023-08-28 12:43:00 +02:00
|
|
|
return @options[:current_account]&.id || -1 if term == 'me'
|
|
|
|
|
2023-08-24 16:40:04 +02:00
|
|
|
username, domain = term.gsub(/\A@/, '').split('@')
|
|
|
|
domain = nil if TagManager.instance.local_domain?(domain)
|
|
|
|
account = Account.find_remote(username, domain)
|
|
|
|
|
|
|
|
# If the account is not found, we want to return empty results, so return
|
|
|
|
# an ID that does not exist
|
|
|
|
account&.id || -1
|
|
|
|
end
|
2023-08-30 16:07:26 +02:00
|
|
|
|
|
|
|
def language_code_from_term(term)
|
|
|
|
language_code = term
|
|
|
|
|
|
|
|
return language_code if LanguagesHelper::SUPPORTED_LOCALES.key?(language_code.to_sym)
|
|
|
|
|
|
|
|
language_code = term.downcase
|
|
|
|
|
|
|
|
return language_code if LanguagesHelper::SUPPORTED_LOCALES.key?(language_code.to_sym)
|
|
|
|
|
|
|
|
language_code = term.split(/[_-]/).first.downcase
|
|
|
|
|
|
|
|
return language_code if LanguagesHelper::SUPPORTED_LOCALES.key?(language_code.to_sym)
|
|
|
|
|
|
|
|
term
|
|
|
|
end
|
2022-02-14 00:17:09 +01:00
|
|
|
end
|
|
|
|
|
2019-07-27 04:42:08 +02:00
|
|
|
rule(clause: subtree(:clause)) do
|
|
|
|
prefix = clause[:prefix][:term].to_s if clause[:prefix]
|
|
|
|
operator = clause[:operator]&.to_s
|
|
|
|
|
2022-02-14 00:17:09 +01:00
|
|
|
if clause[:prefix]
|
2023-08-28 12:43:00 +02:00
|
|
|
PrefixClause.new(prefix, operator, clause[:term].to_s, current_account: current_account)
|
2022-02-14 00:17:09 +01:00
|
|
|
elsif clause[:term]
|
2019-07-27 04:42:08 +02:00
|
|
|
TermClause.new(prefix, operator, clause[:term].to_s)
|
2019-08-16 13:00:30 +02:00
|
|
|
elsif clause[:shortcode]
|
|
|
|
TermClause.new(prefix, operator, ":#{clause[:term]}:")
|
2019-07-27 04:42:08 +02:00
|
|
|
elsif clause[:phrase]
|
2019-12-30 18:30:24 +01:00
|
|
|
PhraseClause.new(prefix, operator, clause[:phrase].is_a?(Array) ? clause[:phrase].map { |p| p[:term].to_s }.join(' ') : clause[:phrase].to_s)
|
2019-07-27 04:42:08 +02:00
|
|
|
else
|
|
|
|
raise "Unexpected clause type: #{clause}"
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
rule(query: sequence(:clauses)) { Query.new(clauses) }
|
|
|
|
end
|