statuses_index.rb 1.9 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465
  1. # frozen_string_literal: true
  2. class StatusesIndex < Chewy::Index
  3. settings index: index_preset(refresh_interval: '30s', number_of_shards: 5), analysis: {
  4. filter: {
  5. english_stop: {
  6. type: 'stop',
  7. stopwords: '_english_',
  8. },
  9. english_stemmer: {
  10. type: 'stemmer',
  11. language: 'english',
  12. },
  13. english_possessive_stemmer: {
  14. type: 'stemmer',
  15. language: 'possessive_english',
  16. },
  17. },
  18. analyzer: {
  19. verbatim: {
  20. tokenizer: 'uax_url_email',
  21. filter: %w(lowercase),
  22. },
  23. content: {
  24. tokenizer: 'standard',
  25. filter: %w(
  26. lowercase
  27. asciifolding
  28. cjk_width
  29. elision
  30. english_possessive_stemmer
  31. english_stop
  32. english_stemmer
  33. ),
  34. },
  35. hashtag: {
  36. tokenizer: 'keyword',
  37. filter: %w(
  38. word_delimiter_graph
  39. lowercase
  40. asciifolding
  41. cjk_width
  42. ),
  43. },
  44. },
  45. }
  46. index_scope ::Status.unscoped.kept.without_reblogs.includes(:media_attachments, :preview_cards, :local_mentioned, :local_favorited, :local_reblogged, :local_bookmarked, :tags, preloadable_poll: :local_voters), delete_if: ->(status) { status.searchable_by.empty? }
  47. root date_detection: false do
  48. field(:id, type: 'long')
  49. field(:account_id, type: 'long')
  50. field(:text, type: 'text', analyzer: 'verbatim', value: ->(status) { status.searchable_text }) { field(:stemmed, type: 'text', analyzer: 'content') }
  51. field(:tags, type: 'text', analyzer: 'hashtag', value: ->(status) { status.tags.map(&:display_name) })
  52. field(:searchable_by, type: 'long', value: ->(status) { status.searchable_by })
  53. field(:language, type: 'keyword')
  54. field(:properties, type: 'keyword', value: ->(status) { status.searchable_properties })
  55. field(:created_at, type: 'date')
  56. end
  57. end