123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637 |
- # Copyright (C) 2012-2024 Zammad Foundation, https://zammad-foundation.org/
- require 'net/imap'
- class Channel::Driver::Imap < Channel::EmailParser
- FETCH_METADATA_TIMEOUT = 2.minutes
- FETCH_MSG_TIMEOUT = 4.minutes
- EXPUNGE_TIMEOUT = 16.minutes
- DEFAULT_TIMEOUT = 45.seconds
- CHECK_ONLY_TIMEOUT = 8.seconds
- def fetchable?(_channel)
- true
- end
- =begin
- fetch emails from IMAP account
- instance = Channel::Driver::Imap.new
- result = instance.fetch(params[:inbound][:options], channel, 'verify', subject_looking_for)
- returns
- {
- result: 'ok',
- fetched: 123,
- notice: 'e. g. message about to big emails in mailbox',
- }
- check if connect to IMAP account is possible, return count of mails in mailbox
- instance = Channel::Driver::Imap.new
- result = instance.fetch(params[:inbound][:options], channel, 'check')
- returns
- {
- result: 'ok',
- content_messages: 123,
- }
- verify IMAP account, check if search email is in there
- instance = Channel::Driver::Imap.new
- result = instance.fetch(params[:inbound][:options], channel, 'verify', subject_looking_for)
- returns
- {
- result: 'ok', # 'verify not ok'
- }
- example
- params = {
- host: 'outlook.office365.com',
- user: 'xxx@zammad.onmicrosoft.com',
- password: 'xxx',
- keep_on_server: true,
- }
- OR
- params = {
- host: 'imap.gmail.com',
- user: 'xxx@gmail.com',
- password: 'xxx',
- keep_on_server: true,
- auth_type: 'XOAUTH2'
- }
- channel = Channel.last
- instance = Channel::Driver::Imap.new
- result = instance.fetch(params, channel, 'verify')
- =end
- def fetch(options, channel, check_type = '', verify_string = '')
- ssl = true
- ssl_verify = options.fetch(:ssl_verify, true)
- starttls = false
- port = 993
- keep_on_server = false
- folder = 'INBOX'
- if options[:keep_on_server] == true || options[:keep_on_server] == 'true'
- keep_on_server = true
- end
- case options[:ssl]
- when 'off'
- ssl = false
- when 'starttls'
- ssl = false
- starttls = true
- end
- port = if options.key?(:port) && options[:port].present?
- options[:port].to_i
- elsif ssl == true
- 993
- else
- 143
- end
- if options[:folder].present?
- folder = options[:folder]
- end
- Rails.logger.info "fetching imap (#{options[:host]}/#{options[:user]} port=#{port},ssl=#{ssl},starttls=#{starttls},folder=#{folder},keep_on_server=#{keep_on_server},auth_type=#{options.fetch(:auth_type, 'LOGIN')})"
- # on check, reduce open_timeout to have faster probing
- check_type_timeout = check_type == 'check' ? CHECK_ONLY_TIMEOUT : DEFAULT_TIMEOUT
- Certificate::ApplySSLCertificates.ensure_fresh_ssl_context if ssl || starttls
- timeout(check_type_timeout) do
- ssl_settings = false
- ssl_settings = (ssl_verify ? true : { verify_mode: OpenSSL::SSL::VERIFY_NONE }) if ssl
- @imap = ::Net::IMAP.new(options[:host], port: port, ssl: ssl_settings)
- if starttls
- @imap.starttls(verify_mode: ssl_verify ? OpenSSL::SSL::VERIFY_PEER : OpenSSL::SSL::VERIFY_NONE)
- end
- end
- timeout(check_type_timeout) do
- if options[:auth_type].present?
- @imap.authenticate(options[:auth_type], options[:user], options[:password])
- else
- @imap.login(options[:user], options[:password].dup&.force_encoding('ascii-8bit'))
- end
- end
- timeout(check_type_timeout) do
- # select folder
- @imap.select(folder)
- end
- message_ids_result = timeout(6.minutes) do
- if keep_on_server && check_type != 'check' && check_type != 'verify'
- fetch_unread_message_ids
- else
- fetch_all_message_ids
- end
- end
- message_ids = message_ids_result[:result]
- # check mode only
- if check_type == 'check'
- Rails.logger.info 'check only mode, fetch no emails'
- content_max_check = 2
- content_messages = 0
- # check messages
- message_ids.each do |message_id|
- message_meta = nil
- timeout(1.minute) do
- message_meta = @imap.fetch(message_id, ['RFC822.HEADER'])[0]
- end
- # check how many content messages we have, for notice used
- headers = self.class.extract_rfc822_headers(message_meta)
- next if messages_is_verify_message?(headers)
- next if messages_is_ignore_message?(headers)
- content_messages += 1
- break if content_max_check < content_messages
- end
- if content_messages >= content_max_check
- content_messages = message_ids.count
- end
- archive_possible = false || message_ids_result[:is_fallback]
- archive_possible_is_fallback = false || message_ids_result[:is_fallback]
- archive_check = 0
- archive_max_check = 500
- archive_days_range = 14
- archive_week_range = archive_days_range / 7
- # use .each only if ordered response is ascending (from older to newer)
- message_ids_iterator = message_ids.each
- # since the correct loop order could improve performance, we should check even for less than 500 available messages
- # starting with 5 messages, since we need 2 additional fetch requests to find the used order and it would not make sense with less messages
- if !message_ids_result[:is_fallback] && content_messages > 4
- message_0_meta = nil
- message_1_meta = nil
- timeout(1.minute) do
- message_0_meta = @imap.fetch(message_ids[0], ['RFC822.HEADER'])[0]
- message_1_meta = @imap.fetch(message_ids[1], ['RFC822.HEADER'])[0]
- end
- headers0 = self.class.extract_rfc822_headers(message_0_meta)
- headers1 = self.class.extract_rfc822_headers(message_1_meta)
- if headers0['Date'].present? && headers1['Date'].present?
- begin
- date0 = Time.zone.parse(headers0['Date'])
- date1 = Time.zone.parse(headers1['Date'])
- # change iterator to .reverse_each if order of the 2 probe messages is descending (from newer to older)
- message_ids_iterator = message_ids.reverse_each if date0 > date1
- rescue => e # rubocop:disable Metrics/BlockNesting
- # no easy order decision possible due to a date parsing issue, continue with default iterator
- end
- end
- end
- message_ids_iterator.each do |message_id|
- message_meta = nil
- timeout(1.minute) do
- message_meta = @imap.fetch(message_id, ['RFC822.HEADER'])[0]
- end
- headers = self.class.extract_rfc822_headers(message_meta)
- next if messages_is_verify_message?(headers)
- next if messages_is_ignore_message?(headers)
- next if headers['Date'].blank?
- archive_check += 1
- break if archive_check >= archive_max_check
- begin
- date = Time.zone.parse(headers['Date'])
- rescue => e
- Rails.logger.error e
- next
- end
- break if date >= Time.zone.now - archive_days_range.days
- archive_possible = true
- # even if it was fallback before, we just found a real old mail, so it's not fallback anymore
- archive_possible_is_fallback = false
- break
- end
- disconnect
- return {
- result: 'ok',
- content_messages: content_messages,
- archive_possible: archive_possible,
- archive_possible_is_fallback: archive_possible_is_fallback,
- archive_week_range: archive_week_range,
- }
- end
- # reverse message order to increase performance
- if check_type == 'verify'
- Rails.logger.info "verify mode, fetch no emails #{verify_string}"
- # check for verify message
- message_ids.reverse_each do |message_id|
- message_meta = nil
- timeout(FETCH_METADATA_TIMEOUT) do
- message_meta = @imap.fetch(message_id, ['RFC822.HEADER'])[0]
- end
- # check if verify message exists
- headers = self.class.extract_rfc822_headers(message_meta)
- subject = headers['Subject']
- next if !subject
- next if !subject.match?(%r{#{verify_string}})
- Rails.logger.info " - verify email #{verify_string} found"
- timeout(600) do
- @imap.store(message_id, '+FLAGS', [:Deleted])
- @imap.expunge
- end
- disconnect
- return {
- result: 'ok',
- }
- end
- disconnect
- return {
- result: 'verify not ok',
- }
- end
- # fetch regular messages
- count_all = message_ids.count
- count = 0
- count_fetched = 0
- count_max = 5000
- too_large_messages = []
- active_check_interval = 20
- result = 'ok'
- notice = ''
- message_ids.each do |message_id|
- count += 1
- break if (count % active_check_interval).zero? && channel_has_changed?(channel)
- break if max_process_count_has_reached?(channel, count, count_max)
- Rails.logger.info " - message #{count}/#{count_all}"
- message_meta = nil
- timeout(FETCH_METADATA_TIMEOUT) do
- message_meta = @imap.fetch(message_id, ['RFC822.SIZE', 'FLAGS', 'INTERNALDATE', 'RFC822.HEADER'])[0]
- rescue Net::IMAP::ResponseParseError => e
- raise if e.message.exclude?('unknown token')
- result = 'error'
- notice += <<~NOTICE
- One of your incoming emails could not be imported (#{e.message}).
- Please remove it from your inbox directly
- to prevent Zammad from trying to import it again.
- NOTICE
- Rails.logger.error "Net::IMAP failed to parse message #{message_id}: #{e.message} (#{e.class})"
- Rails.logger.error '(See https://github.com/zammad/zammad/issues/2754 for more details)'
- end
- next if message_meta.nil?
- # ignore verify messages
- next if !messages_is_too_old_verify?(message_meta, count, count_all)
- # ignore deleted messages
- next if deleted?(message_meta, count, count_all)
- # ignore already imported
- next if already_imported?(message_id, message_meta, count, count_all, keep_on_server, channel)
- # delete email from server after article was created
- msg = nil
- begin
- timeout(FETCH_MSG_TIMEOUT) do
- key = fetch_message_body_key(options)
- msg = @imap.fetch(message_id, key)[0].attr[key]
- end
- rescue Timeout::Error => e
- Rails.logger.error "Unable to fetch email from #{count}/#{count_all} from server (#{options[:host]}/#{options[:user]}): #{e.inspect}"
- raise e
- end
- next if !msg
- # do not process too big messages, instead download & send postmaster reply
- too_large_info = too_large?(message_meta)
- if too_large_info
- if Setting.get('postmaster_send_reject_if_mail_too_large') == true
- info = " - download message #{count}/#{count_all} - ignore message because it's too large (is:#{too_large_info[0]} MB/max:#{too_large_info[1]} MB)"
- Rails.logger.info info
- notice += "#{info}\n"
- process_oversized_mail(channel, msg)
- else
- info = " - ignore message #{count}/#{count_all} - because message is too large (is:#{too_large_info[0]} MB/max:#{too_large_info[1]} MB)"
- Rails.logger.info info
- notice += "#{info}\n"
- too_large_messages.push info
- next
- end
- else
- process(channel, msg, false)
- end
- begin
- timeout(FETCH_MSG_TIMEOUT) do
- if keep_on_server
- @imap.store(message_id, '+FLAGS', [:Seen])
- else
- @imap.store(message_id, '+FLAGS', [:Deleted])
- end
- end
- rescue Timeout::Error => e
- Rails.logger.error "Unable to set +FLAGS for email #{count}/#{count_all} on server (#{options[:host]}/#{options[:user]}): #{e.inspect}"
- raise e
- end
- count_fetched += 1
- end
- if !keep_on_server
- begin
- timeout(EXPUNGE_TIMEOUT) do
- @imap.expunge
- end
- rescue Timeout::Error => e
- Rails.logger.error "Unable to expunge server (#{options[:host]}/#{options[:user]}): #{e.inspect}"
- raise e
- end
- end
- disconnect
- if count.zero?
- Rails.logger.info ' - no message'
- end
- if too_large_messages.present?
- raise too_large_messages.join("\n")
- end
- {
- result: result,
- fetched: count_fetched,
- notice: notice,
- }
- end
- def fetch_all_message_ids
- fetch_message_ids %w[ALL]
- end
- def fetch_unread_message_ids
- fetch_message_ids %w[NOT SEEN]
- rescue
- fetch_message_ids %w[UNSEEN]
- end
- def fetch_message_ids(filter)
- raise if @imap.capabilities.exclude?('SORT')
- {
- result: @imap.sort(['DATE'], filter, 'US-ASCII'),
- is_fallback: false
- }
- rescue
- {
- result: @imap.search(filter),
- is_fallback: true # indicates that we can not use a result ordered by date
- }
- end
- def fetch_message_body_key(options)
- # https://github.com/zammad/zammad/issues/4589
- options['host'] == 'imap.mail.me.com' ? 'BODY[]' : 'RFC822'
- end
- def disconnect
- return if !@imap
- timeout(1.minute) do
- @imap.disconnect
- end
- end
- =begin
- Channel::Driver::Imap.streamable?
- returns
- true|false
- =end
- def self.streamable?
- false
- end
- # Parses RFC822 header
- # @param [String] RFC822 header text blob
- # @return [Hash<String=>String>]
- def self.parse_rfc822_headers(string)
- array = string
- .gsub("\r\n\t", ' ') # Some servers (e.g. microsoft365) may put attribute value on a separate line and tab it
- .lines(chomp: true)
- .map { |line| line.split(%r{:\s*}, 2).map(&:strip) }
- array.each { |elem| elem.append(nil) if elem.one? }
- Hash[*array.flatten]
- end
- # Parses RFC822 header
- # @param [Net::IMAP::FetchData] fetched message
- # @return [Hash<String=>String>]
- def self.extract_rfc822_headers(message_meta)
- blob = message_meta&.attr&.dig 'RFC822.HEADER'
- return if !blob
- parse_rfc822_headers blob
- end
- private
- def messages_is_too_old_verify?(message_meta, count, count_all)
- headers = self.class.extract_rfc822_headers(message_meta)
- return true if !messages_is_verify_message?(headers)
- return true if headers['X-Zammad-Verify-Time'].blank?
- begin
- verify_time = Time.zone.parse(headers['X-Zammad-Verify-Time'])
- rescue => e
- Rails.logger.error e
- return true
- end
- return true if verify_time < 30.minutes.ago
- Rails.logger.info " - ignore message #{count}/#{count_all} - because message has a verify message"
- false
- end
- def messages_is_verify_message?(headers)
- return true if headers['X-Zammad-Verify'] == 'true'
- false
- end
- def messages_is_ignore_message?(headers)
- return true if headers['X-Zammad-Ignore'] == 'true'
- false
- end
- =begin
- check if email is already impoted
- Channel::Driver::IMAP.already_imported?(message_id, message_meta, count, count_all, keep_on_server, channel)
- returns
- true|false
- =end
- # rubocop:disable Metrics/ParameterLists
- def already_imported?(message_id, message_meta, count, count_all, keep_on_server, channel)
- # rubocop:enable Metrics/ParameterLists
- return false if !keep_on_server
- headers = self.class.extract_rfc822_headers(message_meta)
- retrurn false if !headers
- local_message_id = headers['Message-ID']
- return false if local_message_id.blank?
- local_message_id_md5 = Digest::MD5.hexdigest(local_message_id)
- article = Ticket::Article.where(message_id_md5: local_message_id_md5).reorder('created_at DESC, id DESC').limit(1).first
- return false if !article
- # verify if message is already imported via same channel, if not, import it again
- ticket = article.ticket
- return false if ticket&.preferences && ticket.preferences[:channel_id].present? && channel.present? && ticket.preferences[:channel_id] != channel[:id]
- timeout(1.minute) do
- @imap.store(message_id, '+FLAGS', [:Seen])
- end
- Rails.logger.info " - ignore message #{count}/#{count_all} - because message message id already imported"
- true
- end
- =begin
- check if email is already marked as deleted
- Channel::Driver::IMAP.deleted?(message_meta, count, count_all)
- returns
- true|false
- =end
- def deleted?(message_meta, count, count_all)
- return false if message_meta.attr['FLAGS'].exclude?(:Deleted)
- Rails.logger.info " - ignore message #{count}/#{count_all} - because message has already delete flag"
- true
- end
- =begin
- check if email is to big
- Channel::Driver::IMAP.too_large?(message_meta, count, count_all)
- returns
- true|false
- =end
- def too_large?(message_meta)
- max_message_size = Setting.get('postmaster_max_size').to_f
- real_message_size = message_meta.attr['RFC822.SIZE'].to_f / 1024 / 1024
- if real_message_size > max_message_size
- return [real_message_size, max_message_size]
- end
- false
- end
- =begin
- check if channel config has changed
- Channel::Driver::IMAP.channel_has_changed?(channel)
- returns
- true|false
- =end
- def channel_has_changed?(channel)
- current_channel = Channel.find_by(id: channel.id)
- if !current_channel
- Rails.logger.info "Channel with id #{channel.id} is deleted in the meantime. Stop fetching."
- return true
- end
- return false if channel.updated_at == current_channel.updated_at
- Rails.logger.info "Channel with id #{channel.id} has changed. Stop fetching."
- true
- end
- =begin
- check if maximal fetching email count has reached
- Channel::Driver::IMAP.max_process_count_has_reached?(channel, count, count_max)
- returns
- true|false
- =end
- def max_process_count_has_reached?(channel, count, count_max)
- return false if count < count_max
- Rails.logger.info "Maximal fetched emails (#{count_max}) reached for this interval for Channel with id #{channel.id}."
- true
- end
- def timeout(seconds, &)
- Timeout.timeout(seconds, &)
- end
- end
|