imap.rb 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637
  1. # Copyright (C) 2012-2024 Zammad Foundation, https://zammad-foundation.org/
  2. require 'net/imap'
  3. class Channel::Driver::Imap < Channel::EmailParser
  4. FETCH_METADATA_TIMEOUT = 2.minutes
  5. FETCH_MSG_TIMEOUT = 4.minutes
  6. EXPUNGE_TIMEOUT = 16.minutes
  7. DEFAULT_TIMEOUT = 45.seconds
  8. CHECK_ONLY_TIMEOUT = 8.seconds
  9. def fetchable?(_channel)
  10. true
  11. end
  12. =begin
  13. fetch emails from IMAP account
  14. instance = Channel::Driver::Imap.new
  15. result = instance.fetch(params[:inbound][:options], channel, 'verify', subject_looking_for)
  16. returns
  17. {
  18. result: 'ok',
  19. fetched: 123,
  20. notice: 'e. g. message about to big emails in mailbox',
  21. }
  22. check if connect to IMAP account is possible, return count of mails in mailbox
  23. instance = Channel::Driver::Imap.new
  24. result = instance.fetch(params[:inbound][:options], channel, 'check')
  25. returns
  26. {
  27. result: 'ok',
  28. content_messages: 123,
  29. }
  30. verify IMAP account, check if search email is in there
  31. instance = Channel::Driver::Imap.new
  32. result = instance.fetch(params[:inbound][:options], channel, 'verify', subject_looking_for)
  33. returns
  34. {
  35. result: 'ok', # 'verify not ok'
  36. }
  37. example
  38. params = {
  39. host: 'outlook.office365.com',
  40. user: 'xxx@zammad.onmicrosoft.com',
  41. password: 'xxx',
  42. keep_on_server: true,
  43. }
  44. OR
  45. params = {
  46. host: 'imap.gmail.com',
  47. user: 'xxx@gmail.com',
  48. password: 'xxx',
  49. keep_on_server: true,
  50. auth_type: 'XOAUTH2'
  51. }
  52. channel = Channel.last
  53. instance = Channel::Driver::Imap.new
  54. result = instance.fetch(params, channel, 'verify')
  55. =end
  56. def fetch(options, channel, check_type = '', verify_string = '')
  57. ssl = true
  58. ssl_verify = options.fetch(:ssl_verify, true)
  59. starttls = false
  60. port = 993
  61. keep_on_server = false
  62. folder = 'INBOX'
  63. if options[:keep_on_server] == true || options[:keep_on_server] == 'true'
  64. keep_on_server = true
  65. end
  66. case options[:ssl]
  67. when 'off'
  68. ssl = false
  69. when 'starttls'
  70. ssl = false
  71. starttls = true
  72. end
  73. port = if options.key?(:port) && options[:port].present?
  74. options[:port].to_i
  75. elsif ssl == true
  76. 993
  77. else
  78. 143
  79. end
  80. if options[:folder].present?
  81. folder = options[:folder]
  82. end
  83. Rails.logger.info "fetching imap (#{options[:host]}/#{options[:user]} port=#{port},ssl=#{ssl},starttls=#{starttls},folder=#{folder},keep_on_server=#{keep_on_server},auth_type=#{options.fetch(:auth_type, 'LOGIN')})"
  84. # on check, reduce open_timeout to have faster probing
  85. check_type_timeout = check_type == 'check' ? CHECK_ONLY_TIMEOUT : DEFAULT_TIMEOUT
  86. Certificate::ApplySSLCertificates.ensure_fresh_ssl_context if ssl || starttls
  87. timeout(check_type_timeout) do
  88. ssl_settings = false
  89. ssl_settings = (ssl_verify ? true : { verify_mode: OpenSSL::SSL::VERIFY_NONE }) if ssl
  90. @imap = ::Net::IMAP.new(options[:host], port: port, ssl: ssl_settings)
  91. if starttls
  92. @imap.starttls(verify_mode: ssl_verify ? OpenSSL::SSL::VERIFY_PEER : OpenSSL::SSL::VERIFY_NONE)
  93. end
  94. end
  95. timeout(check_type_timeout) do
  96. if options[:auth_type].present?
  97. @imap.authenticate(options[:auth_type], options[:user], options[:password])
  98. else
  99. @imap.login(options[:user], options[:password].dup&.force_encoding('ascii-8bit'))
  100. end
  101. end
  102. timeout(check_type_timeout) do
  103. # select folder
  104. @imap.select(folder)
  105. end
  106. message_ids_result = timeout(6.minutes) do
  107. if keep_on_server && check_type != 'check' && check_type != 'verify'
  108. fetch_unread_message_ids
  109. else
  110. fetch_all_message_ids
  111. end
  112. end
  113. message_ids = message_ids_result[:result]
  114. # check mode only
  115. if check_type == 'check'
  116. Rails.logger.info 'check only mode, fetch no emails'
  117. content_max_check = 2
  118. content_messages = 0
  119. # check messages
  120. message_ids.each do |message_id|
  121. message_meta = nil
  122. timeout(1.minute) do
  123. message_meta = @imap.fetch(message_id, ['RFC822.HEADER'])[0]
  124. end
  125. # check how many content messages we have, for notice used
  126. headers = self.class.extract_rfc822_headers(message_meta)
  127. next if messages_is_verify_message?(headers)
  128. next if messages_is_ignore_message?(headers)
  129. content_messages += 1
  130. break if content_max_check < content_messages
  131. end
  132. if content_messages >= content_max_check
  133. content_messages = message_ids.count
  134. end
  135. archive_possible = false || message_ids_result[:is_fallback]
  136. archive_possible_is_fallback = false || message_ids_result[:is_fallback]
  137. archive_check = 0
  138. archive_max_check = 500
  139. archive_days_range = 14
  140. archive_week_range = archive_days_range / 7
  141. # use .each only if ordered response is ascending (from older to newer)
  142. message_ids_iterator = message_ids.each
  143. # since the correct loop order could improve performance, we should check even for less than 500 available messages
  144. # starting with 5 messages, since we need 2 additional fetch requests to find the used order and it would not make sense with less messages
  145. if !message_ids_result[:is_fallback] && content_messages > 4
  146. message_0_meta = nil
  147. message_1_meta = nil
  148. timeout(1.minute) do
  149. message_0_meta = @imap.fetch(message_ids[0], ['RFC822.HEADER'])[0]
  150. message_1_meta = @imap.fetch(message_ids[1], ['RFC822.HEADER'])[0]
  151. end
  152. headers0 = self.class.extract_rfc822_headers(message_0_meta)
  153. headers1 = self.class.extract_rfc822_headers(message_1_meta)
  154. if headers0['Date'].present? && headers1['Date'].present?
  155. begin
  156. date0 = Time.zone.parse(headers0['Date'])
  157. date1 = Time.zone.parse(headers1['Date'])
  158. # change iterator to .reverse_each if order of the 2 probe messages is descending (from newer to older)
  159. message_ids_iterator = message_ids.reverse_each if date0 > date1
  160. rescue => e # rubocop:disable Metrics/BlockNesting
  161. # no easy order decision possible due to a date parsing issue, continue with default iterator
  162. end
  163. end
  164. end
  165. message_ids_iterator.each do |message_id|
  166. message_meta = nil
  167. timeout(1.minute) do
  168. message_meta = @imap.fetch(message_id, ['RFC822.HEADER'])[0]
  169. end
  170. headers = self.class.extract_rfc822_headers(message_meta)
  171. next if messages_is_verify_message?(headers)
  172. next if messages_is_ignore_message?(headers)
  173. next if headers['Date'].blank?
  174. archive_check += 1
  175. break if archive_check >= archive_max_check
  176. begin
  177. date = Time.zone.parse(headers['Date'])
  178. rescue => e
  179. Rails.logger.error e
  180. next
  181. end
  182. break if date >= Time.zone.now - archive_days_range.days
  183. archive_possible = true
  184. # even if it was fallback before, we just found a real old mail, so it's not fallback anymore
  185. archive_possible_is_fallback = false
  186. break
  187. end
  188. disconnect
  189. return {
  190. result: 'ok',
  191. content_messages: content_messages,
  192. archive_possible: archive_possible,
  193. archive_possible_is_fallback: archive_possible_is_fallback,
  194. archive_week_range: archive_week_range,
  195. }
  196. end
  197. # reverse message order to increase performance
  198. if check_type == 'verify'
  199. Rails.logger.info "verify mode, fetch no emails #{verify_string}"
  200. # check for verify message
  201. message_ids.reverse_each do |message_id|
  202. message_meta = nil
  203. timeout(FETCH_METADATA_TIMEOUT) do
  204. message_meta = @imap.fetch(message_id, ['RFC822.HEADER'])[0]
  205. end
  206. # check if verify message exists
  207. headers = self.class.extract_rfc822_headers(message_meta)
  208. subject = headers['Subject']
  209. next if !subject
  210. next if !subject.match?(%r{#{verify_string}})
  211. Rails.logger.info " - verify email #{verify_string} found"
  212. timeout(600) do
  213. @imap.store(message_id, '+FLAGS', [:Deleted])
  214. @imap.expunge
  215. end
  216. disconnect
  217. return {
  218. result: 'ok',
  219. }
  220. end
  221. disconnect
  222. return {
  223. result: 'verify not ok',
  224. }
  225. end
  226. # fetch regular messages
  227. count_all = message_ids.count
  228. count = 0
  229. count_fetched = 0
  230. count_max = 5000
  231. too_large_messages = []
  232. active_check_interval = 20
  233. result = 'ok'
  234. notice = ''
  235. message_ids.each do |message_id|
  236. count += 1
  237. break if (count % active_check_interval).zero? && channel_has_changed?(channel)
  238. break if max_process_count_has_reached?(channel, count, count_max)
  239. Rails.logger.info " - message #{count}/#{count_all}"
  240. message_meta = nil
  241. timeout(FETCH_METADATA_TIMEOUT) do
  242. message_meta = @imap.fetch(message_id, ['RFC822.SIZE', 'FLAGS', 'INTERNALDATE', 'RFC822.HEADER'])[0]
  243. rescue Net::IMAP::ResponseParseError => e
  244. raise if e.message.exclude?('unknown token')
  245. result = 'error'
  246. notice += <<~NOTICE
  247. One of your incoming emails could not be imported (#{e.message}).
  248. Please remove it from your inbox directly
  249. to prevent Zammad from trying to import it again.
  250. NOTICE
  251. Rails.logger.error "Net::IMAP failed to parse message #{message_id}: #{e.message} (#{e.class})"
  252. Rails.logger.error '(See https://github.com/zammad/zammad/issues/2754 for more details)'
  253. end
  254. next if message_meta.nil?
  255. # ignore verify messages
  256. next if !messages_is_too_old_verify?(message_meta, count, count_all)
  257. # ignore deleted messages
  258. next if deleted?(message_meta, count, count_all)
  259. # ignore already imported
  260. next if already_imported?(message_id, message_meta, count, count_all, keep_on_server, channel)
  261. # delete email from server after article was created
  262. msg = nil
  263. begin
  264. timeout(FETCH_MSG_TIMEOUT) do
  265. key = fetch_message_body_key(options)
  266. msg = @imap.fetch(message_id, key)[0].attr[key]
  267. end
  268. rescue Timeout::Error => e
  269. Rails.logger.error "Unable to fetch email from #{count}/#{count_all} from server (#{options[:host]}/#{options[:user]}): #{e.inspect}"
  270. raise e
  271. end
  272. next if !msg
  273. # do not process too big messages, instead download & send postmaster reply
  274. too_large_info = too_large?(message_meta)
  275. if too_large_info
  276. if Setting.get('postmaster_send_reject_if_mail_too_large') == true
  277. info = " - download message #{count}/#{count_all} - ignore message because it's too large (is:#{too_large_info[0]} MB/max:#{too_large_info[1]} MB)"
  278. Rails.logger.info info
  279. notice += "#{info}\n"
  280. process_oversized_mail(channel, msg)
  281. else
  282. info = " - ignore message #{count}/#{count_all} - because message is too large (is:#{too_large_info[0]} MB/max:#{too_large_info[1]} MB)"
  283. Rails.logger.info info
  284. notice += "#{info}\n"
  285. too_large_messages.push info
  286. next
  287. end
  288. else
  289. process(channel, msg, false)
  290. end
  291. begin
  292. timeout(FETCH_MSG_TIMEOUT) do
  293. if keep_on_server
  294. @imap.store(message_id, '+FLAGS', [:Seen])
  295. else
  296. @imap.store(message_id, '+FLAGS', [:Deleted])
  297. end
  298. end
  299. rescue Timeout::Error => e
  300. Rails.logger.error "Unable to set +FLAGS for email #{count}/#{count_all} on server (#{options[:host]}/#{options[:user]}): #{e.inspect}"
  301. raise e
  302. end
  303. count_fetched += 1
  304. end
  305. if !keep_on_server
  306. begin
  307. timeout(EXPUNGE_TIMEOUT) do
  308. @imap.expunge
  309. end
  310. rescue Timeout::Error => e
  311. Rails.logger.error "Unable to expunge server (#{options[:host]}/#{options[:user]}): #{e.inspect}"
  312. raise e
  313. end
  314. end
  315. disconnect
  316. if count.zero?
  317. Rails.logger.info ' - no message'
  318. end
  319. if too_large_messages.present?
  320. raise too_large_messages.join("\n")
  321. end
  322. {
  323. result: result,
  324. fetched: count_fetched,
  325. notice: notice,
  326. }
  327. end
  328. def fetch_all_message_ids
  329. fetch_message_ids %w[ALL]
  330. end
  331. def fetch_unread_message_ids
  332. fetch_message_ids %w[NOT SEEN]
  333. rescue
  334. fetch_message_ids %w[UNSEEN]
  335. end
  336. def fetch_message_ids(filter)
  337. raise if @imap.capabilities.exclude?('SORT')
  338. {
  339. result: @imap.sort(['DATE'], filter, 'US-ASCII'),
  340. is_fallback: false
  341. }
  342. rescue
  343. {
  344. result: @imap.search(filter),
  345. is_fallback: true # indicates that we can not use a result ordered by date
  346. }
  347. end
  348. def fetch_message_body_key(options)
  349. # https://github.com/zammad/zammad/issues/4589
  350. options['host'] == 'imap.mail.me.com' ? 'BODY[]' : 'RFC822'
  351. end
  352. def disconnect
  353. return if !@imap
  354. timeout(1.minute) do
  355. @imap.disconnect
  356. end
  357. end
  358. =begin
  359. Channel::Driver::Imap.streamable?
  360. returns
  361. true|false
  362. =end
  363. def self.streamable?
  364. false
  365. end
  366. # Parses RFC822 header
  367. # @param [String] RFC822 header text blob
  368. # @return [Hash<String=>String>]
  369. def self.parse_rfc822_headers(string)
  370. array = string
  371. .gsub("\r\n\t", ' ') # Some servers (e.g. microsoft365) may put attribute value on a separate line and tab it
  372. .lines(chomp: true)
  373. .map { |line| line.split(%r{:\s*}, 2).map(&:strip) }
  374. array.each { |elem| elem.append(nil) if elem.one? }
  375. Hash[*array.flatten]
  376. end
  377. # Parses RFC822 header
  378. # @param [Net::IMAP::FetchData] fetched message
  379. # @return [Hash<String=>String>]
  380. def self.extract_rfc822_headers(message_meta)
  381. blob = message_meta&.attr&.dig 'RFC822.HEADER'
  382. return if !blob
  383. parse_rfc822_headers blob
  384. end
  385. private
  386. def messages_is_too_old_verify?(message_meta, count, count_all)
  387. headers = self.class.extract_rfc822_headers(message_meta)
  388. return true if !messages_is_verify_message?(headers)
  389. return true if headers['X-Zammad-Verify-Time'].blank?
  390. begin
  391. verify_time = Time.zone.parse(headers['X-Zammad-Verify-Time'])
  392. rescue => e
  393. Rails.logger.error e
  394. return true
  395. end
  396. return true if verify_time < 30.minutes.ago
  397. Rails.logger.info " - ignore message #{count}/#{count_all} - because message has a verify message"
  398. false
  399. end
  400. def messages_is_verify_message?(headers)
  401. return true if headers['X-Zammad-Verify'] == 'true'
  402. false
  403. end
  404. def messages_is_ignore_message?(headers)
  405. return true if headers['X-Zammad-Ignore'] == 'true'
  406. false
  407. end
  408. =begin
  409. check if email is already impoted
  410. Channel::Driver::IMAP.already_imported?(message_id, message_meta, count, count_all, keep_on_server, channel)
  411. returns
  412. true|false
  413. =end
  414. # rubocop:disable Metrics/ParameterLists
  415. def already_imported?(message_id, message_meta, count, count_all, keep_on_server, channel)
  416. # rubocop:enable Metrics/ParameterLists
  417. return false if !keep_on_server
  418. headers = self.class.extract_rfc822_headers(message_meta)
  419. retrurn false if !headers
  420. local_message_id = headers['Message-ID']
  421. return false if local_message_id.blank?
  422. local_message_id_md5 = Digest::MD5.hexdigest(local_message_id)
  423. article = Ticket::Article.where(message_id_md5: local_message_id_md5).reorder('created_at DESC, id DESC').limit(1).first
  424. return false if !article
  425. # verify if message is already imported via same channel, if not, import it again
  426. ticket = article.ticket
  427. return false if ticket&.preferences && ticket.preferences[:channel_id].present? && channel.present? && ticket.preferences[:channel_id] != channel[:id]
  428. timeout(1.minute) do
  429. @imap.store(message_id, '+FLAGS', [:Seen])
  430. end
  431. Rails.logger.info " - ignore message #{count}/#{count_all} - because message message id already imported"
  432. true
  433. end
  434. =begin
  435. check if email is already marked as deleted
  436. Channel::Driver::IMAP.deleted?(message_meta, count, count_all)
  437. returns
  438. true|false
  439. =end
  440. def deleted?(message_meta, count, count_all)
  441. return false if message_meta.attr['FLAGS'].exclude?(:Deleted)
  442. Rails.logger.info " - ignore message #{count}/#{count_all} - because message has already delete flag"
  443. true
  444. end
  445. =begin
  446. check if email is to big
  447. Channel::Driver::IMAP.too_large?(message_meta, count, count_all)
  448. returns
  449. true|false
  450. =end
  451. def too_large?(message_meta)
  452. max_message_size = Setting.get('postmaster_max_size').to_f
  453. real_message_size = message_meta.attr['RFC822.SIZE'].to_f / 1024 / 1024
  454. if real_message_size > max_message_size
  455. return [real_message_size, max_message_size]
  456. end
  457. false
  458. end
  459. =begin
  460. check if channel config has changed
  461. Channel::Driver::IMAP.channel_has_changed?(channel)
  462. returns
  463. true|false
  464. =end
  465. def channel_has_changed?(channel)
  466. current_channel = Channel.find_by(id: channel.id)
  467. if !current_channel
  468. Rails.logger.info "Channel with id #{channel.id} is deleted in the meantime. Stop fetching."
  469. return true
  470. end
  471. return false if channel.updated_at == current_channel.updated_at
  472. Rails.logger.info "Channel with id #{channel.id} has changed. Stop fetching."
  473. true
  474. end
  475. =begin
  476. check if maximal fetching email count has reached
  477. Channel::Driver::IMAP.max_process_count_has_reached?(channel, count, count_max)
  478. returns
  479. true|false
  480. =end
  481. def max_process_count_has_reached?(channel, count, count_max)
  482. return false if count < count_max
  483. Rails.logger.info "Maximal fetched emails (#{count_max}) reached for this interval for Channel with id #{channel.id}."
  484. true
  485. end
  486. def timeout(seconds, &)
  487. Timeout.timeout(seconds, &)
  488. end
  489. end