require 'uri'
require 'net/imap'
require 'stringio'
+require 'time'
+require 'rmail'
+## fucking imap fucking sucks. what the FUCK kind of committee of
+## dunces designed this shit.
+##
+## imap talks about 'unique ids' for messages, to be used for
+## cross-session identification. great---just what sup needs! except
+## it turns out the uids can be invalidated every time the
+## 'uidvalidity' value changes on the server, and 'uidvalidity' can
+## change without restriction. it can change any time you log in. it
+## can change EVERY time you log in. of course the imap spec "strongly
+## recommends" that it never change, but there's nothing to stop
+## people from just setting it to the current timestamp, and in fact
+## that's exactly what the one imap server i have at my disposal
+## does. thus the so-called uids are absolutely useless and imap
+## provides no cross-session way of uniquely identifying a
+## message. but thanks for the "strong recommendation", guys!
+##
+## so right now i'm using the 'internal date' and the size of each
+## message to uniquely identify it, and i scan over the entire mailbox
+## each time i open it to map those things to message ids. that can be
+## slow for large mailboxes, and we'll just have to hope that there
+## are no collisions. ho ho! a perfectly reasonable solution!
+##
+## and here's another thing. check out RFC2060 2.2.2 paragraph 5:
+##
+## A client MUST be prepared to accept any server response at all times.
+## This includes server data that was not requested.
+##
+## yeah. that totally makes a lot of sense. and once again, the idiocy
+## of the spec actually happens in practice. you'll request flags for
+## one message, and get it interspersed with a random bunch of flags
+## for some other messages, including a different set of flags for the
+## same message! totally ok by the imap spec. totally retarded by any
+## other metric.
+##
+## fuck you, imap committee. you managed to design something nearly as
+## shitty as mbox but goddamn THIRTY YEARS LATER.
module Redwood
class IMAP < Source
- attr_reader :labels
-
- def initialize uri, username, password, uid_validity=nil, last_uid=nil, usual=true, archived=false, id=nil
+ SCAN_INTERVAL = 60 # seconds
+
+ ## upon these errors we'll try to rereconnect a few times
+ RECOVERABLE_ERRORS = [ Errno::EPIPE, Errno::ETIMEDOUT, OpenSSL::SSL::SSLError ]
+
+ attr_accessor :username, :password
+ yaml_properties :uri, :username, :password, :cur_offset, :usual,
+ :archived, :id, :labels
+
+ def initialize uri, username, password, last_idate=nil, usual=true, archived=false, id=nil, labels=[]
raise ArgumentError, "username and password must be specified" unless username && password
raise ArgumentError, "not an imap uri" unless uri =~ %r!imaps?://!
- super uri, last_uid, usual, archived, id
+ super uri, last_idate, usual, archived, id
@parsed_uri = URI(uri)
@username = username
@password = password
- @uid_validity = uid_validity
@imap = nil
- @labels = [:unread]
- @labels << :inbox unless archived?
- @labels << mailbox.intern unless mailbox =~ /inbox/i || mailbox.nil?
+ @imap_ids = {}
+ @ids = []
+ @last_scan = nil
+ @labels = (labels || []).freeze
+ @say_id = nil
+ @mutex = Mutex.new
end
- def connect
- return false if broken?
- return true if @imap
- Redwood::log "connecting to #{@parsed_uri.host} port #{ssl? ? 993 : 143}, ssl=#{ssl?} ..."
-
- ## ok, this is FUCKING ANNOYING.
- ##
- ## what imap.rb likes to do is, if an exception occurs, catch it
- ## and re-raise it on the calling thread. seems reasonable. but
- ## what that REALLY means is that the only way to reasonably
- ## initialize imap is in its own thread, because otherwise, you
- ## will never be able to catch the exception it raises on the
- ## calling thread, and the backtrace will not make any sense at
- ## all, and you will waste HOURS of your life on this fucking
- ## problem.
- ##
- ## FUCK!!!!!!!!!
-
- BufferManager.say "Connecting to IMAP server #{host}..." do
- ::Thread.new do
- begin
- #raise Net::IMAP::ByeResponseError, "simulated imap failure"
- @imap = Net::IMAP.new host, ssl? ? 993 : 143, ssl?
- @imap.authenticate 'LOGIN', @username, @password
- @imap.examine mailbox
- Redwood::log "successfully connected to #{@parsed_uri}, mailbox #{mailbox}"
- @uid_validity ||= @imap.responses["UIDVALIDITY"][-1]
- raise SourceError, "Your shitty IMAP server has kindly invalidated all 'unique' ids for the folder '#{mailbox}'. You will have to rescan this folder manually." if @imap.responses["UIDVALIDITY"][-1] != @uid_validity
- rescue Exception => e
- self.broken_msg = e.message.chomp # fucking chomp! fuck!!!
- @imap = nil
- Redwood::log "error connecting to IMAP server: #{self.broken_msg}"
- end
- end.join
+ def self.suggest_labels_for path
+ if path =~ /inbox/i
+ [path.intern]
+ else
+ []
end
-
- !!@imap
end
- private :connect
def host; @parsed_uri.host; end
- def mailbox; @parsed_uri.path[1..-1] end ##XXXX TODO handle nil
+ def port; @parsed_uri.port || (ssl? ? 993 : 143); end
+ def mailbox
+ x = @parsed_uri.path[1..-1]
+ x.nil? || x.empty? ? 'INBOX' : x
+ end
def ssl?; @parsed_uri.scheme == 'imaps' end
- def load_header uid=nil
- MBox::read_header StringIO.new(raw_header(uid))
+ def check
+ ids =
+ @mutex.synchronize do
+ unsynchronized_scan_mailbox
+ @ids
+ end
+
+ start = ids.index(cur_offset || start_offset) or raise OutOfSyncSourceError, "Unknown message id #{cur_offset || start_offset}."
end
- def load_message uid
- RMail::Parser.read raw_full_message(uid)
+ ## is this necessary? TODO: remove maybe
+ def == o; o.is_a?(IMAP) && o.uri == self.uri && o.username == self.username; end
+
+ def load_header id
+ MBox::read_header StringIO.new(raw_header(id))
end
- ## load the full header text
- def raw_header uid
- connect or raise SourceError, broken_msg
- get_imap_field(uid, 'RFC822.HEADER').gsub(/\r\n/, "\n")
+ def load_message id
+ RMail::Parser.read raw_full_message(id)
end
- def raw_full_message uid
- connect or raise SourceError, broken_msg
- get_imap_field(uid, 'RFC822').gsub(/\r\n/, "\n")
+ def raw_header id
+ unsynchronized_scan_mailbox
+ header, flags = get_imap_fields id, 'RFC822.HEADER', 'FLAGS'
+ ## very bad. this is very very bad. very bad bad bad.
+ header = header + "Status: RO\n" if flags.include? :Seen # fake an mbox-style read header # TODO: improve source-marked-as-read reporting system
+ header.gsub(/\r\n/, "\n")
end
+ synchronized :raw_header
- def get_imap_field uid, field
- f = @imap.uid_fetch uid, field
- raise SourceError, "null IMAP field '#{field}' for message with uid #{uid}" if f.nil?
- f[0].attr[field]
+ def raw_full_message id
+ unsynchronized_scan_mailbox
+ get_imap_fields(id, 'RFC822').first.gsub(/\r\n/, "\n")
end
- private :get_imap_field
-
+ synchronized :raw_full_message
+
+ def connect
+ return if @imap
+ safely { } # do nothing!
+ end
+ synchronized :connect
+
+ def scan_mailbox
+ return if @last_scan && (Time.now - @last_scan) < SCAN_INTERVAL
+ last_id = safely do
+ @imap.examine mailbox
+ @imap.responses["EXISTS"].last
+ end
+ @last_scan = Time.now
+
+ return if last_id == @ids.length
+
+ range = (@ids.length + 1) .. last_id
+ Redwood::log "fetching IMAP headers #{range}"
+ fetch(range, ['RFC822.SIZE', 'INTERNALDATE']).each do |v|
+ id = make_id v
+ @ids << id
+ @imap_ids[id] = v.seqno
+ end
+ end
+ synchronized :scan_mailbox
+
def each
- connect or raise SourceError, broken_msg
- uids = @imap.uid_search ['UID', "#{cur_offset}:#{end_offset}"]
- uids.each do |uid|
- @last_uid = uid
- @dirty = true
- self.cur_offset = uid
- yield uid, labels
+ ids =
+ @mutex.synchronize do
+ unsynchronized_scan_mailbox
+ @ids
+ end
+
+ start = ids.index(cur_offset || start_offset) or raise OutOfSyncSourceError, "Unknown message id #{cur_offset || start_offset}."
+
+ start.upto(ids.length - 1) do |i|
+ id = ids[i]
+ self.cur_offset = id
+ yield id, @labels
end
end
- def start_offset; 1; end
+ def start_offset
+ unsynchronized_scan_mailbox
+ @ids.first
+ end
+ synchronized :start_offset
+
def end_offset
- connect or return start_offset
- @imap.uid_search(['ALL']).last
+ unsynchronized_scan_mailbox
+ @ids.last
end
-end
+ synchronized :end_offset
+
+ def pct_done; 100.0 * (@ids.index(cur_offset) || 0).to_f / (@ids.length - 1).to_f; end
+
+private
+
+ def fetch ids, fields
+ results = safely { @imap.fetch ids, fields }
+ good_results =
+ if ids.respond_to? :member?
+ results.find_all { |r| ids.member?(r.seqno) && fields.all? { |f| r.attr.member?(f) } }
+ else
+ results.find_all { |r| ids == r.seqno && fields.all? { |f| r.attr.member?(f) } }
+ end
-Redwood::register_yaml(IMAP, %w(uri username password uid_validity cur_offset usual archived id))
+ if good_results.empty?
+ raise FatalSourceError, "no IMAP response for #{ids} containing all fields #{fields.join(', ')} (got #{results.size} results)"
+ elsif good_results.size < results.size
+ Redwood::log "Your IMAP server sucks. It sent #{results.size} results for a request for #{good_results.size} messages. What are you using, Binc?"
+ end
+
+ good_results
+ end
+
+ def unsafe_connect
+ say "Connecting to IMAP server #{host}:#{port}..."
+
+ ## apparently imap.rb does a lot of threaded stuff internally and
+ ## if an exception occurs, it will catch it and re-raise it on the
+ ## calling thread. but i can't seem to catch that exception, so
+ ## i've resorted to initializing it in its own thread. surely
+ ## there's a better way.
+ exception = nil
+ ::Thread.new do
+ begin
+ #raise Net::IMAP::ByeResponseError, "simulated imap failure"
+ @imap = Net::IMAP.new host, port, ssl?
+ say "Logging in..."
+
+ ## although RFC1730 claims that "If an AUTHENTICATE command
+ ## fails with a NO response, the client may try another", in
+ ## practice it seems like they can also send a BAD response.
+ begin
+ @imap.authenticate 'CRAM-MD5', @username, @password
+ rescue Net::IMAP::BadResponseError, Net::IMAP::NoResponseError => e
+ Redwood::log "CRAM-MD5 authentication failed: #{e.class}. Trying LOGIN auth..."
+ begin
+ @imap.authenticate 'LOGIN', @username, @password
+ rescue Net::IMAP::BadResponseError, Net::IMAP::NoResponseError => e
+ Redwood::log "LOGIN authentication failed: #{e.class}. Trying plain-text LOGIN..."
+ @imap.login @username, @password
+ end
+ end
+ say "Successfully connected to #{@parsed_uri}."
+ rescue Exception => e
+ exception = e
+ ensure
+ shutup
+ end
+ end.join
+
+ raise exception if exception
+ end
+
+ def say s
+ @say_id = BufferManager.say s, @say_id if BufferManager.instantiated?
+ Redwood::log s
+ end
+
+ def shutup
+ BufferManager.clear @say_id if BufferManager.instantiated?
+ @say_id = nil
+ end
+
+ def make_id imap_stuff
+ # use 7 digits for the size. why 7? seems nice.
+ %w(RFC822.SIZE INTERNALDATE).each do |w|
+ raise FatalSourceError, "requested data not in IMAP response: #{w}" unless imap_stuff.attr[w]
+ end
+
+ msize, mdate = imap_stuff.attr['RFC822.SIZE'] % 10000000, Time.parse(imap_stuff.attr["INTERNALDATE"])
+ sprintf("%d%07d", mdate.to_i, msize).to_i
+ end
+
+ def get_imap_fields id, *fields
+ imap_id = @imap_ids[id] or raise OutOfSyncSourceError, "Unknown message id #{id}"
+
+ retried = false
+ result = fetch(imap_id, (fields + ['RFC822.SIZE', 'INTERNALDATE']).uniq).first
+ got_id = make_id result
+ raise OutOfSyncSourceError, "IMAP message mismatch: requested #{id}, got #{got_id}." unless got_id == id
+
+ fields.map { |f| result.attr[f] or raise FatalSourceError, "empty response from IMAP server: #{f}" }
+ end
+
+ ## execute a block, connected if unconnected, re-connected up to 3
+ ## times if a recoverable error occurs, and properly dying if an
+ ## unrecoverable error occurs.
+ def safely
+ retries = 0
+ begin
+ begin
+ unsafe_connect unless @imap
+ yield
+ rescue *RECOVERABLE_ERRORS => e
+ if (retries += 1) <= 3
+ @imap = nil
+ Redwood::log "got #{e.class.name}: #{e.message.inspect}"
+ sleep 2
+ retry
+ end
+ raise
+ end
+ rescue SocketError, Net::IMAP::Error, SystemCallError, IOError, OpenSSL::SSL::SSLError => e
+ raise FatalSourceError, "While communicating with IMAP server (type #{e.class.name}): #{e.message.inspect}"
+ end
+ end
+
+end
end