8 yaml_properties :uri, :cur_offset, :usual, :archived, :id, :labels
9 def initialize uri_or_fp, start_offset=nil, usual=true, archived=false, id=nil, labels=[]
10 super uri_or_fp, start_offset, usual, archived, id
13 @labels = (labels || []).freeze
18 raise ArgumentError, "not an mbox uri" unless uri.scheme == "mbox"
19 raise ArgumentError, "mbox uri ('#{uri}') cannot have a host: #{uri.host}" if uri.host
20 @f = File.open uri.path
26 def self.suggest_labels_for path
27 ## heuristic: use the filename as a label, unless the file
28 ## has a path that probably represents an inbox.
29 if File.dirname(path) =~ /\b(var|usr|spool)\b/
32 [File.basename(path).intern]
37 if (cur_offset ||= start_offset) > end_offset
38 raise OutOfSyncSourceError, "mbox file is smaller than last recorded message offset. Messages have probably been deleted by another client."
42 def start_offset; 0; end
43 def end_offset; File.size @f; end
45 def load_header offset
51 raise OutOfSyncSourceError, "mismatch in mbox file offset #{offset.inspect}: #{l.inspect}."
53 header = MBox::read_header @f
58 def load_message offset
62 RMail::Mailbox::MBoxReader.new(@f).each_message do |input|
63 return RMail::Parser.read(input)
65 rescue RMail::Parser::Error => e
66 raise FatalSourceError, "error parsing mbox file: #{e.message}"
75 until @f.eof? || (l = @f.gets) =~ /^$/
82 def raw_full_message offset
84 each_raw_full_message_line(offset) { |l| ret += l }
88 ## apparently it's a million times faster to call this directly if
89 ## we're just moving messages around on disk, than reading things
90 ## into memory with raw_full_message.
92 ## i hoped never to have to move shit around on disk but
93 ## sup-sync-back has to do it.
94 def each_raw_full_message_line offset
98 until @f.eof? || (l = @f.gets) =~ BREAK_RE
105 returned_offset = nil
106 next_offset = cur_offset
109 @mutex.synchronize do
112 ## cur_offset could be at one of two places here:
114 ## 1. before a \n and a mbox separator, if it was previously at
115 ## EOF and a new message was added; or,
116 ## 2. at the beginning of an mbox separator (in all other
119 l = @f.gets or raise "next while at EOF"
120 if l =~ /^\s*$/ # case 1
121 returned_offset = @f.tell
122 @f.gets # now we're at a BREAK_RE, so skip past it
124 returned_offset = cur_offset
125 ## we've already skipped past the BREAK_RE, so just go
128 while(line = @f.gets)
129 break if line =~ BREAK_RE
130 next_offset = @f.tell
133 rescue SystemCallError, IOError => e
134 raise FatalSourceError, "Error reading #{@f.path}: #{e.message}"
137 self.cur_offset = next_offset
138 [returned_offset, @labels]