trabajo-afectivo/app/models/channel/email_parser.rb

481 lines
15 KiB
Ruby
Raw Normal View History

2012-06-15 11:10:23 +00:00
# encoding: utf-8
require 'mail'
require 'iconv'
class Channel::EmailParser
def conv (charset, string)
2012-05-07 22:37:07 +00:00
if !charset || charset == 'US-ASCII' || charset == 'ASCII-8BIT'
charset = 'LATIN1'
end
2012-05-04 19:30:22 +00:00
return string if charset.downcase == 'utf8' || charset.downcase == 'utf-8'
# puts '-------' + charset
# puts string
# string.encode("UTF-8")
Iconv.conv( 'UTF8', charset, string )
end
=begin
mail = parse( msg_as_string )
mail = {
:from => 'Some Name <some@example.com>',
:from_email => 'some@example.com',
:from_local => 'some',
:from_domain => 'example.com',
:from_display_name => 'Some Name',
:message_id => 'some_message_id@example.com',
2012-10-04 07:09:27 +00:00
:to => 'Some System <system@example.com>',
:cc => 'Somebody <somebody@example.com>',
:subject => 'some message subject',
:body => 'some message body',
:attachments => [
2012-10-04 07:09:27 +00:00
{
:data => 'binary of attachment',
:filename => 'file_name_of_attachment.txt',
:preferences => {
:content-alternative => true,
:Mime-Type => 'text/plain',
:Charset => 'iso-8859-1',
},
},
],
2012-10-04 07:09:27 +00:00
# ignore email header
:x-zammad-ignore => 'false',
# customer headers
:x-zammad-customer-login => '',
:x-zammad-customer-email => '',
:x-zammad-customer-firstname => '',
:x-zammad-customer-lastname => '',
# ticket headers
:x-zammad-group => 'some_group',
:x-zammad-state => 'some_state',
:x-zammad-priority => 'some_priority',
:x-zammad-owner => 'some_owner_login',
# article headers
:x-zammad-article-visability => 'true',
:x-zammad-article-type => 'agent',
:x-zammad-article-sender => 'customer',
# all other email headers
:some-header => 'some_value',
}
=end
def parse (msg)
data = {}
mail = Mail.new( msg )
# set all headers
mail.header.fields.each { |field|
data[field.name.downcase.to_sym] = field.to_s
}
# set extra headers
data[:from_email] = Mail::Address.new( mail[:from].value ).address
data[:from_local] = Mail::Address.new( mail[:from].value ).local
data[:from_domain] = Mail::Address.new( mail[:from].value ).domain
2012-05-07 22:37:07 +00:00
data[:from_display_name] = Mail::Address.new( mail[:from].value ).display_name ||
( Mail::Address.new( mail[:from].value ).comments && Mail::Address.new( mail[:from].value ).comments[0] )
# do extra decoding because we needed to use field.value
data[:from_display_name] = Mail::Field.new( 'X-From', data[:from_display_name] ).to_s
# compat headers
data[:message_id] = data['message-id'.to_sym]
# body
2012-05-04 19:30:22 +00:00
# plain_part = mail.multipart? ? (mail.text_part ? mail.text_part.body.decoded : nil) : mail.body.decoded
# html_part = message.html_part ? message.html_part.body.decoded : nil
2012-05-07 22:37:07 +00:00
data[:attachments] = []
2012-07-02 18:52:27 +00:00
# multi part email
2012-05-04 19:30:22 +00:00
if mail.multipart?
2012-06-15 11:27:52 +00:00
2012-07-02 18:52:27 +00:00
# text attachment/body exists
2012-06-15 11:10:23 +00:00
if mail.text_part
data[:body] = mail.text_part.body.decoded
data[:body] = conv( mail.text_part.charset, data[:body] )
2012-06-15 11:27:52 +00:00
2012-07-02 18:52:27 +00:00
# html attachment/body may exists and will be converted to text
2012-06-15 11:10:23 +00:00
else
filename = '-no name-'
if mail.html_part.body
filename = 'html-email'
data[:body] = mail.html_part.body.to_s
data[:body] = conv( mail.html_part.charset.to_s, data[:body] )
data[:body] = html2ascii( data[:body] )
2012-06-15 11:10:23 +00:00
# any other attachments
else
data[:body] = 'no visible content'
2012-06-15 11:10:23 +00:00
end
2012-07-02 18:52:27 +00:00
end
2012-06-15 11:10:23 +00:00
2012-07-02 18:52:27 +00:00
# add html attachment/body as real attachment
if mail.html_part
filename = 'message.html'
headers_store = {
'content-alternative' => true,
}
2012-06-15 11:10:23 +00:00
if mail.mime_type
headers_store['Mime-Type'] = mail.html_part.mime_type
end
if mail.charset
headers_store['Charset'] = mail.html_part.charset
end
attachment = {
2012-06-15 11:27:52 +00:00
:data => mail.html_part.body.to_s,
2012-06-15 11:10:23 +00:00
:filename => mail.html_part.filename || filename,
:preferences => headers_store
2012-06-15 11:10:23 +00:00
}
data[:attachments].push attachment
end
2012-07-02 18:52:27 +00:00
# get attachments
if mail.has_attachments?
mail.attachments.each { |file|
# get file preferences
headers_store = {}
file.header.fields.each { |field|
headers_store[field.name.to_s] = field.value.to_s
}
filename = nil
if file.header[:content_disposition].filename
filename = file.header[:content_disposition].filename
end
if file.header[:content_type].string
headers_store['Mime-Type'] = file.header[:content_type].string
end
if file.header.charset
headers_store['Charset'] = file.header.charset
end
2012-07-02 18:52:27 +00:00
# remove not needed header
headers_store.delete('Content-Transfer-Encoding')
headers_store.delete('Content-Disposition')
attach = {
:data => file.body.to_s,
:filename => filename,
:preferences => headers_store,
2012-07-02 18:52:27 +00:00
}
data[:attachments].push attach
}
end
# not multipart email
2012-05-04 19:30:22 +00:00
else
2012-05-07 22:37:07 +00:00
# text part
if !mail.mime_type || mail.mime_type.to_s == '' || mail.mime_type.to_s.downcase == 'text/plain'
data[:body] = mail.body.decoded
data[:body] = conv( mail.charset, data[:body] )
2012-05-07 22:37:07 +00:00
2012-07-02 18:52:27 +00:00
# html part
else
2012-05-07 22:37:07 +00:00
filename = '-no name-'
if mail.mime_type.to_s.downcase == 'text/html'
filename = 'html-email'
data[:body] = mail.body.decoded
data[:body] = conv( mail.charset, data[:body] )
data[:body] = html2ascii( data[:body] )
2012-05-07 22:37:07 +00:00
# any other attachments
else
data[:body] = 'no visible content'
2012-05-07 22:37:07 +00:00
end
# add body as attachment
2012-07-02 18:52:27 +00:00
headers_store = {
'content-alternative' => true,
}
2012-05-07 22:37:07 +00:00
if mail.mime_type
headers_store['Mime-Type'] = mail.mime_type
end
if mail.charset
headers_store['Charset'] = mail.charset
end
attachment = {
:data => mail.body.decoded,
:filename => mail.filename || filename,
:preferences => headers_store
}
data[:attachments].push attachment
end
2012-05-04 19:30:22 +00:00
end
2012-07-02 18:52:27 +00:00
# strip not wanted chars
data[:body].gsub!( /\r\n/, "\n" )
data[:body].gsub!( /\r/, "\n" )
2012-07-02 18:52:27 +00:00
return data
end
def process(channel, msg)
mail = parse( msg )
2012-05-06 20:48:23 +00:00
# check if trust x-headers
if !channel[:trusted]
mail.each {|key, value|
if key =~ /^x-zammad/i
mail.delete(key)
end
}
end
2012-10-04 07:09:27 +00:00
# process postmaster filter
2012-05-06 20:48:23 +00:00
# check ignore header
return true if mail[ 'x-zammad-ignore'.to_sym ] == 'true' || mail[ 'x-zammad-ignore'.to_sym ] == true
ticket = nil
article = nil
user = nil
# use transaction
ActiveRecord::Base.transaction do
2012-05-06 20:48:23 +00:00
if mail[ 'x-zammad-customer-login'.to_sym ]
user = User.where( :login => mail[ 'x-zammad-customer-login'.to_sym ] ).first
end
if !user
user = User.where( :email => mail[ 'x-zammad-customer-email'.to_sym ] || mail[:from_email] ).first
end
if !user
puts 'create user...'
roles = Role.where( :name => 'Customer' )
user = User.create(
2012-05-06 20:48:23 +00:00
:login => mail[ 'x-zammad-customer-login'.to_sym ] || mail[ 'x-zammad-customer-email'.to_sym ] || mail[:from_email],
:firstname => mail[ 'x-zammad-customer-firstname'.to_sym ] || mail[:from_display_name],
:lastname => mail[ 'x-zammad-customer-lastname'.to_sym ],
:email => mail[ 'x-zammad-customer-email'.to_sym ] || mail[:from_email],
:password => '',
:active => true,
:roles => roles,
:created_by_id => 1
)
end
2012-10-04 07:09:27 +00:00
# set current user
UserInfo.current_user_id = user.id
2012-10-04 07:09:27 +00:00
# get ticket# from subject
ticket = Ticket.number_check( mail[:subject] )
# set ticket state to open if not new
if ticket
ticket_state = Ticket::State.find( ticket.ticket_state_id )
ticket_state_type = Ticket::StateType.find( ticket_state.ticket_state_type_id )
2012-08-28 05:21:45 +00:00
# if tickte is merged, find linked ticket
if ticket_state_type.name == 'merged'
end
if ticket_state_type.name != 'new'
ticket.ticket_state = Ticket::State.where( :name => 'open' ).first
ticket.save
end
end
# create new ticket
2012-05-06 20:48:23 +00:00
if !ticket
# set attributes
ticket_attributes = {
2012-05-04 19:30:22 +00:00
:group_id => channel[:group_id] || 1,
:customer_id => user.id,
2012-08-28 05:21:45 +00:00
:title => mail[:subject] || '',
2012-05-06 20:48:23 +00:00
:ticket_state_id => Ticket::State.where( :name => 'new' ).first.id,
:ticket_priority_id => Ticket::Priority.where( :name => '2 normal' ).first.id,
:created_by_id => user.id,
}
# x-headers lookup
map = [
[ 'x-zammad-group', Group, 'group_id', 'name' ],
[ 'x-zammad-state', Ticket::State, 'ticket_state_id', 'name' ],
[ 'x-zammad-priority', Ticket::Priority, 'ticket_priority_id', 'name' ],
[ 'x-zammad-owner', User, 'owner_id', 'login' ],
]
map.each { |item|
if mail[ item[0].to_sym ]
if item[1].where( item[3].to_sym => mail[ item[0].to_sym ] ).first
ticket_attributes[ item[2].to_sym ] = item[1].where( item[3].to_sym => mail[ item[0].to_sym ] ).first.id
end
end
}
# create ticket
ticket = Ticket.create( ticket_attributes )
end
# import mail
2012-05-06 20:48:23 +00:00
# set attributes
internal = false
if mail[ 'X-Zammad-Article-Visability'.to_sym ] && mail[ 'X-Zammad-Article-Visability'.to_sym ] == 'internal'
internal = true
end
article_attributes = {
:created_by_id => user.id,
:ticket_id => ticket.id,
2012-05-06 20:48:23 +00:00
:ticket_article_type_id => Ticket::Article::Type.where( :name => 'email' ).first.id,
:ticket_article_sender_id => Ticket::Article::Sender.where( :name => 'Customer' ).first.id,
:body => mail[:body],
:from => mail[:from],
:to => mail[:to],
:cc => mail[:cc],
:subject => mail[:subject],
:message_id => mail[:message_id],
2012-05-06 20:48:23 +00:00
:internal => internal,
}
# x-headers lookup
map = [
[ 'x-zammad-article-type', Ticket::Article::Type, 'ticket_article_type_id', 'name' ],
[ 'x-zammad-article-sender', Ticket::Article::Sender, 'ticket_article_sender_id', 'name' ],
]
map.each { |item|
if mail[ item[0].to_sym ]
if item[1].where( item[3].to_sym => mail[ item[0].to_sym ] ).first
article_attributes[ item[2].to_sym ] = item[1].where( item[3].to_sym => mail[ item[0].to_sym ] ).first.id
end
end
}
# create article
article = Ticket::Article.create(article_attributes)
# store mail plain
Store.add(
:object => 'Ticket::Article::Mail',
:o_id => article.id,
:data => msg,
2012-07-02 12:47:09 +00:00
:filename => "ticket-#{ticket.number}-#{article.id}.eml",
:preferences => {}
)
# store attachments
if mail[:attachments]
mail[:attachments].each do |attachment|
Store.add(
:object => 'Ticket::Article',
:o_id => article.id,
:data => attachment[:data],
:filename => attachment[:filename],
:preferences => attachment[:preferences]
)
end
end
end
# execute ticket events
Ticket::Observer::Notification.transaction
2012-05-06 20:48:23 +00:00
# return new objects
return ticket, article, user
end
2012-05-07 22:37:07 +00:00
def html2ascii(string)
# find <a href=....> and replace it with [x]
link_list = ''
counter = 0
string.gsub!( /<a\s.*?href=("|')(.+?)("|').*?>/ix ) { |item|
link = $2
counter = counter + 1
link_list += "[#{counter}] #{link}\n"
"[#{counter}]"
}
# remove empty lines
string.gsub!( /^\s*/m, '' )
# fix some bad stuff from opera and others
2012-06-15 11:10:23 +00:00
string.gsub!( /(\n\r|\r\r\n|\r\n)/, "\n" )
# strip all other tags
string.gsub!( /\<(br|br\/|br\s\/)\>/, "\n" )
2012-05-07 22:37:07 +00:00
# strip all other tags
2012-06-15 11:10:23 +00:00
string.gsub!( /\<.+?\>/, '' )
2012-05-07 22:37:07 +00:00
# encode html entities like "&#8211;"
string.gsub!( /(&\#(\d+);?)/x ) { |item|
$2.chr
}
# encode html entities like "&#3d;"
string.gsub!( /(&\#[xX]([0-9a-fA-F]+);?)/x ) { |item|
chr_orig = $1
hex = $2.hex
if hex
chr = hex.chr
if chr
chr
else
chr_orig
end
else
chr_orig
end
}
# remove empty lines
string.gsub!( /^\s*\n\s*\n/m, "\n" )
# add extracted links
if link_list
string += "\n\n" + link_list
end
return string
end
end
# workaround to parse subjects with 2 different encodings correctly (e. g. quoted-printable see test/fixtures/mail9.box)
module Mail
module Encodings
def Encodings.value_decode(str)
# Optimization: If there's no encoded-words in the string, just return it
return str unless str.index("=?")
str = str.gsub(/\?=(\s*)=\?/, '?==?') # Remove whitespaces between 'encoded-word's
# Split on white-space boundaries with capture, so we capture the white-space as well
str.split(/([ \t])/).map do |text|
if text.index('=?') .nil?
text
else
# Join QP encoded-words that are adjacent to avoid decoding partial chars
# text.gsub!(/\?\=\=\?.+?\?[Qq]\?/m, '') if text =~ /\?==\?/
# Search for occurences of quoted strings or plain strings
text.scan(/( # Group around entire regex to include it in matches
\=\?[^?]+\?([QB])\?[^?]+?\?\= # Quoted String with subgroup for encoding method
| # or
.+?(?=\=\?|$) # Plain String
)/xmi).map do |matches|
string, method = *matches
if method == 'b' || method == 'B'
b_value_decode(string)
elsif method == 'q' || method == 'Q'
q_value_decode(string)
else
string
end
end
end
end.join("")
end
end
end