2013-09-20 06:29:09 +00:00
|
|
|
class String
|
|
|
|
def message_quote
|
2015-05-07 12:10:38 +00:00
|
|
|
quote = split("\n")
|
2013-09-20 06:29:09 +00:00
|
|
|
body_quote = ''
|
|
|
|
quote.each do |line|
|
|
|
|
body_quote = body_quote + '> ' + line + "\n"
|
|
|
|
end
|
|
|
|
body_quote
|
|
|
|
end
|
2015-05-07 10:27:12 +00:00
|
|
|
|
2013-09-20 06:29:09 +00:00
|
|
|
def word_wrap(*args)
|
|
|
|
options = args.extract_options!
|
|
|
|
unless args.blank?
|
|
|
|
options[:line_width] = args[0] || 82
|
|
|
|
end
|
2015-04-27 13:42:53 +00:00
|
|
|
options.reverse_merge!(line_width: 82)
|
2013-09-20 06:29:09 +00:00
|
|
|
|
|
|
|
lines = self
|
|
|
|
lines.split("\n").collect do |line|
|
|
|
|
line.length > options[:line_width] ? line.gsub(/(.{1,#{options[:line_width]}})(\s+|$)/, "\\1\n").strip : line
|
|
|
|
end * "\n"
|
|
|
|
end
|
2015-01-09 13:17:34 +00:00
|
|
|
|
|
|
|
=begin
|
|
|
|
|
|
|
|
filename = 'Some::Module'.to_filename
|
|
|
|
|
|
|
|
returns
|
|
|
|
'some/module'
|
|
|
|
|
|
|
|
=end
|
|
|
|
|
2013-10-07 07:00:26 +00:00
|
|
|
def to_filename
|
2015-01-09 13:17:34 +00:00
|
|
|
camel_cased_word = "#{self}"
|
2013-10-07 07:00:26 +00:00
|
|
|
camel_cased_word.gsub(/::/, '/').downcase
|
|
|
|
end
|
2014-06-01 08:29:58 +00:00
|
|
|
|
2015-06-30 14:45:03 +00:00
|
|
|
=begin
|
|
|
|
|
|
|
|
filename = 'some/module.rb'.to_classname
|
|
|
|
|
|
|
|
returns
|
|
|
|
'Some::Module'
|
|
|
|
|
|
|
|
=end
|
|
|
|
|
|
|
|
def to_classname
|
|
|
|
camel_cased_word = "#{self}"
|
|
|
|
camel_cased_word.gsub!(/\.rb$/, '')
|
|
|
|
camel_cased_word.split('/').map(&:camelize).join('::')
|
|
|
|
end
|
|
|
|
|
2014-06-01 08:29:58 +00:00
|
|
|
# because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis)
|
|
|
|
# unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes
|
|
|
|
# More details: http://pjambet.github.io/blog/emojis-and-mysql/
|
|
|
|
def utf8_to_3bytesutf8
|
|
|
|
return if ActiveRecord::Base.connection_config[:adapter] != 'mysql2'
|
2015-05-07 12:10:38 +00:00
|
|
|
each_char.select {|c|
|
2014-06-01 08:29:58 +00:00
|
|
|
if c.bytes.count > 3
|
2015-07-03 15:18:01 +00:00
|
|
|
Rails.logger.warn "strip out 4 bytes utf8 chars '#{c}' of '#{self}'"
|
2014-06-01 08:29:58 +00:00
|
|
|
next
|
|
|
|
end
|
|
|
|
c
|
|
|
|
}
|
2015-05-05 13:23:45 +00:00
|
|
|
.join('') # rubocop:disable Style/MultilineOperationIndentation
|
2014-06-01 08:29:58 +00:00
|
|
|
end
|
2014-12-27 15:25:58 +00:00
|
|
|
|
|
|
|
=begin
|
|
|
|
|
|
|
|
text = html_string.html2text
|
|
|
|
|
2015-01-09 13:17:34 +00:00
|
|
|
returns
|
|
|
|
|
2015-09-02 07:14:48 +00:00
|
|
|
'string with text only'
|
2015-01-09 13:17:34 +00:00
|
|
|
|
2014-12-27 15:25:58 +00:00
|
|
|
=end
|
|
|
|
|
2015-09-02 07:14:48 +00:00
|
|
|
def html2text(string_only = false)
|
2015-01-09 13:17:34 +00:00
|
|
|
string = "#{self}"
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
# in case of invalid encodeing, strip invalid chars
|
|
|
|
# see also test/fixtures/mail21.box
|
|
|
|
# note: string.encode!('UTF-8', 'UTF-8', :invalid => :replace, :replace => '?') was not detecting invalid chars
|
|
|
|
if !string.valid_encoding?
|
2015-05-07 10:25:16 +00:00
|
|
|
string = string.chars.select(&:valid_encoding?).join
|
2014-12-27 15:25:58 +00:00
|
|
|
end
|
|
|
|
|
2015-01-08 14:27:44 +00:00
|
|
|
# find <a href=....> and replace it with [x]
|
|
|
|
link_list = ''
|
|
|
|
counter = 0
|
2015-09-02 07:14:48 +00:00
|
|
|
if !string_only
|
|
|
|
string.gsub!( /<a\s.*?href=("|')(.+?)("|').*?>/ix ) {
|
|
|
|
link = $2
|
|
|
|
counter = counter + 1
|
|
|
|
link_list += "[#{counter}] #{link}\n"
|
|
|
|
"[#{counter}] "
|
|
|
|
}
|
|
|
|
end
|
|
|
|
|
|
|
|
# remove style tags with content
|
2015-09-02 07:26:40 +00:00
|
|
|
string.gsub!( %r{<style(|\s.+?)>(.+?)</style>}im, '')
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
# remove empty lines
|
|
|
|
string.gsub!( /^\s*/m, '' )
|
|
|
|
|
|
|
|
# pre/code handling 1/2
|
2015-05-01 12:12:37 +00:00
|
|
|
string.gsub!( %r{<pre>(.+?)</pre>}m ) { |placeholder|
|
2015-04-27 13:20:16 +00:00
|
|
|
placeholder = placeholder.gsub(/\n/, '###BR###')
|
2015-01-08 14:27:44 +00:00
|
|
|
}
|
2015-05-01 13:17:17 +00:00
|
|
|
string.gsub!( %r{<code>(.+?)</code>}m ) { |placeholder|
|
2015-04-27 13:20:16 +00:00
|
|
|
placeholder = placeholder.gsub(/\n/, '###BR###')
|
2015-01-08 14:27:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
# remove all new lines
|
2015-09-02 07:14:48 +00:00
|
|
|
string.gsub!(/(\n\r|\r\r\n|\r\n|\n)/, '')
|
|
|
|
|
|
|
|
# blockquote handling
|
2015-09-02 07:26:40 +00:00
|
|
|
string.gsub!( %r{<blockquote(| [^>]*)>(.+?)</blockquote>}m ) {
|
|
|
|
"\n" + $2.html2text(true).gsub(/^(.*)$/, '> \1') + "\n"
|
2015-09-02 07:14:48 +00:00
|
|
|
}
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
# pre/code handling 2/2
|
2015-09-02 07:14:48 +00:00
|
|
|
string.gsub!(/###BR###/, "\n" )
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
# add counting
|
|
|
|
string.gsub!(/<li(| [^>]*)>/i, "\n* ")
|
|
|
|
|
|
|
|
# add hr
|
2015-09-02 07:14:48 +00:00
|
|
|
string.gsub!(%r{<hr(|/| [^>]*)>}i, "\n___\n")
|
|
|
|
|
|
|
|
# add h\d
|
|
|
|
string.gsub!(%r{</h\d>}i, "\n")
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
# add new lines
|
2015-09-02 07:14:48 +00:00
|
|
|
string.gsub!( %r{</div><div(|\s.+?)>}im, "\n" )
|
|
|
|
string.gsub!( %r{</p><p(|\s.+?)>}im, "\n" )
|
|
|
|
string.gsub!( %r{<(div|p|pre|br|table|h)(|/| [^>]*)>}i, "\n" )
|
|
|
|
string.gsub!( %r{</(tr|p|br|div)(|\s.+?)>}i, "\n" )
|
2015-05-01 13:17:17 +00:00
|
|
|
string.gsub!( %r{</td>}i, ' ' )
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
# strip all other tags
|
|
|
|
string.gsub!( /\<.+?\>/, '' )
|
|
|
|
|
2015-09-02 07:14:48 +00:00
|
|
|
# replace multible spaces with one
|
|
|
|
string.gsub!(/ /, ' ')
|
|
|
|
|
2015-01-08 14:27:44 +00:00
|
|
|
# strip all & < > "
|
|
|
|
string.gsub!( '&', '&' )
|
|
|
|
string.gsub!( '<', '<' )
|
|
|
|
string.gsub!( '>', '>' )
|
|
|
|
string.gsub!( '"', '"' )
|
|
|
|
string.gsub!( ' ', ' ' )
|
|
|
|
|
|
|
|
# encode html entities like "–"
|
2015-05-07 09:49:46 +00:00
|
|
|
string.gsub!( /(&\#(\d+);?)/x ) {
|
2015-01-08 14:27:44 +00:00
|
|
|
$2.chr
|
|
|
|
}
|
|
|
|
|
|
|
|
# encode html entities like "d;"
|
2015-05-07 09:49:46 +00:00
|
|
|
string.gsub!( /(&\#[xX]([0-9a-fA-F]+);?)/x ) {
|
2015-01-08 14:27:44 +00:00
|
|
|
chr_orig = $1
|
|
|
|
hex = $2.hex
|
|
|
|
if hex
|
|
|
|
chr = hex.chr
|
|
|
|
if chr
|
|
|
|
chr_orig = chr
|
|
|
|
else
|
|
|
|
chr_orig
|
|
|
|
end
|
|
|
|
else
|
|
|
|
chr_orig
|
|
|
|
end
|
|
|
|
|
|
|
|
# check valid encoding
|
|
|
|
begin
|
|
|
|
if !chr_orig.encode('UTF-8').valid_encoding?
|
|
|
|
chr_orig = '?'
|
|
|
|
end
|
|
|
|
rescue
|
|
|
|
chr_orig = '?'
|
|
|
|
end
|
|
|
|
chr_orig
|
|
|
|
}
|
|
|
|
|
|
|
|
# remove tailing empty spaces
|
|
|
|
string.gsub!(/\s+\n$/, "\n")
|
|
|
|
|
|
|
|
# remove multible empty lines
|
|
|
|
string.gsub!(/\n\n\n/, "\n\n")
|
|
|
|
|
2015-09-02 07:14:48 +00:00
|
|
|
string.strip!
|
|
|
|
|
2015-01-08 14:27:44 +00:00
|
|
|
# add extracted links
|
|
|
|
if link_list != ''
|
2015-09-02 07:14:48 +00:00
|
|
|
string += "\n\n\n" + link_list
|
2014-12-27 15:25:58 +00:00
|
|
|
end
|
2015-01-08 14:27:44 +00:00
|
|
|
|
|
|
|
string.strip
|
2014-12-27 15:25:58 +00:00
|
|
|
end
|
2015-01-03 22:53:07 +00:00
|
|
|
|
|
|
|
=begin
|
|
|
|
|
|
|
|
html = text_string.text2html
|
|
|
|
|
|
|
|
=end
|
|
|
|
|
|
|
|
def text2html
|
|
|
|
text = CGI.escapeHTML( self )
|
|
|
|
text.gsub!(/\n/, '<br>')
|
|
|
|
text.chomp
|
|
|
|
end
|
|
|
|
|
2015-04-27 14:15:29 +00:00
|
|
|
end
|