trabajo-afectivo/lib/core_ext/string.rb

class String
  def message_quote
    quote = split("\n")
    body_quote = ''
    quote.each do |line|
      body_quote = body_quote + '> ' + line + "\n"
    end
    body_quote
  end

  def word_wrap(*args)
    options = args.extract_options!
    unless args.blank?
      options[:line_width] = args[0] || 82
    end
    options.reverse_merge!(line_width: 82)

    lines = self
    lines.split("\n").collect do |line|
      line.length > options[:line_width] ? line.gsub(/(.{1,#{options[:line_width]}})(\s+|$)/, "\\1\n").strip : line
    end * "\n"
  end

=begin

  filename = 'Some::Module'.to_filename

  returns
    'some/module'

=end

  def to_filename
    camel_cased_word = "#{self}"
    camel_cased_word.gsub(/::/, '/').downcase
  end

  # because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis)
  # unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes
  # More details: http://pjambet.github.io/blog/emojis-and-mysql/
  def utf8_to_3bytesutf8
    return if ActiveRecord::Base.connection_config[:adapter] != 'mysql2'
    each_char.select {|c|
      if c.bytes.count > 3
        Rails.logger.warn "strip out 4 bytes utf8 chars '#{c}' of '#{ self }'"
        next
      end
      c
    }
    .join('') # rubocop:disable Style/MultilineOperationIndentation
  end

=begin

  text = html_string.html2text

  returns

    'string with text'

=end

  def html2text
    string = "#{self}"

    # in case of invalid encodeing, strip invalid chars
    # see also test/fixtures/mail21.box
    # note: string.encode!('UTF-8', 'UTF-8', :invalid => :replace, :replace => '?') was not detecting invalid chars
    if !string.valid_encoding?
      string = string.chars.select(&:valid_encoding?).join
    end

    # find <a href=....> and replace it with [x]
    link_list = ''
    counter   = 0
    string.gsub!( /<a\s.*?href=("|')(.+?)("|').*?>/ix ) {
      link = $2
      counter   = counter + 1
      link_list += "[#{counter}] #{link}\n"
      "[#{counter}] "
    }

    # remove empty lines
    string.gsub!( /^\s*/m, '' )

    # pre/code handling 1/2
    string.gsub!( %r{<pre>(.+?)</pre>}m ) { |placeholder|
      placeholder = placeholder.gsub(/\n/, '###BR###')
    }
    string.gsub!( %r{<code>(.+?)</code>}m ) { |placeholder|
      placeholder = placeholder.gsub(/\n/, '###BR###')
    }

    # remove all new lines
    string.gsub!( /(\n\r|\r\r\n|\r\n|\n)/, '' )

    # pre/code handling 2/2
    string.gsub!( /###BR###/, "\n" )

    # add counting
    string.gsub!(/<li(| [^>]*)>/i, "\n* ")

    # add quoting
    string.gsub!(/<blockquote(| [^>]*)>/i, '> ')

    # add hr
    string.gsub!(%r{<hr(|/| [^>]*)>}i, "___\n")

    # add new lines
    string.gsub!( %r{<(br|table)(|/| [^>]*)>}i, "\n" )
    string.gsub!( %r{</(div|p|pre|blockquote|table|tr)(|\s.+?)>}i, "\n" )
    string.gsub!( %r{</td>}i, ' '  )

    # strip all other tags
    string.gsub!( /\<.+?\>/, '' )

    # strip all &amp; &lt; &gt; &quot;
    string.gsub!( '&amp;', '&' )
    string.gsub!( '&lt;', '<' )
    string.gsub!( '&gt;', '>' )
    string.gsub!( '&quot;', '"' )
    string.gsub!( '&nbsp;', ' ' )

    # encode html entities like "&#8211;"
    string.gsub!( /(&\#(\d+);?)/x ) {
      $2.chr
    }

    # encode html entities like "&#3d;"
    string.gsub!( /(&\#[xX]([0-9a-fA-F]+);?)/x ) {
      chr_orig = $1
      hex      = $2.hex
      if hex
        chr = hex.chr
        if chr
          chr_orig = chr
        else
          chr_orig
        end
      else
        chr_orig
      end

      # check valid encoding
      begin
        if !chr_orig.encode('UTF-8').valid_encoding?
          chr_orig = '?'
        end
      rescue
        chr_orig = '?'
      end
      chr_orig
    }

    # remove tailing empty spaces
    string.gsub!(/\s+\n$/, "\n")

    # remove multible empty lines
    string.gsub!(/\n\n\n/, "\n\n")

    # add extracted links
    if link_list != ''
      string += "\n\n" + link_list
    end

    string.strip
  end

=begin

  html = text_string.text2html

=end

  def text2html
    text = CGI.escapeHTML( self )
    text.gsub!(/\n/, '<br>')
    text.chomp
  end

end
Moved to extra directory to extend ruby core. 2013-09-20 06:29:09 +00:00			`class String`
			`def message_quote`
Corrected with rubocop cop 'Style/RedundantSelf'. 2015-05-07 12:10:38 +00:00			`quote = split("\n")`
Moved to extra directory to extend ruby core. 2013-09-20 06:29:09 +00:00			`body_quote = ''`
			`quote.each do \|line\|`
			`body_quote = body_quote + '> ' + line + "\n"`
			`end`
			`body_quote`
			`end`
Corrected with rubocop cop 'Style/EmptyLineBetweenDefs'. 2015-05-07 10:27:12 +00:00
Moved to extra directory to extend ruby core. 2013-09-20 06:29:09 +00:00			`def word_wrap(*args)`
			`options = args.extract_options!`
			`unless args.blank?`
			`options[:line_width] = args[0] \|\| 82`
			`end`
Corrected with rubocop cop 'Style/HashSyntax'. 2015-04-27 13:42:53 +00:00			`options.reverse_merge!(line_width: 82)`
Moved to extra directory to extend ruby core. 2013-09-20 06:29:09 +00:00
			`lines = self`
			`lines.split("\n").collect do \|line\|`
			`line.length > options[:line_width] ? line.gsub(/(.{1,#{options[:line_width]}})(\s+\|$)/, "\\1\n").strip : line`
			`end * "\n"`
			`end`
Fixed manipulation of string in html2text. Added unit tests. 2015-01-09 13:17:34 +00:00
			`=begin`

			`filename = 'Some::Module'.to_filename`

			`returns`
			`'some/module'`

			`=end`

Improved object lookup for activity stream. 2013-10-07 07:00:26 +00:00			`def to_filename`
Fixed manipulation of string in html2text. Added unit tests. 2015-01-09 13:17:34 +00:00			`camel_cased_word = "#{self}"`
Improved object lookup for activity stream. 2013-10-07 07:00:26 +00:00			`camel_cased_word.gsub(/::/, '/').downcase`
			`end`
Because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis). Unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes. More details: http://pjambet.github.io/blog/emojis-and-mysql/ 2014-06-01 08:29:58 +00:00
			`# because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis)`
			`# unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes`
			`# More details: http://pjambet.github.io/blog/emojis-and-mysql/`
			`def utf8_to_3bytesutf8`
			`return if ActiveRecord::Base.connection_config[:adapter] != 'mysql2'`
Corrected with rubocop cop 'Style/RedundantSelf'. 2015-05-07 12:10:38 +00:00			`each_char.select {\|c\|`
Because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis). Unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes. More details: http://pjambet.github.io/blog/emojis-and-mysql/ 2014-06-01 08:29:58 +00:00			`if c.bytes.count > 3`
Improved logging. 2015-05-05 08:26:53 +00:00			`Rails.logger.warn "strip out 4 bytes utf8 chars '#{c}' of '#{ self }'"`
Because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis). Unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes. More details: http://pjambet.github.io/blog/emojis-and-mysql/ 2014-06-01 08:29:58 +00:00			`next`
			`end`
			`c`
			`}`
Corrected with rubocop cop 'Style/MultilineOperationIndentation'. 2015-05-05 13:23:45 +00:00			`.join('') # rubocop:disable Style/MultilineOperationIndentation`
Because of mysql inno_db limitations, strip 4 bytes utf8 chars (e. g. emojis). Unfortunaly UTF8mb4 will raise other limitaions of max varchar and lower index sizes. More details: http://pjambet.github.io/blog/emojis-and-mysql/ 2014-06-01 08:29:58 +00:00			`end`
Improved sending emails. 2014-12-27 15:25:58 +00:00
			`=begin`

			`text = html_string.html2text`

Fixed manipulation of string in html2text. Added unit tests. 2015-01-09 13:17:34 +00:00			`returns`

			`'string with text'`

Improved sending emails. 2014-12-27 15:25:58 +00:00			`=end`

			`def html2text`
Fixed manipulation of string in html2text. Added unit tests. 2015-01-09 13:17:34 +00:00			`string = "#{self}"`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00
			`# in case of invalid encodeing, strip invalid chars`
			`# see also test/fixtures/mail21.box`
			`# note: string.encode!('UTF-8', 'UTF-8', :invalid => :replace, :replace => '?') was not detecting invalid chars`
			`if !string.valid_encoding?`
Corrected with rubocop cop 'Style/SymbolProc'. 2015-05-07 10:25:16 +00:00			`string = string.chars.select(&:valid_encoding?).join`
Improved sending emails. 2014-12-27 15:25:58 +00:00			`end`

Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00			`# find <a href=....> and replace it with [x]`
			`link_list = ''`
			`counter = 0`
Corrected with rubocop cop 'Lint/UnusedBlockArgument'. 2015-05-07 09:49:46 +00:00			`string.gsub!( /<a\s.?href=("\|')(.+?)("\|').?>/ix ) {`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00			`link = $2`
			`counter = counter + 1`
			`link_list += "[#{counter}] #{link}\n"`
			`"[#{counter}] "`
			`}`

			`# remove empty lines`
			`string.gsub!( /^\s*/m, '' )`

			`# pre/code handling 1/2`
Corrected with rubocop cop 'Style/RegexpLiteral'. 2015-05-01 12:12:37 +00:00			`string.gsub!( %r{<pre>(.+?)</pre>}m ) { \|placeholder\|`
Corrected with rubocop cop 'Style/StringLiterals'. 2015-04-27 13:20:16 +00:00			`placeholder = placeholder.gsub(/\n/, '###BR###')`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00			`}`
Reworked regex r%{} 2015-05-01 13:17:17 +00:00			`string.gsub!( %r{<code>(.+?)</code>}m ) { \|placeholder\|`
Corrected with rubocop cop 'Style/StringLiterals'. 2015-04-27 13:20:16 +00:00			`placeholder = placeholder.gsub(/\n/, '###BR###')`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00			`}`

			`# remove all new lines`
			`string.gsub!( /(\n\r\|\r\r\n\|\r\n\|\n)/, '' )`

			`# pre/code handling 2/2`
			`string.gsub!( /###BR###/, "\n" )`

			`# add counting`
			`string.gsub!(/<li(\| [^>])>/i, "\n ")`

			`# add quoting`
			`string.gsub!(/<blockquote(\| [^>]*)>/i, '> ')`

			`# add hr`
Corrected with rubocop cop 'Style/RegexpLiteral'. 2015-05-01 12:12:37 +00:00			`string.gsub!(%r{<hr(\|/\| [^>]*)>}i, "___\n")`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00
			`# add new lines`
Reworked regex r%{} 2015-05-01 13:17:17 +00:00			`string.gsub!( %r{<(br\|table)(\|/\| [^>]*)>}i, "\n" )`
			`string.gsub!( %r{</(div\|p\|pre\|blockquote\|table\|tr)(\|\s.+?)>}i, "\n" )`
			`string.gsub!( %r{</td>}i, ' ' )`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00
			`# strip all other tags`
			`string.gsub!( /\<.+?\>/, '' )`

			`# strip all & < > "`
			`string.gsub!( '&', '&' )`
			`string.gsub!( '<', '<' )`
			`string.gsub!( '>', '>' )`
			`string.gsub!( '"', '"' )`
			`string.gsub!( ' ', ' ' )`

			`# encode html entities like "–"`
Corrected with rubocop cop 'Lint/UnusedBlockArgument'. 2015-05-07 09:49:46 +00:00			`string.gsub!( /(&\#(\d+);?)/x ) {`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00			`$2.chr`
			`}`

			`# encode html entities like "&#3d;"`
Corrected with rubocop cop 'Lint/UnusedBlockArgument'. 2015-05-07 09:49:46 +00:00			`string.gsub!( /(&\#[xX]([0-9a-fA-F]+);?)/x ) {`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00			`chr_orig = $1`
			`hex = $2.hex`
			`if hex`
			`chr = hex.chr`
			`if chr`
			`chr_orig = chr`
			`else`
			`chr_orig`
			`end`
			`else`
			`chr_orig`
			`end`

			`# check valid encoding`
			`begin`
			`if !chr_orig.encode('UTF-8').valid_encoding?`
			`chr_orig = '?'`
			`end`
			`rescue`
			`chr_orig = '?'`
			`end`
			`chr_orig`
			`}`

			`# remove tailing empty spaces`
			`string.gsub!(/\s+\n$/, "\n")`

			`# remove multible empty lines`
			`string.gsub!(/\n\n\n/, "\n\n")`

			`# add extracted links`
			`if link_list != ''`
			`string += "\n\n" + link_list`
Improved sending emails. 2014-12-27 15:25:58 +00:00			`end`
Improved unit tests, merged html2ascii to html2text. 2015-01-08 14:27:44 +00:00
			`string.strip`
Improved sending emails. 2014-12-27 15:25:58 +00:00			`end`
Moved to html notifications. 2015-01-03 22:53:07 +00:00
			`=begin`

			`html = text_string.text2html`

			`=end`

			`def text2html`
			`text = CGI.escapeHTML( self )`
			`text.gsub!(/\n/, '<br>')`
			`text.chomp`
			`end`

Applied rubocop Style/TrailingBlankLines. 2015-04-27 14:15:29 +00:00			`end`