rex-text/lib/rex/text/hex.rb

201 lines
6.8 KiB
Ruby

module Rex
module Text
# We are re-opening the module to add these module methods.
# Breaking them up this way allows us to maintain a little higher
# degree of organisation and make it easier to find what you're looking for
# without hanging the underlying calls that we historically rely upon.
#
# Returns the escaped hex version of the supplied string
#
# @example
# Rex::Text.to_hex("asdf") # => "\\x61\\x73\\x64\\x66"
#
# @param str (see to_octal)
# @param prefix (see to_octal)
# @param count [Integer] Number of bytes to put in each escape chunk
# @return [String] The escaped hex version of +str+
def self.to_hex(str, prefix = "\\x", count = 1)
raise ::RuntimeError, "unable to chunk into #{count} byte chunks" if ((str.length % count) > 0)
# XXX: Regexp.new is used here since using /.{#{count}}/o would compile
# the regex the first time it is used and never check again. Since we
# want to know how many to capture on every instance, we do it this
# way.
return str.unpack('H*')[0].gsub(Regexp.new(".{#{count * 2}}", Regexp::NOENCODING)) { |s| prefix + s }
end
#
# Returns the string with nonprintable hex characters sanitized to ascii.
# Similiar to {.to_hex}, but regular ASCII is not translated if +count+ is 1.
#
# @example
# Rex::Text.to_hex_ascii("\x7fABC\0") # => "\\x7fABC\\x00"
#
# @param str (see to_hex)
# @param prefix (see to_hex)
# @param count (see to_hex)
# @param suffix [String,nil] A string to append to the converted bytes
# @return [String] The original string with non-printables converted to
# their escaped hex representation
def self.to_hex_ascii(str, prefix = "\\x", count = 1, suffix=nil)
raise ::RuntimeError, "unable to chunk into #{count} byte chunks" if ((str.length % count) > 0)
return str.unpack('H*')[0].gsub(Regexp.new(".{#{count * 2}}", Regexp::NOENCODING)) { |s|
(0x20..0x7e) === s.to_i(16) ? s.to_i(16).chr : prefix + s + suffix.to_s
}
end
#
# Converts a string to a nicely formatted hex dump
#
# @param str [String] The string to convert
# @param width [Integer] Number of bytes to convert before adding a newline
# @param base [Integer] The base address of the dump
def self.to_hex_dump(str, width=16, base=nil)
buf = ''
idx = 0
cnt = 0
snl = false
lst = 0
lft_col_len = (base.to_i+str.length).to_s(16).length
lft_col_len = 8 if lft_col_len < 8
while (idx < str.length)
chunk = str[idx, width]
addr = base ? "%0#{lft_col_len}x " %(base.to_i + idx) : ''
line = chunk.unpack("H*")[0].scan(/../).join(" ")
buf << addr + line
if (lst == 0)
lst = line.length
buf << " " * 4
else
buf << " " * ((lst - line.length) + 4).abs
end
buf << "|"
chunk.unpack("C*").each do |c|
if (c > 0x1f and c < 0x7f)
buf << c.chr
else
buf << "."
end
end
buf << "|\n"
idx += width
end
buf << "\n"
end
#
# Converts a hex string to a raw string
#
# @example
# Rex::Text.hex_to_raw("\\x41\\x7f\\x42") # => "A\x7fB"
#
def self.hex_to_raw(str)
[ str.downcase.gsub(/'/,'').gsub(/\\?x([a-f0-9][a-f0-9])/, '\1') ].pack("H*")
end
#
# Turn non-printable chars into hex representations, leaving others alone
#
# If +whitespace+ is true, converts whitespace (0x20, 0x09, etc) to hex as
# well.
#
# @see hexify
# @see to_hex Converts all the chars
#
def self.ascii_safe_hex(str, whitespace=false)
# This sanitization is terrible and breaks everything if it finds unicode.
# ~4 Billion can't be wrong; long-term, this should be removed.
if str.encoding == (::Encoding::UTF_8)
return str
end
if whitespace
str.gsub(/([\x00-\x20\x80-\xFF])/n){ |x| "\\x%.2x" % x.unpack("C*")[0] }
else
str.gsub(/([\x00-\x08\x0b\x0c\x0e-\x1f\x80-\xFF])/n){ |x| "\\x%.2x" % x.unpack("C*")[0]}
end
end
#
# Converts a string to a hex version with wrapping support
#
def self.hexify(str, col = DefaultWrap, line_start = '', line_end = '', buf_start = '', buf_end = '')
self.hexify_general(str, "\\x", col, line_start, line_end, buf_start, buf_end)
end
#
# Converts a string to hex, with each character prefixed with 0x; with wrapping support
def self.numhexify(str, col = DefaultWrap, line_start = '', line_end = '', buf_start = '', buf_end = '', between = '')
self.hexify_general(str, "0x", col, line_start, line_end, buf_start, buf_end, between)
end
#
# Convert hex-encoded characters to literals.
#
# @example
# Rex::Text.dehex("AA\\x42CC") # => "AABCC"
#
# @see hex_to_raw
# @param str [String]
def self.dehex(str)
return str unless str.respond_to? :match
return str unless str.respond_to? :gsub
regex = /\x5cx[0-9a-f]{2}/nmi
if str.match(regex)
str.gsub(regex) { |x| x[2,2].to_i(16).chr }
else
str
end
end
#
# Convert and replace hex-encoded characters to literals.
#
# @param (see dehex)
def self.dehex!(str)
return str unless str.respond_to? :match
return str unless str.respond_to? :gsub
regex = /\x5cx[0-9a-f]{2}/nmi
str.gsub!(regex) { |x| x[2,2].to_i(16).chr }
end
private
#
# General-case method to handle both "\xAA\xBB\xCC" format and 0xAA,0xBB,0xCC format
#
def self.hexify_general(str, char_prefix, col = DefaultWrap, line_start = '', line_end = '', buf_start = '', buf_end = '', between='', char_suffix: '')
encoded_char_length = 2 + char_prefix.length + char_suffix.length + between.length
if col < line_start.length + encoded_char_length + line_end.length
# raise an exception
raise ArgumentError.new('insufficient column width')
end
ret = buf_start.dup
ret << line_start if ret.end_with?("\n")
last_newline = ret.rindex("\n") || -1
last_line_length = ret.length - last_newline - 1
str.each_char do |char|
# Check if we're going over the wrap boundary
if last_line_length + encoded_char_length + line_end.length > col
ret << "#{line_end}\n#{line_start}"
last_line_length = line_start.length
end
ret << char_prefix << char.unpack('H*')[0] << char_suffix << between
last_line_length += encoded_char_length
end
# Remove the last in-between characters, if required
ret = ret[0..ret.length - 1 - between.length] unless str.empty?
ret << "\n" if last_line_length + buf_end.length > col
ret << "#{buf_end}\n"
end
end
end