2011-10-04 03:23:24 +04:00
|
|
|
##
|
|
|
|
# = Manipulates strings like the UNIX Bourne shell
|
2003-01-26 13:11:30 +03:00
|
|
|
#
|
2007-09-11 12:27:48 +04:00
|
|
|
# This module manipulates strings according to the word parsing rules
|
|
|
|
# of the UNIX Bourne shell.
|
2003-01-26 13:11:30 +03:00
|
|
|
#
|
2007-09-11 12:27:48 +04:00
|
|
|
# The shellwords() function was originally a port of shellwords.pl,
|
|
|
|
# but modified to conform to POSIX / SUSv3 (IEEE Std 1003.1-2001).
|
2003-01-26 13:11:30 +03:00
|
|
|
#
|
2011-10-04 03:23:24 +04:00
|
|
|
# == Example
|
2003-01-26 13:11:30 +03:00
|
|
|
#
|
2011-10-04 03:23:24 +04:00
|
|
|
# argv = Shellwords.split('here are "two words"') # or String#shellsplit
|
|
|
|
# argv #=> ["here", "are", "two words"]
|
2008-03-21 15:15:06 +03:00
|
|
|
#
|
2011-10-04 03:23:24 +04:00
|
|
|
# argv = Shellwords.escape("special's.txt") # or String#shellescape
|
|
|
|
# system("cat " + argv)
|
|
|
|
#
|
|
|
|
# == Authors:
|
|
|
|
# * Wakou Aoyama
|
|
|
|
# * Akinori MUSHA <knu@iDaemons.org>
|
|
|
|
#
|
|
|
|
# == Contact:
|
|
|
|
# * Akinori MUSHA <knu@iDaemons.org> (current maintainer)
|
|
|
|
|
1998-01-16 15:19:09 +03:00
|
|
|
module Shellwords
|
2007-09-11 12:27:48 +04:00
|
|
|
# Splits a string into an array of tokens in the same way the UNIX
|
|
|
|
# Bourne shell does.
|
|
|
|
#
|
|
|
|
# argv = Shellwords.split('here are "two words"')
|
|
|
|
# argv #=> ["here", "are", "two words"]
|
2003-01-26 13:11:30 +03:00
|
|
|
#
|
2012-01-12 22:49:27 +04:00
|
|
|
# String#shellsplit is a shorthand for this function.
|
2003-01-26 13:11:30 +03:00
|
|
|
#
|
2007-09-11 12:27:48 +04:00
|
|
|
# argv = 'here are "two words"'.shellsplit
|
|
|
|
# argv #=> ["here", "are", "two words"]
|
|
|
|
def shellsplit(line)
|
1998-01-16 15:19:09 +03:00
|
|
|
words = []
|
2005-11-09 02:41:40 +03:00
|
|
|
field = ''
|
2005-11-10 15:05:57 +03:00
|
|
|
line.scan(/\G\s*(?>([^\s\\\'\"]+)|'([^\']*)'|"((?:[^\"\\]|\\.)*)"|(\\.?)|(\S))(\s|\z)?/m) do
|
|
|
|
|word, sq, dq, esc, garbage, sep|
|
|
|
|
raise ArgumentError, "Unmatched double quote: #{line.inspect}" if garbage
|
2012-01-12 22:42:03 +04:00
|
|
|
field << (word || sq || (dq || esc).gsub(/\\(.)/, '\\1'))
|
2005-11-09 02:41:40 +03:00
|
|
|
if sep
|
|
|
|
words << field
|
|
|
|
field = ''
|
1998-01-16 15:19:09 +03:00
|
|
|
end
|
|
|
|
end
|
|
|
|
words
|
|
|
|
end
|
2003-01-26 13:11:30 +03:00
|
|
|
|
2007-09-11 12:27:48 +04:00
|
|
|
alias shellwords shellsplit
|
|
|
|
|
|
|
|
module_function :shellsplit, :shellwords
|
|
|
|
|
|
|
|
class << self
|
|
|
|
alias split shellsplit
|
|
|
|
end
|
|
|
|
|
|
|
|
# Escapes a string so that it can be safely used in a Bourne shell
|
2012-01-12 22:49:30 +04:00
|
|
|
# command line. +str+ can be a non-string object that responds to
|
|
|
|
# +to_s+.
|
2007-09-11 12:27:48 +04:00
|
|
|
#
|
|
|
|
# Note that a resulted string should be used unquoted and is not
|
|
|
|
# intended for use in double quotes nor in single quotes.
|
|
|
|
#
|
|
|
|
# open("| grep #{Shellwords.escape(pattern)} file") { |pipe|
|
|
|
|
# # ...
|
|
|
|
# }
|
|
|
|
#
|
2012-01-12 22:49:27 +04:00
|
|
|
# String#shellescape is a shorthand for this function.
|
2007-09-11 12:27:48 +04:00
|
|
|
#
|
|
|
|
# open("| grep #{pattern.shellescape} file") { |pipe|
|
|
|
|
# # ...
|
|
|
|
# }
|
|
|
|
#
|
2012-01-01 07:26:20 +04:00
|
|
|
# It is caller's responsibility to encode the string in the right
|
|
|
|
# encoding for the shell environment where this string is used.
|
|
|
|
# Multibyte characters are treated as multibyte characters, not
|
|
|
|
# bytes.
|
2007-09-11 12:27:48 +04:00
|
|
|
def shellescape(str)
|
2012-01-12 22:49:30 +04:00
|
|
|
str = str.to_s
|
|
|
|
|
2007-09-11 12:27:48 +04:00
|
|
|
# An empty argument will be skipped, so return empty quotes.
|
|
|
|
return "''" if str.empty?
|
|
|
|
|
|
|
|
str = str.dup
|
|
|
|
|
2012-01-01 07:26:20 +04:00
|
|
|
# Treat multibyte characters as is. It is caller's responsibility
|
|
|
|
# to encode the string in the right encoding for the shell
|
|
|
|
# environment.
|
|
|
|
str.gsub!(/([^A-Za-z0-9_\-.,:\/@\n])/, "\\\\\\1")
|
2007-09-11 12:27:48 +04:00
|
|
|
|
|
|
|
# A LF cannot be escaped with a backslash because a backslash + LF
|
|
|
|
# combo is regarded as line continuation and simply ignored.
|
|
|
|
str.gsub!(/\n/, "'\n'")
|
|
|
|
|
|
|
|
return str
|
|
|
|
end
|
|
|
|
|
|
|
|
module_function :shellescape
|
|
|
|
|
|
|
|
class << self
|
2008-01-14 10:14:14 +03:00
|
|
|
alias escape shellescape
|
2007-09-11 12:27:48 +04:00
|
|
|
end
|
|
|
|
|
|
|
|
# Builds a command line string from an argument list +array+ joining
|
2012-01-12 22:49:30 +04:00
|
|
|
# all elements escaped for Bourne shell into a single string with
|
|
|
|
# fields separated by a space, where each element is stringified
|
|
|
|
# using +to_s+.
|
2007-09-11 12:27:48 +04:00
|
|
|
#
|
|
|
|
# open('|' + Shellwords.join(['grep', pattern, *files])) { |pipe|
|
|
|
|
# # ...
|
|
|
|
# }
|
|
|
|
#
|
2012-01-12 22:49:27 +04:00
|
|
|
# Array#shelljoin is a shorthand for this function.
|
2007-09-11 12:27:48 +04:00
|
|
|
#
|
|
|
|
# open('|' + ['grep', pattern, *files].shelljoin) { |pipe|
|
|
|
|
# # ...
|
|
|
|
# }
|
|
|
|
#
|
2012-01-12 22:49:30 +04:00
|
|
|
# It is allowed to mix non-string objects in the elements as allowed
|
|
|
|
# in Array#join.
|
|
|
|
#
|
|
|
|
# output = `#{['ps', '-p', $$].shelljoin}`
|
|
|
|
#
|
2007-09-11 12:27:48 +04:00
|
|
|
def shelljoin(array)
|
|
|
|
array.map { |arg| shellescape(arg) }.join(' ')
|
|
|
|
end
|
|
|
|
|
|
|
|
module_function :shelljoin
|
|
|
|
|
|
|
|
class << self
|
|
|
|
alias join shelljoin
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
class String
|
|
|
|
# call-seq:
|
|
|
|
# str.shellsplit => array
|
|
|
|
#
|
|
|
|
# Splits +str+ into an array of tokens in the same way the UNIX
|
2012-01-12 22:49:27 +04:00
|
|
|
# Bourne shell does. See Shellwords::shellsplit for details.
|
2007-09-11 12:27:48 +04:00
|
|
|
def shellsplit
|
|
|
|
Shellwords.split(self)
|
|
|
|
end
|
|
|
|
|
|
|
|
# call-seq:
|
|
|
|
# str.shellescape => string
|
|
|
|
#
|
|
|
|
# Escapes +str+ so that it can be safely used in a Bourne shell
|
2012-01-12 22:49:27 +04:00
|
|
|
# command line. See Shellwords::shellescape for details.
|
2007-09-11 12:27:48 +04:00
|
|
|
def shellescape
|
|
|
|
Shellwords.escape(self)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
class Array
|
|
|
|
# call-seq:
|
|
|
|
# array.shelljoin => string
|
|
|
|
#
|
|
|
|
# Builds a command line string from an argument list +array+ joining
|
|
|
|
# all elements escaped for Bourne shell and separated by a space.
|
2012-01-12 22:49:27 +04:00
|
|
|
# See Shellwords::shelljoin for details.
|
2007-09-11 12:27:48 +04:00
|
|
|
def shelljoin
|
|
|
|
Shellwords.join(self)
|
|
|
|
end
|
1998-01-16 15:19:09 +03:00
|
|
|
end
|