From 8c72fc9bf09071300b6283411b4481456aac7e34 Mon Sep 17 00:00:00 2001 From: knu Date: Thu, 12 Jan 2012 18:42:03 +0000 Subject: * lib/shellwords.rb (Shellwords#shellsplit): Fix a bug where consecutive backslashes in double quotes are all removed except the one at the tail. git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@34285 b2dd03c8-39d4-4d8f-98ff-823fe69b080e --- ChangeLog | 6 ++++++ lib/shellwords.rb | 2 +- test/test_shellwords.rb | 9 +++++++++ 3 files changed, 16 insertions(+), 1 deletion(-) diff --git a/ChangeLog b/ChangeLog index 6685cbdb34..b88e7959bd 100644 --- a/ChangeLog +++ b/ChangeLog @@ -1,3 +1,9 @@ +Fri Jan 13 03:38:36 2012 Akinori MUSHA + + * lib/shellwords.rb (Shellwords#shellsplit): Fix a bug where + consecutive backslashes in double quotes are all removed except + the one at the tail. + Fri Jan 13 03:28:00 2012 Luis Lavena * ext/socket/extconf.rb (if ipv6): only define _WIN32_WINNT if was not diff --git a/lib/shellwords.rb b/lib/shellwords.rb index a83d1f1c86..20ddfe2646 100644 --- a/lib/shellwords.rb +++ b/lib/shellwords.rb @@ -41,7 +41,7 @@ module Shellwords line.scan(/\G\s*(?>([^\s\\\'\"]+)|'([^\']*)'|"((?:[^\"\\]|\\.)*)"|(\\.?)|(\S))(\s|\z)?/m) do |word, sq, dq, esc, garbage, sep| raise ArgumentError, "Unmatched double quote: #{line.inspect}" if garbage - field << (word || sq || (dq || esc).gsub(/\\(?=.)/, '')) + field << (word || sq || (dq || esc).gsub(/\\(.)/, '\\1')) if sep words << field field = '' diff --git a/test/test_shellwords.rb b/test/test_shellwords.rb index 593f0e0aea..bd44aec1af 100644 --- a/test/test_shellwords.rb +++ b/test/test_shellwords.rb @@ -38,6 +38,15 @@ class TestShellwords < Test::Unit::TestCase end end + def test_backslashes + cmdline, expected = [ + %q{/a//b///c////d/////e/ "/a//b///c////d/////e/ "'/a//b///c////d/////e/ '/a//b///c////d/////e/ }, + %q{a/b/c//d//e a/b/c//d//e /a//b///c////d/////e/ a/b/c//d//e } + ].map { |str| str.tr("/", "\\\\") } + + assert_equal [expected], shellwords(cmdline) + end + def test_multibyte_characters # This is not a spec. It describes the current behavior which may # be changed in future. There would be no multibyte character -- cgit v1.2.3