* lib/find.rb (Find.find): respect the encodings of arguments.

[ruby-dev:47530] [Feature #8657]

* test/test_find.rb: add tests.

git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@42866 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
This commit is contained in:
ktsj 2013-09-07 04:34:27 +00:00
parent dd946739dd
commit 0a4801e768
3 changed files with 64 additions and 17 deletions

View File

@ -1,3 +1,10 @@
Sat Sep 7 13:29:22 2013 Kazuki Tsujimoto <kazuki@callcc.net>
* lib/find.rb (Find.find): respect the encodings of arguments.
[ruby-dev:47530] [Feature #8657]
* test/test_find.rb: add tests.
Sat Sep 7 10:40:32 2013 Tanaka Akira <akr@fsij.org> Sat Sep 7 10:40:32 2013 Tanaka Akira <akr@fsij.org>
* ext/socket/mkconstants.rb (TCP_FASTOPEN): Defined for TCP fast open. * ext/socket/mkconstants.rb (TCP_FASTOPEN): Defined for TCP fast open.

View File

@ -37,30 +37,36 @@ module Find
def find(*paths) # :yield: path def find(*paths) # :yield: path
block_given? or return enum_for(__method__, *paths) block_given? or return enum_for(__method__, *paths)
paths.collect!{|d| raise Errno::ENOENT unless File.exist?(d); d.dup} fs_encoding = Encoding.find("filesystem")
while file = paths.shift
catch(:prune) do paths.collect!{|d| raise Errno::ENOENT unless File.exist?(d); d.dup}.each do |path|
yield file.dup.taint enc = path.encoding == Encoding::US_ASCII ? fs_encoding : path.encoding
begin ps = [path]
s = File.lstat(file) while file = ps.shift
rescue Errno::ENOENT, Errno::EACCES, Errno::ENOTDIR, Errno::ELOOP, Errno::ENAMETOOLONG catch(:prune) do
next yield file.dup.taint
end
if s.directory? then
begin begin
fs = Dir.entries(file) s = File.lstat(file)
rescue Errno::ENOENT, Errno::EACCES, Errno::ENOTDIR, Errno::ELOOP, Errno::ENAMETOOLONG rescue Errno::ENOENT, Errno::EACCES, Errno::ENOTDIR, Errno::ELOOP, Errno::ENAMETOOLONG
next next
end end
fs.sort! if s.directory? then
fs.reverse_each {|f| begin
next if f == "." or f == ".." fs = Dir.entries(file, encoding: enc)
f = File.join(file, f) rescue Errno::ENOENT, Errno::EACCES, Errno::ENOTDIR, Errno::ELOOP, Errno::ENAMETOOLONG
paths.unshift f.untaint next
} end
fs.sort!
fs.reverse_each {|f|
next if f == "." or f == ".."
f = File.join(file, f)
ps.unshift f.untaint
}
end
end end
end end
end end
nil
end end
# #

View File

@ -210,6 +210,40 @@ class TestFind < Test::Unit::TestCase
} }
end end
def test_encoding_ascii
Dir.mktmpdir {|d|
File.open("#{d}/a", "w"){}
Dir.mkdir("#{d}/b")
a = []
Find.find(d.encode(Encoding::US_ASCII)) {|f| a << f }
a.each do |i|
assert(Encoding.compatible?(d.encode(Encoding.find('filesystem')), i))
end
}
end
def test_encoding_non_ascii
Dir.mktmpdir {|d|
File.open("#{d}/a", "w"){}
Dir.mkdir("#{d}/b")
euc_jp = Encoding::EUC_JP
win_31j = Encoding::Windows_31J
utf_8 = Encoding::UTF_8
a = []
Find.find(d.encode(euc_jp), d.encode(win_31j), d.encode(utf_8)) {|f| a << [f, f.encoding] }
assert_equal([[d, euc_jp], ["#{d}/a", euc_jp], ["#{d}/b", euc_jp],
[d, win_31j], ["#{d}/a", win_31j], ["#{d}/b", win_31j],
[d, utf_8], ["#{d}/a", utf_8], ["#{d}/b", utf_8]],
a)
if /mswin|mingw/ =~ RUBY_PLATFORM
a = []
Dir.mkdir("#{d}/\u{2660}")
Find.find("#{d}".encode(utf_8)) {|f| a << [f, f.encoding] }
assert_equal([[d, utf_8], ["#{d}/a", utf_8], ["#{d}/b", utf_8], ["#{d}/\u{2660}", utf_8]], a)
end
}
end
class TestInclude < Test::Unit::TestCase class TestInclude < Test::Unit::TestCase
include Find include Find