Author: labath Date: Mon Oct 31 11:22:07 2016 New Revision: 285593 URL: http://llvm.org/viewvc/llvm-project?rev=285593&view=rev Log: Improve ".." handling in FileSpec normalization
Summary: .. handling for windows path was completely broken because the function was expecting \ as path separators, but we were passing it normalized file paths, where these have been replaced by forward slashes. Apart from this, the function was incorrect for posix paths as well in some corner cases, as well as being generally hard to follow. The corner cases were: - /../bar -> should be same as /bar - /bar/.. -> should be same as / (slightly dodgy as the former depends on /bar actually existing, but since we're doing it in an abstract way, I think the transformation is reasonable) I rewrite the function to fix these corner cases and handle windows paths more correctly. The function should now handle the posix paths (modulo symlinks, but we cannot really do anything about that without a real filesystem). For windows paths, there are a couple of corner cases left, mostly to do with drive letter handling, which cannot be fixed until the rest of the class understands drive letters better. Reviewers: clayborg, zturner Subscribers: lldb-commits Differential Revision: https://reviews.llvm.org/D26081 Modified: lldb/trunk/include/lldb/Host/FileSpec.h lldb/trunk/source/Host/common/FileSpec.cpp lldb/trunk/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp lldb/trunk/unittests/Host/FileSpecTest.cpp Modified: lldb/trunk/include/lldb/Host/FileSpec.h URL: http://llvm.org/viewvc/llvm-project/lldb/trunk/include/lldb/Host/FileSpec.h?rev=285593&r1=285592&r2=285593&view=diff ============================================================================== --- lldb/trunk/include/lldb/Host/FileSpec.h (original) +++ lldb/trunk/include/lldb/Host/FileSpec.h Mon Oct 31 11:22:07 2016 @@ -620,22 +620,7 @@ public: /// Normalize a pathname by collapsing redundant separators and /// up-level references. //------------------------------------------------------------------ - void NormalizePath(); - - //------------------------------------------------------------------ - /// Run through the input string, replaying the effect of any ".." and produce - /// the resultant path. The input path is not required to be in the host file - /// system - /// format, but it is required to be normalized to that system. - /// - /// @param[in] input - /// The input path to analyze. - /// - /// @param[out] result - /// The backup-resolved path will be written here. - //------------------------------------------------------------------ - static void RemoveBackupDots(const ConstString &input_const_str, - ConstString &result_const_str); + FileSpec GetNormalizedPath() const; //------------------------------------------------------------------ /// Change the file specified with a new path. Modified: lldb/trunk/source/Host/common/FileSpec.cpp URL: http://llvm.org/viewvc/llvm-project/lldb/trunk/source/Host/common/FileSpec.cpp?rev=285593&r1=285592&r2=285593&view=diff ============================================================================== --- lldb/trunk/source/Host/common/FileSpec.cpp (original) +++ lldb/trunk/source/Host/common/FileSpec.cpp Mon Oct 31 11:22:07 2016 @@ -533,120 +533,73 @@ bool FileSpec::Equal(const FileSpec &a, if (!full && (a.GetDirectory().IsEmpty() || b.GetDirectory().IsEmpty())) return ConstString::Equals(a.m_filename, b.m_filename, case_sensitive); - else if (remove_backups == false) + + if (remove_backups == false) return a == b; - else { - if (!ConstString::Equals(a.m_filename, b.m_filename, case_sensitive)) - return false; - if (ConstString::Equals(a.m_directory, b.m_directory, case_sensitive)) - return true; - ConstString a_without_dots; - ConstString b_without_dots; - - RemoveBackupDots(a.m_directory, a_without_dots); - RemoveBackupDots(b.m_directory, b_without_dots); - return ConstString::Equals(a_without_dots, b_without_dots, case_sensitive); - } -} -void FileSpec::NormalizePath() { - ConstString normalized_directory; - FileSpec::RemoveBackupDots(m_directory, normalized_directory); - m_directory = normalized_directory; -} + if (a == b) + return true; -void FileSpec::RemoveBackupDots(const ConstString &input_const_str, - ConstString &result_const_str) { - const char *input = input_const_str.GetCString(); - result_const_str.Clear(); - if (!input || input[0] == '\0') - return; - - const char win_sep = '\\'; - const char unix_sep = '/'; - char found_sep; - const char *win_backup = "\\.."; - const char *unix_backup = "/.."; - - bool is_win = false; - - // Determine the platform for the path (win or unix): - - if (input[0] == win_sep) - is_win = true; - else if (input[0] == unix_sep) - is_win = false; - else if (input[1] == ':') - is_win = true; - else if (strchr(input, unix_sep) != nullptr) - is_win = false; - else if (strchr(input, win_sep) != nullptr) - is_win = true; - else { - // No separators at all, no reason to do any work here. - result_const_str = input_const_str; - return; - } + return Equal(a.GetNormalizedPath(), b.GetNormalizedPath(), full, false); +} - llvm::StringRef backup_sep; - if (is_win) { - found_sep = win_sep; - backup_sep = win_backup; +FileSpec FileSpec::GetNormalizedPath() const { + // Fast path. Do nothing if the path is not interesting. + if (!m_directory.GetStringRef().contains(".") && + (m_filename.GetStringRef() != ".." && m_filename.GetStringRef() != ".")) + return *this; + + llvm::SmallString<64> path, result; + const bool normalize = false; + GetPath(path, normalize); + llvm::StringRef rest(path); + + // We will not go below root dir. + size_t root_dir_start = RootDirStart(path, m_syntax); + const bool absolute = root_dir_start != llvm::StringRef::npos; + if (absolute) { + result += rest.take_front(root_dir_start + 1); + rest = rest.drop_front(root_dir_start + 1); } else { - found_sep = unix_sep; - backup_sep = unix_backup; + if (m_syntax == ePathSyntaxWindows && path.size() > 2 && path[1] == ':') { + result += rest.take_front(2); + rest = rest.drop_front(2); + } } - llvm::StringRef input_ref(input); - llvm::StringRef curpos(input); - - bool had_dots = false; - std::string result; - - while (1) { - // Start of loop - llvm::StringRef before_sep; - std::pair<llvm::StringRef, llvm::StringRef> around_sep = - curpos.split(backup_sep); - - before_sep = around_sep.first; - curpos = around_sep.second; - - if (curpos.empty()) { - if (had_dots) { - while (before_sep.startswith("//")) - before_sep = before_sep.substr(1); - if (!before_sep.empty()) { - result.append(before_sep.data(), before_sep.size()); - } - } - break; + bool anything_added = false; + llvm::SmallVector<llvm::StringRef, 0> components, processed; + rest.split(components, '/', -1, false); + processed.reserve(components.size()); + for (auto component : components) { + if (component == ".") + continue; // Skip these. + if (component != "..") { + processed.push_back(component); + continue; // Regular file name. } - had_dots = true; - - unsigned num_backups = 1; - while (curpos.startswith(backup_sep)) { - num_backups++; - curpos = curpos.slice(backup_sep.size(), curpos.size()); + if (!processed.empty()) { + processed.pop_back(); + continue; // Dots. Go one level up if we can. } + if (absolute) + continue; // We're at the top level. Cannot go higher than that. Skip. - size_t end_pos = before_sep.size(); - while (num_backups-- > 0) { - end_pos = before_sep.rfind(found_sep, end_pos); - if (end_pos == llvm::StringRef::npos) { - result_const_str = input_const_str; - return; - } - } - result.append(before_sep.data(), end_pos); + result += component; // We're a relative path. We need to keep these. + result += '/'; + anything_added = true; } + for (auto component : processed) { + result += component; + result += '/'; + anything_added = true; + } + if (anything_added) + result.pop_back(); // Pop last '/'. + else if (result.empty()) + result = "."; - if (had_dots) - result_const_str.SetCString(result.c_str()); - else - result_const_str = input_const_str; - - return; + return FileSpec(result, false, m_syntax); } //------------------------------------------------------------------ Modified: lldb/trunk/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp URL: http://llvm.org/viewvc/llvm-project/lldb/trunk/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp?rev=285593&r1=285592&r2=285593&view=diff ============================================================================== --- lldb/trunk/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp (original) +++ lldb/trunk/source/Plugins/ObjectFile/Mach-O/ObjectFileMachO.cpp Mon Oct 31 11:22:07 2016 @@ -5095,7 +5095,7 @@ uint32_t ObjectFileMachO::GetDependentMo FileSpec file_spec(path, true); // Remove any redundant parts of the path (like "../foo") since // LC_RPATH values often contain "..". - file_spec.NormalizePath(); + file_spec = file_spec.GetNormalizedPath(); if (file_spec.Exists() && files.AppendIfUnique(file_spec)) { count++; break; Modified: lldb/trunk/unittests/Host/FileSpecTest.cpp URL: http://llvm.org/viewvc/llvm-project/lldb/trunk/unittests/Host/FileSpecTest.cpp?rev=285593&r1=285592&r2=285593&view=diff ============================================================================== --- lldb/trunk/unittests/Host/FileSpecTest.cpp (original) +++ lldb/trunk/unittests/Host/FileSpecTest.cpp Mon Oct 31 11:22:07 2016 @@ -131,7 +131,6 @@ TEST(FileSpecTest, EqualSeparator) { Compare(forward, backward, !full_match, !remove_backup_dots, match); } -#if 0 TEST(FileSpecTest, EqualDotsWindows) { const bool full_match = true; const bool remove_backup_dots = true; @@ -142,6 +141,7 @@ TEST(FileSpecTest, EqualDotsWindows) { {R"(C:\bar\baz)", R"(C:/foo/../bar/baz)"}, {R"(C:/bar/baz)", R"(C:\foo\..\bar\baz)"}, {R"(C:\bar)", R"(C:\foo\..\bar)"}, + {R"(C:\foo\bar)", R"(C:\foo\.\bar)"}, }; for(const auto &test: tests) { @@ -151,11 +151,10 @@ TEST(FileSpecTest, EqualDotsWindows) { Compare(one, two, full_match, remove_backup_dots, match); Compare(one, two, full_match, !remove_backup_dots, !match); Compare(one, two, !full_match, remove_backup_dots, match); - Compare(one, two, !full_match, !remove_backup_dots, match); + Compare(one, two, !full_match, !remove_backup_dots, !match); } } -#endif TEST(FileSpecTest, EqualDotsPosix) { const bool full_match = true; @@ -164,7 +163,8 @@ TEST(FileSpecTest, EqualDotsPosix) { std::pair<const char *, const char *> tests[] = { {R"(/foo/bar/baz)", R"(/foo/foo/../bar/baz)"}, {R"(/bar/baz)", R"(/foo/../bar/baz)"}, -// {R"(/bar)", R"(/foo/../bar)"}, + {R"(/bar)", R"(/foo/../bar)"}, + {R"(/foo/bar)", R"(/foo/./bar)"}, }; for(const auto &test: tests) { @@ -174,19 +174,17 @@ TEST(FileSpecTest, EqualDotsPosix) { Compare(one, two, full_match, remove_backup_dots, match); Compare(one, two, full_match, !remove_backup_dots, !match); Compare(one, two, !full_match, remove_backup_dots, match); -// Compare(one, two, !full_match, !remove_backup_dots, match); + Compare(one, two, !full_match, !remove_backup_dots, !match); } } -#if 0 TEST(FileSpecTest, EqualDotsPosixRoot) { const bool full_match = true; const bool remove_backup_dots = true; const bool match = true; std::pair<const char *, const char *> tests[] = { - {R"(/)", R"(/..)"}, - {R"(/)", R"(/foo/..)"}, + {R"(/)", R"(/..)"}, {R"(/)", R"(/.)"}, {R"(/)", R"(/foo/..)"}, }; for(const auto &test: tests) { @@ -194,7 +192,66 @@ TEST(FileSpecTest, EqualDotsPosixRoot) { FileSpec two(test.second, false, FileSpec::ePathSyntaxPosix); EXPECT_NE(one, two); Compare(one, two, full_match, remove_backup_dots, match); - Compare(one, two, !full_match, remove_backup_dots, match); + Compare(one, two, full_match, !remove_backup_dots, !match); + Compare(one, two, !full_match, remove_backup_dots, !match); + Compare(one, two, !full_match, !remove_backup_dots, !match); + } +} + +TEST(FileSpecTest, GetNormalizedPath) { + std::pair<const char *, const char *> posix_tests[] = { + {"/foo/../bar", "/bar"}, + {"/foo/./bar", "/foo/bar"}, + {"/foo/..", "/"}, + {"/foo/.", "/foo"}, + {"/./foo", "/foo"}, + {"/", "/"}, + {"//", "//"}, + {"//net", "//net"}, + {"/..", "/"}, + {"/.", "/"}, + {"..", ".."}, + {".", "."}, + {"../..", "../.."}, + {"foo/..", "."}, + {"foo/../bar", "bar"}, + {"../foo/..", ".."}, + {"./foo", "foo"}, + }; + for (auto test : posix_tests) { + EXPECT_EQ(test.second, + FileSpec(test.first, false, FileSpec::ePathSyntaxPosix) + .GetNormalizedPath() + .GetPath()); + } + + std::pair<const char *, const char *> windows_tests[] = { + {R"(c:\bar\..\bar)", R"(c:\bar)"}, + {R"(c:\bar\.\bar)", R"(c:\bar\bar)"}, + {R"(c:\bar\..)", R"(c:\)"}, + {R"(c:\bar\.)", R"(c:\bar)"}, + {R"(c:\.\bar)", R"(c:\bar)"}, + {R"(\)", R"(\)"}, + // {R"(\\)", R"(\\)"}, + // {R"(\\net)", R"(\\net)"}, + {R"(c:\..)", R"(c:\)"}, + {R"(c:\.)", R"(c:\)"}, + {R"(\..)", R"(\)"}, + // {R"(c:..)", R"(c:..)"}, + {R"(..)", R"(..)"}, + {R"(.)", R"(.)"}, + {R"(c:..\..)", R"(c:..\..)"}, + {R"(..\..)", R"(..\..)"}, + {R"(foo\..)", R"(.)"}, + {R"(foo\..\bar)", R"(bar)"}, + {R"(..\foo\..)", R"(..)"}, + {R"(.\foo)", R"(foo)"}, + }; + for (auto test : windows_tests) { + EXPECT_EQ(test.second, + FileSpec(test.first, false, FileSpec::ePathSyntaxWindows) + .GetNormalizedPath() + .GetPath()) + << "Original path: " << test.first; } } -#endif _______________________________________________ lldb-commits mailing list lldb-commits@lists.llvm.org http://lists.llvm.org/cgi-bin/mailman/listinfo/lldb-commits