1 // Copyright (c) 2013 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #include "tools/gn/filesystem_utils.h"
9 #include "base/file_util.h"
10 #include "base/logging.h"
11 #include "base/strings/string_util.h"
12 #include "base/strings/utf_string_conversions.h"
13 #include "build/build_config.h"
14 #include "tools/gn/location.h"
15 #include "tools/gn/settings.h"
16 #include "tools/gn/source_dir.h"
21 // The given dot is just part of a filename and is not special.
24 // The given dot is the current directory.
27 // The given dot is the first of a double dot that should take us up one.
31 // When we find a dot, this function is called with the character following
32 // that dot to see what it is. The return value indicates what type this dot is
33 // (see above). This code handles the case where the dot is at the end of the
36 // |*consumed_len| will contain the number of characters in the input that
37 // express what we found.
38 DotDisposition ClassifyAfterDot(const std::string& path,
40 size_t* consumed_len) {
41 if (after_dot == path.size()) {
42 // Single dot at the end.
46 if (IsSlash(path[after_dot])) {
47 // Single dot followed by a slash.
48 *consumed_len = 2; // Consume the slash
52 if (path[after_dot] == '.') {
54 if (after_dot + 1 == path.size()) {
55 // Double dot at the end.
59 if (IsSlash(path[after_dot + 1])) {
60 // Double dot folowed by a slash.
66 // The dots are followed by something else, not a directory.
68 return NOT_A_DIRECTORY;
72 inline char NormalizeWindowsPathChar(char c) {
75 return base::ToLowerASCII(c);
78 // Attempts to do a case and slash-insensitive comparison of two 8-bit Windows
80 bool AreAbsoluteWindowsPathsEqual(const base::StringPiece& a,
81 const base::StringPiece& b) {
82 if (a.size() != b.size())
85 // For now, just do a case-insensitive ASCII comparison. We could convert to
86 // UTF-16 and use ICU if necessary. Or maybe base::strcasecmp is good enough?
87 for (size_t i = 0; i < a.size(); i++) {
88 if (NormalizeWindowsPathChar(a[i]) != NormalizeWindowsPathChar(b[i]))
94 bool DoesBeginWindowsDriveLetter(const base::StringPiece& path) {
98 // Check colon first, this will generally fail fastest.
102 // Check drive letter
103 if (!((path[0] >= 'A' && path[0] <= 'Z') ||
104 path[0] >= 'a' && path[0] <= 'z'))
107 if (!IsSlash(path[2]))
113 // A wrapper around FilePath.GetComponents that works the way we need. This is
114 // not super efficient since it does some O(n) transformations on the path. If
115 // this is called a lot, we might want to optimize.
116 std::vector<base::FilePath::StringType> GetPathComponents(
117 const base::FilePath& path) {
118 std::vector<base::FilePath::StringType> result;
119 path.GetComponents(&result);
124 // GetComponents will preserve the "/" at the beginning, which confuses us.
125 // We don't expect to have relative paths in this function.
126 // Don't use IsSeparator since we always want to allow backslashes.
127 if (result[0] == FILE_PATH_LITERAL("/") ||
128 result[0] == FILE_PATH_LITERAL("\\"))
129 result.erase(result.begin());
132 // On Windows, GetComponents will give us [ "C:", "/", "foo" ], and we
133 // don't want the slash in there. This doesn't support input like "C:foo"
134 // which means foo relative to the current directory of the C drive but
135 // that's basically legacy DOS behavior we don't need to support.
136 if (result.size() >= 2 && result[1].size() == 1 && IsSlash(result[1][0]))
137 result.erase(result.begin() + 1);
143 // Provides the equivalent of == for filesystem strings, trying to do
144 // approximately the right thing with case.
145 bool FilesystemStringsEqual(const base::FilePath::StringType& a,
146 const base::FilePath::StringType& b) {
148 // Assume case-insensitive filesystems on Windows. We use the CompareString
149 // function to do a case-insensitive comparison based on the current locale
150 // (we don't want GN to depend on ICU which is large and requires data
151 // files). This isn't perfect, but getting this perfectly right is very
152 // difficult and requires I/O, and this comparison should cover 99.9999% of
155 // Note: The documentation for CompareString says it runs fastest on
156 // null-terminated strings with -1 passed for the length, so we do that here.
157 // There should not be embedded nulls in filesystem strings.
158 return ::CompareString(LOCALE_USER_DEFAULT, LINGUISTIC_IGNORECASE,
159 a.c_str(), -1, b.c_str(), -1) == CSTR_EQUAL;
161 // Assume case-sensitive filesystems on non-Windows.
168 SourceFileType GetSourceFileType(const SourceFile& file,
169 Settings::TargetOS os) {
170 base::StringPiece extension = FindExtension(&file.value());
171 if (extension == "cc" || extension == "cpp" || extension == "cxx")
173 if (extension == "h")
175 if (extension == "c")
180 if (extension == "m")
182 if (extension == "mm")
187 if (extension == "rc")
189 // TODO(brettw) asm files.
196 if (os != Settings::WIN) {
197 if (extension == "S")
201 return SOURCE_UNKNOWN;
204 const char* GetExtensionForOutputType(Target::OutputType type,
205 Settings::TargetOS os) {
209 case Target::EXECUTABLE:
211 case Target::SHARED_LIBRARY:
213 case Target::STATIC_LIBRARY:
222 case Target::EXECUTABLE:
224 case Target::SHARED_LIBRARY:
225 return "dll.lib"; // Extension of import library.
226 case Target::STATIC_LIBRARY:
233 case Settings::LINUX:
235 case Target::EXECUTABLE:
237 case Target::SHARED_LIBRARY:
239 case Target::STATIC_LIBRARY:
252 std::string FilePathToUTF8(const base::FilePath::StringType& str) {
254 return base::WideToUTF8(str);
260 base::FilePath UTF8ToFilePath(const base::StringPiece& sp) {
262 return base::FilePath(base::UTF8ToWide(sp));
264 return base::FilePath(sp.as_string());
268 size_t FindExtensionOffset(const std::string& path) {
269 for (int i = static_cast<int>(path.size()); i >= 0; i--) {
270 if (IsSlash(path[i]))
275 return std::string::npos;
278 base::StringPiece FindExtension(const std::string* path) {
279 size_t extension_offset = FindExtensionOffset(*path);
280 if (extension_offset == std::string::npos)
281 return base::StringPiece();
282 return base::StringPiece(&path->data()[extension_offset],
283 path->size() - extension_offset);
286 size_t FindFilenameOffset(const std::string& path) {
287 for (int i = static_cast<int>(path.size()) - 1; i >= 0; i--) {
288 if (IsSlash(path[i]))
291 return 0; // No filename found means everything was the filename.
294 base::StringPiece FindFilename(const std::string* path) {
295 size_t filename_offset = FindFilenameOffset(*path);
296 if (filename_offset == 0)
297 return base::StringPiece(*path); // Everything is the file name.
298 return base::StringPiece(&(*path).data()[filename_offset],
299 path->size() - filename_offset);
302 base::StringPiece FindFilenameNoExtension(const std::string* path) {
304 return base::StringPiece();
305 size_t filename_offset = FindFilenameOffset(*path);
306 size_t extension_offset = FindExtensionOffset(*path);
309 if (extension_offset == std::string::npos)
310 name_len = path->size() - filename_offset;
312 name_len = extension_offset - filename_offset - 1;
314 return base::StringPiece(&(*path).data()[filename_offset], name_len);
317 void RemoveFilename(std::string* path) {
318 path->resize(FindFilenameOffset(*path));
321 bool EndsWithSlash(const std::string& s) {
322 return !s.empty() && IsSlash(s[s.size() - 1]);
325 base::StringPiece FindDir(const std::string* path) {
326 size_t filename_offset = FindFilenameOffset(*path);
327 if (filename_offset == 0u)
328 return base::StringPiece();
329 return base::StringPiece(path->data(), filename_offset);
332 bool EnsureStringIsInOutputDir(const SourceDir& dir,
333 const std::string& str,
334 const Value& originating,
336 // The last char of the dir will be a slash. We don't care if the input ends
337 // in a slash or not, so just compare up until there.
339 // This check will be wrong for all proper prefixes "e.g. "/output" will
340 // match "/out" but we don't really care since this is just a sanity check.
341 const std::string& dir_str = dir.value();
342 if (str.compare(0, dir_str.length() - 1, dir_str, 0, dir_str.length() - 1)
344 *err = Err(originating, "File is not inside output directory.",
345 "The given file should be in the output directory. Normally you would "
346 "specify\n\"$target_out_dir/foo\" or "
347 "\"$target_gen_dir/foo\". I interpreted this as\n\""
354 bool IsPathAbsolute(const base::StringPiece& path) {
358 if (!IsSlash(path[0])) {
360 // Check for Windows system paths like "C:\foo".
361 if (path.size() > 2 && path[1] == ':' && IsSlash(path[2]))
364 return false; // Doesn't begin with a slash, is relative.
367 // Double forward slash at the beginning means source-relative (we don't
368 // allow backslashes for denoting this).
369 if (path.size() > 1 && path[1] == '/')
375 bool MakeAbsolutePathRelativeIfPossible(const base::StringPiece& source_root,
376 const base::StringPiece& path,
378 DCHECK(IsPathAbsolute(source_root));
379 DCHECK(IsPathAbsolute(path));
383 if (source_root.size() > path.size())
384 return false; // The source root is longer: the path can never be inside.
387 // Source root should be canonical on Windows. Note that the initial slash
388 // must be forward slash, but that the other ones can be either forward or
390 DCHECK(source_root.size() > 2 && source_root[0] != '/' &&
391 source_root[1] == ':' && IsSlash(source_root[2]));
393 size_t after_common_index = std::string::npos;
394 if (DoesBeginWindowsDriveLetter(path)) {
396 if (AreAbsoluteWindowsPathsEqual(source_root,
397 path.substr(0, source_root.size())))
398 after_common_index = source_root.size();
401 } else if (path[0] == '/' && source_root.size() <= path.size() - 1 &&
402 DoesBeginWindowsDriveLetter(path.substr(1))) {
404 if (AreAbsoluteWindowsPathsEqual(source_root,
405 path.substr(1, source_root.size())))
406 after_common_index = source_root.size() + 1;
413 // If we get here, there's a match and after_common_index identifies the
416 // The base may or may not have a trailing slash, so skip all slashes from
417 // the path after our prefix match.
418 size_t first_after_slash = after_common_index;
419 while (first_after_slash < path.size() && IsSlash(path[first_after_slash]))
422 dest->assign("//"); // Result is source root relative.
423 dest->append(&path.data()[first_after_slash],
424 path.size() - first_after_slash);
429 // On non-Windows this is easy. Since we know both are absolute, just do a
431 if (path.substr(0, source_root.size()) == source_root) {
432 // The base may or may not have a trailing slash, so skip all slashes from
433 // the path after our prefix match.
434 size_t first_after_slash = source_root.size();
435 while (first_after_slash < path.size() && IsSlash(path[first_after_slash]))
438 dest->assign("//"); // Result is source root relative.
439 dest->append(&path.data()[first_after_slash],
440 path.size() - first_after_slash);
447 std::string InvertDir(const SourceDir& path) {
448 const std::string value = path.value();
450 return std::string();
452 DCHECK(value[0] == '/');
453 size_t begin_index = 1;
455 // If the input begins with two slashes, skip over both (this is a
456 // source-relative dir). These must be forward slashes only.
457 if (value.size() > 1 && value[1] == '/')
461 for (size_t i = begin_index; i < value.size(); i++) {
462 if (IsSlash(value[i]))
468 void NormalizePath(std::string* path) {
469 char* pathbuf = path->empty() ? NULL : &(*path)[0];
471 // top_index is the first character we can modify in the path. Anything
472 // before this indicates where the path is relative to.
473 size_t top_index = 0;
474 bool is_relative = true;
475 if (!path->empty() && pathbuf[0] == '/') {
478 if (path->size() > 1 && pathbuf[1] == '/') {
479 // Two leading slashes, this is a path into the source dir.
482 // One leading slash, this is a system-absolute path.
487 size_t dest_i = top_index;
488 for (size_t src_i = top_index; src_i < path->size(); /* nothing */) {
489 if (pathbuf[src_i] == '.') {
490 if (src_i == 0 || IsSlash(pathbuf[src_i - 1])) {
491 // Slash followed by a dot, see if it's something special.
493 switch (ClassifyAfterDot(*path, src_i + 1, &consumed_len)) {
494 case NOT_A_DIRECTORY:
495 // Copy the dot to the output, it means nothing special.
496 pathbuf[dest_i++] = pathbuf[src_i++];
499 // Current directory, just skip the input.
500 src_i += consumed_len;
503 // Back up over previous directory component. If we're already
504 // at the top, preserve the "..".
505 if (dest_i > top_index) {
506 // The previous char was a slash, remove it.
510 if (dest_i == top_index) {
512 // We're already at the beginning of a relative input, copy the
513 // ".." and continue. We need the trailing slash if there was
514 // one before (otherwise we're at the end of the input).
515 pathbuf[dest_i++] = '.';
516 pathbuf[dest_i++] = '.';
517 if (consumed_len == 3)
518 pathbuf[dest_i++] = '/';
520 // This also makes a new "root" that we can't delete by going
521 // up more levels. Otherwise "../.." would collapse to
525 // Otherwise we're at the beginning of an absolute path. Don't
526 // allow ".." to go up another level and just eat it.
528 // Just find the previous slash or the beginning of input.
529 while (dest_i > 0 && !IsSlash(pathbuf[dest_i - 1]))
532 src_i += consumed_len;
535 // Dot not preceeded by a slash, copy it literally.
536 pathbuf[dest_i++] = pathbuf[src_i++];
538 } else if (IsSlash(pathbuf[src_i])) {
539 if (src_i > 0 && IsSlash(pathbuf[src_i - 1])) {
540 // Two slashes in a row, skip over it.
543 // Just one slash, copy it, normalizing to foward slash.
544 pathbuf[dest_i] = '/';
549 // Input nothing special, just copy it.
550 pathbuf[dest_i++] = pathbuf[src_i++];
553 path->resize(dest_i);
556 void ConvertPathToSystem(std::string* path) {
558 for (size_t i = 0; i < path->size(); i++) {
559 if ((*path)[i] == '/')
565 std::string PathToSystem(const std::string& path) {
566 std::string ret(path);
567 ConvertPathToSystem(&ret);
571 std::string RebaseSourceAbsolutePath(const std::string& input,
572 const SourceDir& dest_dir) {
573 CHECK(input.size() >= 2 && input[0] == '/' && input[1] == '/')
574 << "Input to rebase isn't source-absolute: " << input;
575 CHECK(dest_dir.is_source_absolute())
576 << "Dir to rebase to isn't source-absolute: " << dest_dir.value();
578 const std::string& dest = dest_dir.value();
580 // Skip the common prefixes of the source and dest as long as they end in
582 size_t common_prefix_len = 2; // The beginning two "//" are always the same.
583 size_t max_common_length = std::min(input.size(), dest.size());
584 for (size_t i = common_prefix_len; i < max_common_length; i++) {
585 if (IsSlash(input[i]) && IsSlash(dest[i]))
586 common_prefix_len = i + 1;
587 else if (input[i] != dest[i])
591 // Invert the dest dir starting from the end of the common prefix.
593 for (size_t i = common_prefix_len; i < dest.size(); i++) {
594 if (IsSlash(dest[i]))
598 // Append any remaining unique input.
599 ret.append(&input[common_prefix_len], input.size() - common_prefix_len);
601 // If the result is still empty, the paths are the same.
608 std::string DirectoryWithNoLastSlash(const SourceDir& dir) {
611 if (dir.value().empty()) {
612 // Just keep input the same.
613 } else if (dir.value() == "/") {
615 } else if (dir.value() == "//") {
618 ret.assign(dir.value());
619 ret.resize(ret.size() - 1);
624 SourceDir SourceDirForPath(const base::FilePath& source_root,
625 const base::FilePath& path) {
626 std::vector<base::FilePath::StringType> source_comp =
627 GetPathComponents(source_root);
628 std::vector<base::FilePath::StringType> path_comp =
629 GetPathComponents(path);
631 // See if path is inside the source root by looking for each of source root's
632 // components at the beginning of path.
633 bool is_inside_source;
634 if (path_comp.size() < source_comp.size()) {
636 is_inside_source = false;
638 is_inside_source = true;
639 for (size_t i = 0; i < source_comp.size(); i++) {
640 if (!FilesystemStringsEqual(source_comp[i], path_comp[i])) {
641 is_inside_source = false;
647 std::string result_str;
648 size_t initial_path_comp_to_use;
649 if (is_inside_source) {
650 // Construct a source-relative path beginning in // and skip all of the
651 // shared directories.
653 initial_path_comp_to_use = source_comp.size();
655 // Not inside source code, construct a system-absolute path.
657 initial_path_comp_to_use = 0;
660 for (size_t i = initial_path_comp_to_use; i < path_comp.size(); i++) {
661 result_str.append(FilePathToUTF8(path_comp[i]));
662 result_str.push_back('/');
664 return SourceDir(result_str);
667 SourceDir SourceDirForCurrentDirectory(const base::FilePath& source_root) {
669 base::GetCurrentDirectory(&cd);
670 return SourceDirForPath(source_root, cd);
673 SourceDir GetToolchainOutputDir(const Settings* settings) {
674 const OutputFile& toolchain_subdir = settings->toolchain_output_subdir();
676 std::string result = settings->build_settings()->build_dir().value();
677 if (!toolchain_subdir.value().empty())
678 result.append(toolchain_subdir.value());
680 return SourceDir(SourceDir::SWAP_IN, &result);
683 SourceDir GetToolchainGenDir(const Settings* settings) {
684 const OutputFile& toolchain_subdir = settings->toolchain_output_subdir();
686 std::string result = settings->build_settings()->build_dir().value();
687 if (!toolchain_subdir.value().empty())
688 result.append(toolchain_subdir.value());
690 result.append("gen/");
691 return SourceDir(SourceDir::SWAP_IN, &result);
694 SourceDir GetOutputDirForSourceDir(const Settings* settings,
695 const SourceDir& source_dir) {
696 SourceDir toolchain = GetToolchainOutputDir(settings);
699 toolchain.SwapValue(&ret);
702 // The source dir should be source-absolute, so we trim off the two leading
703 // slashes to append to the toolchain object directory.
704 DCHECK(source_dir.is_source_absolute());
705 ret.append(&source_dir.value()[2], source_dir.value().size() - 2);
707 return SourceDir(SourceDir::SWAP_IN, &ret);
710 SourceDir GetGenDirForSourceDir(const Settings* settings,
711 const SourceDir& source_dir) {
712 SourceDir toolchain = GetToolchainGenDir(settings);
715 toolchain.SwapValue(&ret);
717 // The source dir should be source-absolute, so we trim off the two leading
718 // slashes to append to the toolchain object directory.
719 DCHECK(source_dir.is_source_absolute());
720 ret.append(&source_dir.value()[2], source_dir.value().size() - 2);
722 return SourceDir(SourceDir::SWAP_IN, &ret);
725 SourceDir GetTargetOutputDir(const Target* target) {
726 return GetOutputDirForSourceDir(target->settings(), target->label().dir());
729 SourceDir GetTargetGenDir(const Target* target) {
730 return GetGenDirForSourceDir(target->settings(), target->label().dir());
733 SourceDir GetCurrentOutputDir(const Scope* scope) {
734 return GetOutputDirForSourceDir(scope->settings(), scope->GetSourceDir());
737 SourceDir GetCurrentGenDir(const Scope* scope) {
738 return GetGenDirForSourceDir(scope->settings(), scope->GetSourceDir());