1 //===-- FileSpec.cpp ------------------------------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "lldb/Utility/FileSpec.h"
10 #include "lldb/Utility/RegularExpression.h"
11 #include "lldb/Utility/Stream.h"
13 #include "llvm/ADT/SmallString.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/StringExtras.h"
16 #include "llvm/ADT/StringRef.h"
17 #include "llvm/ADT/Twine.h"
18 #include "llvm/Support/ErrorOr.h"
19 #include "llvm/Support/FileSystem.h"
20 #include "llvm/Support/Program.h"
21 #include "llvm/Support/raw_ostream.h"
22 #include "llvm/TargetParser/Triple.h"
26 #include <system_error>
35 using namespace lldb_private
;
39 static constexpr FileSpec::Style
GetNativeStyle() {
41 return FileSpec::Style::windows
;
43 return FileSpec::Style::posix
;
47 bool PathStyleIsPosix(FileSpec::Style style
) {
48 return llvm::sys::path::is_style_posix(style
);
51 const char *GetPathSeparators(FileSpec::Style style
) {
52 return llvm::sys::path::get_separator(style
).data();
55 char GetPreferredPathSeparator(FileSpec::Style style
) {
56 return GetPathSeparators(style
)[0];
59 void Denormalize(llvm::SmallVectorImpl
<char> &path
, FileSpec::Style style
) {
60 if (PathStyleIsPosix(style
))
63 std::replace(path
.begin(), path
.end(), '/', '\\');
66 } // end anonymous namespace
68 FileSpec::FileSpec() : m_style(GetNativeStyle()) {}
70 // Default constructor that can take an optional full path to a file on disk.
71 FileSpec::FileSpec(llvm::StringRef path
, Style style
) : m_style(style
) {
75 FileSpec::FileSpec(llvm::StringRef path
, const llvm::Triple
&triple
)
76 : FileSpec
{path
, triple
.isOSWindows() ? Style::windows
: Style::posix
} {}
79 /// Safely get a character at the specified index.
82 /// A full, partial, or relative path to a file.
85 /// An index into path which may or may not be valid.
88 /// The character at index \a i if the index is valid, or 0 if
89 /// the index is not valid.
90 inline char safeCharAtIndex(const llvm::StringRef
&path
, size_t i
) {
96 /// Check if a path needs to be normalized.
98 /// Check if a path needs to be normalized. We currently consider a
99 /// path to need normalization if any of the following are true
100 /// - path contains "/./"
101 /// - path contains "/../"
102 /// - path contains "//"
103 /// - path ends with "/"
104 /// Paths that start with "./" or with "../" are not considered to
105 /// need normalization since we aren't trying to resolve the path,
106 /// we are just trying to remove redundant things from the path.
109 /// A full, partial, or relative path to a file.
112 /// Returns \b true if the path needs to be normalized.
113 bool needsNormalization(const llvm::StringRef
&path
) {
116 // We strip off leading "." values so these paths need to be normalized
119 for (auto i
= path
.find_first_of("\\/"); i
!= llvm::StringRef::npos
;
120 i
= path
.find_first_of("\\/", i
+ 1)) {
121 const auto next
= safeCharAtIndex(path
, i
+1);
124 // path separator char at the end of the string which should be
125 // stripped unless it is the one and only character
129 // two path separator chars in the middle of a path needs to be
137 const auto next_next
= safeCharAtIndex(path
, i
+2);
140 case 0: return true; // ends with "/."
143 return true; // contains "/./"
145 const auto next_next_next
= safeCharAtIndex(path
, i
+3);
146 switch (next_next_next
) {
148 case 0: return true; // ends with "/.."
151 return true; // contains "/../"
169 void FileSpec::SetFile(llvm::StringRef pathname
) { SetFile(pathname
, m_style
); }
171 // Update the contents of this object with a new path. The path will be split
172 // up into a directory and filename and stored as uniqued string values for
173 // quick comparison and efficient memory usage.
174 void FileSpec::SetFile(llvm::StringRef pathname
, Style style
) {
176 m_style
= (style
== Style::native
) ? GetNativeStyle() : style
;
178 if (pathname
.empty())
181 llvm::SmallString
<128> resolved(pathname
);
183 // Normalize the path by removing ".", ".." and other redundant components.
184 if (needsNormalization(resolved
))
185 llvm::sys::path::remove_dots(resolved
, true, m_style
);
187 // Normalize back slashes to forward slashes
188 if (m_style
== Style::windows
)
189 std::replace(resolved
.begin(), resolved
.end(), '\\', '/');
191 if (resolved
.empty()) {
192 // If we have no path after normalization set the path to the current
193 // directory. This matches what python does and also a few other path
195 m_filename
.SetString(".");
199 // Split path into filename and directory. We rely on the underlying char
200 // pointer to be nullptr when the components are empty.
201 llvm::StringRef filename
= llvm::sys::path::filename(resolved
, m_style
);
202 if(!filename
.empty())
203 m_filename
.SetString(filename
);
205 llvm::StringRef directory
= llvm::sys::path::parent_path(resolved
, m_style
);
206 if(!directory
.empty())
207 m_directory
.SetString(directory
);
210 void FileSpec::SetFile(llvm::StringRef path
, const llvm::Triple
&triple
) {
211 return SetFile(path
, triple
.isOSWindows() ? Style::windows
: Style::posix
);
214 // Convert to pointer operator. This allows code to check any FileSpec objects
215 // to see if they contain anything valid using code such as:
219 FileSpec::operator bool() const { return m_filename
|| m_directory
; }
221 // Logical NOT operator. This allows code to check any FileSpec objects to see
222 // if they are invalid using code such as:
226 bool FileSpec::operator!() const { return !m_directory
&& !m_filename
; }
228 bool FileSpec::DirectoryEquals(const FileSpec
&rhs
) const {
229 const bool case_sensitive
= IsCaseSensitive() || rhs
.IsCaseSensitive();
230 return ConstString::Equals(m_directory
, rhs
.m_directory
, case_sensitive
);
233 bool FileSpec::FileEquals(const FileSpec
&rhs
) const {
234 const bool case_sensitive
= IsCaseSensitive() || rhs
.IsCaseSensitive();
235 return ConstString::Equals(m_filename
, rhs
.m_filename
, case_sensitive
);
239 bool FileSpec::operator==(const FileSpec
&rhs
) const {
240 return FileEquals(rhs
) && DirectoryEquals(rhs
);
243 // Not equal to operator
244 bool FileSpec::operator!=(const FileSpec
&rhs
) const { return !(*this == rhs
); }
246 // Less than operator
247 bool FileSpec::operator<(const FileSpec
&rhs
) const {
248 return FileSpec::Compare(*this, rhs
, true) < 0;
251 // Dump a FileSpec object to a stream
252 Stream
&lldb_private::operator<<(Stream
&s
, const FileSpec
&f
) {
253 f
.Dump(s
.AsRawOstream());
257 // Clear this object by releasing both the directory and filename string values
258 // and making them both the empty string.
259 void FileSpec::Clear() {
265 // Compare two FileSpec objects. If "full" is true, then both the directory and
266 // the filename must match. If "full" is false, then the directory names for
267 // "a" and "b" are only compared if they are both non-empty. This allows a
268 // FileSpec object to only contain a filename and it can match FileSpec objects
269 // that have matching filenames with different paths.
271 // Return -1 if the "a" is less than "b", 0 if "a" is equal to "b" and "1" if
272 // "a" is greater than "b".
273 int FileSpec::Compare(const FileSpec
&a
, const FileSpec
&b
, bool full
) {
276 // case sensitivity of compare
277 const bool case_sensitive
= a
.IsCaseSensitive() || b
.IsCaseSensitive();
279 // If full is true, then we must compare both the directory and filename.
281 // If full is false, then if either directory is empty, then we match on the
282 // basename only, and if both directories have valid values, we still do a
283 // full compare. This allows for matching when we just have a filename in one
284 // of the FileSpec objects.
286 if (full
|| (a
.m_directory
&& b
.m_directory
)) {
287 result
= ConstString::Compare(a
.m_directory
, b
.m_directory
, case_sensitive
);
291 return ConstString::Compare(a
.m_filename
, b
.m_filename
, case_sensitive
);
294 bool FileSpec::Equal(const FileSpec
&a
, const FileSpec
&b
, bool full
) {
295 if (full
|| (a
.GetDirectory() && b
.GetDirectory()))
298 return a
.FileEquals(b
);
301 bool FileSpec::Match(const FileSpec
&pattern
, const FileSpec
&file
) {
302 if (pattern
.GetDirectory())
303 return pattern
== file
;
304 if (pattern
.GetFilename())
305 return pattern
.FileEquals(file
);
309 std::optional
<FileSpec::Style
>
310 FileSpec::GuessPathStyle(llvm::StringRef absolute_path
) {
311 if (absolute_path
.startswith("/"))
313 if (absolute_path
.startswith(R
"(\\)"))
314 return Style::windows
;
315 if (absolute_path
.size() >= 3 && llvm::isAlpha(absolute_path
[0]) &&
316 (absolute_path
.substr(1, 2) == R
"(:\)" ||
317 absolute_path
.substr(1, 2) == R
"(:/)"))
318 return Style::windows
;
322 // Dump the object to the supplied stream. If the object contains a valid
323 // directory name, it will be displayed followed by a directory delimiter, and
325 void FileSpec::Dump(llvm::raw_ostream
&s
) const {
326 std::string path
{GetPath(true)};
328 char path_separator
= GetPreferredPathSeparator(m_style
);
329 if (!m_filename
&& !path
.empty() && path
.back() != path_separator
)
333 FileSpec::Style
FileSpec::GetPathStyle() const { return m_style
; }
335 void FileSpec::SetDirectory(ConstString directory
) {
336 m_directory
= directory
;
340 void FileSpec::SetDirectory(llvm::StringRef directory
) {
341 m_directory
= ConstString(directory
);
345 void FileSpec::SetFilename(ConstString filename
) {
346 m_filename
= filename
;
350 void FileSpec::SetFilename(llvm::StringRef filename
) {
351 m_filename
= ConstString(filename
);
355 void FileSpec::ClearFilename() {
360 void FileSpec::ClearDirectory() {
365 // Extract the directory and path into a fixed buffer. This is needed as the
366 // directory and path are stored in separate string values.
367 size_t FileSpec::GetPath(char *path
, size_t path_max_len
,
368 bool denormalize
) const {
372 std::string result
= GetPath(denormalize
);
373 ::snprintf(path
, path_max_len
, "%s", result
.c_str());
374 return std::min(path_max_len
- 1, result
.length());
377 std::string
FileSpec::GetPath(bool denormalize
) const {
378 llvm::SmallString
<64> result
;
379 GetPath(result
, denormalize
);
380 return static_cast<std::string
>(result
);
383 ConstString
FileSpec::GetPathAsConstString(bool denormalize
) const {
384 return ConstString
{GetPath(denormalize
)};
387 void FileSpec::GetPath(llvm::SmallVectorImpl
<char> &path
,
388 bool denormalize
) const {
389 path
.append(m_directory
.GetStringRef().begin(),
390 m_directory
.GetStringRef().end());
391 // Since the path was normalized and all paths use '/' when stored in these
392 // objects, we don't need to look for the actual syntax specific path
393 // separator, we just look for and insert '/'.
394 if (m_directory
&& m_filename
&& m_directory
.GetStringRef().back() != '/' &&
395 m_filename
.GetStringRef().back() != '/')
396 path
.insert(path
.end(), '/');
397 path
.append(m_filename
.GetStringRef().begin(),
398 m_filename
.GetStringRef().end());
399 if (denormalize
&& !path
.empty())
400 Denormalize(path
, m_style
);
403 llvm::StringRef
FileSpec::GetFileNameExtension() const {
404 return llvm::sys::path::extension(m_filename
.GetStringRef(), m_style
);
407 ConstString
FileSpec::GetFileNameStrippingExtension() const {
408 return ConstString(llvm::sys::path::stem(m_filename
.GetStringRef(), m_style
));
411 // Return the size in bytes that this object takes in memory. This returns the
412 // size in bytes of this object, not any shared string values it may refer to.
413 size_t FileSpec::MemorySize() const {
414 return m_filename
.MemorySize() + m_directory
.MemorySize();
418 FileSpec::CopyByAppendingPathComponent(llvm::StringRef component
) const {
419 FileSpec ret
= *this;
420 ret
.AppendPathComponent(component
);
424 FileSpec
FileSpec::CopyByRemovingLastPathComponent() const {
425 llvm::SmallString
<64> current_path
;
426 GetPath(current_path
, false);
427 if (llvm::sys::path::has_parent_path(current_path
, m_style
))
428 return FileSpec(llvm::sys::path::parent_path(current_path
, m_style
),
433 void FileSpec::PrependPathComponent(llvm::StringRef component
) {
434 llvm::SmallString
<64> new_path(component
);
435 llvm::SmallString
<64> current_path
;
436 GetPath(current_path
, false);
437 llvm::sys::path::append(new_path
,
438 llvm::sys::path::begin(current_path
, m_style
),
439 llvm::sys::path::end(current_path
), m_style
);
440 SetFile(new_path
, m_style
);
443 void FileSpec::PrependPathComponent(const FileSpec
&new_path
) {
444 return PrependPathComponent(new_path
.GetPath(false));
447 void FileSpec::AppendPathComponent(llvm::StringRef component
) {
448 llvm::SmallString
<64> current_path
;
449 GetPath(current_path
, false);
450 llvm::sys::path::append(current_path
, m_style
, component
);
451 SetFile(current_path
, m_style
);
454 void FileSpec::AppendPathComponent(const FileSpec
&new_path
) {
455 return AppendPathComponent(new_path
.GetPath(false));
458 bool FileSpec::RemoveLastPathComponent() {
459 llvm::SmallString
<64> current_path
;
460 GetPath(current_path
, false);
461 if (llvm::sys::path::has_parent_path(current_path
, m_style
)) {
462 SetFile(llvm::sys::path::parent_path(current_path
, m_style
));
468 std::vector
<llvm::StringRef
> FileSpec::GetComponents() const {
469 std::vector
<llvm::StringRef
> components
;
471 auto dir_begin
= llvm::sys::path::begin(m_directory
.GetStringRef(), m_style
);
472 auto dir_end
= llvm::sys::path::end(m_directory
.GetStringRef());
474 for (auto iter
= dir_begin
; iter
!= dir_end
; ++iter
) {
475 if (*iter
== "/" || *iter
== ".")
478 components
.push_back(*iter
);
481 if (!m_filename
.IsEmpty() && m_filename
!= "/" && m_filename
!= ".")
482 components
.push_back(m_filename
.GetStringRef());
487 /// Returns true if the filespec represents an implementation source
488 /// file (files with a ".c", ".cpp", ".m", ".mm" (many more)
492 /// \b true if the filespec represents an implementation source
493 /// file, \b false otherwise.
494 bool FileSpec::IsSourceImplementationFile() const {
495 llvm::StringRef extension
= GetFileNameExtension();
496 if (extension
.empty())
499 static RegularExpression
g_source_file_regex(llvm::StringRef(
500 "^.([cC]|[mM]|[mM][mM]|[cC][pP][pP]|[cC]\\+\\+|[cC][xX][xX]|[cC][cC]|["
501 "cC][pP]|[sS]|[aA][sS][mM]|[fF]|[fF]77|[fF]90|[fF]95|[fF]03|[fF][oO]["
502 "rR]|[fF][tT][nN]|[fF][pP][pP]|[aA][dD][aA]|[aA][dD][bB]|[aA][dD][sS])"
504 return g_source_file_regex
.Execute(extension
);
507 bool FileSpec::IsRelative() const {
508 return !IsAbsolute();
511 bool FileSpec::IsAbsolute() const {
512 // Check if we have cached if this path is absolute to avoid recalculating.
513 if (m_absolute
!= Absolute::Calculate
)
514 return m_absolute
== Absolute::Yes
;
516 m_absolute
= Absolute::No
;
518 llvm::SmallString
<64> path
;
519 GetPath(path
, false);
522 // We consider paths starting with ~ to be absolute.
523 if (path
[0] == '~' || llvm::sys::path::is_absolute(path
, m_style
))
524 m_absolute
= Absolute::Yes
;
527 return m_absolute
== Absolute::Yes
;
530 void FileSpec::MakeAbsolute(const FileSpec
&dir
) {
532 PrependPathComponent(dir
);
535 void llvm::format_provider
<FileSpec
>::format(const FileSpec
&F
,
538 assert((Style
.empty() || Style
.equals_insensitive("F") ||
539 Style
.equals_insensitive("D")) &&
540 "Invalid FileSpec style!");
542 StringRef dir
= F
.GetDirectory().GetStringRef();
543 StringRef file
= F
.GetFilename().GetStringRef();
545 if (dir
.empty() && file
.empty()) {
550 if (Style
.equals_insensitive("F")) {
551 Stream
<< (file
.empty() ? "(empty)" : file
);
555 // Style is either D or empty, either way we need to print the directory.
557 // Directory is stored in normalized form, which might be different than
558 // preferred form. In order to handle this, we need to cut off the
559 // filename, then denormalize, then write the entire denorm'ed directory.
560 llvm::SmallString
<64> denormalized_dir
= dir
;
561 Denormalize(denormalized_dir
, F
.GetPathStyle());
562 Stream
<< denormalized_dir
;
563 Stream
<< GetPreferredPathSeparator(F
.GetPathStyle());
566 if (Style
.equals_insensitive("D")) {
567 // We only want to print the directory, so now just exit.