1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4 
5 // This file contains utility functions for dealing with the local
6 // filesystem.
7 
8 #ifndef BASE_FILES_FILE_UTIL_H_
9 #define BASE_FILES_FILE_UTIL_H_
10 
11 #include <stddef.h>
12 #include <stdint.h>
13 #include <stdio.h>
14 
15 #include <set>
16 #include <string>
17 #include <vector>
18 
19 #if defined(OS_POSIX) || defined(OS_FUCHSIA)
20 #include <sys/stat.h>
21 #include <unistd.h>
22 #endif
23 
24 #include "base/base_export.h"
25 #include "base/files/file.h"
26 #include "base/files/file_path.h"
27 #include "base/strings/string16.h"
28 #include "build/build_config.h"
29 
30 #if defined(OS_WIN)
31 #include "base/win/windows_types.h"
32 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
33 #include "base/file_descriptor_posix.h"
34 #include "base/logging.h"
35 #include "base/posix/eintr_wrapper.h"
36 #endif
37 
38 namespace base {
39 
40 class Environment;
41 class Time;
42 
43 //-----------------------------------------------------------------------------
44 // Functions that involve filesystem access or modification:
45 
46 // Returns an absolute version of a relative path. Returns an empty path on
47 // error. On POSIX, this function fails if the path does not exist. This
48 // function can result in I/O so it can be slow.
49 BASE_EXPORT FilePath MakeAbsoluteFilePath(const FilePath& input);
50 
51 // Returns the total number of bytes used by all the files under |root_path|.
52 // If the path does not exist the function returns 0.
53 //
54 // This function is implemented using the FileEnumerator class so it is not
55 // particularly speedy in any platform.
56 BASE_EXPORT int64_t ComputeDirectorySize(const FilePath& root_path);
57 
58 // Deletes the given path, whether it's a file or a directory.
59 // If it's a directory, it's perfectly happy to delete all of the
60 // directory's contents.  Passing true to recursive deletes
61 // subdirectories and their contents as well.
62 // Returns true if successful, false otherwise. It is considered successful
63 // to attempt to delete a file that does not exist.
64 //
65 // In posix environment and if |path| is a symbolic link, this deletes only
66 // the symlink. (even if the symlink points to a non-existent file)
67 //
68 // WARNING: USING THIS WITH recursive==true IS EQUIVALENT
69 //          TO "rm -rf", SO USE WITH CAUTION.
70 BASE_EXPORT bool DeleteFile(const FilePath& path, bool recursive);
71 
72 #if defined(OS_WIN)
73 // Schedules to delete the given path, whether it's a file or a directory, until
74 // the operating system is restarted.
75 // Note:
76 // 1) The file/directory to be deleted should exist in a temp folder.
77 // 2) The directory to be deleted must be empty.
78 BASE_EXPORT bool DeleteFileAfterReboot(const FilePath& path);
79 #endif
80 
81 // Moves the given path, whether it's a file or a directory.
82 // If a simple rename is not possible, such as in the case where the paths are
83 // on different volumes, this will attempt to copy and delete. Returns
84 // true for success.
85 // This function fails if either path contains traversal components ('..').
86 BASE_EXPORT bool Move(const FilePath& from_path, const FilePath& to_path);
87 
88 // Renames file |from_path| to |to_path|. Both paths must be on the same
89 // volume, or the function will fail. Destination file will be created
90 // if it doesn't exist. Prefer this function over Move when dealing with
91 // temporary files. On Windows it preserves attributes of the target file.
92 // Returns true on success, leaving *error unchanged.
93 // Returns false on failure and sets *error appropriately, if it is non-NULL.
94 BASE_EXPORT bool ReplaceFile(const FilePath& from_path,
95                              const FilePath& to_path,
96                              File::Error* error);
97 
98 // Copies a single file. Use CopyDirectory() to copy directories.
99 // This function fails if either path contains traversal components ('..').
100 // This function also fails if |to_path| is a directory.
101 //
102 // On POSIX, if |to_path| is a symlink, CopyFile() will follow the symlink. This
103 // may have security implications. Use with care.
104 //
105 // If |to_path| already exists and is a regular file, it will be overwritten,
106 // though its permissions will stay the same.
107 //
108 // If |to_path| does not exist, it will be created. The new file's permissions
109 // varies per platform:
110 //
111 // - This function keeps the metadata on Windows. The read only bit is not kept.
112 // - On Mac and iOS, |to_path| retains |from_path|'s permissions, except user
113 //   read/write permissions are always set.
114 // - On Linux and Android, |to_path| has user read/write permissions only. i.e.
115 //   Always 0600.
116 // - On ChromeOS, |to_path| has user read/write permissions and group/others
117 //   read permissions. i.e. Always 0644.
118 BASE_EXPORT bool CopyFile(const FilePath& from_path, const FilePath& to_path);
119 
120 // Copies the given path, and optionally all subdirectories and their contents
121 // as well.
122 //
123 // If there are files existing under to_path, always overwrite. Returns true
124 // if successful, false otherwise. Wildcards on the names are not supported.
125 //
126 // This function has the same metadata behavior as CopyFile().
127 //
128 // If you only need to copy a file use CopyFile, it's faster.
129 BASE_EXPORT bool CopyDirectory(const FilePath& from_path,
130                                const FilePath& to_path,
131                                bool recursive);
132 
133 // Like CopyDirectory() except trying to overwrite an existing file will not
134 // work and will return false.
135 BASE_EXPORT bool CopyDirectoryExcl(const FilePath& from_path,
136                                    const FilePath& to_path,
137                                    bool recursive);
138 
139 // Returns true if the given path exists on the local filesystem,
140 // false otherwise.
141 BASE_EXPORT bool PathExists(const FilePath& path);
142 
143 // Returns true if the given path is writable by the user, false otherwise.
144 BASE_EXPORT bool PathIsWritable(const FilePath& path);
145 
146 // Returns true if the given path exists and is a directory, false otherwise.
147 BASE_EXPORT bool DirectoryExists(const FilePath& path);
148 
149 // Returns true if the contents of the two files given are equal, false
150 // otherwise.  If either file can't be read, returns false.
151 BASE_EXPORT bool ContentsEqual(const FilePath& filename1,
152                                const FilePath& filename2);
153 
154 // Returns true if the contents of the two text files given are equal, false
155 // otherwise.  This routine treats "\r\n" and "\n" as equivalent.
156 BASE_EXPORT bool TextContentsEqual(const FilePath& filename1,
157                                    const FilePath& filename2);
158 
159 // Reads the file at |path| into |contents| and returns true on success and
160 // false on error.  For security reasons, a |path| containing path traversal
161 // components ('..') is treated as a read error and |contents| is set to empty.
162 // In case of I/O error, |contents| holds the data that could be read from the
163 // file before the error occurred.
164 // |contents| may be NULL, in which case this function is useful for its side
165 // effect of priming the disk cache (could be used for unit tests).
166 BASE_EXPORT bool ReadFileToString(const FilePath& path, std::string* contents);
167 
168 // Reads the file at |path| into |contents| and returns true on success and
169 // false on error.  For security reasons, a |path| containing path traversal
170 // components ('..') is treated as a read error and |contents| is set to empty.
171 // In case of I/O error, |contents| holds the data that could be read from the
172 // file before the error occurred.  When the file size exceeds |max_size|, the
173 // function returns false with |contents| holding the file truncated to
174 // |max_size|.
175 // |contents| may be NULL, in which case this function is useful for its side
176 // effect of priming the disk cache (could be used for unit tests).
177 BASE_EXPORT bool ReadFileToStringWithMaxSize(const FilePath& path,
178                                              std::string* contents,
179                                              size_t max_size);
180 
181 #if defined(OS_POSIX) || defined(OS_FUCHSIA)
182 
183 // Read exactly |bytes| bytes from file descriptor |fd|, storing the result
184 // in |buffer|. This function is protected against EINTR and partial reads.
185 // Returns true iff |bytes| bytes have been successfully read from |fd|.
186 BASE_EXPORT bool ReadFromFD(int fd, char* buffer, size_t bytes);
187 
188 // Performs the same function as CreateAndOpenTemporaryFileInDir(), but returns
189 // the file-descriptor directly, rather than wrapping it into a FILE. Returns
190 // -1 on failure.
191 BASE_EXPORT int CreateAndOpenFdForTemporaryFileInDir(const FilePath& dir,
192                                                      FilePath* path);
193 
194 #endif  // OS_POSIX || OS_FUCHSIA
195 
196 #if defined(OS_POSIX)
197 
198 // Creates a symbolic link at |symlink| pointing to |target|.  Returns
199 // false on failure.
200 BASE_EXPORT bool CreateSymbolicLink(const FilePath& target,
201                                     const FilePath& symlink);
202 
203 // Reads the given |symlink| and returns where it points to in |target|.
204 // Returns false upon failure.
205 BASE_EXPORT bool ReadSymbolicLink(const FilePath& symlink, FilePath* target);
206 
207 // Bits and masks of the file permission.
208 enum FilePermissionBits {
209   FILE_PERMISSION_MASK              = S_IRWXU | S_IRWXG | S_IRWXO,
210   FILE_PERMISSION_USER_MASK         = S_IRWXU,
211   FILE_PERMISSION_GROUP_MASK        = S_IRWXG,
212   FILE_PERMISSION_OTHERS_MASK       = S_IRWXO,
213 
214   FILE_PERMISSION_READ_BY_USER      = S_IRUSR,
215   FILE_PERMISSION_WRITE_BY_USER     = S_IWUSR,
216   FILE_PERMISSION_EXECUTE_BY_USER   = S_IXUSR,
217   FILE_PERMISSION_READ_BY_GROUP     = S_IRGRP,
218   FILE_PERMISSION_WRITE_BY_GROUP    = S_IWGRP,
219   FILE_PERMISSION_EXECUTE_BY_GROUP  = S_IXGRP,
220   FILE_PERMISSION_READ_BY_OTHERS    = S_IROTH,
221   FILE_PERMISSION_WRITE_BY_OTHERS   = S_IWOTH,
222   FILE_PERMISSION_EXECUTE_BY_OTHERS = S_IXOTH,
223 };
224 
225 // Reads the permission of the given |path|, storing the file permission
226 // bits in |mode|. If |path| is symbolic link, |mode| is the permission of
227 // a file which the symlink points to.
228 BASE_EXPORT bool GetPosixFilePermissions(const FilePath& path, int* mode);
229 // Sets the permission of the given |path|. If |path| is symbolic link, sets
230 // the permission of a file which the symlink points to.
231 BASE_EXPORT bool SetPosixFilePermissions(const FilePath& path, int mode);
232 
233 // Returns true iff |executable| can be found in any directory specified by the
234 // environment variable in |env|.
235 BASE_EXPORT bool ExecutableExistsInPath(Environment* env,
236                                         const FilePath::StringType& executable);
237 
238 #if defined(OS_LINUX) || defined(OS_AIX)
239 // Determine if files under a given |path| can be mapped and then mprotect'd
240 // PROT_EXEC. This depends on the mount options used for |path|, which vary
241 // among different Linux distributions and possibly local configuration. It also
242 // depends on details of kernel--ChromeOS uses the noexec option for /dev/shm
243 // but its kernel allows mprotect with PROT_EXEC anyway.
244 BASE_EXPORT bool IsPathExecutable(const FilePath& path);
245 #endif  // OS_LINUX || OS_AIX
246 
247 #endif  // OS_POSIX
248 
249 // Returns true if the given directory is empty
250 BASE_EXPORT bool IsDirectoryEmpty(const FilePath& dir_path);
251 
252 // Get the temporary directory provided by the system.
253 //
254 // WARNING: In general, you should use CreateTemporaryFile variants below
255 // instead of this function. Those variants will ensure that the proper
256 // permissions are set so that other users on the system can't edit them while
257 // they're open (which can lead to security issues).
258 BASE_EXPORT bool GetTempDir(FilePath* path);
259 
260 // Get the home directory. This is more complicated than just getenv("HOME")
261 // as it knows to fall back on getpwent() etc.
262 //
263 // You should not generally call this directly. Instead use DIR_HOME with the
264 // path service which will use this function but cache the value.
265 // Path service may also override DIR_HOME.
266 BASE_EXPORT FilePath GetHomeDir();
267 
268 // Creates a temporary file. The full path is placed in |path|, and the
269 // function returns true if was successful in creating the file. The file will
270 // be empty and all handles closed after this function returns.
271 BASE_EXPORT bool CreateTemporaryFile(FilePath* path);
272 
273 // Same as CreateTemporaryFile but the file is created in |dir|.
274 BASE_EXPORT bool CreateTemporaryFileInDir(const FilePath& dir,
275                                           FilePath* temp_file);
276 
277 // Create and open a temporary file.  File is opened for read/write.
278 // The full path is placed in |path|.
279 // Returns a handle to the opened file or NULL if an error occurred.
280 BASE_EXPORT FILE* CreateAndOpenTemporaryFile(FilePath* path);
281 
282 // Similar to CreateAndOpenTemporaryFile, but the file is created in |dir|.
283 BASE_EXPORT FILE* CreateAndOpenTemporaryFileInDir(const FilePath& dir,
284                                                   FilePath* path);
285 
286 // Create a new directory. If prefix is provided, the new directory name is in
287 // the format of prefixyyyy.
288 // NOTE: prefix is ignored in the POSIX implementation.
289 // If success, return true and output the full path of the directory created.
290 BASE_EXPORT bool CreateNewTempDirectory(const FilePath::StringType& prefix,
291                                         FilePath* new_temp_path);
292 
293 // Create a directory within another directory.
294 // Extra characters will be appended to |prefix| to ensure that the
295 // new directory does not have the same name as an existing directory.
296 BASE_EXPORT bool CreateTemporaryDirInDir(const FilePath& base_dir,
297                                          const FilePath::StringType& prefix,
298                                          FilePath* new_dir);
299 
300 // Creates a directory, as well as creating any parent directories, if they
301 // don't exist. Returns 'true' on successful creation, or if the directory
302 // already exists.  The directory is only readable by the current user.
303 // Returns true on success, leaving *error unchanged.
304 // Returns false on failure and sets *error appropriately, if it is non-NULL.
305 BASE_EXPORT bool CreateDirectoryAndGetError(const FilePath& full_path,
306                                             File::Error* error);
307 
308 // Backward-compatible convenience method for the above.
309 BASE_EXPORT bool CreateDirectory(const FilePath& full_path);
310 
311 // Returns the file size. Returns true on success.
312 BASE_EXPORT bool GetFileSize(const FilePath& file_path, int64_t* file_size);
313 
314 // Sets |real_path| to |path| with symbolic links and junctions expanded.
315 // On windows, make sure the path starts with a lettered drive.
316 // |path| must reference a file.  Function will fail if |path| points to
317 // a directory or to a nonexistent path.  On windows, this function will
318 // fail if |path| is a junction or symlink that points to an empty file,
319 // or if |real_path| would be longer than MAX_PATH characters.
320 BASE_EXPORT bool NormalizeFilePath(const FilePath& path, FilePath* real_path);
321 
322 #if defined(OS_WIN)
323 
324 // Given a path in NT native form ("\Device\HarddiskVolumeXX\..."),
325 // return in |drive_letter_path| the equivalent path that starts with
326 // a drive letter ("C:\...").  Return false if no such path exists.
327 BASE_EXPORT bool DevicePathToDriveLetterPath(const FilePath& device_path,
328                                              FilePath* drive_letter_path);
329 
330 // Given an existing file in |path|, set |real_path| to the path
331 // in native NT format, of the form "\Device\HarddiskVolumeXX\..".
332 // Returns false if the path can not be found. Empty files cannot
333 // be resolved with this function.
334 BASE_EXPORT bool NormalizeToNativeFilePath(const FilePath& path,
335                                            FilePath* nt_path);
336 #endif
337 
338 // This function will return if the given file is a symlink or not.
339 BASE_EXPORT bool IsLink(const FilePath& file_path);
340 
341 // Returns information about the given file path.
342 BASE_EXPORT bool GetFileInfo(const FilePath& file_path, File::Info* info);
343 
344 // Sets the time of the last access and the time of the last modification.
345 BASE_EXPORT bool TouchFile(const FilePath& path,
346                            const Time& last_accessed,
347                            const Time& last_modified);
348 
349 // Wrapper for fopen-like calls. Returns non-NULL FILE* on success. The
350 // underlying file descriptor (POSIX) or handle (Windows) is unconditionally
351 // configured to not be propagated to child processes.
352 BASE_EXPORT FILE* OpenFile(const FilePath& filename, const char* mode);
353 
354 // Closes file opened by OpenFile. Returns true on success.
355 BASE_EXPORT bool CloseFile(FILE* file);
356 
357 // Associates a standard FILE stream with an existing File. Note that this
358 // functions take ownership of the existing File.
359 BASE_EXPORT FILE* FileToFILE(File file, const char* mode);
360 
361 // Truncates an open file to end at the location of the current file pointer.
362 // This is a cross-platform analog to Windows' SetEndOfFile() function.
363 BASE_EXPORT bool TruncateFile(FILE* file);
364 
365 // Reads at most the given number of bytes from the file into the buffer.
366 // Returns the number of read bytes, or -1 on error.
367 BASE_EXPORT int ReadFile(const FilePath& filename, char* data, int max_size);
368 
369 // Writes the given buffer into the file, overwriting any data that was
370 // previously there.  Returns the number of bytes written, or -1 on error.
371 BASE_EXPORT int WriteFile(const FilePath& filename, const char* data,
372                           int size);
373 
374 #if defined(OS_POSIX) || defined(OS_FUCHSIA)
375 // Appends |data| to |fd|. Does not close |fd| when done.  Returns true iff
376 // |size| bytes of |data| were written to |fd|.
377 BASE_EXPORT bool WriteFileDescriptor(const int fd, const char* data, int size);
378 #endif
379 
380 // Appends |data| to |filename|.  Returns true iff |size| bytes of |data| were
381 // written to |filename|.
382 BASE_EXPORT bool AppendToFile(const FilePath& filename,
383                               const char* data,
384                               int size);
385 
386 // Gets the current working directory for the process.
387 BASE_EXPORT bool GetCurrentDirectory(FilePath* path);
388 
389 // Sets the current working directory for the process.
390 BASE_EXPORT bool SetCurrentDirectory(const FilePath& path);
391 
392 // Attempts to find a number that can be appended to the |path| to make it
393 // unique. If |path| does not exist, 0 is returned.  If it fails to find such
394 // a number, -1 is returned. If |suffix| is not empty, also checks the
395 // existence of it with the given suffix.
396 BASE_EXPORT int GetUniquePathNumber(const FilePath& path,
397                                     const FilePath::StringType& suffix);
398 
399 // Sets the given |fd| to non-blocking mode.
400 // Returns true if it was able to set it in the non-blocking mode, otherwise
401 // false.
402 BASE_EXPORT bool SetNonBlocking(int fd);
403 
404 #if defined(OS_POSIX) || defined(OS_FUCHSIA)
405 // Creates a non-blocking, close-on-exec pipe.
406 // This creates a non-blocking pipe that is not intended to be shared with any
407 // child process. This will be done atomically if the operating system supports
408 // it. Returns true if it was able to create the pipe, otherwise false.
409 BASE_EXPORT bool CreateLocalNonBlockingPipe(int fds[2]);
410 
411 // Sets the given |fd| to close-on-exec mode.
412 // Returns true if it was able to set it in the close-on-exec mode, otherwise
413 // false.
414 BASE_EXPORT bool SetCloseOnExec(int fd);
415 
416 // Test that |path| can only be changed by a given user and members of
417 // a given set of groups.
418 // Specifically, test that all parts of |path| under (and including) |base|:
419 // * Exist.
420 // * Are owned by a specific user.
421 // * Are not writable by all users.
422 // * Are owned by a member of a given set of groups, or are not writable by
423 //   their group.
424 // * Are not symbolic links.
425 // This is useful for checking that a config file is administrator-controlled.
426 // |base| must contain |path|.
427 BASE_EXPORT bool VerifyPathControlledByUser(const base::FilePath& base,
428                                             const base::FilePath& path,
429                                             uid_t owner_uid,
430                                             const std::set<gid_t>& group_gids);
431 #endif  // defined(OS_POSIX) || defined(OS_FUCHSIA)
432 
433 #if defined(OS_MACOSX) && !defined(OS_IOS)
434 // Is |path| writable only by a user with administrator privileges?
435 // This function uses Mac OS conventions.  The super user is assumed to have
436 // uid 0, and the administrator group is assumed to be named "admin".
437 // Testing that |path|, and every parent directory including the root of
438 // the filesystem, are owned by the superuser, controlled by the group
439 // "admin", are not writable by all users, and contain no symbolic links.
440 // Will return false if |path| does not exist.
441 BASE_EXPORT bool VerifyPathControlledByAdmin(const base::FilePath& path);
442 #endif  // defined(OS_MACOSX) && !defined(OS_IOS)
443 
444 // Returns the maximum length of path component on the volume containing
445 // the directory |path|, in the number of FilePath::CharType, or -1 on failure.
446 BASE_EXPORT int GetMaximumPathComponentLength(const base::FilePath& path);
447 
448 #if defined(OS_LINUX) || defined(OS_AIX)
449 // Broad categories of file systems as returned by statfs() on Linux.
450 enum FileSystemType {
451   FILE_SYSTEM_UNKNOWN,  // statfs failed.
452   FILE_SYSTEM_0,        // statfs.f_type == 0 means unknown, may indicate AFS.
453   FILE_SYSTEM_ORDINARY,       // on-disk filesystem like ext2
454   FILE_SYSTEM_NFS,
455   FILE_SYSTEM_SMB,
456   FILE_SYSTEM_CODA,
457   FILE_SYSTEM_MEMORY,         // in-memory file system
458   FILE_SYSTEM_CGROUP,         // cgroup control.
459   FILE_SYSTEM_OTHER,          // any other value.
460   FILE_SYSTEM_TYPE_COUNT
461 };
462 
463 // Attempts determine the FileSystemType for |path|.
464 // Returns false if |path| doesn't exist.
465 BASE_EXPORT bool GetFileSystemType(const FilePath& path, FileSystemType* type);
466 #endif
467 
468 #if defined(OS_POSIX) || defined(OS_FUCHSIA)
469 // Get a temporary directory for shared memory files. The directory may depend
470 // on whether the destination is intended for executable files, which in turn
471 // depends on how /dev/shmem was mounted. As a result, you must supply whether
472 // you intend to create executable shmem segments so this function can find
473 // an appropriate location.
474 BASE_EXPORT bool GetShmemTempDir(bool executable, FilePath* path);
475 #endif
476 
477 // Internal --------------------------------------------------------------------
478 
479 namespace internal {
480 
481 // Same as Move but allows paths with traversal components.
482 // Use only with extreme care.
483 BASE_EXPORT bool MoveUnsafe(const FilePath& from_path,
484                             const FilePath& to_path);
485 
486 #if defined(OS_WIN)
487 // Copy from_path to to_path recursively and then delete from_path recursively.
488 // Returns true if all operations succeed.
489 // This function simulates Move(), but unlike Move() it works across volumes.
490 // This function is not transactional.
491 BASE_EXPORT bool CopyAndDeleteDirectory(const FilePath& from_path,
492                                         const FilePath& to_path);
493 #endif  // defined(OS_WIN)
494 
495 }  // namespace internal
496 }  // namespace base
497 
498 #endif  // BASE_FILES_FILE_UTIL_H_
499