2 * Utility routines used in rsync.
4 * Copyright (C) 1996-2000 Andrew Tridgell
5 * Copyright (C) 1996 Paul Mackerras
6 * Copyright (C) 2001, 2002 Martin Pool <mbp@samba.org>
7 * Copyright (C) 2003-2020 Wayne Davison
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 3 of the License, or
12 * (at your option) any later version.
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
19 * You should have received a copy of the GNU General Public License along
20 * with this program; if not, visit the http://fsf.org website.
30 extern int protect_args
;
31 extern int modify_window
;
32 extern int relative_paths
;
33 extern int preserve_times
;
34 extern int preserve_xattrs
;
35 extern int preallocate_files
;
36 extern char *module_dir
;
37 extern unsigned int module_dirlen
;
38 extern char *partial_dir
;
39 extern filter_rule_list daemon_filter_list
;
41 int sanitize_paths
= 0;
43 char curr_dir
[MAXPATHLEN
];
44 unsigned int curr_dir_len
;
45 int curr_dir_depth
; /* This is only set for a sanitizing daemon. */
47 /* Set a fd into nonblocking mode. */
48 void set_nonblocking(int fd
)
52 if ((val
= fcntl(fd
, F_GETFL
)) == -1)
54 if (!(val
& NONBLOCK_FLAG
)) {
56 fcntl(fd
, F_SETFL
, val
);
60 /* Set a fd into blocking mode. */
61 void set_blocking(int fd
)
65 if ((val
= fcntl(fd
, F_GETFL
)) == -1)
67 if (val
& NONBLOCK_FLAG
) {
68 val
&= ~NONBLOCK_FLAG
;
69 fcntl(fd
, F_SETFL
, val
);
74 * Create a file descriptor pair - like pipe() but use socketpair if
75 * possible (because of blocking issues on pipes).
77 * Always set non-blocking.
79 int fd_pair(int fd
[2])
83 #ifdef HAVE_SOCKETPAIR
84 ret
= socketpair(AF_UNIX
, SOCK_STREAM
, 0, fd
);
90 set_nonblocking(fd
[0]);
91 set_nonblocking(fd
[1]);
97 void print_child_argv(const char *prefix
, char **cmd
)
100 rprintf(FCLIENT
, "%s ", prefix
);
101 for (; *cmd
; cmd
++) {
102 /* Look for characters that ought to be quoted. This
103 * is not a great quoting algorithm, but it's
104 * sufficient for a log message. */
105 if (strspn(*cmd
, "abcdefghijklmnopqrstuvwxyz"
106 "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
108 ",.-_=+@/") != strlen(*cmd
)) {
109 rprintf(FCLIENT
, "\"%s\" ", *cmd
);
111 rprintf(FCLIENT
, "%s ", *cmd
);
115 rprintf(FCLIENT
, " (%d args)\n", cnt
);
118 /* This returns 0 for success, 1 for a symlink if symlink time-setting
119 * is not possible, or -1 for any other error. */
120 int set_times(const char *fname
, STRUCT_STAT
*stp
)
122 static int switch_step
= 0;
124 if (DEBUG_GTE(TIME
, 1)) {
126 "set modtime, atime of %s to (%ld) %s, (%ld) %s\n",
127 fname
, (long)stp
->st_mtime
,
128 timestring(stp
->st_mtime
), (long)stp
->st_atime
, timestring(stp
->st_atime
));
131 switch (switch_step
) {
132 #ifdef HAVE_SETATTRLIST
134 if (do_setattrlist_times(fname
, stp
) == 0)
141 #ifdef HAVE_UTIMENSAT
143 if (do_utimensat(fname
, stp
) == 0)
152 if (do_lutimes(fname
, stp
) == 0)
161 if (preserve_times
& PRESERVE_LINK_TIMES
) {
162 preserve_times
&= ~PRESERVE_LINK_TIMES
;
163 if (S_ISLNK(stp
->st_mode
))
169 if (do_utimes(fname
, stp
) == 0)
172 if (do_utime(fname
, stp
) == 0)
182 /* Create any necessary directories in fname. Any missing directories are
183 * created with default permissions. Returns < 0 on error, or the number
184 * of directories created. */
185 int make_path(char *fname
, int flags
)
190 if (flags
& MKP_SKIP_SLASH
) {
191 while (*fname
== '/')
195 while (*fname
== '.' && fname
[1] == '/')
198 if (flags
& MKP_DROP_NAME
) {
199 end
= strrchr(fname
, '/');
200 if (!end
|| end
== fname
)
204 end
= fname
+ strlen(fname
);
206 /* Try to find an existing dir, starting from the deepest dir. */
210 if (do_stat(fname
, &st
) == 0) {
211 if (S_ISDIR(st
.st_mode
))
216 } else if (do_mkdir(fname
, ACCESSPERMS
) == 0) {
221 if (errno
!= ENOENT
) {
223 if (errno
!= EEXIST
|| (do_stat(fname
, &st
) == 0 && !S_ISDIR(st
.st_mode
)))
229 /* We got a relative path that doesn't exist, so assume that '.'
230 * is there and just break out and create the whole thing. */
236 /* We reached the "/" dir, which we assume is there. */
246 /* Make all the dirs that we didn't find on the way here. */
253 if (ret
< 0) /* Skip mkdir on error, but keep restoring the path. */
255 if (do_mkdir(fname
, ACCESSPERMS
) < 0)
261 if (flags
& MKP_DROP_NAME
)
268 * Write @p len bytes at @p ptr to descriptor @p desc, retrying if
271 * @retval len upon success
273 * @retval <0 write's (negative) error code
275 * Derived from GNU C's cccp.c.
277 int full_write(int desc
, const char *ptr
, size_t len
)
283 int written
= write(desc
, ptr
, len
);
289 total_written
+= written
;
293 return total_written
;
297 * Read @p len bytes at @p ptr from descriptor @p desc, retrying if
300 * @retval >0 the actual number of bytes read
304 * @retval <0 for an error.
306 * Derived from GNU C's cccp.c. */
307 static int safe_read(int desc
, char *ptr
, size_t len
)
315 n_chars
= read(desc
, ptr
, len
);
316 } while (n_chars
< 0 && errno
== EINTR
);
321 /* Copy a file. If ofd < 0, copy_file unlinks and opens the "dest" file.
322 * Otherwise, it just writes to and closes the provided file descriptor.
323 * In either case, if --xattrs are being preserved, the dest file will
324 * have its xattrs set from the source file.
326 * This is used in conjunction with the --temp-dir, --backup, and
327 * --copy-dest options. */
328 int copy_file(const char *source
, const char *dest
, int ofd
, mode_t mode
)
332 int len
; /* Number of bytes read into `buf'. */
333 OFF_T prealloc_len
= 0, offset
= 0;
335 if ((ifd
= do_open(source
, O_RDONLY
, 0)) < 0) {
336 int save_errno
= errno
;
337 rsyserr(FERROR_XFER
, errno
, "open %s", full_fname(source
));
343 if (robust_unlink(dest
) && errno
!= ENOENT
) {
344 int save_errno
= errno
;
345 rsyserr(FERROR_XFER
, errno
, "unlink %s", full_fname(dest
));
351 #ifdef SUPPORT_XATTRS
355 mode
&= INITACCESSPERMS
;
356 if ((ofd
= do_open(dest
, O_WRONLY
| O_CREAT
| O_TRUNC
| O_EXCL
, mode
)) < 0) {
357 int save_errno
= errno
;
358 rsyserr(FERROR_XFER
, save_errno
, "open %s", full_fname(dest
));
365 #ifdef SUPPORT_PREALLOCATION
366 if (preallocate_files
) {
369 /* Try to preallocate enough space for file's eventual length. Can
370 * reduce fragmentation on filesystems like ext4, xfs, and NTFS. */
371 if (do_fstat(ifd
, &srcst
) < 0)
372 rsyserr(FWARNING
, errno
, "fstat %s", full_fname(source
));
373 else if (srcst
.st_size
> 0) {
374 prealloc_len
= do_fallocate(ofd
, 0, srcst
.st_size
);
375 if (prealloc_len
< 0)
376 rsyserr(FWARNING
, errno
, "do_fallocate %s", full_fname(dest
));
381 while ((len
= safe_read(ifd
, buf
, sizeof buf
)) > 0) {
382 if (full_write(ofd
, buf
, len
) < 0) {
383 int save_errno
= errno
;
384 rsyserr(FERROR_XFER
, errno
, "write %s", full_fname(dest
));
394 int save_errno
= errno
;
395 rsyserr(FERROR_XFER
, errno
, "read %s", full_fname(source
));
402 if (close(ifd
) < 0) {
403 rsyserr(FWARNING
, errno
, "close failed on %s",
407 /* Source file might have shrunk since we fstatted it.
408 * Cut off any extra preallocated zeros from dest file. */
409 if (offset
< prealloc_len
&& do_ftruncate(ofd
, offset
) < 0) {
410 /* If we fail to truncate, the dest file may be wrong, so we
411 * must trigger the "partial transfer" error. */
412 rsyserr(FERROR_XFER
, errno
, "ftruncate %s", full_fname(dest
));
415 if (close(ofd
) < 0) {
416 int save_errno
= errno
;
417 rsyserr(FERROR_XFER
, errno
, "close failed on %s",
423 #ifdef SUPPORT_XATTRS
425 copy_xattrs(source
, dest
);
431 /* MAX_RENAMES should be 10**MAX_RENAMES_DIGITS */
432 #define MAX_RENAMES_DIGITS 3
433 #define MAX_RENAMES 1000
436 * Robust unlink: some OS'es (HPUX) refuse to unlink busy files, so
437 * rename to <path>/.rsyncNNN instead.
439 * Note that successive rsync runs will shuffle the filenames around a
440 * bit as long as the file is still busy; this is because this function
441 * does not know if the unlink call is due to a new file coming in, or
442 * --delete trying to remove old .rsyncNNN files, hence it renames it
445 int robust_unlink(const char *fname
)
448 return do_unlink(fname
);
450 static int counter
= 1;
452 char path
[MAXPATHLEN
];
454 rc
= do_unlink(fname
);
455 if (rc
== 0 || errno
!= ETXTBSY
)
458 if ((pos
= strlcpy(path
, fname
, MAXPATHLEN
)) >= MAXPATHLEN
)
459 pos
= MAXPATHLEN
- 1;
461 while (pos
> 0 && path
[pos
-1] != '/')
463 pos
+= strlcpy(path
+pos
, ".rsync", MAXPATHLEN
-pos
);
465 if (pos
> (MAXPATHLEN
-MAX_RENAMES_DIGITS
-1)) {
470 /* start where the last one left off to reduce chance of clashes */
473 snprintf(&path
[pos
], MAX_RENAMES_DIGITS
+1, "%03d", counter
);
474 if (++counter
>= MAX_RENAMES
)
476 } while ((rc
= access(path
, 0)) == 0 && counter
!= start
);
478 if (INFO_GTE(MISC
, 1)) {
479 rprintf(FWARNING
, "renaming %s to %s because of text busy\n",
483 /* maybe we should return rename()'s exit status? Nah. */
484 if (do_rename(fname
, path
) != 0) {
492 /* Returns 0 on successful rename, 1 if we successfully copied the file
493 * across filesystems, -2 if copy_file() failed, and -1 on other errors.
494 * If partialptr is not NULL and we need to do a copy, copy the file into
495 * the active partial-dir instead of over the destination file. */
496 int robust_rename(const char *from
, const char *to
, const char *partialptr
,
501 /* A resumed in-place partial-dir transfer might call us with from and
502 * to pointing to the same buf if the transfer failed yet again. */
507 if (do_rename(from
, to
) == 0)
513 if (robust_unlink(to
) != 0) {
522 if (!handle_partial_dir(partialptr
,PDIR_CREATE
))
526 if (copy_file(from
, to
, -1, mode
) != 0)
537 static pid_t all_pids
[10];
540 /** Fork and record the pid of the child. **/
543 pid_t newpid
= fork();
545 if (newpid
!= 0 && newpid
!= -1) {
546 all_pids
[num_pids
++] = newpid
;
554 * @todo It would be kind of nice to make sure that they are actually
555 * all our children before we kill them, because their pids may have
556 * been recycled by some other process. Perhaps when we wait for a
557 * child, we should remove it from this array. Alternatively we could
558 * perhaps use process groups, but I think that would not work on
559 * ancient Unix versions that don't support them.
561 void kill_all(int sig
)
565 for (i
= 0; i
< num_pids
; i
++) {
566 /* Let's just be a little careful where we
567 * point that gun, hey? See kill(2) for the
568 * magic caused by negative values. */
569 pid_t p
= all_pids
[i
];
580 /** Lock a byte range in a open file */
581 int lock_range(int fd
, int offset
, int len
)
585 lock
.l_type
= F_WRLCK
;
586 lock
.l_whence
= SEEK_SET
;
587 lock
.l_start
= offset
;
591 return fcntl(fd
,F_SETLK
,&lock
) == 0;
594 #define ENSURE_MEMSPACE(buf, type, sz, req) \
595 if ((req) > sz && !(buf = realloc_array(buf, type, sz = MAX(sz * 2, req)))) \
596 out_of_memory("glob_expand")
598 static inline void call_glob_match(const char *name
, int len
, int from_glob
,
599 char *arg
, int abpos
, int fbpos
);
601 static struct glob_data
{
602 char *arg_buf
, *filt_buf
, **argv
;
603 int absize
, fbsize
, maxargs
, argc
;
606 static void glob_match(char *arg
, int abpos
, int fbpos
)
611 while (*arg
== '.' && arg
[1] == '/') {
613 ENSURE_MEMSPACE(glob
.filt_buf
, char, glob
.fbsize
, glob
.absize
);
614 memcpy(glob
.filt_buf
, glob
.arg_buf
, abpos
+ 1);
617 ENSURE_MEMSPACE(glob
.arg_buf
, char, glob
.absize
, abpos
+ 3);
618 glob
.arg_buf
[abpos
++] = *arg
++;
619 glob
.arg_buf
[abpos
++] = *arg
++;
620 glob
.arg_buf
[abpos
] = '\0';
622 if ((slash
= strchr(arg
, '/')) != NULL
) {
627 if (strpbrk(arg
, "*?[")) {
631 if (!(d
= opendir(abpos
? glob
.arg_buf
: ".")))
633 while ((di
= readdir(d
)) != NULL
) {
634 char *dname
= d_name(di
);
635 if (dname
[0] == '.' && (dname
[1] == '\0'
636 || (dname
[1] == '.' && dname
[2] == '\0')))
638 if (!wildmatch(arg
, dname
))
640 call_glob_match(dname
, strlen(dname
), 1,
641 slash
? arg
+ len
+ 1 : NULL
,
646 call_glob_match(arg
, len
, 0,
647 slash
? arg
+ len
+ 1 : NULL
,
654 static inline void call_glob_match(const char *name
, int len
, int from_glob
,
655 char *arg
, int abpos
, int fbpos
)
659 ENSURE_MEMSPACE(glob
.arg_buf
, char, glob
.absize
, abpos
+ len
+ 2);
660 memcpy(glob
.arg_buf
+ abpos
, name
, len
);
662 glob
.arg_buf
[abpos
] = '\0';
665 ENSURE_MEMSPACE(glob
.filt_buf
, char, glob
.fbsize
, fbpos
+ len
+ 2);
666 memcpy(glob
.filt_buf
+ fbpos
, name
, len
);
668 glob
.filt_buf
[fbpos
] = '\0';
669 use_buf
= glob
.filt_buf
;
671 use_buf
= glob
.arg_buf
;
673 if (from_glob
|| (arg
&& len
)) {
677 if (do_stat(glob
.arg_buf
, &st
) != 0)
679 is_dir
= S_ISDIR(st
.st_mode
) != 0;
683 if (daemon_filter_list
.head
684 && check_filter(&daemon_filter_list
, FLOG
, use_buf
, is_dir
) < 0)
689 glob
.arg_buf
[abpos
++] = '/';
690 glob
.arg_buf
[abpos
] = '\0';
692 glob
.filt_buf
[fbpos
++] = '/';
693 glob
.filt_buf
[fbpos
] = '\0';
695 glob_match(arg
, abpos
, fbpos
);
697 ENSURE_MEMSPACE(glob
.argv
, char *, glob
.maxargs
, glob
.argc
+ 1);
698 if (!(glob
.argv
[glob
.argc
++] = strdup(glob
.arg_buf
)))
699 out_of_memory("glob_match");
703 /* This routine performs wild-card expansion of the pathname in "arg". Any
704 * daemon-excluded files/dirs will not be matched by the wildcards. Returns 0
705 * if a wild-card string is the only returned item (due to matching nothing). */
706 int glob_expand(const char *arg
, char ***argv_p
, int *argc_p
, int *maxargs_p
)
715 memset(&glob
, 0, sizeof glob
);
720 s
= sanitize_path(NULL
, arg
, "", 0, SP_KEEP_DOT_DIRS
);
724 out_of_memory("glob_expand");
725 clean_fname(s
, CFN_KEEP_DOT_DIRS
726 | CFN_KEEP_TRAILING_SLASH
727 | CFN_COLLAPSE_DOT_DOT_DIRS
);
730 ENSURE_MEMSPACE(glob
.arg_buf
, char, glob
.absize
, MAXPATHLEN
);
731 *glob
.arg_buf
= '\0';
733 glob
.argc
= save_argc
= *argc_p
;
735 glob
.maxargs
= *maxargs_p
;
737 ENSURE_MEMSPACE(glob
.argv
, char *, glob
.maxargs
, 100);
739 glob_match(s
, 0, -1);
741 /* The arg didn't match anything, so add the failed arg to the list. */
742 if (glob
.argc
== save_argc
) {
743 ENSURE_MEMSPACE(glob
.argv
, char *, glob
.maxargs
, glob
.argc
+ 1);
744 glob
.argv
[glob
.argc
++] = s
;
751 *maxargs_p
= glob
.maxargs
;
758 /* This routine is only used in daemon mode. */
759 void glob_expand_module(char *base1
, char *arg
, char ***argv_p
, int *argc_p
, int *maxargs_p
)
763 int base_len
= strlen(base
);
768 if (strncmp(arg
, base
, base_len
) == 0)
772 glob_expand(arg
, argv_p
, argc_p
, maxargs_p
);
776 if (!(arg
= strdup(arg
)))
777 out_of_memory("glob_expand_module");
779 if (asprintf(&base
," %s/", base1
) < 0)
780 out_of_memory("glob_expand_module");
783 for (s
= arg
; *s
; s
= p
+ base_len
) {
784 if ((p
= strstr(s
, base
)) != NULL
)
785 *p
= '\0'; /* split it at this point */
786 glob_expand(s
, argv_p
, argc_p
, maxargs_p
);
796 * Convert a string to lower case
798 void strlower(char *s
)
808 * Split a string into tokens based (usually) on whitespace & commas. If the
809 * string starts with a comma (after skipping any leading whitespace), then
810 * splitting is done only on commas. No empty tokens are ever returned. */
811 char *conf_strtok(char *str
)
813 static int commas_only
= 0;
816 while (isSpace(str
)) str
++;
824 while (commas_only
) {
825 char *end
, *tok
= strtok(str
, ",");
828 /* Trim just leading and trailing whitespace. */
831 end
= tok
+ strlen(tok
);
832 while (end
> tok
&& isSpace(end
-1))
839 return strtok(str
, " ,\t\r\n");
842 /* Join strings p1 & p2 into "dest" with a guaranteed '/' between them. (If
843 * p1 ends with a '/', no extra '/' is inserted.) Returns the length of both
844 * strings + 1 (if '/' was inserted), regardless of whether the null-terminated
845 * string fits into destsize. */
846 size_t pathjoin(char *dest
, size_t destsize
, const char *p1
, const char *p2
)
848 size_t len
= strlcpy(dest
, p1
, destsize
);
849 if (len
< destsize
- 1) {
850 if (!len
|| dest
[len
-1] != '/')
852 if (len
< destsize
- 1)
853 len
+= strlcpy(dest
+ len
, p2
, destsize
- len
);
860 len
+= strlen(p2
) + 1; /* Assume we'd insert a '/'. */
864 /* Join any number of strings together, putting them in "dest". The return
865 * value is the length of all the strings, regardless of whether the null-
866 * terminated whole fits in destsize. Your list of string pointers must end
867 * with a NULL to indicate the end of the list. */
868 size_t stringjoin(char *dest
, size_t destsize
, ...)
874 va_start(ap
, destsize
);
876 if (!(src
= va_arg(ap
, const char *)))
883 memcpy(dest
, src
, len
);
894 int count_dir_elements(const char *p
)
896 int cnt
= 0, new_component
= 1;
899 new_component
= (*p
!= '.' || (p
[1] != '/' && p
[1] != '\0'));
900 else if (new_component
) {
908 /* Turns multiple adjacent slashes into a single slash (possible exception:
909 * the preserving of two leading slashes at the start), drops all leading or
910 * interior "." elements unless CFN_KEEP_DOT_DIRS is flagged. Will also drop
911 * a trailing '.' after a '/' if CFN_DROP_TRAILING_DOT_DIR is flagged, removes
912 * a trailing slash (perhaps after removing the aforementioned dot) unless
913 * CFN_KEEP_TRAILING_SLASH is flagged, and will also collapse ".." elements
914 * (except at the start) if CFN_COLLAPSE_DOT_DOT_DIRS is flagged. If the
915 * resulting name would be empty, returns ".". */
916 int clean_fname(char *name
, int flags
)
918 char *limit
= name
- 1, *t
= name
, *f
= name
;
924 #define DOT_IS_DOT_DOT_DIR(bp) (bp[1] == '.' && (bp[2] == '/' || !bp[2]))
926 if ((anchored
= *f
== '/') != 0) {
929 /* If there are exactly 2 slashes at the start, preserve
930 * them. Would break daemon excludes unless the paths are
931 * really treated differently, so used this sparingly. */
932 if (*f
== '/' && f
[1] != '/')
935 } else if (flags
& CFN_KEEP_DOT_DIRS
&& *f
== '.' && f
[1] == '/') {
938 } else if (flags
& CFN_REFUSE_DOT_DOT_DIRS
&& *f
== '.' && DOT_IS_DOT_DOT_DIR(f
))
941 /* discard extra slashes */
947 /* discard interior "." dirs */
948 if (f
[1] == '/' && !(flags
& CFN_KEEP_DOT_DIRS
)) {
952 if (f
[1] == '\0' && flags
& CFN_DROP_TRAILING_DOT_DIR
)
954 /* collapse ".." dirs */
955 if (flags
& (CFN_COLLAPSE_DOT_DOT_DIRS
|CFN_REFUSE_DOT_DOT_DIRS
) && DOT_IS_DOT_DOT_DIR(f
)) {
957 if (flags
& CFN_REFUSE_DOT_DOT_DIRS
)
959 if (s
== name
&& anchored
) {
963 while (s
> limit
&& *--s
!= '/') {}
964 if (s
!= t
- 1 && (s
< name
|| *s
== '/')) {
972 while (*f
&& (*t
++ = *f
++) != '/') {}
975 if (t
> name
+anchored
&& t
[-1] == '/' && !(flags
& CFN_KEEP_TRAILING_SLASH
))
981 #undef DOT_IS_DOT_DOT_DIR
986 /* Make path appear as if a chroot had occurred. This handles a leading
987 * "/" (either removing it or expanding it) and any leading or embedded
988 * ".." components that attempt to escape past the module's top dir.
990 * If dest is NULL, a buffer is allocated to hold the result. It is legal
991 * to call with the dest and the path (p) pointing to the same buffer, but
992 * rootdir will be ignored to avoid expansion of the string.
994 * The rootdir string contains a value to use in place of a leading slash.
995 * Specify NULL to get the default of "module_dir".
997 * The depth var is a count of how many '..'s to allow at the start of the
1000 * We also clean the path in a manner similar to clean_fname() but with a
1003 * Turns multiple adjacent slashes into a single slash, gets rid of "." dir
1004 * elements (INCLUDING a trailing dot dir), PRESERVES a trailing slash, and
1005 * ALWAYS collapses ".." elements (except for those at the start of the
1006 * string up to "depth" deep). If the resulting name would be empty,
1007 * change it into a ".". */
1008 char *sanitize_path(char *dest
, const char *p
, const char *rootdir
, int depth
,
1012 int rlen
= 0, drop_dot_dirs
= !relative_paths
|| !(flags
& SP_KEEP_DOT_DIRS
);
1015 int plen
= strlen(p
); /* the path len INCLUDING any separating slash */
1018 rootdir
= module_dir
;
1019 rlen
= strlen(rootdir
);
1024 if (rlen
+ plen
+ 1 >= MAXPATHLEN
)
1026 } else if (!(dest
= new_array(char, MAX(rlen
+ plen
+ 1, 2))))
1027 out_of_memory("sanitize_path");
1028 if (rlen
) { /* only true if p previously started with a slash */
1029 memcpy(dest
, rootdir
, rlen
);
1030 if (rlen
> 1) /* a rootdir of len 1 is "/", so this avoids a 2nd slash */
1035 if (drop_dot_dirs
) {
1036 while (*p
== '.' && p
[1] == '/')
1040 start
= sanp
= dest
+ rlen
;
1041 /* This loop iterates once per filename component in p, pointing at
1042 * the start of the name (past any prior slash) for each iteration. */
1044 /* discard leading or extra slashes */
1049 if (drop_dot_dirs
) {
1050 if (*p
== '.' && (p
[1] == '/' || p
[1] == '\0')) {
1051 /* skip "." component */
1056 if (*p
== '.' && p
[1] == '.' && (p
[2] == '/' || p
[2] == '\0')) {
1057 /* ".." component followed by slash or end */
1058 if (depth
<= 0 || sanp
!= start
) {
1060 if (sanp
!= start
) {
1061 /* back up sanp one level */
1062 --sanp
; /* now pointing at slash */
1063 while (sanp
> start
&& sanp
[-1] != '/')
1068 /* allow depth levels of .. at the beginning */
1070 /* move the virtual beginning to leave the .. alone */
1073 /* copy one component through next slash */
1074 while (*p
&& (*sanp
++ = *p
++) != '/') {}
1077 /* ended up with nothing, so put in "." component */
1085 /* Like chdir(), but it keeps track of the current directory (in the
1086 * global "curr_dir"), and ensures that the path size doesn't overflow.
1087 * Also cleans the path using the clean_fname() function. */
1088 int change_dir(const char *dir
, int set_path_only
)
1090 static int initialised
, skipped_chdir
;
1095 if (getcwd(curr_dir
, sizeof curr_dir
- 1) == NULL
) {
1096 rsyserr(FERROR
, errno
, "getcwd()");
1097 exit_cleanup(RERR_FILESELECT
);
1099 curr_dir_len
= strlen(curr_dir
);
1102 if (!dir
) /* this call was probably just to initialize */
1106 if (len
== 1 && *dir
== '.' && (!skipped_chdir
|| set_path_only
))
1110 if (len
>= sizeof curr_dir
) {
1111 errno
= ENAMETOOLONG
;
1114 if (!set_path_only
&& chdir(dir
))
1116 skipped_chdir
= set_path_only
;
1117 memcpy(curr_dir
, dir
, len
+ 1);
1119 unsigned int save_dir_len
= curr_dir_len
;
1120 if (curr_dir_len
+ 1 + len
>= sizeof curr_dir
) {
1121 errno
= ENAMETOOLONG
;
1124 if (!(curr_dir_len
&& curr_dir
[curr_dir_len
-1] == '/'))
1125 curr_dir
[curr_dir_len
++] = '/';
1126 memcpy(curr_dir
+ curr_dir_len
, dir
, len
+ 1);
1128 if (!set_path_only
&& chdir(curr_dir
)) {
1129 curr_dir_len
= save_dir_len
;
1130 curr_dir
[curr_dir_len
] = '\0';
1133 skipped_chdir
= set_path_only
;
1136 curr_dir_len
= clean_fname(curr_dir
, CFN_COLLAPSE_DOT_DOT_DIRS
| CFN_DROP_TRAILING_DOT_DIR
);
1137 if (sanitize_paths
) {
1138 if (module_dirlen
> curr_dir_len
)
1139 module_dirlen
= curr_dir_len
;
1140 curr_dir_depth
= count_dir_elements(curr_dir
+ module_dirlen
);
1143 if (DEBUG_GTE(CHDIR
, 1) && !set_path_only
)
1144 rprintf(FINFO
, "[%s] change_dir(%s)\n", who_am_i(), curr_dir
);
1149 /* This will make a relative path absolute and clean it up via clean_fname().
1150 * Returns the string, which might be newly allocated, or NULL on error. */
1151 char *normalize_path(char *path
, BOOL force_newbuf
, unsigned int *len_ptr
)
1155 if (*path
!= '/') { /* Make path absolute. */
1156 int len
= strlen(path
);
1157 if (curr_dir_len
+ 1 + len
>= sizeof curr_dir
)
1159 curr_dir
[curr_dir_len
] = '/';
1160 memcpy(curr_dir
+ curr_dir_len
+ 1, path
, len
+ 1);
1161 if (!(path
= strdup(curr_dir
)))
1162 out_of_memory("normalize_path");
1163 curr_dir
[curr_dir_len
] = '\0';
1164 } else if (force_newbuf
) {
1165 if (!(path
= strdup(path
)))
1166 out_of_memory("normalize_path");
1169 len
= clean_fname(path
, CFN_COLLAPSE_DOT_DOT_DIRS
| CFN_DROP_TRAILING_DOT_DIR
);
1178 * Return a quoted string with the full pathname of the indicated filename.
1179 * The string " (in MODNAME)" may also be appended. The returned pointer
1180 * remains valid until the next time full_fname() is called.
1182 char *full_fname(const char *fn
)
1184 static char *result
= NULL
;
1194 p1
= curr_dir
+ module_dirlen
;
1195 for (p2
= p1
; *p2
== '/'; p2
++) {}
1199 if (module_id
>= 0) {
1201 m2
= lp_name(module_id
);
1206 if (asprintf(&result
, "\"%s%s%s\"%s%s%s", p1
, p2
, fn
, m1
, m2
, m3
) < 0)
1207 out_of_memory("full_fname");
1212 static char partial_fname
[MAXPATHLEN
];
1214 char *partial_dir_fname(const char *fname
)
1216 char *t
= partial_fname
;
1217 int sz
= sizeof partial_fname
;
1220 if ((fn
= strrchr(fname
, '/')) != NULL
) {
1222 if (*partial_dir
!= '/') {
1223 int len
= fn
- fname
;
1224 strncpy(t
, fname
, len
); /* safe */
1230 if ((int)pathjoin(t
, sz
, partial_dir
, fn
) >= sz
)
1232 if (daemon_filter_list
.head
) {
1233 t
= strrchr(partial_fname
, '/');
1235 if (check_filter(&daemon_filter_list
, FLOG
, partial_fname
, 1) < 0)
1238 if (check_filter(&daemon_filter_list
, FLOG
, partial_fname
, 0) < 0)
1242 return partial_fname
;
1245 /* If no --partial-dir option was specified, we don't need to do anything
1246 * (the partial-dir is essentially '.'), so just return success. */
1247 int handle_partial_dir(const char *fname
, int create
)
1251 if (fname
!= partial_fname
)
1253 if (!create
&& *partial_dir
== '/')
1255 if (!(fn
= strrchr(partial_fname
, '/')))
1259 dir
= partial_fname
;
1262 int statret
= do_lstat(dir
, &st
);
1263 if (statret
== 0 && !S_ISDIR(st
.st_mode
)) {
1264 if (do_unlink(dir
) < 0) {
1270 if (statret
< 0 && do_mkdir(dir
, 0700) < 0) {
1281 /* Determine if a symlink points outside the current directory tree.
1282 * This is considered "unsafe" because e.g. when mirroring somebody
1283 * else's machine it might allow them to establish a symlink to
1284 * /etc/passwd, and then read it through a web server.
1286 * Returns 1 if unsafe, 0 if safe.
1288 * Null symlinks and absolute symlinks are always unsafe.
1290 * Basically here we are concerned with symlinks whose target contains
1291 * "..", because this might cause us to walk back up out of the
1292 * transferred directory. We are not allowed to go back up and
1295 * "dest" is the target of the symlink in question.
1297 * "src" is the top source directory currently applicable at the level
1298 * of the referenced symlink. This is usually the symlink's full path
1299 * (including its name), as referenced from the root of the transfer. */
1300 int unsafe_symlink(const char *dest
, const char *src
)
1302 const char *name
, *slash
;
1305 /* all absolute and null symlinks are unsafe */
1306 if (!dest
|| !*dest
|| *dest
== '/')
1309 /* find out what our safety margin is */
1310 for (name
= src
; (slash
= strchr(name
, '/')) != 0; name
= slash
+1) {
1311 /* ".." segment starts the count over. "." segment is ignored. */
1312 if (*name
== '.' && (name
[1] == '/' || (name
[1] == '.' && name
[2] == '/'))) {
1317 while (slash
[1] == '/') slash
++; /* just in case src isn't clean */
1319 if (*name
== '.' && name
[1] == '.' && name
[2] == '\0')
1322 for (name
= dest
; (slash
= strchr(name
, '/')) != 0; name
= slash
+1) {
1323 if (*name
== '.' && (name
[1] == '/' || (name
[1] == '.' && name
[2] == '/'))) {
1324 if (name
[1] == '.') {
1325 /* if at any point we go outside the current directory
1326 then stop - it is unsafe */
1332 while (slash
[1] == '/') slash
++;
1334 if (*name
== '.' && name
[1] == '.' && name
[2] == '\0')
1340 /* Return the date and time as a string. Some callers tweak returned buf. */
1341 char *timestring(time_t t
)
1344 static char buffers
[4][20]; /* We support 4 simultaneous timestring results. */
1345 char *TimeBuf
= buffers
[ndx
= (ndx
+ 1) % 4];
1346 struct tm
*tm
= localtime(&t
);
1347 int len
= snprintf(TimeBuf
, sizeof buffers
[0], "%4d/%02d/%02d %02d:%02d:%02d",
1348 (int)tm
->tm_year
+ 1900, (int)tm
->tm_mon
+ 1, (int)tm
->tm_mday
,
1349 (int)tm
->tm_hour
, (int)tm
->tm_min
, (int)tm
->tm_sec
);
1350 assert(len
> 0); /* Silence gcc warning */
1355 /* Determine if two time_t values are equivalent (either exact, or in
1356 * the modification timestamp window established by --modify-window).
1358 * @retval 0 if the times should be treated as the same
1360 * @retval +1 if the first is later
1362 * @retval -1 if the 2nd is later
1364 int cmp_time(time_t f1_sec
, unsigned long f1_nsec
, time_t f2_sec
, unsigned long f2_nsec
)
1366 if (f2_sec
> f1_sec
) {
1367 /* The final comparison makes sure that modify_window doesn't overflow a
1368 * time_t, which would mean that f2_sec must be in the equality window. */
1369 if (modify_window
<= 0 || (f2_sec
> f1_sec
+ modify_window
&& f1_sec
+ modify_window
> f1_sec
))
1371 } else if (f1_sec
> f2_sec
) {
1372 if (modify_window
<= 0 || (f1_sec
> f2_sec
+ modify_window
&& f2_sec
+ modify_window
> f2_sec
))
1374 } else if (modify_window
< 0) {
1375 if (f2_nsec
> f1_nsec
)
1377 else if (f1_nsec
> f2_nsec
)
1387 This routine is a trick to immediately catch errors when debugging
1388 with insure. A xterm with a gdb is popped up when insure catches
1389 a error. It is Linux specific.
1391 int _Insure_trap_error(int a1
, int a2
, int a3
, int a4
, int a5
, int a6
)
1394 int ret
, pid_int
= getpid();
1398 "/usr/X11R6/bin/xterm -display :0 -T Panic -n Panic -e /bin/sh -c 'cat /tmp/ierrs.*.%d ; "
1399 "gdb /proc/%d/exe %d'", pid_int
, pid_int
, pid_int
) < 0)
1404 h
= dlopen("/usr/local/parasoft/insure++lite/lib.linux2/libinsure.so", RTLD_LAZY
);
1405 fn
= dlsym(h
, "_Insure_trap_error");
1408 ret
= fn(a1
, a2
, a3
, a4
, a5
, a6
);
1418 /* Take a filename and filename length and return the most significant
1419 * filename suffix we can find. This ignores suffixes such as "~",
1420 * ".bak", ".orig", ".~1~", etc. */
1421 const char *find_filename_suffix(const char *fn
, int fn_len
, int *len_ptr
)
1423 const char *suf
, *s
;
1427 /* One or more dots at the start aren't a suffix. */
1428 while (fn_len
&& *fn
== '.') fn
++, fn_len
--;
1430 /* Ignore the ~ in a "foo~" filename. */
1431 if (fn_len
> 1 && fn
[fn_len
-1] == '~')
1432 fn_len
--, had_tilde
= True
;
1436 /* Assume we don't find an suffix. */
1440 /* Find the last significant suffix. */
1441 for (s
= fn
+ fn_len
; fn_len
> 1; ) {
1442 while (*--s
!= '.' && s
!= fn
) {}
1445 s_len
= fn_len
- (s
- fn
);
1448 if (strcmp(s
+1, "bak") == 0
1449 || strcmp(s
+1, "old") == 0)
1451 } else if (s_len
== 5) {
1452 if (strcmp(s
+1, "orig") == 0)
1454 } else if (s_len
> 2 && had_tilde
1455 && s
[1] == '~' && isDigit(s
+ 2))
1461 /* Determine if the suffix is all digits. */
1462 for (s
++, s_len
--; s_len
> 0; s
++, s_len
--) {
1466 /* An all-digit suffix may not be that significant. */
1473 /* This is an implementation of the Levenshtein distance algorithm. It
1474 * was implemented to avoid needing a two-dimensional matrix (to save
1475 * memory). It was also tweaked to try to factor in the ASCII distance
1476 * between changed characters as a minor distance quantity. The normal
1477 * Levenshtein units of distance (each signifying a single change between
1478 * the two strings) are defined as a "UNIT". */
1480 #define UNIT (1 << 16)
1482 uint32
fuzzy_distance(const char *s1
, unsigned len1
, const char *s2
, unsigned len2
)
1484 uint32 a
[MAXPATHLEN
], diag
, above
, left
, diag_inc
, above_inc
, left_inc
;
1488 if (!len1
|| !len2
) {
1493 for (i1
= 0, cost
= 0; i1
< len1
; i1
++)
1495 return (int32
)len1
* UNIT
+ cost
;
1498 for (i2
= 0; i2
< len2
; i2
++)
1499 a
[i2
] = (i2
+1) * UNIT
;
1501 for (i1
= 0; i1
< len1
; i1
++) {
1503 above
= (i1
+1) * UNIT
;
1504 for (i2
= 0; i2
< len2
; i2
++) {
1506 if ((cost
= *((uchar
*)s1
+i1
) - *((uchar
*)s2
+i2
)) != 0) {
1512 diag_inc
= diag
+ cost
;
1513 left_inc
= left
+ UNIT
+ *((uchar
*)s1
+i1
);
1514 above_inc
= above
+ UNIT
+ *((uchar
*)s2
+i2
);
1515 a
[i2
] = above
= left
< above
1516 ? (left_inc
< diag_inc
? left_inc
: diag_inc
)
1517 : (above_inc
< diag_inc
? above_inc
: diag_inc
);
1525 #define BB_SLOT_SIZE (16*1024) /* Desired size in bytes */
1526 #define BB_PER_SLOT_BITS (BB_SLOT_SIZE * 8) /* Number of bits per slot */
1527 #define BB_PER_SLOT_INTS (BB_SLOT_SIZE / 4) /* Number of int32s per slot */
1534 struct bitbag
*bitbag_create(int max_ndx
)
1536 struct bitbag
*bb
= new(struct bitbag
);
1537 bb
->slot_cnt
= (max_ndx
+ BB_PER_SLOT_BITS
- 1) / BB_PER_SLOT_BITS
;
1539 if (!(bb
->bits
= (uint32
**)calloc(bb
->slot_cnt
, sizeof (uint32
*))))
1540 out_of_memory("bitbag_create");
1545 void bitbag_set_bit(struct bitbag
*bb
, int ndx
)
1547 int slot
= ndx
/ BB_PER_SLOT_BITS
;
1548 ndx
%= BB_PER_SLOT_BITS
;
1550 if (!bb
->bits
[slot
]) {
1551 if (!(bb
->bits
[slot
] = (uint32
*)calloc(BB_PER_SLOT_INTS
, 4)))
1552 out_of_memory("bitbag_set_bit");
1555 bb
->bits
[slot
][ndx
/32] |= 1u << (ndx
% 32);
1558 #if 0 /* not needed yet */
1559 void bitbag_clear_bit(struct bitbag
*bb
, int ndx
)
1561 int slot
= ndx
/ BB_PER_SLOT_BITS
;
1562 ndx
%= BB_PER_SLOT_BITS
;
1564 if (!bb
->bits
[slot
])
1567 bb
->bits
[slot
][ndx
/32] &= ~(1u << (ndx
% 32));
1570 int bitbag_check_bit(struct bitbag
*bb
, int ndx
)
1572 int slot
= ndx
/ BB_PER_SLOT_BITS
;
1573 ndx
%= BB_PER_SLOT_BITS
;
1575 if (!bb
->bits
[slot
])
1578 return bb
->bits
[slot
][ndx
/32] & (1u << (ndx
% 32)) ? 1 : 0;
1582 /* Call this with -1 to start checking from 0. Returns -1 at the end. */
1583 int bitbag_next_bit(struct bitbag
*bb
, int after
)
1586 int i
, ndx
= after
+ 1;
1587 int slot
= ndx
/ BB_PER_SLOT_BITS
;
1588 ndx
%= BB_PER_SLOT_BITS
;
1590 mask
= (1u << (ndx
% 32)) - 1;
1591 for (i
= ndx
/ 32; slot
< bb
->slot_cnt
; slot
++, i
= mask
= 0) {
1592 if (!bb
->bits
[slot
])
1594 for ( ; i
< BB_PER_SLOT_INTS
; i
++, mask
= 0) {
1595 if (!(bits
= bb
->bits
[slot
][i
] & ~mask
))
1597 /* The xor magic figures out the lowest enabled bit in
1598 * bits, and the switch quickly computes log2(bit). */
1599 switch (bits
^ (bits
& (bits
-1))) {
1600 #define LOG2(n) case 1u << n: return slot*BB_PER_SLOT_BITS + i*32 + n
1601 LOG2(0); LOG2(1); LOG2(2); LOG2(3);
1602 LOG2(4); LOG2(5); LOG2(6); LOG2(7);
1603 LOG2(8); LOG2(9); LOG2(10); LOG2(11);
1604 LOG2(12); LOG2(13); LOG2(14); LOG2(15);
1605 LOG2(16); LOG2(17); LOG2(18); LOG2(19);
1606 LOG2(20); LOG2(21); LOG2(22); LOG2(23);
1607 LOG2(24); LOG2(25); LOG2(26); LOG2(27);
1608 LOG2(28); LOG2(29); LOG2(30); LOG2(31);
1610 return -1; /* impossible... */
1617 void flist_ndx_push(flist_ndx_list
*lp
, int ndx
)
1619 struct flist_ndx_item
*item
;
1621 if (!(item
= new(struct flist_ndx_item
)))
1622 out_of_memory("flist_ndx_push");
1626 lp
->tail
->next
= item
;
1632 int flist_ndx_pop(flist_ndx_list
*lp
)
1634 struct flist_ndx_item
*next
;
1640 ndx
= lp
->head
->ndx
;
1641 next
= lp
->head
->next
;
1650 /* Make sure there is room for one more item in the item list. If there
1651 * is not, expand the list as indicated by the value of "incr":
1652 * - if incr < 0 then increase the malloced size by -1 * incr
1653 * - if incr >= 0 then either make the malloced size equal to "incr"
1654 * or (if that's not large enough) double the malloced size
1655 * After the size check, the list's count is incremented by 1 and a pointer
1656 * to the "new" list item is returned.
1658 void *expand_item_list(item_list
*lp
, size_t item_size
,
1659 const char *desc
, int incr
)
1661 /* First time through, 0 <= 0, so list is expanded. */
1662 if (lp
->malloced
<= lp
->count
) {
1664 size_t new_size
= lp
->malloced
;
1666 new_size
+= -incr
; /* increase slowly */
1667 else if (new_size
< (size_t)incr
)
1673 if (new_size
<= lp
->malloced
)
1674 overflow_exit("expand_item_list");
1675 /* Using _realloc_array() lets us pass the size, not a type. */
1676 new_ptr
= _realloc_array(lp
->items
, item_size
, new_size
);
1677 if (DEBUG_GTE(FLIST
, 3)) {
1678 rprintf(FINFO
, "[%s] expand %s to %s bytes, did%s move\n",
1679 who_am_i(), desc
, big_num(new_size
* item_size
),
1680 new_ptr
== lp
->items
? " not" : "");
1683 out_of_memory("expand_item_list");
1685 lp
->items
= new_ptr
;
1686 lp
->malloced
= new_size
;
1688 return (char*)lp
->items
+ (lp
->count
++ * item_size
);
1691 /* This zeroing of memory won't be optimized away by the compiler. */
1692 void force_memzero(void *buf
, size_t len
)
1694 volatile uchar
*z
= buf
;