rm_/lib/backupfile.c

394 lines
12 KiB
C
Raw Permalink Normal View History

2020-09-02 16:47:03 +08:00
/* backupfile.c -- make Emacs style backup file names
2022-07-28 14:16:50 +08:00
Copyright (C) 1990-2006, 2009-2022 Free Software Foundation, Inc.
2020-09-02 16:47:03 +08:00
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
2022-07-28 14:16:50 +08:00
the Free Software Foundation, either version 3 of the License, or
2020-09-02 16:47:03 +08:00
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <https://www.gnu.org/licenses/>. */
/* Written by Paul Eggert and David MacKenzie.
Some algorithms adapted from GNU Emacs. */
#include <config.h>
#include "backup-internal.h"
2022-07-28 14:16:50 +08:00
#include <dirent.h>
2020-09-02 16:47:03 +08:00
#include <errno.h>
#include <fcntl.h>
#include <stdbool.h>
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
2022-07-28 14:16:50 +08:00
#include "attribute.h"
#include "basename-lgpl.h"
#include "ialloc.h"
#include "intprops.h"
#include "opendirat.h"
#include "renameatu.h"
2020-09-02 16:47:03 +08:00
#ifndef _D_EXACT_NAMLEN
# define _D_EXACT_NAMLEN(dp) strlen ((dp)->d_name)
#endif
#if ! (HAVE_PATHCONF && defined _PC_NAME_MAX)
# define pathconf(file, option) (errno = -1)
2022-07-28 14:16:50 +08:00
# define fpathconf(fd, option) (errno = -1)
2020-09-02 16:47:03 +08:00
#endif
#ifndef _POSIX_NAME_MAX
# define _POSIX_NAME_MAX 14
#endif
#if defined _XOPEN_NAME_MAX
# define NAME_MAX_MINIMUM _XOPEN_NAME_MAX
#else
# define NAME_MAX_MINIMUM _POSIX_NAME_MAX
#endif
#ifndef HAVE_DOS_FILE_NAMES
# define HAVE_DOS_FILE_NAMES 0
#endif
#ifndef HAVE_LONG_FILE_NAMES
# define HAVE_LONG_FILE_NAMES 0
#endif
/* ISDIGIT differs from isdigit, as follows:
- Its arg may be any int or unsigned int; it need not be an unsigned char
or EOF.
- It's typically faster.
POSIX says that only '0' through '9' are digits. Prefer ISDIGIT to
ISDIGIT unless it's important to use the locale's definition
of "digit" even when the host does not conform to POSIX. */
#define ISDIGIT(c) ((unsigned int) (c) - '0' <= 9)
/* The extension added to file names to produce a simple (as opposed
to numbered) backup file name. */
char const *simple_backup_suffix = NULL;
/* Set SIMPLE_BACKUP_SUFFIX to S, or to a default specified by the
environment if S is null. If S or the environment does not specify
a valid backup suffix, use "~". */
void
set_simple_backup_suffix (char const *s)
{
if (!s)
s = getenv ("SIMPLE_BACKUP_SUFFIX");
simple_backup_suffix = s && *s && s == last_component (s) ? s : "~";
}
/* If FILE (which was of length FILELEN before an extension was
appended to it) is too long, replace the extension with the single
char E. If the result is still too long, remove the char just
2022-07-28 14:16:50 +08:00
before E. Return true if the extension was OK already, false
if it needed replacement.
2020-09-02 16:47:03 +08:00
If DIR_FD is nonnegative, it is a file descriptor for FILE's parent.
2022-07-28 14:16:50 +08:00
*BASE_MAX is either 0, or the cached result of a previous call for
2020-09-02 16:47:03 +08:00
FILE's parent's _PC_NAME_MAX. */
2022-07-28 14:16:50 +08:00
static bool
check_extension (char *file, idx_t filelen, char e,
int dir_fd, idx_t *base_max)
2020-09-02 16:47:03 +08:00
{
char *base = last_component (file);
2022-07-28 14:16:50 +08:00
idx_t baselen = base_len (base);
idx_t baselen_max = HAVE_LONG_FILE_NAMES ? 255 : NAME_MAX_MINIMUM;
2020-09-02 16:47:03 +08:00
if (HAVE_DOS_FILE_NAMES || NAME_MAX_MINIMUM < baselen)
{
/* The new base name is long enough to require a pathconf check. */
if (*base_max == 0)
{
long name_max;
if (dir_fd < 0)
{
/* Temporarily modify the buffer into its parent
directory name, invoke pathconf on the directory, and
then restore the buffer. */
char tmp[sizeof "."];
memcpy (tmp, base, sizeof ".");
strcpy (base, ".");
errno = 0;
name_max = pathconf (file, _PC_NAME_MAX);
name_max -= !errno;
memcpy (base, tmp, sizeof ".");
}
else
{
errno = 0;
name_max = fpathconf (dir_fd, _PC_NAME_MAX);
name_max -= !errno;
}
*base_max = (0 <= name_max && name_max <= SIZE_MAX ? name_max
: name_max < -1 ? NAME_MAX_MINIMUM : SIZE_MAX);
}
baselen_max = *base_max;
}
if (HAVE_DOS_FILE_NAMES && baselen_max <= 12)
{
/* Live within DOS's 8.3 limit. */
char *dot = strchr (base, '.');
if (!dot)
baselen_max = 8;
else
{
char const *second_dot = strchr (dot + 1, '.');
baselen_max = (second_dot
? second_dot - base
: dot + 1 - base + 3);
}
}
2022-07-28 14:16:50 +08:00
if (baselen <= baselen_max)
return true;
else
2020-09-02 16:47:03 +08:00
{
baselen = file + filelen - base;
if (baselen_max <= baselen)
baselen = baselen_max - 1;
base[baselen] = e;
base[baselen + 1] = '\0';
2022-07-28 14:16:50 +08:00
return false;
2020-09-02 16:47:03 +08:00
}
}
/* Returned values for NUMBERED_BACKUP. */
enum numbered_backup_result
{
/* The new backup name is the same length as an existing backup
name, so it's valid for that directory. */
BACKUP_IS_SAME_LENGTH,
/* Some backup names already exist, but the returned name is longer
than any of them, and its length should be checked. */
BACKUP_IS_LONGER,
/* There are no existing backup names. The new name's length
should be checked. */
BACKUP_IS_NEW,
/* Memory allocation failure. */
BACKUP_NOMEM
};
/* Relative to DIR_FD, *BUFFER contains a file name.
Store into *BUFFER the next backup name for the named file,
with a version number greater than all the
existing numbered backups. Reallocate *BUFFER as necessary; its
2022-07-28 14:16:50 +08:00
initial allocated size is BUFFER_SIZE, which must be at least 5
2020-09-02 16:47:03 +08:00
bytes longer than the file name to make room for the initially
2022-07-28 14:16:50 +08:00
appended ".~1~". FILELEN is the length of the original file name.
(The original file name is not necessarily null-terminated;
FILELEN does not count trailing slashes after a non-slash.)
2020-09-02 16:47:03 +08:00
BASE_OFFSET is the offset of the basename in *BUFFER.
The returned value indicates what kind of backup was found. If an
I/O or other read error occurs, use the highest backup number that
was found.
*DIRPP is the destination directory. If *DIRPP is null, open the
destination directory and store the resulting stream into *DIRPP
and its file descriptor into *PNEW_FD without closing the stream. */
static enum numbered_backup_result
2022-07-28 14:16:50 +08:00
numbered_backup (int dir_fd, char **buffer, idx_t buffer_size, idx_t filelen,
idx_t base_offset, DIR **dirpp, int *pnew_fd)
2020-09-02 16:47:03 +08:00
{
enum numbered_backup_result result = BACKUP_IS_NEW;
DIR *dirp = *dirpp;
char *buf = *buffer;
2022-07-28 14:16:50 +08:00
idx_t versionlenmax = 1;
idx_t baselen = filelen - base_offset;
2020-09-02 16:47:03 +08:00
if (dirp)
rewinddir (dirp);
else
{
/* Temporarily modify the buffer into its parent directory name,
open the directory, and then restore the buffer. */
char tmp[sizeof "."];
2022-07-28 14:16:50 +08:00
char *base = buf + base_offset;
2020-09-02 16:47:03 +08:00
memcpy (tmp, base, sizeof ".");
strcpy (base, ".");
dirp = opendirat (dir_fd, buf, 0, pnew_fd);
if (!dirp && errno == ENOMEM)
result = BACKUP_NOMEM;
memcpy (base, tmp, sizeof ".");
strcpy (base + baselen, ".~1~");
if (!dirp)
return result;
*dirpp = dirp;
}
2022-07-28 14:16:50 +08:00
for (struct dirent *dp; (dp = readdir (dirp)) != NULL; )
2020-09-02 16:47:03 +08:00
{
if (_D_EXACT_NAMLEN (dp) < baselen + 4)
continue;
if (memcmp (buf + base_offset, dp->d_name, baselen + 2) != 0)
continue;
2022-07-28 14:16:50 +08:00
char const *p = dp->d_name + baselen + 2;
2020-09-02 16:47:03 +08:00
/* Check whether this file has a version number and if so,
whether it is larger. Use string operations rather than
integer arithmetic, to avoid problems with integer overflow. */
if (! ('1' <= *p && *p <= '9'))
continue;
2022-07-28 14:16:50 +08:00
bool all_9s = (*p == '9');
idx_t versionlen;
2020-09-02 16:47:03 +08:00
for (versionlen = 1; ISDIGIT (p[versionlen]); versionlen++)
all_9s &= (p[versionlen] == '9');
if (! (p[versionlen] == '~' && !p[versionlen + 1]
&& (versionlenmax < versionlen
|| (versionlenmax == versionlen
&& memcmp (buf + filelen + 2, p, versionlen) <= 0))))
continue;
/* This entry has the largest version number seen so far.
Append this highest numbered extension to the file name,
prepending '0' to the number if it is all 9s. */
versionlenmax = all_9s + versionlen;
result = (all_9s ? BACKUP_IS_LONGER : BACKUP_IS_SAME_LENGTH);
2022-07-28 14:16:50 +08:00
idx_t new_buffer_size = filelen + 2 + versionlenmax + 2;
2020-09-02 16:47:03 +08:00
if (buffer_size < new_buffer_size)
{
2022-07-28 14:16:50 +08:00
idx_t grown;
if (! INT_ADD_WRAPV (new_buffer_size, new_buffer_size >> 1, &grown))
new_buffer_size = grown;
char *new_buf = irealloc (buf, new_buffer_size);
2020-09-02 16:47:03 +08:00
if (!new_buf)
{
*buffer = buf;
return BACKUP_NOMEM;
}
buf = new_buf;
buffer_size = new_buffer_size;
}
2022-07-28 14:16:50 +08:00
char *q = buf + filelen;
2020-09-02 16:47:03 +08:00
*q++ = '.';
*q++ = '~';
*q = '0';
q += all_9s;
memcpy (q, p, versionlen + 2);
/* Add 1 to the version number. */
q += versionlen;
while (*--q == '9')
*q = '0';
++*q;
}
*buffer = buf;
return result;
}
/* Relative to DIR_FD, return the name of the new backup file for the
existing file FILE, allocated with malloc.
If RENAME, also rename FILE to the new name.
On failure, return NULL and set errno.
Do not call this function if backup_type == no_backups. */
char *
backupfile_internal (int dir_fd, char const *file,
enum backup_type backup_type, bool rename)
{
2022-07-28 14:16:50 +08:00
idx_t base_offset = last_component (file) - file;
idx_t filelen = base_offset + base_len (file + base_offset);
2020-09-02 16:47:03 +08:00
if (! simple_backup_suffix)
set_simple_backup_suffix (NULL);
/* Allow room for simple or ".~N~" backups. The guess must be at
least sizeof ".~1~", but otherwise will be adjusted as needed. */
2022-07-28 14:16:50 +08:00
idx_t simple_backup_suffix_size = strlen (simple_backup_suffix) + 1;
idx_t backup_suffix_size_guess = simple_backup_suffix_size;
2020-09-02 16:47:03 +08:00
enum { GUESS = sizeof ".~12345~" };
if (backup_suffix_size_guess < GUESS)
backup_suffix_size_guess = GUESS;
2022-07-28 14:16:50 +08:00
idx_t ssize = filelen + backup_suffix_size_guess + 1;
char *s = imalloc (ssize);
2020-09-02 16:47:03 +08:00
if (!s)
return s;
DIR *dirp = NULL;
2022-07-28 14:16:50 +08:00
int sdir = AT_FDCWD;
idx_t base_max = 0;
2020-09-02 16:47:03 +08:00
while (true)
{
2022-07-28 14:16:50 +08:00
bool extended = true;
memcpy (s, file, filelen);
2020-09-02 16:47:03 +08:00
if (backup_type == simple_backups)
memcpy (s + filelen, simple_backup_suffix, simple_backup_suffix_size);
else
switch (numbered_backup (dir_fd, &s, ssize, filelen, base_offset,
&dirp, &sdir))
{
case BACKUP_IS_SAME_LENGTH:
break;
case BACKUP_IS_NEW:
if (backup_type == numbered_existing_backups)
{
backup_type = simple_backups;
memcpy (s + filelen, simple_backup_suffix,
simple_backup_suffix_size);
}
FALLTHROUGH;
case BACKUP_IS_LONGER:
2022-07-28 14:16:50 +08:00
extended = check_extension (s, filelen, '~', sdir, &base_max);
2020-09-02 16:47:03 +08:00
break;
case BACKUP_NOMEM:
if (dirp)
closedir (dirp);
free (s);
errno = ENOMEM;
return NULL;
}
if (! rename)
break;
2022-07-28 14:16:50 +08:00
int olddirfd = sdir < 0 ? dir_fd : sdir;
idx_t offset = sdir < 0 ? 0 : base_offset;
2020-09-02 16:47:03 +08:00
unsigned flags = backup_type == simple_backups ? 0 : RENAME_NOREPLACE;
2022-07-28 14:16:50 +08:00
if (renameatu (olddirfd, file + offset, sdir, s + offset, flags) == 0)
2020-09-02 16:47:03 +08:00
break;
int e = errno;
2022-07-28 14:16:50 +08:00
if (! (e == EEXIST && extended))
2020-09-02 16:47:03 +08:00
{
if (dirp)
closedir (dirp);
free (s);
errno = e;
return NULL;
}
}
if (dirp)
closedir (dirp);
return s;
}