-/* FDUPES Copyright (c) 1999-2002 Adrian Lopez
+/* FDUPES Copyright (c) 1999-2022 Adrian Lopez
Permission is hereby granted, free of charge, to any person
obtaining a copy of this software and associated documentation files
TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
+#include "config.h"
#include <stdio.h>
#include <stdarg.h>
#include <string.h>
+#include <strings.h>
#include <sys/stat.h>
#include <dirent.h>
#include <unistd.h>
#include <stdlib.h>
-#ifndef OMIT_GETOPT_LONG
+#include <time.h>
+#ifdef HAVE_GETOPT_H
#include <getopt.h>
#endif
-#include <string.h>
#include <errno.h>
#include <libgen.h>
+#include <locale.h>
+#ifndef NO_NCURSES
+#ifdef HAVE_NCURSESW_CURSES_H
+ #include <ncursesw/curses.h>
+#else
+ #include <curses.h>
+#endif
+#include "ncurses-interface.h"
+#endif
+#include "fdupes.h"
+#include "confirmmatch.h"
+#include "errormsg.h"
+#include "log.h"
+#include "sigint.h"
+#include "flags.h"
+#include "removeifnotchanged.h"
-#include "md5/md5.h"
-
-#define ISFLAG(a,b) ((a & b) == b)
-#define SETFLAG(a,b) (a |= b)
-
-#define F_RECURSE 0x0001
-#define F_HIDEPROGRESS 0x0002
-#define F_DSAMELINE 0x0004
-#define F_FOLLOWLINKS 0x0008
-#define F_DELETEFILES 0x0010
-#define F_EXCLUDEEMPTY 0x0020
-#define F_CONSIDERHARDLINKS 0x0040
-#define F_SHOWSIZE 0x0080
-#define F_OMITFIRST 0x0100
-#define F_RECURSEAFTER 0x0200
-#define F_NOPROMPT 0x0400
-#define F_SUMMARIZEMATCHES 0x0800
-#define F_EXCLUDEHIDDEN 0x1000
-#define F_PERMISSIONS 0x2000
-#define F_REVERSE 0x4000
-#define F_IMMEDIATE 0x8000
+long long minsize = -1;
+long long maxsize = -1;
typedef enum {
- ORDER_TIME = 0,
+ ORDER_MTIME = 0,
+ ORDER_CTIME,
ORDER_NAME
} ordertype_t;
char *program_name;
-unsigned long flags = 0;
-
-#define CHUNK_SIZE 8192
-
-#define INPUT_SIZE 256
-
-#define PARTIAL_MD5_SIZE 4096
+ordertype_t ordertype = ORDER_MTIME;
#define MD5_DIGEST_LENGTH 16
-/*
-
-TODO: Partial sums (for working with very large files).
-
-typedef struct _signature
-{
- md5_state_t state;
- md5_byte_t digest[16];
-} signature_t;
-
-typedef struct _signatures
-{
- int num_signatures;
- signature_t *signatures;
-} signatures_t;
-
-*/
-
-typedef struct _file {
- char *d_name;
- off_t size;
- md5_byte_t *crcpartial;
- md5_byte_t *crcsignature;
- dev_t device;
- ino_t inode;
- time_t mtime;
- int hasdupes; /* true only if file is first on duplicate chain */
- struct _file *duplicates;
- struct _file *next;
-} file_t;
-
typedef struct _filetree {
file_t *file;
struct _filetree *left;
struct _filetree *right;
} filetree_t;
-void errormsg(char *message, ...)
-{
- va_list ap;
-
- va_start(ap, message);
-
- fprintf(stderr, "\r%40s\r%s: ", "", program_name);
- vfprintf(stderr, message, ap);
-}
-
void escapefilename(char *escape_list, char **filename_ptr)
{
int x;
}
}
-off_t filesize(char *filename) {
- struct stat s;
-
- if (stat(filename, &s) != 0) return -1;
-
- return s.st_size;
-}
-
dev_t getdevice(char *filename) {
struct stat s;
return s.st_ino;
}
-time_t getmtime(char *filename) {
- struct stat s;
+char *fmttime(time_t t) {
+ static char buf[64];
- if (stat(filename, &s) != 0) return 0;
+ strftime(buf, sizeof(buf), "%Y-%m-%d %H:%M", localtime(&t));
- return s.st_mtime;
+ return buf;
}
char **cloneargs(int argc, char **argv)
return x;
}
-int grokdir(char *dir, file_t **filelistp)
+void getfilestats(file_t *file, struct stat *info, struct stat *linfo)
+{
+ file->size = info->st_size;;
+ file->inode = info->st_ino;
+ file->device = info->st_dev;
+ file->ctime = info->st_ctime;
+ file->mtime = info->st_mtime;
+}
+
+int grokdir(char *dir, file_t **filelistp, struct stat *logfile_status)
{
DIR *cd;
file_t *newfile;
if (ISFLAG(flags, F_EXCLUDEHIDDEN)) {
fullname = strdup(newfile->d_name);
+ if (fullname == 0)
+ {
+ errormsg("out of memory!\n");
+ free(newfile);
+ closedir(cd);
+ exit(1);
+ }
name = basename(fullname);
if (name[0] == '.' && strcmp(name, ".") && strcmp(name, "..") ) {
free(newfile->d_name);
free(newfile);
+ free(fullname);
continue;
}
free(fullname);
}
- if (filesize(newfile->d_name) == 0 && ISFLAG(flags, F_EXCLUDEEMPTY)) {
- free(newfile->d_name);
- free(newfile);
- continue;
+ if (stat(newfile->d_name, &info) == -1) {
+ free(newfile->d_name);
+ free(newfile);
+ continue;
+ }
+
+ if (!S_ISDIR(info.st_mode) && (((info.st_size == 0 && ISFLAG(flags, F_EXCLUDEEMPTY)) || info.st_size < minsize || (info.st_size > maxsize && maxsize != -1)))) {
+ free(newfile->d_name);
+ free(newfile);
+ continue;
}
- if (stat(newfile->d_name, &info) == -1) {
- free(newfile->d_name);
- free(newfile);
- continue;
+ /* ignore logfile */
+ if (logfile_status != 0 && info.st_dev == logfile_status->st_dev && info.st_ino == logfile_status->st_ino)
+ {
+ free(newfile->d_name);
+ free(newfile);
+ continue;
}
if (lstat(newfile->d_name, &linfo) == -1) {
if (S_ISDIR(info.st_mode)) {
if (ISFLAG(flags, F_RECURSE) && (ISFLAG(flags, F_FOLLOWLINKS) || !S_ISLNK(linfo.st_mode)))
- filecount += grokdir(newfile->d_name, filelistp);
+ filecount += grokdir(newfile->d_name, filelistp, logfile_status);
free(newfile->d_name);
free(newfile);
} else {
if (S_ISREG(linfo.st_mode) || (S_ISLNK(linfo.st_mode) && ISFLAG(flags, F_FOLLOWLINKS))) {
+ getfilestats(newfile, &info, &linfo);
*filelistp = newfile;
filecount++;
} else {
return filecount;
}
-md5_byte_t *getcrcsignatureuntil(char *filename, off_t max_read)
+md5_byte_t *getcrcsignatureuntil(char *filename, off_t fsize, off_t max_read)
{
- off_t fsize;
off_t toread;
md5_state_t state;
static md5_byte_t digest[MD5_DIGEST_LENGTH];
FILE *file;
md5_init(&state);
-
-
- fsize = filesize(filename);
if (max_read != 0 && fsize > max_read)
fsize = max_read;
return digest;
}
-md5_byte_t *getcrcsignature(char *filename)
+md5_byte_t *getcrcsignature(char *filename, off_t fsize)
{
- return getcrcsignatureuntil(filename, 0);
+ return getcrcsignatureuntil(filename, fsize, 0);
}
-md5_byte_t *getcrcpartialsignature(char *filename)
+md5_byte_t *getcrcpartialsignature(char *filename, off_t fsize)
{
- return getcrcsignatureuntil(filename, PARTIAL_MD5_SIZE);
+ return getcrcsignatureuntil(filename, fsize, PARTIAL_MD5_SIZE);
}
int md5cmp(const md5_byte_t *a, const md5_byte_t *b)
free(checktree);
}
-void getfilestats(file_t *file)
-{
- file->size = filesize(file->d_name);
- file->inode = getinode(file->d_name);
- file->device = getdevice(file->d_name);
- file->mtime = getmtime(file->d_name);
-}
-
int registerfile(filetree_t **branch, file_t *file)
{
- getfilestats(file);
-
*branch = (filetree_t*) malloc(sizeof(filetree_t));
if (*branch == NULL) {
errormsg("out of memory!\n");
int is_hardlink(filetree_t *checktree, file_t *file)
{
file_t *dupe;
- ino_t inode;
- dev_t device;
-
- inode = getinode(file->d_name);
- device = getdevice(file->d_name);
- if ((inode == checktree->file->inode) &&
- (device == checktree->file->device))
+ if ((file->inode == checktree->file->inode) &&
+ (file->device == checktree->file->device))
return 1;
if (checktree->file->hasdupes)
dupe = checktree->file->duplicates;
do {
- if ((inode == dupe->inode) &&
- (device == dupe->device))
+ if ((file->inode == dupe->inode) &&
+ (file->device == dupe->device))
return 1;
dupe = dupe->duplicates;
return 0;
}
+/* check whether two paths represent the same file (deleting one would delete the other) */
+int is_same_file(file_t *file_a, file_t *file_b)
+{
+ char *filename_a;
+ char *filename_b;
+ char *dirname_a;
+ char *dirname_b;
+ char *basename_a;
+ char *basename_b;
+ struct stat dirstat_a;
+ struct stat dirstat_b;
+
+ /* if files on different devices and/or different inodes, they are not the same file */
+ if (file_a->device != file_b->device || file_a->inode != file_b->inode)
+ return 0;
+
+ /* copy filenames (basename and dirname may modify these) */
+ filename_a = strdup(file_a->d_name);
+ if (filename_a == 0)
+ return -1;
+
+ filename_b = strdup(file_b->d_name);
+ if (filename_b == 0)
+ return -1;
+
+ /* get file basenames */
+ basename_a = basename(filename_a);
+ memmove(filename_a, basename_a, strlen(basename_a) + 1);
+
+ basename_b = basename(filename_b);
+ memmove(filename_b, basename_b, strlen(basename_b) + 1);
+
+ /* if files have different names, they are not the same file */
+ if (strcmp(filename_a, filename_b) != 0)
+ {
+ free(filename_b);
+ free(filename_a);
+ return 0;
+ }
+
+ /* restore paths */
+ strcpy(filename_a, file_a->d_name);
+ strcpy(filename_b, file_b->d_name);
+
+ /* get directory names */
+ dirname_a = dirname(filename_a);
+ if (stat(dirname_a, &dirstat_a) != 0)
+ {
+ free(filename_b);
+ free(filename_a);
+ return -1;
+ }
+
+ dirname_b = dirname(filename_b);
+ if (stat(dirname_b, &dirstat_b) != 0)
+ {
+ free(filename_b);
+ free(filename_a);
+ return -1;
+ }
+
+ free(filename_b);
+ free(filename_a);
+
+ /* if directories on which files reside are different, they are not the same file */
+ if (dirstat_a.st_dev != dirstat_b.st_dev || dirstat_a.st_ino != dirstat_b.st_ino)
+ return 0;
+
+ /* same device, inode, filename, and directory; therefore, same file */
+ return 1;
+}
+
+/* check whether given tree node already contains a copy of given file */
+int has_same_file(filetree_t *checktree, file_t *file)
+{
+ file_t *dupe;
+
+ if (is_same_file(checktree->file, file))
+ return 1;
+
+ if (checktree->file->hasdupes)
+ {
+ dupe = checktree->file->duplicates;
+
+ do {
+ if (is_same_file(dupe, file))
+ return 1;
+
+ dupe = dupe->duplicates;
+ } while (dupe != NULL);
+ }
+
+ return 0;
+}
+
file_t **checkmatch(filetree_t **root, filetree_t *checktree, file_t *file)
{
int cmpresult;
md5_byte_t *crcsignature;
- off_t fsize;
-
- /* If device and inode fields are equal one of the files is a
- hard link to the other or the files have been listed twice
- unintentionally. We don't want to flag these files as
- duplicates unless the user specifies otherwise.
- */
-
- if (!ISFLAG(flags, F_CONSIDERHARDLINKS) && is_hardlink(checktree, file))
- return NULL;
- fsize = filesize(file->d_name);
+ if (ISFLAG(flags, F_CONSIDERHARDLINKS))
+ {
+ /* If node already contains file, we don't want to add it again.
+ */
+ if (has_same_file(checktree, file))
+ return NULL;
+ }
+ else
+ {
+ /* If device and inode fields are equal one of the files is a
+ hard link to the other or the files have been listed twice
+ unintentionally. We don't want to flag these files as
+ duplicates unless the user specifies otherwise.
+ */
+ if (is_hardlink(checktree, file))
+ return NULL;
+ }
- if (fsize < checktree->file->size)
+ if (file->size < checktree->file->size)
cmpresult = -1;
else
- if (fsize > checktree->file->size) cmpresult = 1;
+ if (file->size > checktree->file->size) cmpresult = 1;
else
if (ISFLAG(flags, F_PERMISSIONS) &&
!same_permissions(file->d_name, checktree->file->d_name))
cmpresult = -1;
else {
if (checktree->file->crcpartial == NULL) {
- crcsignature = getcrcpartialsignature(checktree->file->d_name);
+ crcsignature = getcrcpartialsignature(checktree->file->d_name, checktree->file->size);
if (crcsignature == NULL) {
errormsg ("cannot read file %s\n", checktree->file->d_name);
return NULL;
}
if (file->crcpartial == NULL) {
- crcsignature = getcrcpartialsignature(file->d_name);
+ crcsignature = getcrcpartialsignature(file->d_name, file->size);
if (crcsignature == NULL) {
errormsg ("cannot read file %s\n", file->d_name);
return NULL;
}
cmpresult = md5cmp(file->crcpartial, checktree->file->crcpartial);
- /*if (cmpresult != 0) errormsg(" on %s vs %s\n", file->d_name, checktree->file->d_name);*/
if (cmpresult == 0) {
if (checktree->file->crcsignature == NULL) {
- crcsignature = getcrcsignature(checktree->file->d_name);
+ crcsignature = getcrcsignature(checktree->file->d_name, checktree->file->size);
if (crcsignature == NULL) return NULL;
checktree->file->crcsignature = (md5_byte_t*) malloc(MD5_DIGEST_LENGTH * sizeof(md5_byte_t));
}
if (file->crcsignature == NULL) {
- crcsignature = getcrcsignature(file->d_name);
+ crcsignature = getcrcsignature(file->d_name, file->size);
if (crcsignature == NULL) return NULL;
file->crcsignature = (md5_byte_t*) malloc(MD5_DIGEST_LENGTH * sizeof(md5_byte_t));
}
cmpresult = md5cmp(file->crcsignature, checktree->file->crcsignature);
- /*if (cmpresult != 0) errormsg("P on %s vs %s\n",
- file->d_name, checktree->file->d_name);
- else errormsg("P F on %s vs %s\n", file->d_name,
- checktree->file->d_name);
- printf("%s matches %s\n", file->d_name, checktree->file->d_name);*/
}
}
}
} else
{
- getfilestats(file);
return &checktree->file;
}
}
-/* Do a bit-for-bit comparison in case two different files produce the
- same signature. Unlikely, but better safe than sorry. */
-
-int confirmmatch(FILE *file1, FILE *file2)
-{
- unsigned char c1[CHUNK_SIZE];
- unsigned char c2[CHUNK_SIZE];
- size_t r1;
- size_t r2;
-
- fseek(file1, 0, SEEK_SET);
- fseek(file2, 0, SEEK_SET);
-
- do {
- r1 = fread(c1, sizeof(unsigned char), sizeof(c1), file1);
- r2 = fread(c2, sizeof(unsigned char), sizeof(c2), file2);
-
- if (r1 != r2) return 0; /* file lengths are different */
- if (memcmp (c1, c2, r1)) return 0; /* file contents are different */
- } while (r2);
-
- return 1;
-}
-
void summarizematches(file_t *files)
{
int numsets = 0;
if (!ISFLAG(flags, F_OMITFIRST)) {
if (ISFLAG(flags, F_SHOWSIZE)) printf("%lld byte%seach:\n", (long long int)files->size,
(files->size != 1) ? "s " : " ");
+ if (ISFLAG(flags, F_SHOWTIME))
+ printf("%s ", fmttime(files->mtime));
if (ISFLAG(flags, F_DSAMELINE)) escapefilename("\\ ", &files->d_name);
printf("%s%c", files->d_name, ISFLAG(flags, F_DSAMELINE)?' ':'\n');
}
tmpfile = files->duplicates;
while (tmpfile != NULL) {
+ if (ISFLAG(flags, F_SHOWTIME))
+ printf("%s ", fmttime(tmpfile->mtime));
if (ISFLAG(flags, F_DSAMELINE)) escapefilename("\\ ", &tmpfile->d_name);
printf("%s%c", tmpfile->d_name, ISFLAG(flags, F_DSAMELINE)?' ':'\n');
tmpfile = tmpfile->duplicates;
return 1;
}
-void deletefiles(file_t *files, int prompt, FILE *tty)
+void deletefiles(file_t *files, int prompt, FILE *tty, char *logfile)
{
int counter;
int groups = 0;
file_t *curfile;
file_t **dupelist;
int *preserve;
+ int firstpreserved;
char *preservestr;
char *token;
char *tstr;
int max = 0;
int x;
int i;
+ struct log_info *loginfo;
+ int log_error;
+ FILE *file1;
+ FILE *file2;
+ int ismatch;
+ char *errorstring;
curfile = files;
exit(1);
}
+ loginfo = 0;
+ if (logfile != 0)
+ loginfo = log_open(logfile, &log_error);
+
+ register_sigint_handler();
+
while (files) {
if (files->hasdupes) {
curgroup++;
counter = 1;
dupelist[counter] = files;
- if (prompt) printf("[%d] %s\n", counter, files->d_name);
+ if (prompt)
+ {
+ if (ISFLAG(flags, F_SHOWTIME))
+ printf("[%d] [%s] %s\n", counter, fmttime(files->mtime), files->d_name);
+ else
+ printf("[%d] %s\n", counter, files->d_name);
+ }
tmpfile = files->duplicates;
while (tmpfile) {
dupelist[++counter] = tmpfile;
- if (prompt) printf("[%d] %s\n", counter, tmpfile->d_name);
+ if (prompt)
+ {
+ if (ISFLAG(flags, F_SHOWTIME))
+ printf("[%d] [%s] %s\n", counter, fmttime(tmpfile->mtime), tmpfile->d_name);
+ else
+ printf("[%d] %s\n", counter, tmpfile->d_name);
+ }
tmpfile = tmpfile->duplicates;
}
else /* prompt for files to preserve */
do {
- printf("Set %d of %d, preserve files [1 - %d, all]",
+ printf("Set %d of %d, preserve files [1 - %d, all, quit]",
curgroup, groups, counter);
if (ISFLAG(flags, F_SHOWSIZE)) printf(" (%lld byte%seach)", (long long int)files->size,
(files->size != 1) ? "s " : " ");
fflush(stdout);
if (!fgets(preservestr, INPUT_SIZE, tty))
+ {
preservestr[0] = '\n'; /* treat fgets() failure as if nothing was entered */
+ preservestr[1] = '\0';
+
+ if (got_sigint)
+ {
+ if (loginfo)
+ log_close(loginfo);
+
+ free(dupelist);
+ free(preserve);
+ free(preservestr);
+
+ printf("\n");
+
+ exit(0);
+ }
+ }
i = strlen(preservestr) - 1;
if (!fgets(preservestr + i + 1, INPUT_SIZE, tty))
{
preservestr[0] = '\n'; /* treat fgets() failure as if nothing was entered */
+ preservestr[1] = '\0';
break;
}
i = strlen(preservestr)-1;
}
+ if (strcmp(preservestr, "q\n") == 0 || strcmp(preservestr, "quit\n") == 0)
+ {
+ if (loginfo)
+ log_close(loginfo);
+
+ free(dupelist);
+ free(preserve);
+ free(preservestr);
+
+ printf("\n");
+
+ exit(0);
+ }
+
for (x = 1; x <= counter; x++) preserve[x] = 0;
token = strtok(preservestr, " ,\n");
while (token != NULL) {
- if (strcasecmp(token, "all") == 0)
+ if (strcasecmp(token, "all") == 0 || strcasecmp(token, "a") == 0)
for (x = 0; x <= counter; x++) preserve[x] = 1;
number = 0;
printf("\n");
+ if (loginfo)
+ log_begin_set(loginfo);
+
for (x = 1; x <= counter; x++) {
if (preserve[x])
+ {
printf(" [+] %s\n", dupelist[x]->d_name);
+
+ if (loginfo)
+ log_file_remaining(loginfo, dupelist[x]->d_name);
+ }
else {
- if (remove(dupelist[x]->d_name) == 0) {
- printf(" [-] %s\n", dupelist[x]->d_name);
- } else {
- printf(" [!] %s ", dupelist[x]->d_name);
- printf("-- unable to delete file!\n");
- }
+ if (ISFLAG(flags, F_DEFERCONFIRMATION))
+ {
+ firstpreserved = 0;
+ for (i = 1; i <= counter; ++i)
+ {
+ if (preserve[i])
+ {
+ firstpreserved = i;
+ break;
+ }
+ }
+
+ file1 = fopen(dupelist[x]->d_name, "rb");
+ file2 = fopen(dupelist[firstpreserved]->d_name, "rb");
+
+ if (file1 && file2)
+ ismatch = confirmmatch(file1, file2);
+ else
+ ismatch = 0;
+
+ if (file2)
+ fclose(file2);
+
+ if (file1)
+ fclose(file1);
+ }
+ else
+ {
+ ismatch = 1;
+ }
+
+ if (ismatch) {
+ if (removeifnotchanged(dupelist[x], &errorstring) == 0) {
+ printf(" [-] %s\n", dupelist[x]->d_name);
+
+ if (loginfo)
+ log_file_deleted(loginfo, dupelist[x]->d_name);
+ }
+ else {
+ printf(" [!] %s ", dupelist[x]->d_name);
+ printf("-- unable to delete file: %s!\n", errorstring);
+
+ if (loginfo)
+ log_file_remaining(loginfo, dupelist[x]->d_name);
+ }
+ }
+ else {
+ printf(" [!] %s\n", dupelist[x]->d_name);
+ printf(" -- unable to confirm match; file not deleted!\n");
+
+ if (loginfo)
+ log_file_remaining(loginfo, dupelist[x]->d_name);
+ }
}
}
printf("\n");
+
+ if (loginfo)
+ log_end_set(loginfo);
}
files = files->next;
}
+ if (loginfo)
+ log_close(loginfo);
+
free(dupelist);
free(preserve);
free(preservestr);
return !ISFLAG(flags, F_REVERSE) ? -1 : 1;
}
+int sort_pairs_by_ctime(file_t *f1, file_t *f2)
+{
+ if (f1->ctime < f2->ctime)
+ return !ISFLAG(flags, F_REVERSE) ? -1 : 1;
+ else if (f1->ctime > f2->ctime)
+ return !ISFLAG(flags, F_REVERSE) ? 1 : -1;
+
+ return 0;
+}
+
int sort_pairs_by_mtime(file_t *f1, file_t *f2)
{
if (f1->mtime < f2->mtime)
return !ISFLAG(flags, F_REVERSE) ? -1 : 1;
else if (f1->mtime > f2->mtime)
return !ISFLAG(flags, F_REVERSE) ? 1 : -1;
-
- return 0;
+ else
+ return sort_pairs_by_ctime(f1, f2);
}
int sort_pairs_by_filename(file_t *f1, file_t *f2)
{
- return strcmp(f1->d_name, f2->d_name);
+ int strvalue = strcmp(f1->d_name, f2->d_name);
+ return !ISFLAG(flags, F_REVERSE) ? strvalue : -strvalue;
}
void registerpair(file_t **matchlist, file_t *newmatch,
}
}
-void deletesuccessor(file_t **existing, file_t *duplicate,
- int (*comparef)(file_t *f1, file_t *f2))
+void deletesuccessor(file_t **existing, file_t *duplicate, int matchconfirmed,
+ int (*comparef)(file_t *f1, file_t *f2), struct log_info *loginfo)
{
file_t *to_keep;
file_t *to_delete;
+ char *errorstring;
if (comparef(duplicate, *existing) >= 0)
{
if (!ISFLAG(flags, F_HIDEPROGRESS)) fprintf(stderr, "\r%40s\r", " ");
+ if (loginfo)
+ log_begin_set(loginfo);
+
printf(" [+] %s\n", to_keep->d_name);
- if (remove(to_delete->d_name) == 0) {
- printf(" [-] %s\n", to_delete->d_name);
- } else {
- printf(" [!] %s ", to_delete->d_name);
- printf("-- unable to delete file!\n");
+
+ if (loginfo)
+ log_file_remaining(loginfo, to_keep->d_name);
+
+ if (matchconfirmed)
+ {
+ if (removeifnotchanged(to_delete, &errorstring) == 0) {
+ printf(" [-] %s\n", to_delete->d_name);
+
+ if (loginfo)
+ log_file_deleted(loginfo, to_delete->d_name);
+ } else {
+ printf(" [!] %s ", to_delete->d_name);
+ printf("-- unable to delete file: %s!\n", errorstring);
+
+ if (loginfo)
+ log_file_remaining(loginfo, to_delete->d_name);
+ }
+ }
+ else
+ {
+ printf(" [!] %s\n", to_delete->d_name);
+ printf(" -- unable to confirm match; file not deleted!\n");
+
+ if (loginfo)
+ log_file_remaining(loginfo, to_delete->d_name);
}
+ if (loginfo)
+ log_end_set(loginfo);
+
printf("\n");
}
{
printf("Usage: fdupes [options] DIRECTORY...\n\n");
- printf(" -r --recurse \tfor every directory given follow subdirectories\n");
- printf(" \tencountered within\n");
- printf(" -R --recurse: \tfor each directory given after this option follow\n");
- printf(" \tsubdirectories encountered within (note the ':' at\n");
- printf(" \tthe end of the option, manpage for more details)\n");
- printf(" -s --symlinks \tfollow symlinks\n");
- printf(" -H --hardlinks \tnormally, when two or more files point to the same\n");
- printf(" \tdisk area they are treated as non-duplicates; this\n");
- printf(" \toption will change this behavior\n");
- printf(" -n --noempty \texclude zero-length files from consideration\n");
- printf(" -A --nohidden \texclude hidden files from consideration\n");
- printf(" -f --omitfirst \tomit the first file in each set of matches\n");
- printf(" -1 --sameline \tlist each set of matches on a single line\n");
- printf(" -S --size \tshow size of duplicate files\n");
- printf(" -m --summarize \tsummarize dupe information\n");
- printf(" -q --quiet \thide progress indicator\n");
- printf(" -d --delete \tprompt user for files to preserve and delete all\n");
- printf(" \tothers; important: under particular circumstances,\n");
- printf(" \tdata may be lost when using this option together\n");
- printf(" \twith -s or --symlinks, or when specifying a\n");
- printf(" \tparticular directory more than once; refer to the\n");
- printf(" \tfdupes documentation for additional information\n");
- /*printf(" -l --relink \t(description)\n");*/
- printf(" -N --noprompt \ttogether with --delete, preserve the first file in\n");
- printf(" \teach set of duplicates and delete the rest without\n");
- printf(" \tprompting the user\n");
- printf(" -I --immediate \tdelete duplicates as they are encountered, without\n");
- printf(" \tgrouping into sets; implies --noprompt\n");
- printf(" -p --permissions \tdon't consider files with different owner/group or\n");
- printf(" \tpermission bits as duplicates\n");
- printf(" -o --order=BY \tselect sort order for output, linking and deleting; by\n");
- printf(" \tmtime (BY='time'; default) or filename (BY='name')\n");
- printf(" -i --reverse \treverse order while sorting\n");
- printf(" -v --version \tdisplay fdupes version\n");
- printf(" -h --help \tdisplay this help message\n\n");
-#ifdef OMIT_GETOPT_LONG
+ /* 0 1 0 2 0 3 0 4 0 5 0 6 0 7 0 8 0
+ -------"---------|---------|---------|---------|---------|---------|---------|---------|"
+ */
+ printf(" -r --recurse for every directory given follow subdirectories\n");
+ printf(" encountered within\n");
+ printf(" -R --recurse: for each directory given after this option follow\n");
+ printf(" subdirectories encountered within (note the ':' at the\n");
+ printf(" end of the option, manpage for more details)\n");
+ printf(" -s --symlinks follow symlinks\n");
+ printf(" -H --hardlinks normally, when two or more files point to the same\n");
+ printf(" disk area they are treated as non-duplicates; this\n");
+ printf(" option will change this behavior\n");
+ printf(" -G --minsize=SIZE consider only files greater than or equal to SIZE bytes\n");
+ printf(" -L --maxsize=SIZE consider only files less than or equal to SIZE bytes\n");
+ printf(" -n --noempty exclude zero-length files from consideration\n");
+ printf(" -A --nohidden exclude hidden files from consideration\n");
+ printf(" -f --omitfirst omit the first file in each set of matches\n");
+ printf(" -1 --sameline list each set of matches on a single line\n");
+ printf(" -S --size show size of duplicate files\n");
+ printf(" -t --time show modification time of duplicate files\n");
+ printf(" -m --summarize summarize dupe information\n");
+ printf(" -q --quiet hide progress indicator\n");
+ printf(" -d --delete prompt user for files to preserve and delete all\n");
+ printf(" others; important: under particular circumstances,\n");
+ printf(" data may be lost when using this option together\n");
+ printf(" with -s or --symlinks, or when specifying a\n");
+ printf(" particular directory more than once; refer to the\n");
+ printf(" fdupes documentation for additional information\n");
+ printf(" -D --deferconfirmation in interactive mode, defer byte-for-byte confirmation\n");
+ printf(" of duplicates until just before file deletion\n");
+#ifndef NO_NCURSES
+ printf(" -P --plain with --delete, use line-based prompt (as with older\n");
+ printf(" versions of fdupes) instead of screen-mode interface\n");
+#endif
+ printf(" -N --noprompt together with --delete, preserve the first file in\n");
+ printf(" each set of duplicates and delete the rest without\n");
+ printf(" prompting the user\n");
+ printf(" -I --immediate delete duplicates as they are encountered, without\n");
+ printf(" grouping into sets; implies --noprompt\n");
+ printf(" -p --permissions don't consider files with different owner/group or\n");
+ printf(" permission bits as duplicates\n");
+ printf(" -o --order=BY select sort order for output and deleting; by file\n");
+ printf(" modification time (BY='time'; default), status\n");
+ printf(" change time (BY='ctime'), or filename (BY='name')\n");
+ printf(" -i --reverse reverse order while sorting\n");
+ printf(" -l --log=LOGFILE log file deletion choices to LOGFILE\n");
+ printf(" -v --version display fdupes version\n");
+ printf(" -h --help display this help message\n\n");
+#ifndef HAVE_GETOPT_H
printf("Note: Long options are not supported in this fdupes build.\n\n");
#endif
}
int progress = 0;
char **oldargv;
int firstrecurse;
- ordertype_t ordertype = ORDER_TIME;
+ char *logfile = 0;
+ struct log_info *loginfo = NULL;
+ int log_error;
+ struct stat logfile_status;
+ char *endptr;
-#ifndef OMIT_GETOPT_LONG
+#ifdef HAVE_GETOPT_H
static struct option long_options[] =
{
{ "omitfirst", 0, 0, 'f' },
{ "recurse", 0, 0, 'r' },
- { "recursive", 0, 0, 'r' },
{ "recurse:", 0, 0, 'R' },
- { "recursive:", 0, 0, 'R' },
{ "quiet", 0, 0, 'q' },
{ "sameline", 0, 0, '1' },
{ "size", 0, 0, 'S' },
+ { "time", 0, 0, 't' },
{ "symlinks", 0, 0, 's' },
{ "hardlinks", 0, 0, 'H' },
- { "relink", 0, 0, 'l' },
+ { "minsize", 1, 0, 'G' },
+ { "maxsize", 1, 0, 'L' },
{ "noempty", 0, 0, 'n' },
{ "nohidden", 0, 0, 'A' },
{ "delete", 0, 0, 'd' },
+ { "plain", 0, 0, 'P' },
{ "version", 0, 0, 'v' },
{ "help", 0, 0, 'h' },
{ "noprompt", 0, 0, 'N' },
{ "permissions", 0, 0, 'p' },
{ "order", 1, 0, 'o' },
{ "reverse", 0, 0, 'i' },
+ { "log", 1, 0, 'l' },
+ { "deferconfirmation", 0, 0, 'D' },
{ 0, 0, 0, 0 }
};
#define GETOPT getopt_long
program_name = argv[0];
+ setlocale(LC_CTYPE, "");
+
oldargv = cloneargs(argc, argv);
- while ((opt = GETOPT(argc, argv, "frRq1SsHlnAdvhNmpo:i"
-#ifndef OMIT_GETOPT_LONG
+ while ((opt = GETOPT(argc, argv, "frRq1StsHG:L:nAdPvhNImpo:il:D"
+#ifdef HAVE_GETOPT_H
, long_options, NULL
#endif
)) != EOF) {
case 'S':
SETFLAG(flags, F_SHOWSIZE);
break;
+ case 't':
+ SETFLAG(flags, F_SHOWTIME);
+ break;
case 's':
SETFLAG(flags, F_FOLLOWLINKS);
break;
case 'H':
SETFLAG(flags, F_CONSIDERHARDLINKS);
break;
+ case 'G':
+ minsize = strtoll(optarg, &endptr, 10);
+ if (optarg[0] == '\0' || *endptr != '\0' || minsize < 0)
+ {
+ errormsg("invalid value for --minsize: '%s'\n", optarg);
+ exit(1);
+ }
+ break;
+ case 'L':
+ maxsize = strtoll(optarg, &endptr, 10);
+ if (optarg[0] == '\0' || *endptr != '\0' || maxsize < 0)
+ {
+ errormsg("invalid value for --maxsize: '%s'\n", optarg);
+ exit(1);
+ }
+ break;
case 'n':
SETFLAG(flags, F_EXCLUDEEMPTY);
break;
case 'd':
SETFLAG(flags, F_DELETEFILES);
break;
+ case 'P':
+ SETFLAG(flags, F_PLAINPROMPT);
+ break;
case 'v':
printf("fdupes %s\n", VERSION);
exit(0);
if (!strcasecmp("name", optarg)) {
ordertype = ORDER_NAME;
} else if (!strcasecmp("time", optarg)) {
- ordertype = ORDER_TIME;
+ ordertype = ORDER_MTIME;
+ } else if (!strcasecmp("ctime", optarg)) {
+ ordertype = ORDER_CTIME;
} else {
errormsg("invalid value for --order: '%s'\n", optarg);
exit(1);
case 'i':
SETFLAG(flags, F_REVERSE);
break;
-
+ case 'l':
+ logfile = optarg;
+ break;
+ case 'D':
+ SETFLAG(flags, F_DEFERCONFIRMATION);
+ break;
default:
fprintf(stderr, "Try `fdupes --help' for more information.\n");
exit(1);
exit(1);
}
+ if (ISFLAG(flags, F_DEFERCONFIRMATION) && (!ISFLAG(flags, F_DELETEFILES) || ISFLAG(flags, F_NOPROMPT)))
+ {
+ errormsg("--deferconfirmation only works with interactive deletion modes\n");
+ exit(1);
+ }
+
+ if (!ISFLAG(flags, F_DELETEFILES))
+ logfile = 0;
+
+ if (logfile != 0)
+ {
+ loginfo = log_open(logfile, &log_error);
+ if (loginfo == 0)
+ {
+ if (log_error == LOG_ERROR_NOT_A_LOG_FILE)
+ errormsg("%s: doesn't look like an fdupes log file\n", logfile);
+ else
+ errormsg("%s: could not open log file\n", logfile);
+
+ exit(1);
+ }
+
+ if (stat(logfile, &logfile_status) != 0)
+ {
+ errormsg("could not read log file status\n");
+ exit(1);
+ }
+ }
+
if (ISFLAG(flags, F_RECURSEAFTER)) {
firstrecurse = nonoptafter("--recurse:", argc, oldargv, argv, optind);
/* F_RECURSE is not set for directories before --recurse: */
for (x = optind; x < firstrecurse; x++)
- filecount += grokdir(argv[x], &files);
+ filecount += grokdir(argv[x], &files, logfile ? &logfile_status : 0);
/* Set F_RECURSE for directories after --recurse: */
SETFLAG(flags, F_RECURSE);
for (x = firstrecurse; x < argc; x++)
- filecount += grokdir(argv[x], &files);
+ filecount += grokdir(argv[x], &files, logfile ? &logfile_status : 0);
} else {
for (x = optind; x < argc; x++)
- filecount += grokdir(argv[x], &files);
+ filecount += grokdir(argv[x], &files, logfile ? &logfile_status : 0);
}
if (!files) {
continue;
}
- if (confirmmatch(file1, file2)) {
- if (ISFLAG(flags, F_DELETEFILES) && ISFLAG(flags, F_IMMEDIATE))
- deletesuccessor(match, curfile,
- (ordertype == ORDER_TIME) ? sort_pairs_by_mtime : sort_pairs_by_filename );
- else
- registerpair(match, curfile,
- (ordertype == ORDER_TIME) ? sort_pairs_by_mtime : sort_pairs_by_filename );
+ if (ISFLAG(flags, F_DELETEFILES) && ISFLAG(flags, F_IMMEDIATE))
+ {
+ deletesuccessor(match, curfile, confirmmatch(file1, file2),
+ ordertype == ORDER_MTIME ? sort_pairs_by_mtime :
+ ordertype == ORDER_CTIME ? sort_pairs_by_ctime :
+ sort_pairs_by_filename, loginfo );
}
-
+ else if (ISFLAG(flags, F_DEFERCONFIRMATION) || confirmmatch(file1, file2))
+ registerpair(match, curfile,
+ ordertype == ORDER_MTIME ? sort_pairs_by_mtime :
+ ordertype == ORDER_CTIME ? sort_pairs_by_ctime :
+ sort_pairs_by_filename );
+
fclose(file1);
fclose(file2);
}
if (!ISFLAG(flags, F_HIDEPROGRESS)) fprintf(stderr, "\r%40s\r", " ");
+ if (loginfo != 0)
+ {
+ log_close(loginfo);
+ loginfo = 0;
+ }
+
if (ISFLAG(flags, F_DELETEFILES))
{
- if (ISFLAG(flags, F_NOPROMPT))
+ if (ISFLAG(flags, F_NOPROMPT) || ISFLAG(flags, F_IMMEDIATE))
{
- deletefiles(files, 0, 0);
+ deletefiles(files, 0, 0, logfile);
}
else
{
- if (freopen("/dev/tty", "r", stdin) == 0)
+#ifndef NO_NCURSES
+ if (!ISFLAG(flags, F_PLAINPROMPT))
+ {
+ if (newterm(getenv("TERM"), stdout, stdin) != 0)
+ {
+ deletefiles_ncurses(files, logfile);
+ }
+ else
+ {
+ errormsg("could not enter screen mode; falling back to plain mode\n\n");
+ SETFLAG(flags, F_PLAINPROMPT);
+ }
+ }
+
+ if (ISFLAG(flags, F_PLAINPROMPT))
+ {
+ if (freopen("/dev/tty", "r", stdin) == NULL)
+ {
+ errormsg("could not open terminal for input\n");
+ exit(1);
+ }
+
+ deletefiles(files, 1, stdin, logfile);
+ }
+#else
+ if (freopen("/dev/tty", "r", stdin) == NULL)
{
errormsg("could not open terminal for input\n");
exit(1);
}
- deletefiles(files, 1, stdin);
+ deletefiles(files, 1, stdin, logfile);
+#endif
}
}