2004-04-05 21:32:18 +00:00
|
|
|
/*-
|
2007-01-09 08:12:17 +00:00
|
|
|
* Copyright (c) 2003-2007 Tim Kientzle
|
2004-04-05 21:32:18 +00:00
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
* 1. Redistributions of source code must retain the above copyright
|
2007-01-09 08:12:17 +00:00
|
|
|
* notice, this list of conditions and the following disclaimer.
|
2004-04-05 21:32:18 +00:00
|
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
|
|
|
|
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
|
|
|
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
|
|
|
|
* IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
|
|
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
|
|
|
|
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
|
|
|
|
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "bsdtar_platform.h"
|
|
|
|
__FBSDID("$FreeBSD$");
|
|
|
|
|
2007-03-11 10:36:42 +00:00
|
|
|
#ifdef HAVE_ERRNO_H
|
2004-04-05 21:32:18 +00:00
|
|
|
#include <errno.h>
|
2007-03-11 10:36:42 +00:00
|
|
|
#endif
|
|
|
|
#ifdef HAVE_STDLIB_H
|
2004-04-05 21:32:18 +00:00
|
|
|
#include <stdlib.h>
|
2007-03-11 10:36:42 +00:00
|
|
|
#endif
|
|
|
|
#ifdef HAVE_STRING_H
|
2004-04-05 21:32:18 +00:00
|
|
|
#include <string.h>
|
2007-03-11 10:36:42 +00:00
|
|
|
#endif
|
2004-04-05 21:32:18 +00:00
|
|
|
|
2010-02-06 19:44:37 +00:00
|
|
|
#include "err.h"
|
2010-02-07 02:00:26 +00:00
|
|
|
#include "line_reader.h"
|
|
|
|
#include "matching.h"
|
|
|
|
#include "pathmatch.h"
|
2004-04-05 21:32:18 +00:00
|
|
|
|
|
|
|
struct match {
|
|
|
|
struct match *next;
|
|
|
|
int matches;
|
|
|
|
char pattern[1];
|
|
|
|
};
|
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
struct lafe_matching {
|
2004-04-05 21:32:18 +00:00
|
|
|
struct match *exclusions;
|
|
|
|
int exclusions_count;
|
2004-07-24 22:13:44 +00:00
|
|
|
struct match *inclusions;
|
2004-04-05 21:32:18 +00:00
|
|
|
int inclusions_count;
|
|
|
|
int inclusions_unmatched_count;
|
|
|
|
};
|
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
static void add_pattern(struct match **list, const char *pattern);
|
|
|
|
static void initialize_matching(struct lafe_matching **);
|
2004-04-05 21:32:18 +00:00
|
|
|
static int match_exclusion(struct match *, const char *pathname);
|
|
|
|
static int match_inclusion(struct match *, const char *pathname);
|
|
|
|
|
|
|
|
/*
|
2004-06-27 06:29:03 +00:00
|
|
|
* The matching logic here needs to be re-thought. I started out to
|
|
|
|
* try to mimic gtar's matching logic, but it's not entirely
|
|
|
|
* consistent. In particular 'tar -t' and 'tar -x' interpret patterns
|
|
|
|
* on the command line as anchored, but --exclude doesn't.
|
2004-04-05 21:32:18 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Utility functions to manage exclusion/inclusion patterns
|
|
|
|
*/
|
|
|
|
|
2004-06-27 06:29:03 +00:00
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_exclude(struct lafe_matching **matching, const char *pattern)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
if (*matching == NULL)
|
|
|
|
initialize_matching(matching);
|
|
|
|
add_pattern(&((*matching)->exclusions), pattern);
|
|
|
|
(*matching)->exclusions_count++;
|
2004-06-27 06:29:03 +00:00
|
|
|
return (0);
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
|
2004-06-27 06:29:03 +00:00
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_exclude_from_file(struct lafe_matching **matching, const char *pathname)
|
2004-06-15 05:55:41 +00:00
|
|
|
{
|
2010-02-07 02:00:26 +00:00
|
|
|
struct lafe_line_reader *lr;
|
|
|
|
const char *p;
|
|
|
|
int ret = 0;
|
|
|
|
|
2010-04-11 01:36:10 +00:00
|
|
|
lr = lafe_line_reader(pathname, 0);
|
2010-02-07 02:00:26 +00:00
|
|
|
while ((p = lafe_line_reader_next(lr)) != NULL) {
|
|
|
|
if (lafe_exclude(matching, p) != 0)
|
|
|
|
ret = -1;
|
|
|
|
}
|
|
|
|
lafe_line_reader_free(lr);
|
|
|
|
return (ret);
|
2004-06-15 05:55:41 +00:00
|
|
|
}
|
|
|
|
|
2004-06-27 06:29:03 +00:00
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_include(struct lafe_matching **matching, const char *pattern)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
2010-02-07 02:00:26 +00:00
|
|
|
|
|
|
|
if (*matching == NULL)
|
|
|
|
initialize_matching(matching);
|
|
|
|
add_pattern(&((*matching)->inclusions), pattern);
|
|
|
|
(*matching)->inclusions_count++;
|
|
|
|
(*matching)->inclusions_unmatched_count++;
|
2004-06-27 06:29:03 +00:00
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_include_from_file(struct lafe_matching **matching, const char *pathname,
|
|
|
|
int nullSeparator)
|
2004-06-27 06:29:03 +00:00
|
|
|
{
|
2010-02-07 02:00:26 +00:00
|
|
|
struct lafe_line_reader *lr;
|
|
|
|
const char *p;
|
|
|
|
int ret = 0;
|
|
|
|
|
|
|
|
lr = lafe_line_reader(pathname, nullSeparator);
|
|
|
|
while ((p = lafe_line_reader_next(lr)) != NULL) {
|
|
|
|
if (lafe_include(matching, p) != 0)
|
|
|
|
ret = -1;
|
|
|
|
}
|
|
|
|
lafe_line_reader_free(lr);
|
|
|
|
return (ret);
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2010-02-06 19:44:37 +00:00
|
|
|
add_pattern(struct match **list, const char *pattern)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
|
|
|
struct match *match;
|
2010-02-07 02:00:26 +00:00
|
|
|
size_t len;
|
2004-04-05 21:32:18 +00:00
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
len = strlen(pattern);
|
|
|
|
match = malloc(sizeof(*match) + len + 1);
|
2004-04-05 21:32:18 +00:00
|
|
|
if (match == NULL)
|
2010-02-06 19:44:37 +00:00
|
|
|
bsdtar_errc(1, errno, "Out of memory");
|
2004-04-05 21:32:18 +00:00
|
|
|
strcpy(match->pattern, pattern);
|
2004-06-02 07:23:54 +00:00
|
|
|
/* Both "foo/" and "foo" should match "foo/bar". */
|
2010-02-07 02:00:26 +00:00
|
|
|
if (len && match->pattern[len - 1] == '/')
|
2004-06-02 07:23:54 +00:00
|
|
|
match->pattern[strlen(match->pattern)-1] = '\0';
|
2004-04-05 21:32:18 +00:00
|
|
|
match->next = *list;
|
|
|
|
*list = match;
|
|
|
|
match->matches = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_excluded(struct lafe_matching *matching, const char *pathname)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
|
|
|
struct match *match;
|
|
|
|
struct match *matched;
|
|
|
|
|
|
|
|
if (matching == NULL)
|
|
|
|
return (0);
|
|
|
|
|
2010-04-11 18:44:42 +00:00
|
|
|
/* Mark off any unmatched inclusions. */
|
|
|
|
/* In particular, if a filename does appear in the archive and
|
|
|
|
* is explicitly included and excluded, then we don't report
|
|
|
|
* it as missing even though we don't extract it.
|
|
|
|
*/
|
|
|
|
matched = NULL;
|
|
|
|
for (match = matching->inclusions; match != NULL; match = match->next){
|
|
|
|
if (match->matches == 0
|
|
|
|
&& match_inclusion(match, pathname)) {
|
|
|
|
matching->inclusions_unmatched_count--;
|
|
|
|
match->matches++;
|
|
|
|
matched = match;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2004-04-05 21:32:18 +00:00
|
|
|
/* Exclusions take priority */
|
|
|
|
for (match = matching->exclusions; match != NULL; match = match->next){
|
|
|
|
if (match_exclusion(match, pathname))
|
|
|
|
return (1);
|
|
|
|
}
|
|
|
|
|
2010-04-11 18:44:42 +00:00
|
|
|
/* It's not excluded and we found an inclusion above, so it's included. */
|
|
|
|
if (matched != NULL)
|
|
|
|
return (0);
|
|
|
|
|
|
|
|
|
|
|
|
/* We didn't find an unmatched inclusion, check the remaining ones. */
|
2004-04-05 21:32:18 +00:00
|
|
|
for (match = matching->inclusions; match != NULL; match = match->next){
|
2010-04-11 18:44:42 +00:00
|
|
|
/* We looked at previously-unmatched inclusions already. */
|
|
|
|
if (match->matches > 0
|
|
|
|
&& match_inclusion(match, pathname)) {
|
|
|
|
match->matches++;
|
|
|
|
return (0);
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If there were inclusions, default is to exclude. */
|
|
|
|
if (matching->inclusions != NULL)
|
|
|
|
return (1);
|
|
|
|
|
|
|
|
/* No explicit inclusions, default is to match. */
|
|
|
|
return (0);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This is a little odd, but it matches the default behavior of
|
|
|
|
* gtar. In particular, 'a*b' will match 'foo/a1111/222b/bar'
|
|
|
|
*
|
|
|
|
*/
|
2009-03-08 05:22:50 +00:00
|
|
|
static int
|
2004-04-05 21:32:18 +00:00
|
|
|
match_exclusion(struct match *match, const char *pathname)
|
|
|
|
{
|
2010-02-07 02:00:26 +00:00
|
|
|
return (lafe_pathmatch(match->pattern,
|
|
|
|
pathname,
|
|
|
|
PATHMATCH_NO_ANCHOR_START | PATHMATCH_NO_ANCHOR_END));
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Again, mimic gtar: inclusions are always anchored (have to match
|
|
|
|
* the beginning of the path) even though exclusions are not anchored.
|
|
|
|
*/
|
2010-02-07 02:00:26 +00:00
|
|
|
static int
|
2004-04-05 21:32:18 +00:00
|
|
|
match_inclusion(struct match *match, const char *pathname)
|
|
|
|
{
|
2010-02-07 02:00:26 +00:00
|
|
|
return (lafe_pathmatch(match->pattern, pathname, PATHMATCH_NO_ANCHOR_END));
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_cleanup_exclusions(struct lafe_matching **matching)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
|
|
|
struct match *p, *q;
|
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
if (*matching == NULL)
|
|
|
|
return;
|
|
|
|
|
|
|
|
for (p = (*matching)->inclusions; p != NULL; ) {
|
|
|
|
q = p;
|
|
|
|
p = p->next;
|
|
|
|
free(q);
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
2010-02-07 02:00:26 +00:00
|
|
|
|
|
|
|
for (p = (*matching)->exclusions; p != NULL; ) {
|
|
|
|
q = p;
|
|
|
|
p = p->next;
|
|
|
|
free(q);
|
|
|
|
}
|
|
|
|
|
|
|
|
free(*matching);
|
|
|
|
*matching = NULL;
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
2010-02-07 02:00:26 +00:00
|
|
|
initialize_matching(struct lafe_matching **matching)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
2010-02-07 02:00:26 +00:00
|
|
|
*matching = calloc(sizeof(**matching), 1);
|
|
|
|
if (*matching == NULL)
|
2010-02-06 19:44:37 +00:00
|
|
|
bsdtar_errc(1, errno, "No memory");
|
2004-04-05 21:32:18 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_unmatched_inclusions(struct lafe_matching *matching)
|
2004-04-05 21:32:18 +00:00
|
|
|
{
|
|
|
|
|
|
|
|
if (matching == NULL)
|
|
|
|
return (0);
|
|
|
|
return (matching->inclusions_unmatched_count);
|
|
|
|
}
|
2004-12-22 06:08:04 +00:00
|
|
|
|
2008-05-26 17:10:10 +00:00
|
|
|
int
|
2010-02-07 02:00:26 +00:00
|
|
|
lafe_unmatched_inclusions_warn(struct lafe_matching *matching, const char *msg)
|
2008-05-26 17:10:10 +00:00
|
|
|
{
|
|
|
|
struct match *p;
|
|
|
|
|
|
|
|
if (matching == NULL)
|
|
|
|
return (0);
|
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
for (p = matching->inclusions; p != NULL; p = p->next) {
|
|
|
|
if (p->matches == 0)
|
|
|
|
bsdtar_warnc(0, "%s: %s", p->pattern, msg);
|
2008-08-18 04:58:54 +00:00
|
|
|
}
|
2008-05-26 17:10:10 +00:00
|
|
|
|
2010-02-07 02:00:26 +00:00
|
|
|
return (matching->inclusions_unmatched_count);
|
2004-12-22 06:08:04 +00:00
|
|
|
}
|