[PATCH v6] erofs-utils: introduce exclude dirs and files

Gao Xiang gaoxiang25 at huawei.com
Tue Feb 18 13:32:17 AEDT 2020


On Mon, Feb 17, 2020 at 09:16:53PM +0800, Li Guifu wrote:
> From: Li GuiFu <bluce.lee at aliyun.com>
> 
> Add excluded file feature "--exclude-path=" and '--exclude-regex=',
> which can be used to build EROFS image without some user specific
> files or dirs. Note that you may give multiple '--exclude-path'
> or '--exclude-regex' options.
> 
> Signed-off-by: Gao Xiang <gaoxiang25 at huawei.com>
> Signed-off-by: Li Guifu <bluce.lee at aliyun.com>
> ---
>  change since v6, fix as comments suggested by Gao Xiang
>   - update a new email address
>   - refact regex and pattern match
> 
>  include/erofs/exclude.h |  26 ++++++++
>  lib/Makefile.am         |   2 +-
>  lib/exclude.c           | 136 ++++++++++++++++++++++++++++++++++++++++
>  lib/inode.c             |   5 ++
>  man/mkfs.erofs.1        |   8 +++
>  mkfs/main.c             |  36 +++++++++--
>  6 files changed, 206 insertions(+), 7 deletions(-)
>  create mode 100644 include/erofs/exclude.h
>  create mode 100644 lib/exclude.c
> 
> diff --git a/include/erofs/exclude.h b/include/erofs/exclude.h
> new file mode 100644
> index 0000000..0a82dbe
> --- /dev/null
> +++ b/include/erofs/exclude.h
> @@ -0,0 +1,26 @@
> +/* SPDX-License-Identifier: GPL-2.0+ */
> +/*
> + * erofs-utils/include/erofs/exclude.h
> + *
> + * Created by Li Guifu <bluce.lee at aliyun.com>
> + */
> +#ifndef __EROFS_EXCLUDE_H
> +#define __EROFS_EXCLUDE_H
> +#include <sys/types.h>
> +#include <regex.h>
> +
> +struct erofs_exclude_rule {
> +	struct list_head list;
> +
> +	char *pattern;		/* save original pattern for exact or regex match */
> +	regex_t reg;
> +};
> +
> +void erofs_exclude_set_root(const char *rootdir);
> +void erofs_cleanup_exclude_rules(void);
> +
> +int erofs_parse_exclude_path(const char *args, bool is_regex);
> +struct erofs_exclude_rule *erofs_is_exclude_path(const char *dir,
> +						 const char *name);
> +#endif
> +
> diff --git a/lib/Makefile.am b/lib/Makefile.am
> index 1ff81f9..e4b51e6 100644
> --- a/lib/Makefile.am
> +++ b/lib/Makefile.am
> @@ -3,7 +3,7 @@
>  
>  noinst_LTLIBRARIES = liberofs.la
>  liberofs_la_SOURCES = config.c io.c cache.c inode.c xattr.c \
> -		      compress.c compressor.c
> +		      compress.c compressor.c exclude.c
>  liberofs_la_CFLAGS = -Wall -Werror -I$(top_srcdir)/include
>  if ENABLE_LZ4
>  liberofs_la_CFLAGS += ${LZ4_CFLAGS}
> diff --git a/lib/exclude.c b/lib/exclude.c
> new file mode 100644
> index 0000000..6dae67e
> --- /dev/null
> +++ b/lib/exclude.c
> @@ -0,0 +1,136 @@
> +// SPDX-License-Identifier: GPL-2.0+
> +/*
> + * erofs-utils/lib/exclude.c
> + *
> + * Created by Li Guifu <bluce.lee at aliyun.com>
> + */
> +#include <string.h>
> +#include <stdlib.h>
> +#include "erofs/err.h"
> +#include "erofs/list.h"
> +#include "erofs/print.h"
> +#include "erofs/exclude.h"
> +
> +#define EXCLUDE_RULE_EXACT_SIZE	offsetof(struct erofs_exclude_rule, reg)
> +#define EXCLUDE_RULE_REGEX_SIZE	sizeof(struct erofs_exclude_rule)
> +
> +static LIST_HEAD(exclude_head);
> +static LIST_HEAD(regex_exclude_head);
> +
> +static unsigned int rpathlen;		/* root directory prefix length */
> +
> +void erofs_exclude_set_root(const char *rootdir)
> +{
> +	rpathlen = strlen(rootdir);
> +}
> +
> +static void dump_regerror(int errcode, const char *s, const regex_t *preg)
> +{
> +	char str[1024]; /* overflow safe */
> +
> +	regerror(errcode, preg, str, 1024);


Still some minor issues here.

You could send the new version or I will fix them myself later.

Maybe it's better to "

char msg[1024];

regerror(errcode, preg, msg, sizeof(msg));

"


> +	erofs_err("invalid regex %s,because %s\n", s, str);
> +}
> +
> +static struct erofs_exclude_rule *erofs_insert_exclude(const char *s,
> +						       bool is_regex)
> +{
> +	int ret = -ENOMEM;
> +	struct erofs_exclude_rule *r;
> +	struct list_head *h;
> +	unsigned int size;
> +
> +	size = is_regex ? EXCLUDE_RULE_REGEX_SIZE : EXCLUDE_RULE_EXACT_SIZE;
> +	r = malloc(size);
> +	if (!r)
> +		return ERR_PTR(-ENOMEM);
> +
> +	r->pattern = strdup(s);
> +	if (!r->pattern)
> +		goto err_rule;
> +
> +	if (is_regex) {
> +		ret = regcomp(&r->reg, s, REG_EXTENDED|REG_NOSUB);
> +		if(ret) {
> +			dump_regerror(ret, s, &r->reg);
> +			goto err_rule;
> +		}
> +		h = &regex_exclude_head;
> +	} else {
> +		h = &exclude_head;
> +	}
> +
> +	list_add_tail(&r->list, h);
> +	erofs_info("Insert exclude:[%s]\n", s);
> +	return r;
> +
> +err_rule:
> +	free(r);
> +	return ERR_PTR(ret);
> +}
> +
> +static inline void erofs_free_exclude_rules(struct list_head *h)
> +{
> +	struct erofs_exclude_rule *r, *n;
> +
> +	list_for_each_entry_safe(r, n, h, list) {
> +		list_del(&r->list);
> +		free(r->pattern);
> +		free(r);
> +	}
> +}
> +
> +void erofs_cleanup_exclude_rules(void)
> +{
> +	erofs_free_exclude_rules(&exclude_head);
> +	erofs_free_exclude_rules(&regex_exclude_head);

For regular expression, it needs to regfree(&r->reg) anyway.

> +}
> +
> +int erofs_parse_exclude_path(const char *args, bool is_regex)
> +{
> +	struct erofs_exclude_rule *r = erofs_insert_exclude(args, is_regex);
> +
> +	if (IS_ERR(r)) {
> +		erofs_cleanup_exclude_rules();
> +		return PTR_ERR(r);
> +	}
> +	return 0;
> +}
> +
> +struct erofs_exclude_rule *erofs_is_exclude_path(const char *dir,
> +						 const char *name)
> +{
> +	char buf[PATH_MAX];
> +	const char *s;
> +	struct erofs_exclude_rule *r;
> +
> +	if (!dir) {
> +		/* no prefix */
> +		s = name;
> +	} else {
> +		sprintf(buf, "%s/%s", dir, name);
> +		s = buf;
> +	}
> +
> +	s += rpathlen;
> +	while (*s == '/')
> +		s++;
> +
> +	list_for_each_entry(r, &exclude_head, list) {
> +		if (!strcmp(r->pattern, s))
> +			return r;
> +	}
> +
> +	list_for_each_entry(r, &regex_exclude_head, list) {
> +		int ret = regexec(&r->reg, s, (size_t)0, NULL, 0);
> +
> +		if(!ret)
> +			return r;
> +		else if (ret != REG_NOMATCH)
> +			dump_regerror(ret, s, &r->reg);
> +
> +	}
> +
> +	return NULL;
> +}
> +
> diff --git a/lib/inode.c b/lib/inode.c
> index bd0652b..7114023 100644
> --- a/lib/inode.c
> +++ b/lib/inode.c
> @@ -20,6 +20,7 @@
>  #include "erofs/io.h"
>  #include "erofs/compress.h"
>  #include "erofs/xattr.h"
> +#include "erofs/exclude.h"
>  
>  struct erofs_sb_info sbi;
>  
> @@ -877,6 +878,10 @@ struct erofs_inode *erofs_mkfs_build_tree(struct erofs_inode *dir)
>  		    !strncmp(dp->d_name, "lost+found", strlen("lost+found")))
>  			continue;
>  
> +		/* skip if it's a exclude file */
> +		if (erofs_is_exclude_path(dir->i_srcpath, dp->d_name))
> +			continue;
> +
>  		d = erofs_d_alloc(dir, dp->d_name);
>  		if (IS_ERR(d)) {
>  			ret = PTR_ERR(d);
> diff --git a/man/mkfs.erofs.1 b/man/mkfs.erofs.1
> index d6bf828..ab19927 100644
> --- a/man/mkfs.erofs.1
> +++ b/man/mkfs.erofs.1
> @@ -52,6 +52,14 @@ Forcely generate extended inodes (64-byte inodes) to output.
>  Set all files to the given UNIX timestamp. Reproducible builds requires setting
>  all to a specific one.
>  .TP
> +.BI "\-\-exclude-path=" path
> +Ignore file that matches the exact literal path.
> +You may give multiple `--exclude-path' options.
> +.TP
> +.BI "\-\-exclude-regex=" path
> +Ignore file that matches the exact literal path given by a regex expression
> +You may give multiple `--exclude-regex` options

Didn't handle the previous comment of this.

(Regular expression is not a exact literal path.)

> +.TP
>  .B \-\-help
>  Display this help and exit.
>  .SH AUTHOR
> diff --git a/mkfs/main.c b/mkfs/main.c
> index 817a6c1..d0c9869 100644
> --- a/mkfs/main.c
> +++ b/mkfs/main.c
> @@ -21,6 +21,7 @@
>  #include "erofs/io.h"
>  #include "erofs/compress.h"
>  #include "erofs/xattr.h"
> +#include "erofs/exclude.h"
>  
>  #ifdef HAVE_LIBUUID
>  #include <uuid/uuid.h>
> @@ -30,6 +31,8 @@
>  
>  static struct option long_options[] = {
>  	{"help", no_argument, 0, 1},
> +	{"exclude-path", required_argument, NULL, 2},
> +	{"exclude-regex", required_argument, NULL, 3},
>  	{0, 0, 0, 0},
>  };
>  
> @@ -50,12 +53,14 @@ static void usage(void)
>  {
>  	fputs("usage: [options] FILE DIRECTORY\n\n"
>  	      "Generate erofs image from DIRECTORY to FILE, and [options] are:\n"
> -	      " -zX[,Y]   X=compressor (Y=compression level, optional)\n"
> -	      " -d#       set output message level to # (maximum 9)\n"
> -	      " -x#       set xattr tolerance to # (< 0, disable xattrs; default 2)\n"
> -	      " -EX[,...] X=extended options\n"
> -	      " -T#       set a fixed UNIX timestamp # to all files\n"
> -	      " --help    display this help and exit\n"
> +	      " -zX[,Y]          X=compressor (Y=compression level, optional)\n"
> +	      " -d#              set output message level to # (maximum 9)\n"
> +	      " -x#              set xattr tolerance to # (< 0, disable xattrs; default 2)\n"
> +	      " -EX[,...]        X=extended options\n"
> +	      " -T#              set a fixed UNIX timestamp # to all files\n"
> +	      " --exclude-path=X avoid including file X (X = exact literal path)\n"
> +	      " --exclude-regex=X avoid including file X (X = exact literal path of a regex)\n"

Didn't handle this as well.

Thanks,
Gao Xiang



More information about the Linux-erofs mailing list