From: Andre Noll Date: Sun, 1 Jun 2008 15:50:41 +0000 (+0200) Subject: Move the code for the select command to its own file. X-Git-Tag: v0.0.2~16 X-Git-Url: http://git.tuebingen.mpg.de/?a=commitdiff_plain;ds=sidebyside;h=cab88f141a9550dcceee0ad8eab978660e0ae0de;p=adu.git Move the code for the select command to its own file. --- diff --git a/Makefile b/Makefile index ef94fcc..68e6443 100644 --- a/Makefile +++ b/Makefile @@ -1,4 +1,4 @@ -objects := adu.o string.o cmdline.o fd.o +objects := adu.o string.o cmdline.o fd.o select.o all: adu DEBUG_CPPFLAGS += -Wno-sign-compare -g -Wunused -Wundef -W diff --git a/adu.c b/adu.c index c3a278e..9a0e513 100644 --- a/adu.c +++ b/adu.c @@ -12,33 +12,21 @@ DEFINE_ERRLIST; int osl_errno; -/** Command line and config file options. */ -static struct gengetopt_args_info conf; - -enum uid_info_flags { - /** whether this slot of the hash table is used. */ - UI_FL_SLOT_USED = 1, - /** whether this uid should be taken into account. */ - UI_FL_ADMISSIBLE = 2, -}; - -struct user_info { - uint32_t uid; - uint32_t flags; - char *pw_name; - struct osl_table *table; - uint64_t files; - uint64_t bytes; - uint64_t dirs; - struct osl_table_description *desc; -}; +/** In case a signal is received, its number is stored here. */ +static int signum; -/** The decimal representation of an uint64_t never exceeds that size. */ -#define FORMATED_VALUE_SIZE 25 +/** Command line and config file options. */ +struct gengetopt_args_info conf; -#define FOR_EACH_USER(ui) for (ui = uid_hash_table; ui && ui < uid_hash_table \ - + uid_hash_table_size; ui++) +/** Global dir count. */ +uint64_t num_dirs = 0; +/** Global files count. */ +uint64_t num_files = 0; +/** Global bytes count. */ +uint64_t num_bytes = 0; +/** The number of different uids found so far. */ +uint32_t num_uids = 0; /** * Contains info for each user that owns at least one regular file. @@ -47,113 +35,20 @@ struct user_info { * option occupy a slot in this hash table. This allows to find out * quicky whether a uid is admissible. And yes, this has to be fast. */ -static struct user_info *uid_hash_table; - -/* these get filled in by the select command. */ -static char count_unit_buf[4] = "( )", size_unit_buf[4] = "( )"; - -static inline int ui_used(struct user_info *ui) -{ - return ui->flags & UI_FL_SLOT_USED; -} - -static inline int ui_admissible(struct user_info *ui) -{ - return ui->flags & UI_FL_ADMISSIBLE; -} - -struct uid_range { - uint32_t low; - uint32_t high; -}; - -static struct uid_range *admissible_uids; - -static inline int check_uid_arg(const char *arg, uint32_t *uid) -{ - const uint32_t max = ~0U; - /* - * we need an 64-bit int for string -> uid conversion because strtoll() - * returns a signed value. - */ - int64_t val; - int ret = atoi64(arg, &val); - - if (ret < 0) - return ret; - if (val < 0 || val > max) - return -ERRNO_TO_ERROR(EINVAL); - *uid = val; - return 1; -} - -static int parse_uid_range(const char *orig_arg, struct uid_range *ur) -{ - int ret; - char *arg = adu_strdup(orig_arg), *p = strchr(arg, '-'); - - if (!p || p == arg) { /* -42 or 42 */ - ret = check_uid_arg(p? p + 1 : arg, &ur->high); - if (ret < 0) - goto out; - ur->low = p? 0 : ur->high; - ret = 1; - goto out; - } - /* 42- or 42-4711 */ - *p = '\0'; - p++; - ret = check_uid_arg(arg, &ur->low); - if (ret < 0) - goto out; - ur->high = ~0U; - if (*p) { /* 42-4711 */ - ret = check_uid_arg(p, &ur->high); - if (ret < 0) - goto out; - } - if (ur->low > ur->high) - ret = -ERRNO_TO_ERROR(EINVAL); -out: - if (ret < 0) - ERROR_LOG("bad uid option: %s\n", orig_arg); - else - INFO_LOG("admissible uid range: %u - %u\n", ur->low, - ur->high); - free(arg); - return ret; -} +struct user_info *uid_hash_table = NULL; -/** evaluates to 1 if x < y, to -1 if x > y and to 0 if x == y */ -#define NUM_COMPARE(x, y) ((int)((x) < (y)) - (int)((x) > (y))) +/** + * The table containing the directory names and statistics. + */ +struct osl_table *dir_table = NULL; /** - * The log function. - * - * \param ll Loglevel. - * \param fml Usual format string. - * - * All XXX_LOG() macros use this function. + * The array of all uid ranges that were given at the command line. */ -__printf_2_3 void __log(int ll, const char* fmt,...) -{ - va_list argp; - FILE *outfd; - struct tm *tm; - time_t t1; - char str[255] = ""; +struct uid_range *admissible_uids; - if (ll < conf.loglevel_arg) - return; - outfd = stderr; - time(&t1); - tm = localtime(&t1); - strftime(str, sizeof(str), "%b %d %H:%M:%S", tm); - fprintf(outfd, "%s ", str); - va_start(argp, fmt); - vfprintf(outfd, fmt, argp); - va_end(argp); -} +/** Evaluates to 1 if x < y, to -1 if x > y and to 0 if x == y. */ +#define NUM_COMPARE(x, y) ((int)((x) < (y)) - (int)((x) > (y))) /** * Compare the size of two directories @@ -200,22 +95,6 @@ static int uint64_compare(const struct osl_object *obj1, return 0; } -/** The columns of the directory table. */ -enum dir_table_columns { - /** The name of the directory. */ - DT_NAME, - /** The dir count number. */ - DT_NUM, - /** The number of the parent directory. */ - DT_PARENT_NUM, - /** The number of bytes of all regular files. */ - DT_BYTES, - /** The number of all regular files. */ - DT_FILES, - /** Number of columns in this table. */ - NUM_DT_COLUMNS -}; - static struct osl_column_description dir_table_cols[] = { [DT_NAME] = { .storage_type = OSL_MAPPED_STORAGE, @@ -259,18 +138,6 @@ static struct osl_table_description dir_table_desc = { .column_descriptions = dir_table_cols, }; -/** The columns of the id table. */ -enum user_table_columns { - /** The numer of the directory. */ - UT_DIR_NUM, - /** The number of bytes of all regular files in this dir owned by this id. */ - UT_BYTES, - /** The number of files in this dir owned by this id. */ - UT_FILES, - /** Number of columns in this table. */ - NUM_UT_COLUMNS -}; - static struct osl_column_description user_table_cols[] = { [UT_DIR_NUM] = { .storage_type = OSL_MAPPED_STORAGE, @@ -295,7 +162,88 @@ static struct osl_column_description user_table_cols[] = { }, }; -static struct osl_table *dir_table; +static int check_uid_arg(const char *arg, uint32_t *uid) +{ + const uint32_t max = ~0U; + /* + * we need an 64-bit int for string -> uid conversion because strtoll() + * returns a signed value. + */ + int64_t val; + int ret = atoi64(arg, &val); + + if (ret < 0) + return ret; + if (val < 0 || val > max) + return -ERRNO_TO_ERROR(EINVAL); + *uid = val; + return 1; +} + +static int parse_uid_range(const char *orig_arg, struct uid_range *ur) +{ + int ret; + char *arg = adu_strdup(orig_arg), *p = strchr(arg, '-'); + + if (!p || p == arg) { /* -42 or 42 */ + ret = check_uid_arg(p? p + 1 : arg, &ur->high); + if (ret < 0) + goto out; + ur->low = p? 0 : ur->high; + ret = 1; + goto out; + } + /* 42- or 42-4711 */ + *p = '\0'; + p++; + ret = check_uid_arg(arg, &ur->low); + if (ret < 0) + goto out; + ur->high = ~0U; + if (*p) { /* 42-4711 */ + ret = check_uid_arg(p, &ur->high); + if (ret < 0) + goto out; + } + if (ur->low > ur->high) + ret = -ERRNO_TO_ERROR(EINVAL); +out: + if (ret < 0) + ERROR_LOG("bad uid option: %s\n", orig_arg); + else + INFO_LOG("admissible uid range: %u - %u\n", ur->low, + ur->high); + free(arg); + return ret; +} + +/** + * The log function. + * + * \param ll Loglevel. + * \param fml Usual format string. + * + * All XXX_LOG() macros use this function. + */ +__printf_2_3 void __log(int ll, const char* fmt,...) +{ + va_list argp; + FILE *outfd; + struct tm *tm; + time_t t1; + char str[255] = ""; + + if (ll < conf.loglevel_arg) + return; + outfd = stderr; + time(&t1); + tm = localtime(&t1); + strftime(str, sizeof(str), "%b %d %H:%M:%S", tm); + fprintf(outfd, "%s ", str); + va_start(argp, fmt); + vfprintf(outfd, fmt, argp); + va_end(argp); +} static int add_directory(char *dirname, uint64_t *dir_num, uint64_t *parent_dir_num, uint64_t *dir_size, uint64_t *dir_files) @@ -316,8 +264,6 @@ static int add_directory(char *dirname, uint64_t *dir_num, uint64_t *parent_dir_ return osl(osl_add_row(dir_table, dir_objects)); } -static uint32_t num_uids; - static int open_user_table(struct user_info *ui, int create) { int ret; @@ -359,11 +305,11 @@ err: } #define uid_hash_bits 8 -static uint32_t uid_hash_table_size = 1 << uid_hash_bits; +uint32_t uid_hash_table_size = 1 << uid_hash_bits; #define PRIME1 0x811c9dc5 #define PRIME2 0x01000193 -static void create_hash_table(void) +void create_hash_table(void) { uid_hash_table = adu_calloc(uid_hash_table_size * sizeof(struct user_info)); @@ -430,21 +376,19 @@ static void close_user_tables(void) close_user_table(ui); } -static void close_all_tables(void) +void close_all_tables(void) { close_dir_table(); close_user_tables(); free_hash_table(); } -static int signum; - static void signal_handler(int s) { signum = s; } -static void check_signals(void) +void check_signals(void) { if (likely(!signum)) return; @@ -484,11 +428,6 @@ static uint32_t double_hash(uint32_t uid, uint32_t probe_num) % uid_hash_table_size; } -enum search_uid_flags { - OPEN_USER_TABLE = 1, - CREATE_USER_TABLE = 2, -}; - static int uid_is_admissible(uint32_t uid) { int i; @@ -505,7 +444,7 @@ static int uid_is_admissible(uint32_t uid) return i; } -static int search_uid(uint32_t uid, enum search_uid_flags flags, +int search_uid(uint32_t uid, enum search_uid_flags flags, struct user_info **ui_ptr) { uint32_t p; @@ -582,10 +521,6 @@ static int update_user_row(struct osl_table *t, uint64_t dir_num, } } -static uint64_t num_dirs; -static uint64_t num_files; -static uint64_t num_bytes; - /* id of the device containing the base dir. */ static dev_t device_id; @@ -660,441 +595,7 @@ out: return ret; } -static int get_dir_name_by_number(uint64_t *dirnum, char **name) -{ - char *result = NULL, *tmp; - struct osl_row *row; - uint64_t val = *dirnum; - struct osl_object obj = {.data = &val, .size = sizeof(val)}; - int ret; - -again: - ret = osl(osl_get_row(dir_table, DT_NUM, &obj, &row)); - if (ret < 0) - goto out; - ret = osl(osl_get_object(dir_table, row, DT_NAME, &obj)); - if (ret < 0) - goto out; - if (result) { - tmp = make_message("%s/%s", (char *)obj.data, result); - free(result); - result = tmp; - } else - result = adu_strdup((char *)obj.data); - ret = osl(osl_get_object(dir_table, row, DT_PARENT_NUM, &obj)); - if (ret < 0) - goto out; - val = *(uint64_t *)obj.data; - if (val) - goto again; -out: - if (ret < 0) { - free(result); - *name = NULL; - } else - *name = result; - return ret; -} - -static int get_dir_name_of_row(struct osl_row *dir_table_row, char **name) -{ - struct osl_object obj; - int ret; - char *this_dir, *prefix = NULL; - - *name = NULL; - ret = osl(osl_get_object(dir_table, dir_table_row, DT_NAME, &obj)); - if (ret < 0) - return ret; - this_dir = adu_strdup((char *)obj.data); - ret = osl(osl_get_object(dir_table, dir_table_row, DT_PARENT_NUM, &obj)); - if (ret < 0) - goto out; - if (!*(uint64_t *)obj.data) { - *name = this_dir; - return 1; - } - ret = get_dir_name_by_number((uint64_t *)obj.data, &prefix); - if (ret < 0) - goto out; - *name = make_message("%s/%s", prefix, this_dir); - free(prefix); - ret = 1; -out: - free(this_dir); - return ret; -} - -const uint64_t size_unit_divisors[] = { - [size_unit_arg_b] = 1ULL, - [size_unit_arg_k] = 1024ULL, - [size_unit_arg_m] = 1024ULL * 1024ULL, - [size_unit_arg_g] = 1024ULL * 1024ULL * 1024ULL, - [size_unit_arg_t] = 1024ULL * 1024ULL * 1024ULL * 1024ULL, -}; - -const uint64_t count_unit_divisors[] = { - - [count_unit_arg_n] = 1ULL, - [count_unit_arg_k] = 1000ULL, - [count_unit_arg_m] = 1000ULL * 1000ULL, - [count_unit_arg_g] = 1000ULL * 1000ULL * 1000ULL, - [count_unit_arg_t] = 1000ULL * 1000ULL * 1000ULL * 1000ULL, -}; - -const char size_unit_abbrevs[] = " BKMGT"; -const char count_unit_abbrevs[] = " kmgt"; - -static enum enum_size_unit format_size_value(enum enum_size_unit unit, - uint64_t value, int print_unit, char *result) -{ - enum enum_size_unit u = unit; - char unit_buf[2] = "\0\0"; - - if (unit == size_unit_arg_h) /* human readable */ - for (u = size_unit_arg_b; u < size_unit_arg_t && - value > size_unit_divisors[u + 1]; u++) - ; /* nothing */ - if (print_unit) - unit_buf[0] = size_unit_abbrevs[u]; - sprintf(result, "%llu%s", - (long long unsigned)value / size_unit_divisors[u], unit_buf); - return u; -} - -static enum enum_count_unit format_count_value(enum enum_count_unit unit, - uint64_t value, int print_unit, char *result) -{ - enum enum_count_unit u = unit; - char unit_buf[2] = "\0\0"; - - if (unit == count_unit_arg_h) /* human readable */ - for (u = count_unit_arg_n; u < count_unit_arg_t && - value > count_unit_divisors[u + 1]; u++) - ; /* nothing */ - if (print_unit) - unit_buf[0] = count_unit_abbrevs[u]; - sprintf(result, "%llu%s", - (long long unsigned)value / count_unit_divisors[u], unit_buf); - return u; -} - -enum global_stats_flags { - GSF_PRINT_DIRNAME = 1, - GSF_PRINT_BYTES = 2, - GSF_PRINT_FILES = 4, - GSF_COMPUTE_SUMMARY = 8, -}; - -struct global_stats_info { - uint32_t count; - int ret; - int osl_errno; - enum global_stats_flags flags; -}; - -static int global_stats_loop_function(struct osl_row *row, void *data) -{ - struct global_stats_info *gsi = data; - struct osl_object obj; - char *dirname, formated_value[FORMATED_VALUE_SIZE]; - int ret, summary = gsi->flags & GSF_COMPUTE_SUMMARY; - - check_signals(); - if (!gsi->count && !summary) { - ret = -E_LOOP_COMPLETE; - goto err; - } - if (summary || (gsi->count && (gsi->flags & GSF_PRINT_FILES))) { - uint64_t files; - ret = osl(osl_get_object(dir_table, row, DT_FILES, &obj)); - if (ret < 0) - goto err; - files = *(uint64_t *)obj.data; - if (gsi->count && (gsi->flags & GSF_PRINT_FILES)) { - format_count_value(conf.count_unit_arg, files, - conf.count_unit_arg == count_unit_arg_h, - formated_value); - printf("\t%s%s", formated_value, - (gsi->flags & (GSF_PRINT_BYTES | GSF_PRINT_DIRNAME))? - "\t" : "\n"); - } - if (summary) - num_files += files; - } - if (summary || (gsi->count && (gsi->flags & GSF_PRINT_BYTES))) { - uint64_t bytes; - ret = osl(osl_get_object(dir_table, row, DT_BYTES, &obj)); - if (ret < 0) - goto err; - bytes = *(uint64_t *)obj.data; - if (gsi->count && (gsi->flags & GSF_PRINT_BYTES)) { - format_size_value(conf.size_unit_arg, bytes, - conf.size_unit_arg == size_unit_arg_h, - formated_value); - printf("%s%s%s", - (gsi->flags & GSF_PRINT_FILES)? "" : "\t", - formated_value, - (gsi->flags & GSF_PRINT_DIRNAME)? "\t" : "\n" - ); - } - if (summary) { - num_bytes += bytes; - num_dirs++; - } - } - if (gsi->count && (gsi->flags & GSF_PRINT_DIRNAME)) { - ret = get_dir_name_of_row(row, &dirname); - if (ret < 0) - goto err; - printf("%s%s\n", - (gsi->flags & (GSF_PRINT_BYTES | GSF_PRINT_FILES))? "" : "\t", - dirname); - free(dirname); - } - if (gsi->count > 0) - gsi->count--; - return 1; -err: - gsi->ret = ret; - gsi->osl_errno = (ret == -E_OSL)? osl_errno : 0; - return -1; -} - -static void print_id_stats(void) -{ - struct user_info *ui; - - printf("User summary " - "(pw_name/uid/dirs%s/files%s/size%s):\n", - count_unit_buf, count_unit_buf, size_unit_buf); - FOR_EACH_USER(ui) { - char formated_dir_count[FORMATED_VALUE_SIZE], - formated_file_count[FORMATED_VALUE_SIZE], - formated_bytes[FORMATED_VALUE_SIZE ]; - if (!ui_used(ui) || !ui_admissible(ui)) - continue; - format_count_value(conf.count_unit_arg, ui->dirs, - conf.count_unit_arg == count_unit_arg_h, - formated_dir_count); - format_count_value(conf.count_unit_arg, ui->files, - conf.count_unit_arg == count_unit_arg_h, - formated_file_count); - format_size_value(conf.size_unit_arg, ui->bytes, - conf.size_unit_arg == size_unit_arg_h, - formated_bytes); - printf("\t%s\t%u\t%s\t%s\t%s\n", - ui->pw_name? ui->pw_name : "?", - (unsigned)ui->uid, - formated_dir_count, - formated_file_count, - formated_bytes - ); - } -} - -enum user_stats_flags { - USF_PRINT_DIRNAME = 1, - USF_PRINT_BYTES = 2, - USF_PRINT_FILES = 4, - USF_COMPUTE_SUMMARY = 8, -}; - -struct user_stats_info { - uint32_t count; - enum user_stats_flags flags; - int ret; - int osl_errno; - struct user_info *ui; -}; - -static int user_stats_loop_function(struct osl_row *row, void *data) -{ - struct user_stats_info *usi = data; - struct osl_object obj; - int ret, summary = usi->flags & GSF_COMPUTE_SUMMARY; - char formated_value[FORMATED_VALUE_SIZE]; - - check_signals(); - if (!usi->count && !summary) { - ret = -E_LOOP_COMPLETE; - goto err; - } - if (summary || (usi->count && (usi->flags & USF_PRINT_FILES))) { - uint64_t files; - ret = osl(osl_get_object(usi->ui->table, row, UT_FILES, &obj)); - if (ret < 0) - goto err; - files = *(uint64_t *)obj.data; - if (usi->count && (usi->flags & USF_PRINT_FILES)) { - format_count_value(conf.count_unit_arg, files, - conf.count_unit_arg == count_unit_arg_h, - formated_value); - printf("\t%s%s", formated_value, - (usi->flags & (USF_PRINT_BYTES | USF_PRINT_DIRNAME))? - "\t" : "\n" - ); - } - if (summary) - usi->ui->files += files; - } - if (summary || (usi->count && (usi->flags & USF_PRINT_BYTES))) { - uint64_t bytes; - ret = osl(osl_get_object(usi->ui->table, row, UT_BYTES, &obj)); - if (ret < 0) - goto err; - bytes = *(uint64_t *)obj.data; - if (usi->count && (usi->flags & USF_PRINT_BYTES)) { - format_size_value(conf.size_unit_arg, bytes, - conf.size_unit_arg == size_unit_arg_h, - formated_value); - printf("%s%s%s", - (usi->flags & USF_PRINT_FILES)? "" : "\t", - formated_value, - usi->flags & USF_PRINT_DIRNAME? "\t" : "\n" - ); - } - if (summary) { - usi->ui->bytes += bytes; - usi->ui->dirs++; - } - - } - if (usi->count && (usi->flags & USF_PRINT_DIRNAME)) { - char *dirname; - ret = osl(osl_get_object(usi->ui->table, row, UT_DIR_NUM, &obj)); - if (ret < 0) - goto err; - ret = get_dir_name_by_number((uint64_t *)obj.data, &dirname); - if (ret < 0) - goto err; - printf("%s%s\n", - (usi->flags & (USF_PRINT_BYTES | USF_PRINT_FILES))? "" : "\t", - dirname); - free(dirname); - } - if (usi->count > 0) - usi->count--; - return 1; -err: - usi->ret = ret; - usi->osl_errno = (ret == -E_OSL)? osl_errno : 0; - return -1; -} - -static int check_loop_return(int ret, int loop_ret, int loop_osl_errno) -{ - if (ret >= 0) - return ret; - assert(ret == -E_OSL); - if (osl_errno != E_OSL_LOOP) - /* error not caused by loop function returning negative. */ - return ret; - assert(loop_ret < 0); - if (loop_ret == -E_LOOP_COMPLETE) /* no error */ - return 1; - if (loop_ret == -E_OSL) { /* osl error in loop function */ - assert(loop_osl_errno); - osl_errno = loop_osl_errno; - } - return loop_ret; -} - -static int adu_loop_reverse(struct osl_table *t, unsigned col_num, void *private_data, - osl_rbtree_loop_func *func, int *loop_ret, int *loop_osl_errno) -{ - int ret = osl(osl_rbtree_loop_reverse(t, col_num, private_data, func)); - return check_loop_return(ret, *loop_ret, *loop_osl_errno); -} - -static int print_user_stats(void) -{ - struct user_info *ui; - int ret; - - FOR_EACH_USER(ui) { - struct user_stats_info usi = { - .count = conf.limit_arg, - .ui = ui - }; - if (!ui_used(ui) || !ui_admissible(ui)) - continue; - usi.flags = USF_PRINT_DIRNAME | USF_PRINT_BYTES | USF_COMPUTE_SUMMARY; - printf("%s (uid %u), by size%s:\n", - ui->pw_name? ui->pw_name : "?", (unsigned)ui->uid, - size_unit_buf); - ret = adu_loop_reverse(ui->table, UT_BYTES, &usi, user_stats_loop_function, - &usi.ret, &usi.osl_errno); - if (ret < 0) - return ret; - printf("\n%s (uid %u), by file count%s:\n", - ui->pw_name? ui->pw_name : "?", (unsigned)ui->uid, - count_unit_buf); - usi.count = conf.limit_arg, - usi.flags = USF_PRINT_DIRNAME | USF_PRINT_FILES; - ret = adu_loop_reverse(ui->table, UT_FILES, &usi, user_stats_loop_function, - &usi.ret, &usi.osl_errno); - if (ret < 0) - return ret; - printf("\n"); - } - return 1; -} - -static void print_global_summary(void) -{ - char d[FORMATED_VALUE_SIZE], f[FORMATED_VALUE_SIZE], - s[FORMATED_VALUE_SIZE]; - enum enum_count_unit ud, uf; - enum enum_size_unit us; - - ud = format_count_value(conf.count_unit_arg, num_dirs, 0, d); - uf = format_count_value(conf.count_unit_arg, num_files, 0, f); - us = format_size_value(conf.size_unit_arg, num_bytes, 0, s); - - printf("Global summary " - "(dirs(%c)/files(%c)/size(%c))\n" - "\t%s\t%s\t%s\n\n", - count_unit_abbrevs[ud], - count_unit_abbrevs[uf], - size_unit_abbrevs[us], - d, f, s - ); - -} - -static int print_statistics(void) -{ - int ret; - struct global_stats_info gsi = { - .count = conf.limit_arg, - .flags = GSF_PRINT_DIRNAME | GSF_PRINT_BYTES | GSF_COMPUTE_SUMMARY - }; - - printf("By size%s:\n", - size_unit_buf); - ret = adu_loop_reverse(dir_table, DT_BYTES, &gsi, - global_stats_loop_function, &gsi.ret, &gsi.osl_errno); - if (ret < 0) - return ret; - printf("\n"); - - gsi.count = conf.limit_arg; - gsi.flags = GSF_PRINT_DIRNAME | GSF_PRINT_FILES; - printf("By file count%s:\n", - count_unit_buf); - ret = adu_loop_reverse(dir_table, DT_FILES, &gsi, - global_stats_loop_function, &gsi.ret, &gsi.osl_errno); - if (ret < 0) - return ret; - printf("\n"); - print_global_summary(); - print_user_stats(); - print_id_stats(); - return 1; -} - -static char *get_uid_list_name(void) +char *get_uid_list_name(void) { return make_message("%s/uid_list", conf.database_dir_arg); } @@ -1123,7 +624,7 @@ static int write_uid_list(void) return ret; } -static int open_dir_table(void) +int open_dir_table(void) { if (!dir_table_desc.dir) /* we did not create the table */ dir_table_desc.dir = adu_strdup(conf.database_dir_arg); @@ -1157,63 +658,6 @@ out: return ret; } -static int read_uid_file(void) -{ - size_t size; - uint32_t n; - char *filename = get_uid_list_name(), *map; - int ret = mmap_full_file(filename, O_RDONLY, (void **)&map, &size, NULL); - - if (ret < 0) { - INFO_LOG("failed to map %s\n", filename); - free(filename); - return ret; - } - num_uids = size / 4; - INFO_LOG("found %u uids in %s\n", (unsigned)num_uids, filename); - free(filename); - /* hash table size should be a power of two and larger than the number of uids */ - uid_hash_table_size = 4; - while (uid_hash_table_size < num_uids) - uid_hash_table_size *= 2; - create_hash_table(); - for (n = 0; n < num_uids; n++) { - uint32_t uid = read_u32(map + n * sizeof(uid)); - ret = search_uid(uid, OPEN_USER_TABLE, NULL); - if (ret < 0) - goto out; - } -out: - adu_munmap(map, size); - return ret; -} - -static int com_select(void) -{ - int ret; - - if (conf.count_unit_arg != count_unit_arg_h) - count_unit_buf[1] = count_unit_abbrevs[conf.count_unit_arg]; - else - count_unit_buf[0] = '\0'; - if (conf.size_unit_arg != size_unit_arg_h) - size_unit_buf[1] = size_unit_abbrevs[conf.size_unit_arg]; - else - size_unit_buf[0] = '\0'; - - ret = open_dir_table(); - if (ret < 0) - return ret; - check_signals(); - ret = read_uid_file(); - if (ret < 0) - return ret; - check_signals(); - ret = print_statistics(); - close_all_tables(); - return ret; -} - static int check_args(void) { int i, ret; diff --git a/adu.h b/adu.h index 775af7f..69488a4 100644 --- a/adu.h +++ b/adu.h @@ -4,7 +4,7 @@ * Licensed under the GPL v2. For licencing details see COPYING. */ -/** \file para.h global paraslash definitions */ +/** \file adu.h Global definitions. */ #include #include @@ -26,13 +26,6 @@ #include #include "gcc-compat.h" -/** compute the minimum of \a a and \a b */ -#define MIN(a,b) ((a) < (b) ? (a) : (b)) -/** compute the maximum of \a a and \a b */ -#define MAX(a,b) ((a) > (b) ? (a) : (b)) -/** compute the absolute value of \a a */ -#define ABS(a) ((a) > 0 ? (a) : -(a)) - /** debug loglevel, gets really noisy */ #define DEBUG 1 /** still noisy, but won't fill your disk */ @@ -94,7 +87,6 @@ #define EMERG_LOG(...) #endif /** \endcond */ -__printf_2_3 void __log(int, const char*, ...); /** * Write a log message to a dynamically allocated string. @@ -125,3 +117,94 @@ __printf_2_3 void __log(int, const char*, ...); p = adu_realloc(p, size); \ } \ } + +#define FOR_EACH_USER(ui) for (ui = uid_hash_table; ui && ui < uid_hash_table \ + + uid_hash_table_size; ui++) + +/** The columns of the directory table. */ +enum dir_table_columns { + /** The name of the directory. */ + DT_NAME, + /** The dir count number. */ + DT_NUM, + /** The number of the parent directory. */ + DT_PARENT_NUM, + /** The number of bytes of all regular files. */ + DT_BYTES, + /** The number of all regular files. */ + DT_FILES, + /** Number of columns in this table. */ + NUM_DT_COLUMNS +}; + +/** The columns of the id table. */ +enum user_table_columns { + /** The numer of the directory. */ + UT_DIR_NUM, + /** The number of bytes of all regular files in this dir owned by this id. */ + UT_BYTES, + /** The number of files in this dir owned by this id. */ + UT_FILES, + /** Number of columns in this table. */ + NUM_UT_COLUMNS +}; + +enum uid_info_flags { + /** Whether this slot of the hash table is used. */ + UI_FL_SLOT_USED = 1, + /** Whether this uid should be taken into account. */ + UI_FL_ADMISSIBLE = 2, +}; + +struct user_info { + uint32_t uid; + uint32_t flags; + char *pw_name; + struct osl_table *table; + uint64_t files; + uint64_t bytes; + uint64_t dirs; + struct osl_table_description *desc; +}; + +struct uid_range { + uint32_t low; + uint32_t high; +}; + +enum search_uid_flags { + OPEN_USER_TABLE = 1, + CREATE_USER_TABLE = 2, +}; + +extern uint32_t num_uids; +extern uint32_t uid_hash_table_size; +extern struct osl_table *dir_table; +extern struct user_info *uid_hash_table; +extern uint64_t num_dirs; +extern uint64_t num_files; +extern uint64_t num_bytes; +extern struct gengetopt_args_info conf; + +/* adu.c */ +__printf_2_3 void __log(int, const char*, ...); +int open_dir_table(void); +void check_signals(void); +void close_all_tables(void); +char *get_uid_list_name(void); +void create_hash_table(void); +int search_uid(uint32_t uid, enum search_uid_flags flags, + struct user_info **ui_ptr); + +/* select.c */ +int com_select(void); + +static inline int ui_used(struct user_info *ui) +{ + return ui->flags & UI_FL_SLOT_USED; +} + +static inline int ui_admissible(struct user_info *ui) +{ + return ui->flags & UI_FL_ADMISSIBLE; +} diff --git a/select.c b/select.c new file mode 100644 index 0000000..b394676 --- /dev/null +++ b/select.c @@ -0,0 +1,512 @@ +/* + * Copyright (C) 2008 Andre Noll + * + * Licensed under the GPL v2. For licencing details see COPYING. + */ + +/** \file select.c The select mode of adu. */ + +#include /* readdir() */ +#include "adu.h" +#include "gcc-compat.h" +#include "cmdline.h" +#include "fd.h" +#include "string.h" +#include "error.h" +#include "portable_io.h" + +/** The decimal representation of an uint64_t never exceeds that size. */ +#define FORMATED_VALUE_SIZE 25 + +/* these get filled in by the select command. */ +static char count_unit_buf[4] = "( )", size_unit_buf[4] = "( )"; + +enum global_stats_flags { + GSF_PRINT_DIRNAME = 1, + GSF_PRINT_BYTES = 2, + GSF_PRINT_FILES = 4, + GSF_COMPUTE_SUMMARY = 8, +}; + +struct global_stats_info { + uint32_t count; + int ret; + int osl_errno; + enum global_stats_flags flags; +}; + +enum user_stats_flags { + USF_PRINT_DIRNAME = 1, + USF_PRINT_BYTES = 2, + USF_PRINT_FILES = 4, + USF_COMPUTE_SUMMARY = 8, +}; + +struct user_stats_info { + uint32_t count; + enum user_stats_flags flags; + int ret; + int osl_errno; + struct user_info *ui; +}; + +static const uint64_t size_unit_divisors[] = { + [size_unit_arg_b] = 1ULL, + [size_unit_arg_k] = 1024ULL, + [size_unit_arg_m] = 1024ULL * 1024ULL, + [size_unit_arg_g] = 1024ULL * 1024ULL * 1024ULL, + [size_unit_arg_t] = 1024ULL * 1024ULL * 1024ULL * 1024ULL, +}; + +static const uint64_t count_unit_divisors[] = { + + [count_unit_arg_n] = 1ULL, + [count_unit_arg_k] = 1000ULL, + [count_unit_arg_m] = 1000ULL * 1000ULL, + [count_unit_arg_g] = 1000ULL * 1000ULL * 1000ULL, + [count_unit_arg_t] = 1000ULL * 1000ULL * 1000ULL * 1000ULL, +}; + +static const char size_unit_abbrevs[] = " BKMGT"; +static const char count_unit_abbrevs[] = " kmgt"; + +static enum enum_size_unit format_size_value(enum enum_size_unit unit, + uint64_t value, int print_unit, char *result) +{ + enum enum_size_unit u = unit; + char unit_buf[2] = "\0\0"; + + if (unit == size_unit_arg_h) /* human readable */ + for (u = size_unit_arg_b; u < size_unit_arg_t && + value > size_unit_divisors[u + 1]; u++) + ; /* nothing */ + if (print_unit) + unit_buf[0] = size_unit_abbrevs[u]; + sprintf(result, "%llu%s", + (long long unsigned)value / size_unit_divisors[u], unit_buf); + return u; +} + +static enum enum_count_unit format_count_value(enum enum_count_unit unit, + uint64_t value, int print_unit, char *result) +{ + enum enum_count_unit u = unit; + char unit_buf[2] = "\0\0"; + + if (unit == count_unit_arg_h) /* human readable */ + for (u = count_unit_arg_n; u < count_unit_arg_t && + value > count_unit_divisors[u + 1]; u++) + ; /* nothing */ + if (print_unit) + unit_buf[0] = count_unit_abbrevs[u]; + sprintf(result, "%llu%s", + (long long unsigned)value / count_unit_divisors[u], unit_buf); + return u; +} + +static int get_dir_name_by_number(uint64_t *dirnum, char **name) +{ + char *result = NULL, *tmp; + struct osl_row *row; + uint64_t val = *dirnum; + struct osl_object obj = {.data = &val, .size = sizeof(val)}; + int ret; + +again: + ret = osl(osl_get_row(dir_table, DT_NUM, &obj, &row)); + if (ret < 0) + goto out; + ret = osl(osl_get_object(dir_table, row, DT_NAME, &obj)); + if (ret < 0) + goto out; + if (result) { + tmp = make_message("%s/%s", (char *)obj.data, result); + free(result); + result = tmp; + } else + result = adu_strdup((char *)obj.data); + ret = osl(osl_get_object(dir_table, row, DT_PARENT_NUM, &obj)); + if (ret < 0) + goto out; + val = *(uint64_t *)obj.data; + if (val) + goto again; +out: + if (ret < 0) { + free(result); + *name = NULL; + } else + *name = result; + return ret; +} + +static int get_dir_name_of_row(struct osl_row *dir_table_row, char **name) +{ + struct osl_object obj; + int ret; + char *this_dir, *prefix = NULL; + + *name = NULL; + ret = osl(osl_get_object(dir_table, dir_table_row, DT_NAME, &obj)); + if (ret < 0) + return ret; + this_dir = adu_strdup((char *)obj.data); + ret = osl(osl_get_object(dir_table, dir_table_row, DT_PARENT_NUM, &obj)); + if (ret < 0) + goto out; + if (!*(uint64_t *)obj.data) { + *name = this_dir; + return 1; + } + ret = get_dir_name_by_number((uint64_t *)obj.data, &prefix); + if (ret < 0) + goto out; + *name = make_message("%s/%s", prefix, this_dir); + free(prefix); + ret = 1; +out: + free(this_dir); + return ret; +} +static int user_stats_loop_function(struct osl_row *row, void *data) +{ + struct user_stats_info *usi = data; + struct osl_object obj; + int ret, summary = usi->flags & GSF_COMPUTE_SUMMARY; + char formated_value[FORMATED_VALUE_SIZE]; + + check_signals(); + if (!usi->count && !summary) { + ret = -E_LOOP_COMPLETE; + goto err; + } + if (summary || (usi->count && (usi->flags & USF_PRINT_FILES))) { + uint64_t files; + ret = osl(osl_get_object(usi->ui->table, row, UT_FILES, &obj)); + if (ret < 0) + goto err; + files = *(uint64_t *)obj.data; + if (usi->count && (usi->flags & USF_PRINT_FILES)) { + format_count_value(conf.count_unit_arg, files, + conf.count_unit_arg == count_unit_arg_h, + formated_value); + printf("\t%s%s", formated_value, + (usi->flags & (USF_PRINT_BYTES | USF_PRINT_DIRNAME))? + "\t" : "\n" + ); + } + if (summary) + usi->ui->files += files; + } + if (summary || (usi->count && (usi->flags & USF_PRINT_BYTES))) { + uint64_t bytes; + ret = osl(osl_get_object(usi->ui->table, row, UT_BYTES, &obj)); + if (ret < 0) + goto err; + bytes = *(uint64_t *)obj.data; + if (usi->count && (usi->flags & USF_PRINT_BYTES)) { + format_size_value(conf.size_unit_arg, bytes, + conf.size_unit_arg == size_unit_arg_h, + formated_value); + printf("%s%s%s", + (usi->flags & USF_PRINT_FILES)? "" : "\t", + formated_value, + usi->flags & USF_PRINT_DIRNAME? "\t" : "\n" + ); + } + if (summary) { + usi->ui->bytes += bytes; + usi->ui->dirs++; + } + + } + if (usi->count && (usi->flags & USF_PRINT_DIRNAME)) { + char *dirname; + ret = osl(osl_get_object(usi->ui->table, row, UT_DIR_NUM, &obj)); + if (ret < 0) + goto err; + ret = get_dir_name_by_number((uint64_t *)obj.data, &dirname); + if (ret < 0) + goto err; + printf("%s%s\n", + (usi->flags & (USF_PRINT_BYTES | USF_PRINT_FILES))? "" : "\t", + dirname); + free(dirname); + } + if (usi->count > 0) + usi->count--; + return 1; +err: + usi->ret = ret; + usi->osl_errno = (ret == -E_OSL)? osl_errno : 0; + return -1; +} + +static int global_stats_loop_function(struct osl_row *row, void *data) +{ + struct global_stats_info *gsi = data; + struct osl_object obj; + char *dirname, formated_value[FORMATED_VALUE_SIZE]; + int ret, summary = gsi->flags & GSF_COMPUTE_SUMMARY; + + check_signals(); + if (!gsi->count && !summary) { + ret = -E_LOOP_COMPLETE; + goto err; + } + if (summary || (gsi->count && (gsi->flags & GSF_PRINT_FILES))) { + uint64_t files; + ret = osl(osl_get_object(dir_table, row, DT_FILES, &obj)); + if (ret < 0) + goto err; + files = *(uint64_t *)obj.data; + if (gsi->count && (gsi->flags & GSF_PRINT_FILES)) { + format_count_value(conf.count_unit_arg, files, + conf.count_unit_arg == count_unit_arg_h, + formated_value); + printf("\t%s%s", formated_value, + (gsi->flags & (GSF_PRINT_BYTES | GSF_PRINT_DIRNAME))? + "\t" : "\n"); + } + if (summary) + num_files += files; + } + if (summary || (gsi->count && (gsi->flags & GSF_PRINT_BYTES))) { + uint64_t bytes; + ret = osl(osl_get_object(dir_table, row, DT_BYTES, &obj)); + if (ret < 0) + goto err; + bytes = *(uint64_t *)obj.data; + if (gsi->count && (gsi->flags & GSF_PRINT_BYTES)) { + format_size_value(conf.size_unit_arg, bytes, + conf.size_unit_arg == size_unit_arg_h, + formated_value); + printf("%s%s%s", + (gsi->flags & GSF_PRINT_FILES)? "" : "\t", + formated_value, + (gsi->flags & GSF_PRINT_DIRNAME)? "\t" : "\n" + ); + } + if (summary) { + num_bytes += bytes; + num_dirs++; + } + } + if (gsi->count && (gsi->flags & GSF_PRINT_DIRNAME)) { + ret = get_dir_name_of_row(row, &dirname); + if (ret < 0) + goto err; + printf("%s%s\n", + (gsi->flags & (GSF_PRINT_BYTES | GSF_PRINT_FILES))? "" : "\t", + dirname); + free(dirname); + } + if (gsi->count > 0) + gsi->count--; + return 1; +err: + gsi->ret = ret; + gsi->osl_errno = (ret == -E_OSL)? osl_errno : 0; + return -1; +} + +static int check_loop_return(int ret, int loop_ret, int loop_osl_errno) +{ + if (ret >= 0) + return ret; + assert(ret == -E_OSL); + if (osl_errno != E_OSL_LOOP) + /* error not caused by loop function returning negative. */ + return ret; + assert(loop_ret < 0); + if (loop_ret == -E_LOOP_COMPLETE) /* no error */ + return 1; + if (loop_ret == -E_OSL) { /* osl error in loop function */ + assert(loop_osl_errno); + osl_errno = loop_osl_errno; + } + return loop_ret; +} + +static int adu_loop_reverse(struct osl_table *t, unsigned col_num, void *private_data, + osl_rbtree_loop_func *func, int *loop_ret, int *loop_osl_errno) +{ + int ret = osl(osl_rbtree_loop_reverse(t, col_num, private_data, func)); + return check_loop_return(ret, *loop_ret, *loop_osl_errno); +} + +static void print_global_summary(void) +{ + char d[FORMATED_VALUE_SIZE], f[FORMATED_VALUE_SIZE], + s[FORMATED_VALUE_SIZE]; + enum enum_count_unit ud, uf; + enum enum_size_unit us; + + ud = format_count_value(conf.count_unit_arg, num_dirs, 0, d); + uf = format_count_value(conf.count_unit_arg, num_files, 0, f); + us = format_size_value(conf.size_unit_arg, num_bytes, 0, s); + + printf("Global summary " + "(dirs(%c)/files(%c)/size(%c))\n" + "\t%s\t%s\t%s\n\n", + count_unit_abbrevs[ud], + count_unit_abbrevs[uf], + size_unit_abbrevs[us], + d, f, s + ); + +} + +static void print_id_stats(void) +{ + struct user_info *ui; + + printf("User summary " + "(pw_name/uid/dirs%s/files%s/size%s):\n", + count_unit_buf, count_unit_buf, size_unit_buf); + FOR_EACH_USER(ui) { + char formated_dir_count[FORMATED_VALUE_SIZE], + formated_file_count[FORMATED_VALUE_SIZE], + formated_bytes[FORMATED_VALUE_SIZE ]; + if (!ui_used(ui) || !ui_admissible(ui)) + continue; + format_count_value(conf.count_unit_arg, ui->dirs, + conf.count_unit_arg == count_unit_arg_h, + formated_dir_count); + format_count_value(conf.count_unit_arg, ui->files, + conf.count_unit_arg == count_unit_arg_h, + formated_file_count); + format_size_value(conf.size_unit_arg, ui->bytes, + conf.size_unit_arg == size_unit_arg_h, + formated_bytes); + printf("\t%s\t%u\t%s\t%s\t%s\n", + ui->pw_name? ui->pw_name : "?", + (unsigned)ui->uid, + formated_dir_count, + formated_file_count, + formated_bytes + ); + } +} + +static int print_user_stats(void) +{ + struct user_info *ui; + int ret; + + FOR_EACH_USER(ui) { + struct user_stats_info usi = { + .count = conf.limit_arg, + .ui = ui + }; + if (!ui_used(ui) || !ui_admissible(ui)) + continue; + usi.flags = USF_PRINT_DIRNAME | USF_PRINT_BYTES | USF_COMPUTE_SUMMARY; + printf("%s (uid %u), by size%s:\n", + ui->pw_name? ui->pw_name : "?", (unsigned)ui->uid, + size_unit_buf); + ret = adu_loop_reverse(ui->table, UT_BYTES, &usi, user_stats_loop_function, + &usi.ret, &usi.osl_errno); + if (ret < 0) + return ret; + printf("\n%s (uid %u), by file count%s:\n", + ui->pw_name? ui->pw_name : "?", (unsigned)ui->uid, + count_unit_buf); + usi.count = conf.limit_arg, + usi.flags = USF_PRINT_DIRNAME | USF_PRINT_FILES; + ret = adu_loop_reverse(ui->table, UT_FILES, &usi, user_stats_loop_function, + &usi.ret, &usi.osl_errno); + if (ret < 0) + return ret; + printf("\n"); + } + return 1; +} + +static int print_statistics(void) +{ + int ret; + struct global_stats_info gsi = { + .count = conf.limit_arg, + .flags = GSF_PRINT_DIRNAME | GSF_PRINT_BYTES | GSF_COMPUTE_SUMMARY + }; + + printf("By size%s:\n", + size_unit_buf); + ret = adu_loop_reverse(dir_table, DT_BYTES, &gsi, + global_stats_loop_function, &gsi.ret, &gsi.osl_errno); + if (ret < 0) + return ret; + printf("\n"); + + gsi.count = conf.limit_arg; + gsi.flags = GSF_PRINT_DIRNAME | GSF_PRINT_FILES; + printf("By file count%s:\n", + count_unit_buf); + ret = adu_loop_reverse(dir_table, DT_FILES, &gsi, + global_stats_loop_function, &gsi.ret, &gsi.osl_errno); + if (ret < 0) + return ret; + printf("\n"); + print_global_summary(); + print_user_stats(); + print_id_stats(); + return 1; +} + +static int read_uid_file(void) +{ + size_t size; + uint32_t n; + char *filename = get_uid_list_name(), *map; + int ret = mmap_full_file(filename, O_RDONLY, (void **)&map, &size, NULL); + + if (ret < 0) { + INFO_LOG("failed to map %s\n", filename); + free(filename); + return ret; + } + num_uids = size / 4; + INFO_LOG("found %u uids in %s\n", (unsigned)num_uids, filename); + free(filename); + /* hash table size should be a power of two and larger than the number of uids */ + uid_hash_table_size = 4; + while (uid_hash_table_size < num_uids) + uid_hash_table_size *= 2; + create_hash_table(); + for (n = 0; n < num_uids; n++) { + uint32_t uid = read_u32(map + n * sizeof(uid)); + ret = search_uid(uid, OPEN_USER_TABLE, NULL); + if (ret < 0) + goto out; + } +out: + adu_munmap(map, size); + return ret; +} + +int com_select(void) +{ + int ret; + + if (conf.count_unit_arg != count_unit_arg_h) + count_unit_buf[1] = count_unit_abbrevs[conf.count_unit_arg]; + else + count_unit_buf[0] = '\0'; + if (conf.size_unit_arg != size_unit_arg_h) + size_unit_buf[1] = size_unit_abbrevs[conf.size_unit_arg]; + else + size_unit_buf[0] = '\0'; + + ret = open_dir_table(); + if (ret < 0) + return ret; + check_signals(); + ret = read_uid_file(); + if (ret < 0) + return ret; + check_signals(); + ret = print_statistics(); + close_all_tables(); + return ret; +}