-static uint32_t double_hash(uint32_t uid, uint32_t probe_num)
-{
- return (uid * PRIME1 + ((uid * PRIME2) | 1) * probe_num)
- % uid_hash_table_size;
-}
-
-#define FOR_EACH_USER(ui) for (ui = uid_hash_table; ui && ui < uid_hash_table \
- + uid_hash_table_size; ui++)
-
-enum search_uid_flags {
- OPEN_USER_TABLE = 1,
- CREATE_USER_TABLE = 2,
-};
-
-static int uid_is_admissible(uint32_t uid)
-{
- int i;
-
- for (i = 0; i < conf.uid_given; i++) {
- struct uid_range *ur = admissible_uids + i;
-
- if (ur->low <= uid && ur->high >= uid)
- break;
- }
- i = !conf.uid_given || i < conf.uid_given;
- DEBUG_LOG("uid %u is %sadmissible\n", (unsigned)uid,
- i? "" : "not ");
- return i;
-}
-
-static int search_uid(uint32_t uid, enum search_uid_flags flags,
- struct user_info **ui_ptr)
-{
- uint32_t p;
-
- for (p = 0; p < uid_hash_table_size; p++) {
- struct user_info *ui = uid_hash_table + double_hash(uid, p);
-
- if (!ui_used(ui)) {
- int ret;
- if (!flags)
- return -E_BAD_UID;
- ui->uid = uid;
- ui->flags |= UI_FL_SLOT_USED;
- if (!uid_is_admissible(uid))
- return 0;
- ui->flags |= UI_FL_ADMISSIBLE;
- ret = open_user_table(ui, flags & CREATE_USER_TABLE);
- if (ret < 0)
- return ret;
-
- if (ui_ptr)
- *ui_ptr = ui;
- return 1;
- }
- if (ui->uid != uid)
- continue;
- if (ui_ptr)
- *ui_ptr = ui;
- return 0;
- }
- return flags? -E_HASH_TABLE_OVERFLOW : -E_BAD_UID;
-}
-
-static int update_user_row(struct osl_table *t, uint64_t dir_num,
- uint64_t *add)
-{
- struct osl_row *row;
- struct osl_object obj = {.data = &dir_num, .size = sizeof(dir_num)};
-
- int ret = osl(osl_get_row(t, UT_DIR_NUM, &obj, &row));
-
- if (ret == -E_OSL && osl_errno != E_OSL_RB_KEY_NOT_FOUND)
- return ret;
- if (ret < 0) { /* this is the first file we add */
- struct osl_object objects[NUM_UT_COLUMNS];
- uint64_t num_files = 1;
-
- objects[UT_DIR_NUM].data = &dir_num;
- objects[UT_DIR_NUM].size = sizeof(dir_num);
- objects[UT_BYTES].data = add;
- objects[UT_BYTES].size = sizeof(*add);
- objects[UT_FILES].data = &num_files;
- objects[UT_FILES].size = sizeof(num_files);
- INFO_LOG("######################### ret: %d\n", ret);
- ret = osl(osl_add_row(t, objects));
- INFO_LOG("######################### ret: %d\n", ret);
- return ret;
- } else { /* add size and increment file count */
- uint64_t num;
- struct osl_object obj1, obj2 = {.data = &num, .size = sizeof(num)};
-
- ret = osl(osl_get_object(t, row, UT_BYTES, &obj1));
- if (ret < 0)
- return ret;
- num = *(uint64_t *)obj1.data + *add;
- ret = osl(osl_update_object(t, row, UT_BYTES, &obj2));
- if (ret < 0)
- return ret;
- ret = osl(osl_get_object(t, row, UT_FILES, &obj1));
- if (ret < 0)
- return ret;
- num = *(uint64_t *)obj1.data + 1;
- return osl(osl_update_object(t, row, UT_FILES, &obj2));
- }
-}
-
-static uint64_t num_dirs;
-static uint64_t num_files;
-static uint64_t num_bytes;
-
-int scan_dir(char *dirname, uint64_t *parent_dir_num)
-{
- DIR *dir;
- struct dirent *entry;
- int ret, cwd_fd, ret2;
- uint64_t dir_size = 0, dir_files = 0;
- uint64_t this_dir_num = ++num_dirs;
-
- DEBUG_LOG("----------------- %llu: %s\n", (long long unsigned)num_dirs, dirname);
- ret = para_opendir(dirname, &dir, &cwd_fd);
- if (ret < 0) {
- if (ret != -ERRNO_TO_ERROR(EACCES))
- return ret;
- WARNING_LOG("permission denied for %s\n", dirname);
- return 1;
- }
- while ((entry = readdir(dir))) {
- mode_t m;
- struct stat s;
- uint32_t uid;
- uint64_t size;
- struct user_info *ui;
-
- if (!strcmp(entry->d_name, "."))
- continue;
- if (!strcmp(entry->d_name, ".."))
- continue;
- if (lstat(entry->d_name, &s) == -1) {
- WARNING_LOG("lstat error for %s/%s\n", dirname,
- entry->d_name);
- continue;
- }
- m = s.st_mode;
- if (!S_ISREG(m) && !S_ISDIR(m))
- continue;
- if (S_ISDIR(m)) {
- ret = scan_dir(entry->d_name, &this_dir_num);
- if (ret < 0)
- goto out;
- continue;
- }
- /* regular file */
- size = s.st_size;
- dir_size += size;
- num_bytes += size;
- dir_files++;
- num_files++;
- uid = s.st_uid;
- ret = search_uid(uid, CREATE_USER_TABLE | OPEN_USER_TABLE, &ui);
- if (ret < 0)
- goto out;
- ui->bytes += size;
- ui->files++;
- ret = update_user_row(ui->table, this_dir_num, &size);
- if (ret < 0)
- goto out;
- }
- ret = add_directory(dirname, &this_dir_num, parent_dir_num,
- &dir_size, &dir_files);
-out:
- closedir(dir);
- ret2 = para_fchdir(cwd_fd);
- if (ret2 < 0 && ret >= 0)
- ret = ret2;
- close(cwd_fd);
- return ret;
-}
-
-static int get_dir_name_by_number(uint64_t *dirnum, char **name)
-{
- char *result = NULL, *tmp;
- struct osl_row *row;
- uint64_t val = *dirnum;
- struct osl_object obj = {.data = &val, .size = sizeof(val)};
- int ret;
-
-again:
- ret = osl(osl_get_row(dir_table, DT_NUM, &obj, &row));
- if (ret < 0)
- goto out;
- ret = osl(osl_get_object(dir_table, row, DT_NAME, &obj));
- if (ret < 0)
- goto out;
- if (result) {
- tmp = make_message("%s/%s", (char *)obj.data, result);
- free(result);
- result = tmp;
- } else
- result = para_strdup((char *)obj.data);
- ret = osl(osl_get_object(dir_table, row, DT_PARENT_NUM, &obj));
- if (ret < 0)
- goto out;
- val = *(uint64_t *)obj.data;
- if (val)
- goto again;
-out:
- if (ret < 0) {
- free(result);
- *name = NULL;
- } else
- *name = result;
- return ret;
-}
-
-static int get_dir_name_of_row(struct osl_row *dir_table_row, char **name)
-{
- struct osl_object obj;
- int ret;
- char *this_dir, *prefix = NULL;
-
- *name = NULL;
- ret = osl(osl_get_object(dir_table, dir_table_row, DT_NAME, &obj));
- if (ret < 0)
- return ret;
- this_dir = para_strdup((char *)obj.data);
- ret = osl(osl_get_object(dir_table, dir_table_row, DT_PARENT_NUM, &obj));
- if (ret < 0)
- goto out;
- if (!*(uint64_t *)obj.data) {
- *name = this_dir;
- return 1;
- }
- ret = get_dir_name_by_number((uint64_t *)obj.data, &prefix);
- if (ret < 0)
- goto out;
- *name = make_message("%s/%s", prefix, this_dir);
- free(prefix);
- ret = 1;
-out:
- free(this_dir);
- return ret;
-}
-
-const uint64_t size_unit_divisors[] = {
- [size_unit_arg_b] = 1ULL,
- [size_unit_arg_k] = 1024ULL,
- [size_unit_arg_m] = 1024ULL * 1024ULL,
- [size_unit_arg_g] = 1024ULL * 1024ULL * 1024ULL,
- [size_unit_arg_t] = 1024ULL * 1024ULL * 1024ULL * 1024ULL,
-};
-
-const uint64_t count_unit_divisors[] = {
-
- [count_unit_arg_n] = 1ULL,
- [count_unit_arg_k] = 1000ULL,
- [count_unit_arg_m] = 1000ULL * 1000ULL,
- [count_unit_arg_g] = 1000ULL * 1000ULL * 1000ULL,
- [count_unit_arg_t] = 1000ULL * 1000ULL * 1000ULL * 1000ULL,
-};
-
-const char size_unit_abbrevs[] = " BKMGT";
-const char count_unit_abbrevs[] = " kmgt";
-
-static enum enum_size_unit format_size_value(enum enum_size_unit unit,
- uint64_t value, int print_unit, char *result)
-{
- enum enum_size_unit u = unit;
- char unit_buf[2] = "\0\0";
-
- if (unit == size_unit_arg_h) /* human readable */
- for (u = size_unit_arg_b; u < size_unit_arg_t &&
- value > size_unit_divisors[u + 1]; u++)
- ; /* nothing */
- if (print_unit)
- unit_buf[0] = size_unit_abbrevs[u];
- sprintf(result, "%llu%s",
- (long long unsigned)value / size_unit_divisors[u], unit_buf);
- return u;
-}
-
-static enum enum_count_unit format_count_value(enum enum_count_unit unit,
- uint64_t value, int print_unit, char *result)
-{
- enum enum_count_unit u = unit;
- char unit_buf[2] = "\0\0";
-
- if (unit == count_unit_arg_h) /* human readable */
- for (u = count_unit_arg_n; u < count_unit_arg_t &&
- value > count_unit_divisors[u + 1]; u++)
- ; /* nothing */
- if (print_unit)
- unit_buf[0] = count_unit_abbrevs[u];
- sprintf(result, "%llu%s",
- (long long unsigned)value / count_unit_divisors[u], unit_buf);
- return u;
-}
-
-enum global_stats_flags {
- GSF_PRINT_DIRNAME = 1,
- GSF_PRINT_BYTES = 2,
- GSF_PRINT_FILES = 4,
- GSF_COMPUTE_SUMMARY = 8,
-};
-
-struct global_stats_info {
- uint32_t count;
- int ret;
- int osl_errno;
- enum global_stats_flags flags;
-};
-
-static int global_stats_loop_function(struct osl_row *row, void *data)
-{
- struct global_stats_info *gsi = data;
- struct osl_object obj;
- char *dirname, formated_value[FORMATED_VALUE_SIZE];
- int ret, summary = gsi->flags & GSF_COMPUTE_SUMMARY;
-
- if (!gsi->count && !summary) {
- ret = -E_LOOP_COMPLETE;
- goto err;
- }
- if (summary || (gsi->count && (gsi->flags & GSF_PRINT_FILES))) {
- uint64_t files;
- ret = osl(osl_get_object(dir_table, row, DT_FILES, &obj));
- if (ret < 0)
- goto err;
- files = *(uint64_t *)obj.data;
- if (gsi->count && (gsi->flags & GSF_PRINT_FILES)) {
- format_count_value(conf.count_unit_arg, files,
- conf.count_unit_arg == count_unit_arg_h,
- formated_value);
- printf("\t%s%s", formated_value,
- (gsi->flags & (GSF_PRINT_BYTES | GSF_PRINT_DIRNAME))?
- "\t" : "\n");
- }
- if (summary)
- num_files += files;
- }
- if (summary || (gsi->count && (gsi->flags & GSF_PRINT_BYTES))) {
- uint64_t bytes;
- ret = osl(osl_get_object(dir_table, row, DT_BYTES, &obj));
- if (ret < 0)
- goto err;
- bytes = *(uint64_t *)obj.data;
- if (gsi->count && (gsi->flags & GSF_PRINT_BYTES)) {
- format_size_value(conf.size_unit_arg, bytes,
- conf.size_unit_arg == size_unit_arg_h,
- formated_value);
- printf("%s%s%s",
- (gsi->flags & GSF_PRINT_FILES)? "" : "\t",
- formated_value,
- (gsi->flags & GSF_PRINT_DIRNAME)? "\t" : "\n"
- );
- }
- if (summary) {
- num_bytes += bytes;
- num_dirs++;
- }
- }
- if (gsi->count && (gsi->flags & GSF_PRINT_DIRNAME)) {
- ret = get_dir_name_of_row(row, &dirname);
- if (ret < 0)
- goto err;
- printf("%s%s\n",
- (gsi->flags & (GSF_PRINT_BYTES | GSF_PRINT_FILES))? "" : "\t",
- dirname);
- }
- if (gsi->count > 0)
- gsi->count--;
- return 1;
-err:
- gsi->ret = ret;
- gsi->osl_errno = (ret == -E_OSL)? osl_errno : 0;
- return -1;
-}
-
-static void print_id_stats(void)
-{
- struct user_info *ui;
-
- printf("User summary "
- "(uid/dirs%s/files%s/size%s):\n",
- count_unit_buf, count_unit_buf, size_unit_buf);
- FOR_EACH_USER(ui) {
- char formated_dir_count[FORMATED_VALUE_SIZE],
- formated_file_count[FORMATED_VALUE_SIZE],
- formated_bytes[FORMATED_VALUE_SIZE ];
- if (!ui_used(ui) || !ui_admissible(ui))
- continue;
- format_count_value(conf.count_unit_arg, ui->dirs,
- conf.count_unit_arg == count_unit_arg_h,
- formated_dir_count);
- format_count_value(conf.count_unit_arg, ui->files,
- conf.count_unit_arg == count_unit_arg_h,
- formated_file_count);
- format_size_value(conf.size_unit_arg, ui->bytes,
- conf.size_unit_arg == size_unit_arg_h,
- formated_bytes);
- printf("\t%u\t%s\t%s\t%s\n", (unsigned)ui->uid,
- formated_dir_count,
- formated_file_count,
- formated_bytes
- );
- }
-}
-
-enum user_stats_flags {
- USF_PRINT_DIRNAME = 1,
- USF_PRINT_BYTES = 2,
- USF_PRINT_FILES = 4,
- USF_COMPUTE_SUMMARY = 8,
-};
-
-struct user_stats_info {
- uint32_t count;
- enum user_stats_flags flags;
- int ret;
- int osl_errno;
- struct user_info *ui;
-};
-
-static int user_stats_loop_function(struct osl_row *row, void *data)
-{
- struct user_stats_info *usi = data;
- struct osl_object obj;
- int ret, summary = usi->flags & GSF_COMPUTE_SUMMARY;
- char formated_value[FORMATED_VALUE_SIZE];
-
- if (!usi->count && !summary) {
- ret = -E_LOOP_COMPLETE;
- goto err;
- }
- if (summary || (usi->count && (usi->flags & USF_PRINT_FILES))) {
- uint64_t files;
- ret = osl(osl_get_object(usi->ui->table, row, UT_FILES, &obj));
- if (ret < 0)
- goto err;
- files = *(uint64_t *)obj.data;
- if (usi->count && (usi->flags & USF_PRINT_FILES)) {
- format_count_value(conf.count_unit_arg, files,
- conf.count_unit_arg == count_unit_arg_h,
- formated_value);
- printf("\t%s%s", formated_value,
- (usi->flags & (USF_PRINT_BYTES | USF_PRINT_DIRNAME))?
- "\t" : "\n"
- );
- }
- if (summary)
- usi->ui->files += files;
- }
- if (summary || (usi->count && (usi->flags & USF_PRINT_BYTES))) {
- uint64_t bytes;
- ret = osl(osl_get_object(usi->ui->table, row, UT_BYTES, &obj));
- if (ret < 0)
- goto err;
- bytes = *(uint64_t *)obj.data;
- if (usi->count && (usi->flags & USF_PRINT_BYTES)) {
- format_size_value(conf.size_unit_arg, bytes,
- conf.size_unit_arg == size_unit_arg_h,
- formated_value);
- printf("%s%s%s",
- (usi->flags & USF_PRINT_FILES)? "" : "\t",
- formated_value,
- usi->flags & USF_PRINT_DIRNAME? "\t" : "\n"
- );
- }
- if (summary) {
- usi->ui->bytes += bytes;
- usi->ui->dirs++;
- }
-
- }
- if (usi->count && (usi->flags & USF_PRINT_DIRNAME)) {
- char *dirname;
- ret = osl(osl_get_object(usi->ui->table, row, UT_DIR_NUM, &obj));
- if (ret < 0)
- goto err;
- ret = get_dir_name_by_number((uint64_t *)obj.data, &dirname);
- if (ret < 0)
- goto err;
- printf("%s%s\n",
- (usi->flags & (USF_PRINT_BYTES | USF_PRINT_FILES))? "" : "\t",
- dirname);
- }
- if (usi->count > 0)
- usi->count--;
- return 1;
-err:
- usi->ret = ret;
- usi->osl_errno = (ret == -E_OSL)? osl_errno : 0;
- return -1;
-}
-
-static int check_loop_return(int ret, int loop_ret, int loop_osl_errno)
-{
- if (ret >= 0)
- return ret;
- assert(ret == -E_OSL);
- if (osl_errno != E_OSL_LOOP)
- /* error not caused by loop function returning negative. */
- return ret;
- assert(loop_ret < 0);
- if (loop_ret == -E_LOOP_COMPLETE) /* no error */
- return 1;
- if (loop_ret == -E_OSL) { /* osl error in loop function */
- assert(loop_osl_errno);
- osl_errno = loop_osl_errno;
- }
- return loop_ret;
-}
-
-static int adu_loop_reverse(struct osl_table *t, unsigned col_num, void *private_data,
- osl_rbtree_loop_func *func, int *loop_ret, int *loop_osl_errno)
-{
- int ret = osl(osl_rbtree_loop_reverse(t, col_num, private_data, func));
- return check_loop_return(ret, *loop_ret, *loop_osl_errno);
-}
-
-static int print_user_stats(void)
-{
- struct user_info *ui;
- int ret;
-
- FOR_EACH_USER(ui) {
- struct user_stats_info usi = {
- .count = conf.limit_arg,
- .ui = ui
- };
- if (!ui_used(ui) || !ui_admissible(ui))
- continue;
- usi.flags = USF_PRINT_DIRNAME | USF_PRINT_BYTES | USF_COMPUTE_SUMMARY;
- printf("uid %u, by size%s:\n",
- (unsigned) ui->uid, size_unit_buf);
- ret = adu_loop_reverse(ui->table, UT_BYTES, &usi, user_stats_loop_function,
- &usi.ret, &usi.osl_errno);
- if (ret < 0)
- return ret;
- printf("\nuid %u, by file count%s:\n",
- (unsigned) ui->uid, count_unit_buf);
- usi.count = conf.limit_arg,
- usi.flags = USF_PRINT_DIRNAME | USF_PRINT_FILES;
- ret = adu_loop_reverse(ui->table, UT_FILES, &usi, user_stats_loop_function,
- &usi.ret, &usi.osl_errno);
- if (ret < 0)
- return ret;
- printf("\n");
- }
- return 1;
-}
-
-static void print_global_summary(void)
-{
- char d[FORMATED_VALUE_SIZE], f[FORMATED_VALUE_SIZE],
- s[FORMATED_VALUE_SIZE];
- enum enum_count_unit ud, uf;
- enum enum_size_unit us;
-
- ud = format_count_value(conf.count_unit_arg, num_dirs, 0, d);
- uf = format_count_value(conf.count_unit_arg, num_files, 0, f);
- us = format_size_value(conf.size_unit_arg, num_bytes, 0, s);
-
- printf("Global summary "
- "(dirs(%c)/files(%c)/size(%c))\n"
- "\t%s\t%s\t%s\n\n",
- count_unit_abbrevs[ud],
- count_unit_abbrevs[uf],
- size_unit_abbrevs[us],
- d, f, s
- );
-
-}
-
-static int print_statistics(void)