// Setting _DEFAULT_SOURCE is necessary to activate visibility of // certain header file contents on GNU/Linux systems. #define _DEFAULT_SOURCE #include #include #include #include #include #include #include #include #include "job_queue.h" pthread_mutex_t stdout_mutex = PTHREAD_MUTEX_INITIALIZER; // err.h contains various nonstandard BSD extensions, but they are // very handy. #include #include "histogram.h" int global_histogram[8] = { 0 }; struct job_queue q; pthread_mutex_t mutex = PTHREAD_MUTEX_INITIALIZER; void update_histogram_mt(int local_histogram[8]) { pthread_mutex_lock(&mutex); merge_histogram(local_histogram, global_histogram); print_histogram(global_histogram); pthread_mutex_unlock(&mutex); } int fhistogram_mt(char const *path) { FILE *f = fopen(path, "r"); int local_histogram[8] = { 0 }; if (f == NULL) { fflush(stdout); warn("failed to open %s", path); return -1; } int i = 0; char c; while (fread(&c, sizeof(c), 1, f) == 1) { i++; update_histogram(local_histogram, c); if ((i % 100000) == 0) { update_histogram_mt(local_histogram); } } fclose(f); update_histogram_mt(local_histogram); return 0; } void* fhistogram_thread() { char const* path; while (job_queue_pop(&q, (void**) &path) == 0) { fhistogram_mt(path); } return NULL; } int main(int argc, char * const *argv) { if (argc < 2) { err(1, "usage: paths..."); exit(1); } int num_threads = 1; char * const *paths = &argv[1]; if (argc > 3 && strcmp(argv[1], "-n") == 0) { // Since atoi() simply returns zero on syntax errors, we cannot // distinguish between the user entering a zero, or some // non-numeric garbage. In fact, we cannot even tell whether the // given option is suffixed by garbage, i.e. '123foo' returns // '123'. A more robust solution would use strtol(), but its // interface is more complicated, so here we are. num_threads = atoi(argv[2]); if (num_threads < 1) { err(1, "invalid thread count: %s", argv[2]); } paths = &argv[3]; } else { paths = &argv[1]; } job_queue_init(&q, 64); pthread_t threads[num_threads]; for (int i = 0 ; i < num_threads ; i++) { //printf("Initializing thread %i\n", i); pthread_create(&threads[i], NULL, fhistogram_thread, NULL); } // FTS_LOGICAL = follow symbolic links // FTS_NOCHDIR = do not change the working directory of the process // // (These are not particularly important distinctions for our simple // uses.) int fts_options = FTS_LOGICAL | FTS_NOCHDIR; FTS *ftsp; if ((ftsp = fts_open(paths, fts_options, NULL)) == NULL) { err(1, "fts_open() failed"); return -1; } FTSENT *p; while ((p = fts_read(ftsp)) != NULL) { switch (p->fts_info) { case FTS_D: break; case FTS_F: job_queue_push(&q, strdup(p->fts_path)); break; default: break; } } fts_close(ftsp); job_queue_destroy(&q); //printf("done destroying jobqueue\n"); for (int i = 0 ; i < num_threads ; i++) { pthread_join(threads[i], NULL); } move_lines(9); return 0; }