feat: watch: paterns

This commit is contained in:
2025-04-03 22:57:55 +00:00
parent d680e080ad
commit 5ab0833d78

View File

@@ -5,39 +5,144 @@
#include <sys/stat.h> #include <sys/stat.h>
#include <sys/select.h> #include <sys/select.h>
#include <time.h> #include <time.h>
#include <dirent.h>
#include <fnmatch.h>
#include <getopt.h>
#include <ctype.h> #include <ctype.h>
#include <limits.h>
#ifndef PATH_MAX #ifndef PATH_MAX
#define PATH_MAX 4096 #define PATH_MAX 4096
#endif #endif
#define MAX_FILES 1024 #define MAX_DIRS 1024
#define POLL_INTERVAL_MS 100 // milliseconds #define MAX_FILES 10240
#define MAX_PATTERNS 32
#define POLL_INTERVAL_MS 100
void print_usage(const char *prog_name) { void print_usage(const char *prog_name) {
fprintf(stderr, "Usage: %s <command> <file1> [file2] ...\n", prog_name); fprintf(stderr, "Usage: %s <command> [-p <pattern1>] [-p <pattern2>] ... <dir1> [dir2] ...\n", prog_name);
fprintf(stderr, " or: find <pattern> | %s <command>\n", prog_name); fprintf(stderr, " or: find . -type d | %s <command> [-p <pattern1>] [-p <pattern2>] ...\n", prog_name);
fprintf(stderr, "Options:\n");
fprintf(stderr, " -p <pattern> File pattern to watch (can be used multiple times)\n");
fprintf(stderr, " -h Show this help message\n");
fprintf(stderr, "Examples:\n");
fprintf(stderr, " %s 'make' -p '*.c' -p '*.h' ./src\n", prog_name);
fprintf(stderr, " find . -type d | %s 'echo changed' -p '*.py'\n", prog_name);
exit(EXIT_FAILURE); exit(EXIT_FAILURE);
} }
struct file_info { struct file_info {
char *path; char *path;
time_t last_mtime; time_t mtime;
int exists;
};
struct dir_info {
char *path;
time_t mtime;
struct stat st; struct stat st;
}; };
int check_file_modified(struct file_info *file) { struct file_hash {
struct file_info **items;
int size;
int count;
};
void hash_init(struct file_hash *hash, int size) {
hash->size = size;
hash->count = 0;
hash->items = calloc(size, sizeof(struct file_info*));
}
unsigned int hash_function(const char *str) {
unsigned int hash = 5381;
int c;
while ((c = *str++))
hash = ((hash << 5) + hash) + c;
return hash;
}
void hash_insert(struct file_hash *hash, struct file_info *item) {
if (hash->count >= hash->size * 0.75) {
fprintf(stderr, "Warning: Hash table full, performance may degrade\n");
}
unsigned int index = hash_function(item->path) % hash->size;
while (hash->items[index] != NULL) {
if (strcmp(hash->items[index]->path, item->path) == 0) {
hash->items[index]->mtime = item->mtime;
hash->items[index]->exists = item->exists;
free(item->path);
free(item);
return;
}
index = (index + 1) % hash->size;
}
hash->items[index] = item;
hash->count++;
}
struct file_info *hash_find(struct file_hash *hash, const char *path) {
unsigned int index = hash_function(path) % hash->size;
int i = 0;
while (hash->items[index] != NULL && i < hash->size) {
if (strcmp(hash->items[index]->path, path) == 0) {
return hash->items[index];
}
index = (index + 1) % hash->size;
i++;
}
return NULL;
}
void hash_remove_nonexistent(struct file_hash *hash) {
for (int i = 0; i < hash->size; i++) {
if (hash->items[i] != NULL && hash->items[i]->exists == 0) {
free(hash->items[i]->path);
free(hash->items[i]);
hash->items[i] = NULL;
hash->count--;
}
}
}
void hash_free(struct file_hash *hash) {
for (int i = 0; i < hash->size; i++) {
if (hash->items[i] != NULL) {
free(hash->items[i]->path);
free(hash->items[i]);
}
}
free(hash->items);
}
int is_dir(const char *path) {
struct stat st;
if (stat(path, &st) != 0)
return 0;
return S_ISDIR(st.st_mode);
}
int check_dir_modified(struct dir_info *dir) {
struct stat new_st; struct stat new_st;
if (stat(file->path, &new_st) != 0) { if (stat(dir->path, &new_st) != 0) {
perror("stat"); perror("stat");
return -1; return -1;
} }
// Check if file was modified return 1;
if (new_st.st_mtime != file->st.st_mtime) { }
file->st = new_st;
return 1; int match_any_pattern(const char *filename, char **patterns, int num_patterns) {
for (int i = 0; i < num_patterns; i++) {
if (fnmatch(patterns[i], filename, 0) == 0) {
return 1;
}
} }
return 0; return 0;
} }
@@ -48,89 +153,223 @@ int main(int argc, char *argv[]) {
} }
char *command = argv[1]; char *command = argv[1];
struct file_info files[MAX_FILES]; char **patterns = malloc(MAX_PATTERNS * sizeof(char*));
int num_files = 0; int num_patterns = 0;
// Check if we're getting input from stdin (find command) optind = 2;
int opt;
while ((opt = getopt(argc, argv, "p:h")) != -1) {
switch (opt) {
case 'p':
if (num_patterns < MAX_PATTERNS) {
patterns[num_patterns++] = strdup(optarg);
} else {
fprintf(stderr, "Too many patterns (max %d)\n", MAX_PATTERNS);
exit(EXIT_FAILURE);
}
break;
case 'h':
print_usage(argv[0]);
break;
default:
fprintf(stderr, "Unknown option: %c\n", opt);
print_usage(argv[0]);
}
}
if (num_patterns == 0) {
fprintf(stderr, "No patterns specified. Use -p option to specify patterns.\n");
print_usage(argv[0]);
}
struct dir_info dirs[MAX_DIRS];
int num_dirs = 0;
struct file_hash files;
hash_init(&files, MAX_FILES);
// Check if we're getting input from stdin
if (!isatty(fileno(stdin))) { if (!isatty(fileno(stdin))) {
// Read files from stdin // Read directories from stdin
char line[PATH_MAX]; char line[PATH_MAX];
while (fgets(line, sizeof(line), stdin) && num_files < MAX_FILES) { while (fgets(line, sizeof(line), stdin) && num_dirs < MAX_DIRS) {
// Remove newline and any whitespace // Remove newline and any whitespace
line[strcspn(line, "\n")] = 0; line[strcspn(line, "\n")] = 0;
char *end = line + strlen(line) - 1; char *end = line + strlen(line) - 1;
while (end >= line && isspace(*end)) end--; while (end >= line && isspace(*end)) end--;
*(end + 1) = 0; *(end + 1) = 0;
if (strlen(line) > 0) { if (strlen(line) > 0 && is_dir(line)) {
files[num_files].path = strdup(line); dirs[num_dirs].path = strdup(line);
if (!files[num_files].path) { if (!dirs[num_dirs].path) {
perror("strdup"); perror("strdup");
exit(EXIT_FAILURE); exit(EXIT_FAILURE);
} }
if (stat(files[num_files].path, &files[num_files].st) != 0) { if (stat(dirs[num_dirs].path, &dirs[num_dirs].st) != 0) {
perror("stat"); perror("stat");
fprintf(stderr, "Skipping invalid path: %s\n", line); fprintf(stderr, "Skipping invalid directory: %s\n", line);
free(files[num_files].path); free(dirs[num_dirs].path);
continue; continue;
} }
num_files++; num_dirs++;
} }
} }
} else { } else {
// No stdin input, use command line arguments for (int i = optind; i < argc && num_dirs < MAX_DIRS; i++) {
if (argc < 3) { if (is_dir(argv[i])) {
print_usage(argv[0]); dirs[num_dirs].path = strdup(argv[i]);
} if (!dirs[num_dirs].path) {
for (int i = 2; i < argc && num_files < MAX_FILES; i++) { perror("strdup");
files[num_files].path = strdup(argv[i]); exit(EXIT_FAILURE);
if (!files[num_files].path) { }
perror("strdup"); if (stat(dirs[num_dirs].path, &dirs[num_dirs].st) != 0) {
exit(EXIT_FAILURE); perror("stat");
fprintf(stderr, "Skipping invalid directory: %s\n", argv[i]);
free(dirs[num_dirs].path);
continue;
}
num_dirs++;
} else {
fprintf(stderr, "Skipping non-directory: %s\n", argv[i]);
} }
if (stat(files[num_files].path, &files[num_files].st) != 0) {
perror("stat");
fprintf(stderr, "Skipping invalid path: %s\n", argv[i]);
free(files[num_files].path);
continue;
}
num_files++;
} }
} }
if (num_files == 0) { if (num_dirs == 0) {
fprintf(stderr, "No files to watch\n"); fprintf(stderr, "No directories to watch\n");
exit(EXIT_FAILURE); exit(EXIT_FAILURE);
} }
// Print the files we're watching // Print the directories and patterns we're watching
fprintf(stderr, "Watching %d files:\n", num_files); fprintf(stderr, "Watching %d directories for files matching: ", num_dirs);
for (int i = 0; i < num_files; i++) { for (int i = 0; i < num_patterns; i++) {
fprintf(stderr, " %s\n", files[i].path); fprintf(stderr, "'%s'%s", patterns[i], (i < num_patterns - 1) ? ", " : "\n");
} }
for (int i = 0; i < num_dirs; i++) {
fprintf(stderr, " %s\n", dirs[i].path);
}
for (int i = 0; i < num_dirs; i++) {
DIR *dir = opendir(dirs[i].path);
if (!dir) {
perror("opendir");
continue;
}
struct dirent *entry;
while ((entry = readdir(dir)) != NULL) {
if (entry->d_name[0] == '.') continue;
if (match_any_pattern(entry->d_name, patterns, num_patterns)) {
char filepath[PATH_MAX];
snprintf(filepath, PATH_MAX, "%s/%s", dirs[i].path, entry->d_name);
struct stat st;
if (stat(filepath, &st) != 0) continue;
if (S_ISDIR(st.st_mode)) continue;
struct file_info *file = malloc(sizeof(struct file_info));
file->path = strdup(filepath);
file->mtime = st.st_mtime;
file->exists = 1;
hash_insert(&files, file);
}
}
closedir(dir);
}
fprintf(stderr, "Initially found %d matching files\n", files.count);
fprintf(stderr, "Waiting for file modifications...\n"); fprintf(stderr, "Waiting for file modifications...\n");
struct timeval tv; struct timeval tv;
tv.tv_sec = 0; tv.tv_sec = 0;
tv.tv_usec = POLL_INTERVAL_MS * 1000; // Convert to microseconds tv.tv_usec = POLL_INTERVAL_MS * 1000;
for (int i = 0; i < files.size; i++) {
if (files.items[i] != NULL) {
files.items[i]->exists = 1;
}
}
tv.tv_sec = 1;
select(0, NULL, NULL, NULL, &tv);
tv.tv_sec = 0;
tv.tv_usec = POLL_INTERVAL_MS * 1000;
int first_scan = 1;
while (1) { while (1) {
// Use select to wait for the specified interval
select(0, NULL, NULL, NULL, &tv); select(0, NULL, NULL, NULL, &tv);
int any_modified = 0; int any_changes = 0;
for (int i = 0; i < num_files; i++) {
int modified = check_file_modified(&files[i]); for (int i = 0; i < files.size; i++) {
if (modified > 0) { if (files.items[i] != NULL) {
fprintf(stderr, "File modified: %s\n", files[i].path); files.items[i]->exists = 0;
any_modified = 1;
} else if (modified < 0) {
fprintf(stderr, "Error checking file: %s\n", files[i].path);
} }
} }
if (any_modified) { for (int i = 0; i < num_dirs; i++) {
DIR *dir = opendir(dirs[i].path);
if (!dir) {
perror("opendir");
continue;
}
struct dirent *entry;
while ((entry = readdir(dir)) != NULL) {
if (entry->d_name[0] == '.') continue;
if (match_any_pattern(entry->d_name, patterns, num_patterns)) {
char filepath[PATH_MAX];
snprintf(filepath, PATH_MAX, "%s/%s", dirs[i].path, entry->d_name);
struct stat st;
if (stat(filepath, &st) != 0) continue;
if (S_ISDIR(st.st_mode)) continue;
struct file_info *existing = hash_find(&files, filepath);
if (existing) {
existing->exists = 1;
if (existing->mtime != st.st_mtime) {
if (!first_scan) {
fprintf(stderr, "File modified: %s\n", filepath);
any_changes = 1;
}
existing->mtime = st.st_mtime;
}
} else {
if (!first_scan) {
fprintf(stderr, "New file: %s\n", filepath);
any_changes = 1;
}
struct file_info *file = malloc(sizeof(struct file_info));
file->path = strdup(filepath);
file->mtime = st.st_mtime;
file->exists = 1;
hash_insert(&files, file);
}
}
}
closedir(dir);
}
for (int i = 0; i < files.size; i++) {
if (files.items[i] != NULL && files.items[i]->exists == 0) {
if (!first_scan) {
fprintf(stderr, "File deleted: %s\n", files.items[i]->path);
any_changes = 1;
}
}
}
hash_remove_nonexistent(&files);
if (any_changes) {
fprintf(stderr, "Executing command: %s\n", command); fprintf(stderr, "Executing command: %s\n", command);
int res = system(command); int res = system(command);
if (res != 0) { if (res != 0) {
@@ -139,14 +378,20 @@ int main(int argc, char *argv[]) {
} }
} }
// Reset timeout for next iteration
tv.tv_sec = 0; tv.tv_sec = 0;
tv.tv_usec = POLL_INTERVAL_MS * 1000; tv.tv_usec = POLL_INTERVAL_MS * 1000;
first_scan = 0;
} }
// Cleanup for (int i = 0; i < num_dirs; i++) {
for (int i = 0; i < num_files; i++) { free(dirs[i].path);
free(files[i].path);
} }
for (int i = 0; i < num_patterns; i++) {
free(patterns[i]);
}
free(patterns);
hash_free(&files);
return 0; return 0;
} }