diff options
| -rw-r--r-- | cache.c | 359 | ||||
| -rw-r--r-- | cache.h | 33 | ||||
| -rw-r--r-- | cgit.c | 166 | ||||
| -rw-r--r-- | cgit.h | 1 | ||||
| -rwxr-xr-x | tests/setup.sh | 2 | ||||
| -rwxr-xr-x | tests/t0020-validate-cache.sh | 67 |
6 files changed, 418 insertions, 210 deletions
| @@ -4,117 +4,340 @@ | |||
| 4 | * | 4 | * |
| 5 | * Licensed under GNU General Public License v2 | 5 | * Licensed under GNU General Public License v2 |
| 6 | * (see COPYING for full license text) | 6 | * (see COPYING for full license text) |
| 7 | * | ||
| 8 | * | ||
| 9 | * The cache is just a directory structure where each file is a cache slot, | ||
| 10 | * and each filename is based on the hash of some key (e.g. the cgit url). | ||
| 11 | * Each file contains the full key followed by the cached content for that | ||
| 12 | * key. | ||
| 13 | * | ||
| 7 | */ | 14 | */ |
| 8 | 15 | ||
| 9 | #include "cgit.h" | 16 | #include "cgit.h" |
| 10 | #include "cache.h" | 17 | #include "cache.h" |
| 11 | 18 | ||
| 12 | const int NOLOCK = -1; | 19 | #define CACHE_BUFSIZE (1024 * 4) |
| 20 | |||
| 21 | struct cache_slot { | ||
| 22 | const char *key; | ||
| 23 | int keylen; | ||
| 24 | int ttl; | ||
| 25 | cache_fill_fn fn; | ||
| 26 | void *cbdata; | ||
| 27 | int cache_fd; | ||
| 28 | int lock_fd; | ||
| 29 | const char *cache_name; | ||
| 30 | const char *lock_name; | ||
| 31 | int match; | ||
| 32 | struct stat cache_st; | ||
| 33 | struct stat lock_st; | ||
| 34 | int bufsize; | ||
| 35 | char buf[CACHE_BUFSIZE]; | ||
| 36 | }; | ||
| 13 | 37 | ||
| 14 | char *cache_safe_filename(const char *unsafe) | 38 | /* Open an existing cache slot and fill the cache buffer with |
| 39 | * (part of) the content of the cache file. Return 0 on success | ||
| 40 | * and errno otherwise. | ||
| 41 | */ | ||
| 42 | static int open_slot(struct cache_slot *slot) | ||
| 15 | { | 43 | { |
| 16 | static char buf[4][PATH_MAX]; | 44 | char *bufz; |
| 17 | static int bufidx; | 45 | int bufkeylen = -1; |
| 18 | char *s; | 46 | |
| 19 | char c; | 47 | slot->cache_fd = open(slot->cache_name, O_RDONLY); |
| 20 | 48 | if (slot->cache_fd == -1) | |
| 21 | bufidx++; | 49 | return errno; |
| 22 | bufidx &= 3; | 50 | |
| 23 | s = buf[bufidx]; | 51 | if (fstat(slot->cache_fd, &slot->cache_st)) |
| 24 | 52 | return errno; | |
| 25 | while(unsafe && (c = *unsafe++) != 0) { | 53 | |
| 26 | if (c == '/' || c == ' ' || c == '&' || c == '|' || | 54 | slot->bufsize = read(slot->cache_fd, slot->buf, sizeof(slot->buf)); |
| 27 | c == '>' || c == '<' || c == '.') | 55 | if (slot->bufsize == 0) |
| 28 | c = '_'; | 56 | return errno; |
| 29 | *s++ = c; | 57 | |
| 30 | } | 58 | bufz = memchr(slot->buf, 0, slot->bufsize); |
| 31 | *s = '\0'; | 59 | if (bufz) |
| 32 | return buf[bufidx]; | 60 | bufkeylen = bufz - slot->buf; |
| 61 | |||
| 62 | slot->match = bufkeylen == slot->keylen && | ||
| 63 | !memcmp(slot->key, slot->buf, bufkeylen + 1); | ||
| 64 | |||
| 65 | return 0; | ||
| 33 | } | 66 | } |
| 34 | 67 | ||
| 35 | int cache_exist(struct cacheitem *item) | 68 | /* Close the active cache slot */ |
| 69 | static void close_slot(struct cache_slot *slot) | ||
| 36 | { | 70 | { |
| 37 | if (stat(item->name, &item->st)) { | 71 | if (slot->cache_fd > 0) { |
| 38 | item->st.st_mtime = 0; | 72 | close(slot->cache_fd); |
| 39 | return 0; | 73 | slot->cache_fd = -1; |
| 40 | } | 74 | } |
| 41 | return 1; | ||
| 42 | } | 75 | } |
| 43 | 76 | ||
| 44 | int cache_create_dirs() | 77 | /* Print the content of the active cache slot (but skip the key). */ |
| 78 | static int print_slot(struct cache_slot *slot) | ||
| 45 | { | 79 | { |
| 46 | char *path; | 80 | ssize_t i, j = 0; |
| 81 | |||
| 82 | i = lseek(slot->cache_fd, slot->keylen + 1, SEEK_SET); | ||
| 83 | if (i != slot->keylen + 1) | ||
| 84 | return errno; | ||
| 47 | 85 | ||
| 48 | path = fmt("%s", ctx.cfg.cache_root); | 86 | while((i=read(slot->cache_fd, slot->buf, sizeof(slot->buf))) > 0) |
| 49 | if (mkdir(path, S_IRWXU) && errno!=EEXIST) | 87 | j = write(STDOUT_FILENO, slot->buf, i); |
| 88 | |||
| 89 | if (j < 0) | ||
| 90 | return errno; | ||
| 91 | else | ||
| 50 | return 0; | 92 | return 0; |
| 93 | } | ||
| 51 | 94 | ||
| 52 | if (!ctx.repo) | 95 | /* Check if the slot has expired */ |
| 96 | static int is_expired(struct cache_slot *slot) | ||
| 97 | { | ||
| 98 | if (slot->ttl < 0) | ||
| 53 | return 0; | 99 | return 0; |
| 100 | else | ||
| 101 | return slot->cache_st.st_mtime + slot->ttl*60 < time(NULL); | ||
| 102 | } | ||
| 54 | 103 | ||
| 55 | path = fmt("%s/%s", ctx.cfg.cache_root, | 104 | /* Check if the slot has been modified since we opened it. |
| 56 | cache_safe_filename(ctx.repo->url)); | 105 | * NB: If stat() fails, we pretend the file is modified. |
| 106 | */ | ||
| 107 | static int is_modified(struct cache_slot *slot) | ||
| 108 | { | ||
| 109 | struct stat st; | ||
| 57 | 110 | ||
| 58 | if (mkdir(path, S_IRWXU) && errno!=EEXIST) | 111 | if (stat(slot->cache_name, &st)) |
| 59 | return 0; | 112 | return 1; |
| 113 | return (st.st_ino != slot->cache_st.st_ino || | ||
| 114 | st.st_mtime != slot->cache_st.st_mtime || | ||
| 115 | st.st_size != slot->cache_st.st_size); | ||
| 116 | } | ||
| 60 | 117 | ||
| 61 | if (ctx.qry.page) { | 118 | /* Close an open lockfile */ |
| 62 | path = fmt("%s/%s/%s", ctx.cfg.cache_root, | 119 | static void close_lock(struct cache_slot *slot) |
| 63 | cache_safe_filename(ctx.repo->url), | 120 | { |
| 64 | ctx.qry.page); | 121 | if (slot->lock_fd > 0) { |
| 65 | if (mkdir(path, S_IRWXU) && errno!=EEXIST) | 122 | close(slot->lock_fd); |
| 66 | return 0; | 123 | slot->lock_fd = -1; |
| 67 | } | 124 | } |
| 68 | return 1; | ||
| 69 | } | 125 | } |
| 70 | 126 | ||
| 71 | int cache_refill_overdue(const char *lockfile) | 127 | /* Create a lockfile used to store the generated content for a cache |
| 128 | * slot, and write the slot key + \0 into it. | ||
| 129 | * Returns 0 on success and errno otherwise. | ||
| 130 | */ | ||
| 131 | static int lock_slot(struct cache_slot *slot) | ||
| 72 | { | 132 | { |
| 73 | struct stat st; | 133 | slot->lock_fd = open(slot->lock_name, O_RDWR|O_CREAT|O_EXCL, |
| 134 | S_IRUSR|S_IWUSR); | ||
| 135 | if (slot->lock_fd == -1) | ||
| 136 | return errno; | ||
| 137 | write(slot->lock_fd, slot->key, slot->keylen + 1); | ||
| 138 | return 0; | ||
| 139 | } | ||
| 74 | 140 | ||
| 75 | if (stat(lockfile, &st)) | 141 | /* Release the current lockfile. If `replace_old_slot` is set the |
| 76 | return 0; | 142 | * lockfile replaces the old cache slot, otherwise the lockfile is |
| 143 | * just deleted. | ||
| 144 | */ | ||
| 145 | static int unlock_slot(struct cache_slot *slot, int replace_old_slot) | ||
| 146 | { | ||
| 147 | int err; | ||
| 148 | |||
| 149 | if (replace_old_slot) | ||
| 150 | err = rename(slot->lock_name, slot->cache_name); | ||
| 77 | else | 151 | else |
| 78 | return (time(NULL) - st.st_mtime > ctx.cfg.cache_max_create_time); | 152 | err = unlink(slot->lock_name); |
| 153 | return err; | ||
| 79 | } | 154 | } |
| 80 | 155 | ||
| 81 | int cache_lock(struct cacheitem *item) | 156 | /* Generate the content for the current cache slot by redirecting |
| 157 | * stdout to the lock-fd and invoking the callback function | ||
| 158 | */ | ||
| 159 | static int fill_slot(struct cache_slot *slot) | ||
| 82 | { | 160 | { |
| 83 | int i = 0; | 161 | int tmp; |
| 84 | char *lockfile = xstrdup(fmt("%s.lock", item->name)); | ||
| 85 | 162 | ||
| 86 | top: | 163 | /* Preserve stdout */ |
| 87 | if (++i > ctx.cfg.max_lock_attempts) | 164 | tmp = dup(STDOUT_FILENO); |
| 88 | die("cache_lock: unable to lock %s: %s", | 165 | if (tmp == -1) |
| 89 | item->name, strerror(errno)); | 166 | return errno; |
| 90 | 167 | ||
| 91 | item->fd = open(lockfile, O_WRONLY|O_CREAT|O_EXCL, S_IRUSR|S_IWUSR); | 168 | /* Redirect stdout to lockfile */ |
| 169 | if (dup2(slot->lock_fd, STDOUT_FILENO) == -1) | ||
| 170 | return errno; | ||
| 92 | 171 | ||
| 93 | if (item->fd == NOLOCK && errno == ENOENT && cache_create_dirs()) | 172 | /* Generate cache content */ |
| 94 | goto top; | 173 | slot->fn(slot->cbdata); |
| 95 | 174 | ||
| 96 | if (item->fd == NOLOCK && errno == EEXIST && | 175 | /* Restore stdout */ |
| 97 | cache_refill_overdue(lockfile) && !unlink(lockfile)) | 176 | if (dup2(tmp, STDOUT_FILENO) == -1) |
| 98 | goto top; | 177 | return errno; |
| 99 | 178 | ||
| 100 | free(lockfile); | 179 | /* Close the temporary filedescriptor */ |
| 101 | return (item->fd > 0); | 180 | close(tmp); |
| 181 | return 0; | ||
| 102 | } | 182 | } |
| 103 | 183 | ||
| 104 | int cache_unlock(struct cacheitem *item) | 184 | /* Crude implementation of 32-bit FNV-1 hash algorithm, |
| 185 | * see http://www.isthe.com/chongo/tech/comp/fnv/ for details | ||
| 186 | * about the magic numbers. | ||
| 187 | */ | ||
| 188 | #define FNV_OFFSET 0x811c9dc5 | ||
| 189 | #define FNV_PRIME 0x01000193 | ||
| 190 | |||
| 191 | unsigned long hash_str(const char *str) | ||
| 105 | { | 192 | { |
| 106 | close(item->fd); | 193 | unsigned long h = FNV_OFFSET; |
| 107 | return (rename(fmt("%s.lock", item->name), item->name) == 0); | 194 | unsigned char *s = (unsigned char *)str; |
| 195 | |||
| 196 | if (!s) | ||
| 197 | return h; | ||
| 198 | |||
| 199 | while(*s) { | ||
| 200 | h *= FNV_PRIME; | ||
| 201 | h ^= *s++; | ||
| 202 | } | ||
| 203 | return h; | ||
| 108 | } | 204 | } |
| 109 | 205 | ||
| 110 | int cache_cancel_lock(struct cacheitem *item) | 206 | static int process_slot(struct cache_slot *slot) |
| 111 | { | 207 | { |
| 112 | return (unlink(fmt("%s.lock", item->name)) == 0); | 208 | int err; |
| 209 | |||
| 210 | err = open_slot(slot); | ||
| 211 | if (!err && slot->match) { | ||
| 212 | if (is_expired(slot)) { | ||
| 213 | if (!lock_slot(slot)) { | ||
| 214 | /* If the cachefile has been replaced between | ||
| 215 | * `open_slot` and `lock_slot`, we'll just | ||
| 216 | * serve the stale content from the original | ||
| 217 | * cachefile. This way we avoid pruning the | ||
| 218 | * newly generated slot. The same code-path | ||
| 219 | * is chosen if fill_slot() fails for some | ||
| 220 | * reason. | ||
| 221 | * | ||
| 222 | * TODO? check if the new slot contains the | ||
| 223 | * same key as the old one, since we would | ||
| 224 | * prefer to serve the newest content. | ||
| 225 | * This will require us to open yet another | ||
| 226 | * file-descriptor and read and compare the | ||
| 227 | * key from the new file, so for now we're | ||
| 228 | * lazy and just ignore the new file. | ||
| 229 | */ | ||
| 230 | if (is_modified(slot) || fill_slot(slot)) { | ||
| 231 | unlock_slot(slot, 0); | ||
| 232 | close_lock(slot); | ||
| 233 | } else { | ||
| 234 | close_slot(slot); | ||
