]> git.proxmox.com Git - libgit2.git/blob - src/filebuf.c
New upstream version 1.3.0+dfsg.1
[libgit2.git] / src / filebuf.c
1 /*
2 * Copyright (C) the libgit2 contributors. All rights reserved.
3 *
4 * This file is part of libgit2, distributed under the GNU GPL v2 with
5 * a Linking Exception. For full terms see the included COPYING file.
6 */
7
8 #include "filebuf.h"
9
10 #include "futils.h"
11
12 static const size_t WRITE_BUFFER_SIZE = (4096 * 2);
13
14 enum buferr_t {
15 BUFERR_OK = 0,
16 BUFERR_WRITE,
17 BUFERR_ZLIB,
18 BUFERR_MEM
19 };
20
21 #define ENSURE_BUF_OK(buf) if ((buf)->last_error != BUFERR_OK) { return -1; }
22
23 static int verify_last_error(git_filebuf *file)
24 {
25 switch (file->last_error) {
26 case BUFERR_WRITE:
27 git_error_set(GIT_ERROR_OS, "failed to write out file");
28 return -1;
29
30 case BUFERR_MEM:
31 git_error_set_oom();
32 return -1;
33
34 case BUFERR_ZLIB:
35 git_error_set(GIT_ERROR_ZLIB,
36 "Buffer error when writing out ZLib data");
37 return -1;
38
39 default:
40 return 0;
41 }
42 }
43
44 static int lock_file(git_filebuf *file, int flags, mode_t mode)
45 {
46 if (git_path_exists(file->path_lock) == true) {
47 git_error_clear(); /* actual OS error code just confuses */
48 git_error_set(GIT_ERROR_OS,
49 "failed to lock file '%s' for writing", file->path_lock);
50 return GIT_ELOCKED;
51 }
52
53 /* create path to the file buffer is required */
54 if (flags & GIT_FILEBUF_CREATE_LEADING_DIRS) {
55 /* XXX: Should dirmode here be configurable? Or is 0777 always fine? */
56 file->fd = git_futils_creat_locked_withpath(file->path_lock, 0777, mode);
57 } else {
58 file->fd = git_futils_creat_locked(file->path_lock, mode);
59 }
60
61 if (file->fd < 0)
62 return file->fd;
63
64 file->fd_is_open = true;
65
66 if ((flags & GIT_FILEBUF_APPEND) && git_path_exists(file->path_original) == true) {
67 git_file source;
68 char buffer[FILEIO_BUFSIZE];
69 ssize_t read_bytes;
70 int error = 0;
71
72 source = p_open(file->path_original, O_RDONLY);
73 if (source < 0) {
74 git_error_set(GIT_ERROR_OS,
75 "failed to open file '%s' for reading",
76 file->path_original);
77 return -1;
78 }
79
80 while ((read_bytes = p_read(source, buffer, sizeof(buffer))) > 0) {
81 if ((error = p_write(file->fd, buffer, read_bytes)) < 0)
82 break;
83 if (file->compute_digest)
84 git_hash_update(&file->digest, buffer, read_bytes);
85 }
86
87 p_close(source);
88
89 if (read_bytes < 0) {
90 git_error_set(GIT_ERROR_OS, "failed to read file '%s'", file->path_original);
91 return -1;
92 } else if (error < 0) {
93 git_error_set(GIT_ERROR_OS, "failed to write file '%s'", file->path_lock);
94 return -1;
95 }
96 }
97
98 return 0;
99 }
100
101 void git_filebuf_cleanup(git_filebuf *file)
102 {
103 if (file->fd_is_open && file->fd >= 0)
104 p_close(file->fd);
105
106 if (file->created_lock && !file->did_rename && file->path_lock && git_path_exists(file->path_lock))
107 p_unlink(file->path_lock);
108
109 if (file->compute_digest) {
110 git_hash_ctx_cleanup(&file->digest);
111 file->compute_digest = 0;
112 }
113
114 if (file->buffer)
115 git__free(file->buffer);
116
117 /* use the presence of z_buf to decide if we need to deflateEnd */
118 if (file->z_buf) {
119 git__free(file->z_buf);
120 deflateEnd(&file->zs);
121 }
122
123 if (file->path_original)
124 git__free(file->path_original);
125 if (file->path_lock)
126 git__free(file->path_lock);
127
128 memset(file, 0x0, sizeof(git_filebuf));
129 file->fd = -1;
130 }
131
132 GIT_INLINE(int) flush_buffer(git_filebuf *file)
133 {
134 int result = file->write(file, file->buffer, file->buf_pos);
135 file->buf_pos = 0;
136 return result;
137 }
138
139 int git_filebuf_flush(git_filebuf *file)
140 {
141 return flush_buffer(file);
142 }
143
144 static int write_normal(git_filebuf *file, void *source, size_t len)
145 {
146 if (len > 0) {
147 if (p_write(file->fd, (void *)source, len) < 0) {
148 file->last_error = BUFERR_WRITE;
149 return -1;
150 }
151
152 if (file->compute_digest)
153 git_hash_update(&file->digest, source, len);
154 }
155
156 return 0;
157 }
158
159 static int write_deflate(git_filebuf *file, void *source, size_t len)
160 {
161 z_stream *zs = &file->zs;
162
163 if (len > 0 || file->flush_mode == Z_FINISH) {
164 zs->next_in = source;
165 zs->avail_in = (uInt)len;
166
167 do {
168 size_t have;
169
170 zs->next_out = file->z_buf;
171 zs->avail_out = (uInt)file->buf_size;
172
173 if (deflate(zs, file->flush_mode) == Z_STREAM_ERROR) {
174 file->last_error = BUFERR_ZLIB;
175 return -1;
176 }
177
178 have = file->buf_size - (size_t)zs->avail_out;
179
180 if (p_write(file->fd, file->z_buf, have) < 0) {
181 file->last_error = BUFERR_WRITE;
182 return -1;
183 }
184
185 } while (zs->avail_out == 0);
186
187 GIT_ASSERT(zs->avail_in == 0);
188
189 if (file->compute_digest)
190 git_hash_update(&file->digest, source, len);
191 }
192
193 return 0;
194 }
195
196 #define MAX_SYMLINK_DEPTH 5
197
198 static int resolve_symlink(git_buf *out, const char *path)
199 {
200 int i, error, root;
201 ssize_t ret;
202 struct stat st;
203 git_buf curpath = GIT_BUF_INIT, target = GIT_BUF_INIT;
204
205 if ((error = git_buf_grow(&target, GIT_PATH_MAX + 1)) < 0 ||
206 (error = git_buf_puts(&curpath, path)) < 0)
207 return error;
208
209 for (i = 0; i < MAX_SYMLINK_DEPTH; i++) {
210 error = p_lstat(curpath.ptr, &st);
211 if (error < 0 && errno == ENOENT) {
212 error = git_buf_puts(out, curpath.ptr);
213 goto cleanup;
214 }
215
216 if (error < 0) {
217 git_error_set(GIT_ERROR_OS, "failed to stat '%s'", curpath.ptr);
218 error = -1;
219 goto cleanup;
220 }
221
222 if (!S_ISLNK(st.st_mode)) {
223 error = git_buf_puts(out, curpath.ptr);
224 goto cleanup;
225 }
226
227 ret = p_readlink(curpath.ptr, target.ptr, GIT_PATH_MAX);
228 if (ret < 0) {
229 git_error_set(GIT_ERROR_OS, "failed to read symlink '%s'", curpath.ptr);
230 error = -1;
231 goto cleanup;
232 }
233
234 if (ret == GIT_PATH_MAX) {
235 git_error_set(GIT_ERROR_INVALID, "symlink target too long");
236 error = -1;
237 goto cleanup;
238 }
239
240 /* readlink(2) won't NUL-terminate for us */
241 target.ptr[ret] = '\0';
242 target.size = ret;
243
244 root = git_path_root(target.ptr);
245 if (root >= 0) {
246 if ((error = git_buf_sets(&curpath, target.ptr)) < 0)
247 goto cleanup;
248 } else {
249 git_buf dir = GIT_BUF_INIT;
250
251 if ((error = git_path_dirname_r(&dir, curpath.ptr)) < 0)
252 goto cleanup;
253
254 git_buf_swap(&curpath, &dir);
255 git_buf_dispose(&dir);
256
257 if ((error = git_path_apply_relative(&curpath, target.ptr)) < 0)
258 goto cleanup;
259 }
260 }
261
262 git_error_set(GIT_ERROR_INVALID, "maximum symlink depth reached");
263 error = -1;
264
265 cleanup:
266 git_buf_dispose(&curpath);
267 git_buf_dispose(&target);
268 return error;
269 }
270
271 int git_filebuf_open(git_filebuf *file, const char *path, int flags, mode_t mode)
272 {
273 return git_filebuf_open_withsize(file, path, flags, mode, WRITE_BUFFER_SIZE);
274 }
275
276 int git_filebuf_open_withsize(git_filebuf *file, const char *path, int flags, mode_t mode, size_t size)
277 {
278 int compression, error = -1;
279 size_t path_len, alloc_len;
280
281 GIT_ASSERT_ARG(file);
282 GIT_ASSERT_ARG(path);
283 GIT_ASSERT(file->buffer == NULL);
284
285 memset(file, 0x0, sizeof(git_filebuf));
286
287 if (flags & GIT_FILEBUF_DO_NOT_BUFFER)
288 file->do_not_buffer = true;
289
290 if (flags & GIT_FILEBUF_FSYNC)
291 file->do_fsync = true;
292
293 file->buf_size = size;
294 file->buf_pos = 0;
295 file->fd = -1;
296 file->last_error = BUFERR_OK;
297
298 /* Allocate the main cache buffer */
299 if (!file->do_not_buffer) {
300 file->buffer = git__malloc(file->buf_size);
301 GIT_ERROR_CHECK_ALLOC(file->buffer);
302 }
303
304 /* If we are hashing on-write, allocate a new hash context */
305 if (flags & GIT_FILEBUF_HASH_CONTENTS) {
306 file->compute_digest = 1;
307
308 if (git_hash_ctx_init(&file->digest) < 0)
309 goto cleanup;
310 }
311
312 compression = flags >> GIT_FILEBUF_DEFLATE_SHIFT;
313
314 /* If we are deflating on-write, */
315 if (compression != 0) {
316 /* Initialize the ZLib stream */
317 if (deflateInit(&file->zs, compression) != Z_OK) {
318 git_error_set(GIT_ERROR_ZLIB, "failed to initialize zlib");
319 goto cleanup;
320 }
321
322 /* Allocate the Zlib cache buffer */
323 file->z_buf = git__malloc(file->buf_size);
324 GIT_ERROR_CHECK_ALLOC(file->z_buf);
325
326 /* Never flush */
327 file->flush_mode = Z_NO_FLUSH;
328 file->write = &write_deflate;
329 } else {
330 file->write = &write_normal;
331 }
332
333 /* If we are writing to a temp file */
334 if (flags & GIT_FILEBUF_TEMPORARY) {
335 git_buf tmp_path = GIT_BUF_INIT;
336
337 /* Open the file as temporary for locking */
338 file->fd = git_futils_mktmp(&tmp_path, path, mode);
339
340 if (file->fd < 0) {
341 git_buf_dispose(&tmp_path);
342 goto cleanup;
343 }
344 file->fd_is_open = true;
345 file->created_lock = true;
346
347 /* No original path */
348 file->path_original = NULL;
349 file->path_lock = git_buf_detach(&tmp_path);
350 GIT_ERROR_CHECK_ALLOC(file->path_lock);
351 } else {
352 git_buf resolved_path = GIT_BUF_INIT;
353
354 if ((error = resolve_symlink(&resolved_path, path)) < 0)
355 goto cleanup;
356
357 /* Save the original path of the file */
358 path_len = resolved_path.size;
359 file->path_original = git_buf_detach(&resolved_path);
360
361 /* create the locking path by appending ".lock" to the original */
362 GIT_ERROR_CHECK_ALLOC_ADD(&alloc_len, path_len, GIT_FILELOCK_EXTLENGTH);
363 file->path_lock = git__malloc(alloc_len);
364 GIT_ERROR_CHECK_ALLOC(file->path_lock);
365
366 memcpy(file->path_lock, file->path_original, path_len);
367 memcpy(file->path_lock + path_len, GIT_FILELOCK_EXTENSION, GIT_FILELOCK_EXTLENGTH);
368
369 if (git_path_isdir(file->path_original)) {
370 git_error_set(GIT_ERROR_FILESYSTEM, "path '%s' is a directory", file->path_original);
371 error = GIT_EDIRECTORY;
372 goto cleanup;
373 }
374
375 /* open the file for locking */
376 if ((error = lock_file(file, flags, mode)) < 0)
377 goto cleanup;
378
379 file->created_lock = true;
380 }
381
382 return 0;
383
384 cleanup:
385 git_filebuf_cleanup(file);
386 return error;
387 }
388
389 int git_filebuf_hash(git_oid *oid, git_filebuf *file)
390 {
391 GIT_ASSERT_ARG(oid);
392 GIT_ASSERT_ARG(file);
393 GIT_ASSERT_ARG(file->compute_digest);
394
395 flush_buffer(file);
396
397 if (verify_last_error(file) < 0)
398 return -1;
399
400 git_hash_final(oid, &file->digest);
401 git_hash_ctx_cleanup(&file->digest);
402 file->compute_digest = 0;
403
404 return 0;
405 }
406
407 int git_filebuf_commit_at(git_filebuf *file, const char *path)
408 {
409 git__free(file->path_original);
410 file->path_original = git__strdup(path);
411 GIT_ERROR_CHECK_ALLOC(file->path_original);
412
413 return git_filebuf_commit(file);
414 }
415
416 int git_filebuf_commit(git_filebuf *file)
417 {
418 /* temporary files cannot be committed */
419 GIT_ASSERT_ARG(file);
420 GIT_ASSERT(file->path_original);
421
422 file->flush_mode = Z_FINISH;
423 flush_buffer(file);
424
425 if (verify_last_error(file) < 0)
426 goto on_error;
427
428 file->fd_is_open = false;
429
430 if (file->do_fsync && p_fsync(file->fd) < 0) {
431 git_error_set(GIT_ERROR_OS, "failed to fsync '%s'", file->path_lock);
432 goto on_error;
433 }
434
435 if (p_close(file->fd) < 0) {
436 git_error_set(GIT_ERROR_OS, "failed to close file at '%s'", file->path_lock);
437 goto on_error;
438 }
439
440 file->fd = -1;
441
442 if (p_rename(file->path_lock, file->path_original) < 0) {
443 git_error_set(GIT_ERROR_OS, "failed to rename lockfile to '%s'", file->path_original);
444 goto on_error;
445 }
446
447 if (file->do_fsync && git_futils_fsync_parent(file->path_original) < 0)
448 goto on_error;
449
450 file->did_rename = true;
451
452 git_filebuf_cleanup(file);
453 return 0;
454
455 on_error:
456 git_filebuf_cleanup(file);
457 return -1;
458 }
459
460 GIT_INLINE(void) add_to_cache(git_filebuf *file, const void *buf, size_t len)
461 {
462 memcpy(file->buffer + file->buf_pos, buf, len);
463 file->buf_pos += len;
464 }
465
466 int git_filebuf_write(git_filebuf *file, const void *buff, size_t len)
467 {
468 const unsigned char *buf = buff;
469
470 ENSURE_BUF_OK(file);
471
472 if (file->do_not_buffer)
473 return file->write(file, (void *)buff, len);
474
475 for (;;) {
476 size_t space_left = file->buf_size - file->buf_pos;
477
478 /* cache if it's small */
479 if (space_left > len) {
480 add_to_cache(file, buf, len);
481 return 0;
482 }
483
484 add_to_cache(file, buf, space_left);
485 if (flush_buffer(file) < 0)
486 return -1;
487
488 len -= space_left;
489 buf += space_left;
490 }
491 }
492
493 int git_filebuf_reserve(git_filebuf *file, void **buffer, size_t len)
494 {
495 size_t space_left = file->buf_size - file->buf_pos;
496
497 *buffer = NULL;
498
499 ENSURE_BUF_OK(file);
500
501 if (len > file->buf_size) {
502 file->last_error = BUFERR_MEM;
503 return -1;
504 }
505
506 if (space_left <= len) {
507 if (flush_buffer(file) < 0)
508 return -1;
509 }
510
511 *buffer = (file->buffer + file->buf_pos);
512 file->buf_pos += len;
513
514 return 0;
515 }
516
517 int git_filebuf_printf(git_filebuf *file, const char *format, ...)
518 {
519 va_list arglist;
520 size_t space_left, len, alloclen;
521 int written, res;
522 char *tmp_buffer;
523
524 ENSURE_BUF_OK(file);
525
526 space_left = file->buf_size - file->buf_pos;
527
528 do {
529 va_start(arglist, format);
530 written = p_vsnprintf((char *)file->buffer + file->buf_pos, space_left, format, arglist);
531 va_end(arglist);
532
533 if (written < 0) {
534 file->last_error = BUFERR_MEM;
535 return -1;
536 }
537
538 len = written;
539 if (len + 1 <= space_left) {
540 file->buf_pos += len;
541 return 0;
542 }
543
544 if (flush_buffer(file) < 0)
545 return -1;
546
547 space_left = file->buf_size - file->buf_pos;
548
549 } while (len + 1 <= space_left);
550
551 if (GIT_ADD_SIZET_OVERFLOW(&alloclen, len, 1) ||
552 !(tmp_buffer = git__malloc(alloclen))) {
553 file->last_error = BUFERR_MEM;
554 return -1;
555 }
556
557 va_start(arglist, format);
558 written = p_vsnprintf(tmp_buffer, len + 1, format, arglist);
559 va_end(arglist);
560
561 if (written < 0) {
562 git__free(tmp_buffer);
563 file->last_error = BUFERR_MEM;
564 return -1;
565 }
566
567 res = git_filebuf_write(file, tmp_buffer, len);
568 git__free(tmp_buffer);
569
570 return res;
571 }
572
573 int git_filebuf_stats(time_t *mtime, size_t *size, git_filebuf *file)
574 {
575 int res;
576 struct stat st;
577
578 if (file->fd_is_open)
579 res = p_fstat(file->fd, &st);
580 else
581 res = p_stat(file->path_original, &st);
582
583 if (res < 0) {
584 git_error_set(GIT_ERROR_OS, "could not get stat info for '%s'",
585 file->path_original);
586 return res;
587 }
588
589 if (mtime)
590 *mtime = st.st_mtime;
591 if (size)
592 *size = (size_t)st.st_size;
593
594 return 0;
595 }