2 * Copyright (C) the libgit2 contributors. All rights reserved.
4 * This file is part of libgit2, distributed under the GNU GPL v2 with
5 * a Linking Exception. For full terms see the included COPYING file.
10 #include "git2/common.h"
11 #include "git2/object.h"
12 #include "git2/repository.h"
13 #include "git2/odb_backend.h"
18 const void *git_blob_rawcontent(const git_blob
*blob
)
20 GIT_ASSERT_ARG_WITH_RETVAL(blob
, NULL
);
23 return blob
->data
.raw
.data
;
25 return git_odb_object_data(blob
->data
.odb
);
28 git_object_size_t
git_blob_rawsize(const git_blob
*blob
)
33 return blob
->data
.raw
.size
;
35 return (git_object_size_t
)git_odb_object_size(blob
->data
.odb
);
38 int git_blob__getbuf(git_buf
*buffer
, git_blob
*blob
)
40 git_object_size_t size
= git_blob_rawsize(blob
);
42 GIT_ERROR_CHECK_BLOBSIZE(size
);
43 return git_buf_set(buffer
, git_blob_rawcontent(blob
), (size_t)size
);
46 void git_blob__free(void *_blob
)
48 git_blob
*blob
= (git_blob
*) _blob
;
50 git_odb_object_free(blob
->data
.odb
);
54 int git_blob__parse_raw(void *_blob
, const char *data
, size_t size
)
56 git_blob
*blob
= (git_blob
*) _blob
;
61 blob
->data
.raw
.data
= data
;
62 blob
->data
.raw
.size
= size
;
66 int git_blob__parse(void *_blob
, git_odb_object
*odb_obj
)
68 git_blob
*blob
= (git_blob
*) _blob
;
72 git_cached_obj_incref((git_cached_obj
*)odb_obj
);
74 blob
->data
.odb
= odb_obj
;
78 int git_blob_create_from_buffer(
79 git_oid
*id
, git_repository
*repo
, const void *buffer
, size_t len
)
83 git_odb_stream
*stream
;
88 if ((error
= git_repository_odb__weakptr(&odb
, repo
)) < 0 ||
89 (error
= git_odb_open_wstream(&stream
, odb
, len
, GIT_OBJECT_BLOB
)) < 0)
92 if ((error
= git_odb_stream_write(stream
, buffer
, len
)) == 0)
93 error
= git_odb_stream_finalize_write(id
, stream
);
95 git_odb_stream_free(stream
);
99 static int write_file_stream(
100 git_oid
*id
, git_odb
*odb
, const char *path
, git_object_size_t file_size
)
103 char buffer
[FILEIO_BUFSIZE
];
104 git_odb_stream
*stream
= NULL
;
105 ssize_t read_len
= -1;
106 git_object_size_t written
= 0;
108 if ((error
= git_odb_open_wstream(
109 &stream
, odb
, file_size
, GIT_OBJECT_BLOB
)) < 0)
112 if ((fd
= git_futils_open_ro(path
)) < 0) {
113 git_odb_stream_free(stream
);
117 while (!error
&& (read_len
= p_read(fd
, buffer
, sizeof(buffer
))) > 0) {
118 error
= git_odb_stream_write(stream
, buffer
, read_len
);
124 if (written
!= file_size
|| read_len
< 0) {
125 git_error_set(GIT_ERROR_OS
, "failed to read file into stream");
130 error
= git_odb_stream_finalize_write(id
, stream
);
132 git_odb_stream_free(stream
);
136 static int write_file_filtered(
138 git_object_size_t
*size
,
140 const char *full_path
,
142 git_repository
* repo
)
145 git_buf tgt
= GIT_BUF_INIT
;
147 error
= git_filter_list_apply_to_file(&tgt
, fl
, repo
, full_path
);
149 /* Write the file to disk if it was properly filtered */
153 error
= git_odb_write(id
, odb
, tgt
.ptr
, tgt
.size
, GIT_OBJECT_BLOB
);
156 git_buf_dispose(&tgt
);
160 static int write_symlink(
161 git_oid
*id
, git_odb
*odb
, const char *path
, size_t link_size
)
167 link_data
= git__malloc(link_size
);
168 GIT_ERROR_CHECK_ALLOC(link_data
);
170 read_len
= p_readlink(path
, link_data
, link_size
);
171 if (read_len
!= (ssize_t
)link_size
) {
172 git_error_set(GIT_ERROR_OS
, "failed to create blob: cannot read symlink '%s'", path
);
173 git__free(link_data
);
177 error
= git_odb_write(id
, odb
, (void *)link_data
, link_size
, GIT_OBJECT_BLOB
);
178 git__free(link_data
);
182 int git_blob__create_from_paths(
185 git_repository
*repo
,
186 const char *content_path
,
187 const char *hint_path
,
189 bool try_load_filters
)
194 git_object_size_t size
;
196 git_buf path
= GIT_BUF_INIT
;
198 GIT_ASSERT_ARG(hint_path
|| !try_load_filters
);
201 if (git_repository_workdir_path(&path
, repo
, hint_path
) < 0)
204 content_path
= path
.ptr
;
207 if ((error
= git_path_lstat(content_path
, &st
)) < 0 ||
208 (error
= git_repository_odb(&odb
, repo
)) < 0)
211 if (S_ISDIR(st
.st_mode
)) {
212 git_error_set(GIT_ERROR_ODB
, "cannot create blob from '%s': it is a directory", content_path
);
213 error
= GIT_EDIRECTORY
;
218 memcpy(out_st
, &st
, sizeof(st
));
221 mode
= hint_mode
? hint_mode
: st
.st_mode
;
224 error
= write_symlink(id
, odb
, content_path
, (size_t)size
);
226 git_filter_list
*fl
= NULL
;
228 if (try_load_filters
)
229 /* Load the filters for writing this file to the ODB */
230 error
= git_filter_list_load(
231 &fl
, repo
, NULL
, hint_path
,
232 GIT_FILTER_TO_ODB
, GIT_FILTER_DEFAULT
);
235 /* well, that didn't work */;
237 /* No filters need to be applied to the document: we can stream
238 * directly from disk */
239 error
= write_file_stream(id
, odb
, content_path
, size
);
241 /* We need to apply one or more filters */
242 error
= write_file_filtered(id
, &size
, odb
, content_path
, fl
, repo
);
244 git_filter_list_free(fl
);
248 * TODO: eventually support streaming filtered files, for files
249 * which are bigger than a given threshold. This is not a priority
250 * because applying a filter in streaming mode changes the final
251 * size of the blob, and without knowing its final size, the blob
252 * cannot be written in stream mode to the ODB.
254 * The plan is to do streaming writes to a tempfile on disk and then
255 * opening streaming that file to the ODB, using
256 * `write_file_stream`.
258 * CAREFULLY DESIGNED APIS YO
264 git_buf_dispose(&path
);
269 int git_blob_create_from_workdir(
270 git_oid
*id
, git_repository
*repo
, const char *path
)
272 return git_blob__create_from_paths(id
, NULL
, repo
, NULL
, path
, 0, true);
275 int git_blob_create_from_disk(
276 git_oid
*id
, git_repository
*repo
, const char *path
)
279 git_buf full_path
= GIT_BUF_INIT
;
280 const char *workdir
, *hintpath
= NULL
;
282 if ((error
= git_path_prettify(&full_path
, path
, NULL
)) < 0) {
283 git_buf_dispose(&full_path
);
287 workdir
= git_repository_workdir(repo
);
289 if (workdir
&& !git__prefixcmp(full_path
.ptr
, workdir
))
290 hintpath
= full_path
.ptr
+ strlen(workdir
);
292 error
= git_blob__create_from_paths(
293 id
, NULL
, repo
, git_buf_cstr(&full_path
), hintpath
, 0, !!hintpath
);
295 git_buf_dispose(&full_path
);
300 git_writestream parent
;
302 git_repository
*repo
;
306 static int blob_writestream_close(git_writestream
*_stream
)
308 blob_writestream
*stream
= (blob_writestream
*) _stream
;
310 git_filebuf_cleanup(&stream
->fbuf
);
314 static void blob_writestream_free(git_writestream
*_stream
)
316 blob_writestream
*stream
= (blob_writestream
*) _stream
;
318 git_filebuf_cleanup(&stream
->fbuf
);
319 git__free(stream
->hintpath
);
323 static int blob_writestream_write(git_writestream
*_stream
, const char *buffer
, size_t len
)
325 blob_writestream
*stream
= (blob_writestream
*) _stream
;
327 return git_filebuf_write(&stream
->fbuf
, buffer
, len
);
330 int git_blob_create_from_stream(git_writestream
**out
, git_repository
*repo
, const char *hintpath
)
333 git_buf path
= GIT_BUF_INIT
;
334 blob_writestream
*stream
;
337 GIT_ASSERT_ARG(repo
);
339 stream
= git__calloc(1, sizeof(blob_writestream
));
340 GIT_ERROR_CHECK_ALLOC(stream
);
343 stream
->hintpath
= git__strdup(hintpath
);
344 GIT_ERROR_CHECK_ALLOC(stream
->hintpath
);
348 stream
->parent
.write
= blob_writestream_write
;
349 stream
->parent
.close
= blob_writestream_close
;
350 stream
->parent
.free
= blob_writestream_free
;
352 if ((error
= git_repository_item_path(&path
, repo
, GIT_REPOSITORY_ITEM_OBJECTS
)) < 0
353 || (error
= git_buf_joinpath(&path
, path
.ptr
, "streamed")) < 0)
356 if ((error
= git_filebuf_open_withsize(&stream
->fbuf
, git_buf_cstr(&path
), GIT_FILEBUF_TEMPORARY
,
357 0666, 2 * 1024 * 1024)) < 0)
360 *out
= (git_writestream
*) stream
;
364 blob_writestream_free((git_writestream
*) stream
);
366 git_buf_dispose(&path
);
370 int git_blob_create_from_stream_commit(git_oid
*out
, git_writestream
*_stream
)
373 blob_writestream
*stream
= (blob_writestream
*) _stream
;
376 * We can make this more officient by avoiding writing to
377 * disk, but for now let's re-use the helper functions we
380 if ((error
= git_filebuf_flush(&stream
->fbuf
)) < 0)
383 error
= git_blob__create_from_paths(out
, NULL
, stream
->repo
, stream
->fbuf
.path_lock
,
384 stream
->hintpath
, 0, !!stream
->hintpath
);
387 blob_writestream_free(_stream
);
392 int git_blob_is_binary(const git_blob
*blob
)
394 git_buf content
= GIT_BUF_INIT
;
395 git_object_size_t size
;
397 GIT_ASSERT_ARG(blob
);
399 size
= git_blob_rawsize(blob
);
401 git_buf_attach_notowned(&content
, git_blob_rawcontent(blob
),
402 (size_t)min(size
, GIT_FILTER_BYTES_TO_CHECK_NUL
));
403 return git_buf_is_binary(&content
);
406 int git_blob_filter_options_init(
407 git_blob_filter_options
*opts
,
408 unsigned int version
)
410 GIT_INIT_STRUCTURE_FROM_TEMPLATE(opts
, version
,
411 git_blob_filter_options
, GIT_BLOB_FILTER_OPTIONS_INIT
);
419 git_blob_filter_options
*given_opts
)
422 git_filter_list
*fl
= NULL
;
423 git_blob_filter_options opts
= GIT_BLOB_FILTER_OPTIONS_INIT
;
424 git_filter_options filter_opts
= GIT_FILTER_OPTIONS_INIT
;
426 GIT_ASSERT_ARG(blob
);
427 GIT_ASSERT_ARG(path
);
430 GIT_ERROR_CHECK_VERSION(
431 given_opts
, GIT_BLOB_FILTER_OPTIONS_VERSION
, "git_blob_filter_options");
433 if (git_buf_sanitize(out
) < 0)
436 if (given_opts
!= NULL
)
437 memcpy(&opts
, given_opts
, sizeof(git_blob_filter_options
));
439 if ((opts
.flags
& GIT_BLOB_FILTER_CHECK_FOR_BINARY
) != 0 &&
440 git_blob_is_binary(blob
))
443 if ((opts
.flags
& GIT_BLOB_FILTER_NO_SYSTEM_ATTRIBUTES
) != 0)
444 filter_opts
.flags
|= GIT_FILTER_NO_SYSTEM_ATTRIBUTES
;
446 if ((opts
.flags
& GIT_BLOB_FILTER_ATTRIBUTES_FROM_HEAD
) != 0)
447 filter_opts
.flags
|= GIT_FILTER_ATTRIBUTES_FROM_HEAD
;
449 if ((opts
.flags
& GIT_BLOB_FILTER_ATTRIBUTES_FROM_COMMIT
) != 0) {
450 filter_opts
.flags
|= GIT_FILTER_ATTRIBUTES_FROM_COMMIT
;
452 #ifndef GIT_DEPRECATE_HARD
454 git_oid_cpy(&filter_opts
.attr_commit_id
, opts
.commit_id
);
457 git_oid_cpy(&filter_opts
.attr_commit_id
, &opts
.attr_commit_id
);
460 if (!(error
= git_filter_list_load_ext(
461 &fl
, git_blob_owner(blob
), blob
, path
,
462 GIT_FILTER_TO_WORKTREE
, &filter_opts
))) {
464 error
= git_filter_list_apply_to_blob(out
, fl
, blob
);
466 git_filter_list_free(fl
);
472 /* Deprecated functions */
474 #ifndef GIT_DEPRECATE_HARD
475 int git_blob_create_frombuffer(
476 git_oid
*id
, git_repository
*repo
, const void *buffer
, size_t len
)
478 return git_blob_create_from_buffer(id
, repo
, buffer
, len
);
481 int git_blob_create_fromworkdir(git_oid
*id
, git_repository
*repo
, const char *relative_path
)
483 return git_blob_create_from_workdir(id
, repo
, relative_path
);
486 int git_blob_create_fromdisk(git_oid
*id
, git_repository
*repo
, const char *path
)
488 return git_blob_create_from_disk(id
, repo
, path
);
491 int git_blob_create_fromstream(
492 git_writestream
**out
,
493 git_repository
*repo
,
494 const char *hintpath
)
496 return git_blob_create_from_stream(out
, repo
, hintpath
);
499 int git_blob_create_fromstream_commit(
501 git_writestream
*stream
)
503 return git_blob_create_from_stream_commit(out
, stream
);
506 int git_blob_filtered_content(
510 int check_for_binary_data
)
512 git_blob_filter_options opts
= GIT_BLOB_FILTER_OPTIONS_INIT
;
514 if (check_for_binary_data
)
515 opts
.flags
|= GIT_BLOB_FILTER_CHECK_FOR_BINARY
;
517 opts
.flags
&= ~GIT_BLOB_FILTER_CHECK_FOR_BINARY
;
519 return git_blob_filter(out
, blob
, path
, &opts
);