2 * Copyright (c) 2011, Google Inc.
6 #include "repository.h"
7 #include "object-store.h"
8 #include "replace-object.h"
18 typedef int (*open_istream_fn
)(struct git_istream
*,
20 const struct object_id
*,
22 typedef int (*close_istream_fn
)(struct git_istream
*);
23 typedef ssize_t (*read_istream_fn
)(struct git_istream
*, char *, size_t);
26 close_istream_fn close
;
30 #define open_method_decl(name) \
31 int open_istream_ ##name \
32 (struct git_istream *st, struct object_info *oi, \
33 const struct object_id *oid, \
34 enum object_type *type)
36 #define close_method_decl(name) \
37 int close_istream_ ##name \
38 (struct git_istream *st)
40 #define read_method_decl(name) \
41 ssize_t read_istream_ ##name \
42 (struct git_istream *st, char *buf, size_t sz)
44 /* forward declaration */
45 static open_method_decl(incore
);
46 static open_method_decl(loose
);
47 static open_method_decl(pack_non_delta
);
48 static struct git_istream
*attach_stream_filter(struct git_istream
*st
,
49 struct stream_filter
*filter
);
52 static open_istream_fn open_istream_tbl
[] = {
55 open_istream_pack_non_delta
,
58 #define FILTER_BUFFER (1024*16)
60 struct filtered_istream
{
61 struct git_istream
*upstream
;
62 struct stream_filter
*filter
;
63 char ibuf
[FILTER_BUFFER
];
64 char obuf
[FILTER_BUFFER
];
71 const struct stream_vtbl
*vtbl
;
72 unsigned long size
; /* inflated size of full object */
74 enum { z_unused
, z_used
, z_done
, z_error
} z_state
;
78 char *buf
; /* from read_object() */
79 unsigned long read_ptr
;
84 unsigned long mapsize
;
91 struct packed_git
*pack
;
95 struct filtered_istream filtered
;
99 int close_istream(struct git_istream
*st
)
101 int r
= st
->vtbl
->close(st
);
106 ssize_t
read_istream(struct git_istream
*st
, void *buf
, size_t sz
)
108 return st
->vtbl
->read(st
, buf
, sz
);
111 static enum input_source
istream_source(const struct object_id
*oid
,
112 enum object_type
*type
,
113 struct object_info
*oi
)
120 status
= oid_object_info_extended(the_repository
, oid
, oi
, 0);
124 switch (oi
->whence
) {
128 if (!oi
->u
.packed
.is_delta
&& big_file_threshold
< size
)
129 return pack_non_delta
;
136 struct git_istream
*open_istream(const struct object_id
*oid
,
137 enum object_type
*type
,
139 struct stream_filter
*filter
)
141 struct git_istream
*st
;
142 struct object_info oi
= OBJECT_INFO_INIT
;
143 const struct object_id
*real
= lookup_replace_object(the_repository
, oid
);
144 enum input_source src
= istream_source(real
, type
, &oi
);
149 st
= xmalloc(sizeof(*st
));
150 if (open_istream_tbl
[src
](st
, &oi
, real
, type
)) {
151 if (open_istream_incore(st
, &oi
, real
, type
)) {
157 /* Add "&& !is_null_stream_filter(filter)" for performance */
158 struct git_istream
*nst
= attach_stream_filter(st
, filter
);
171 /*****************************************************************
175 *****************************************************************/
177 static void close_deflated_stream(struct git_istream
*st
)
179 if (st
->z_state
== z_used
)
180 git_inflate_end(&st
->z
);
184 /*****************************************************************
188 *****************************************************************/
190 static close_method_decl(filtered
)
192 free_stream_filter(st
->u
.filtered
.filter
);
193 return close_istream(st
->u
.filtered
.upstream
);
196 static read_method_decl(filtered
)
198 struct filtered_istream
*fs
= &(st
->u
.filtered
);
202 /* do we already have filtered output? */
203 if (fs
->o_ptr
< fs
->o_end
) {
204 size_t to_move
= fs
->o_end
- fs
->o_ptr
;
207 memcpy(buf
+ filled
, fs
->obuf
+ fs
->o_ptr
, to_move
);
208 fs
->o_ptr
+= to_move
;
213 fs
->o_end
= fs
->o_ptr
= 0;
215 /* do we have anything to feed the filter with? */
216 if (fs
->i_ptr
< fs
->i_end
) {
217 size_t to_feed
= fs
->i_end
- fs
->i_ptr
;
218 size_t to_receive
= FILTER_BUFFER
;
219 if (stream_filter(fs
->filter
,
220 fs
->ibuf
+ fs
->i_ptr
, &to_feed
,
221 fs
->obuf
, &to_receive
))
223 fs
->i_ptr
= fs
->i_end
- to_feed
;
224 fs
->o_end
= FILTER_BUFFER
- to_receive
;
228 /* tell the filter to drain upon no more input */
229 if (fs
->input_finished
) {
230 size_t to_receive
= FILTER_BUFFER
;
231 if (stream_filter(fs
->filter
,
233 fs
->obuf
, &to_receive
))
235 fs
->o_end
= FILTER_BUFFER
- to_receive
;
240 fs
->i_end
= fs
->i_ptr
= 0;
242 /* refill the input from the upstream */
243 if (!fs
->input_finished
) {
244 fs
->i_end
= read_istream(fs
->upstream
, fs
->ibuf
, FILTER_BUFFER
);
250 fs
->input_finished
= 1;
255 static struct stream_vtbl filtered_vtbl
= {
256 close_istream_filtered
,
257 read_istream_filtered
,
260 static struct git_istream
*attach_stream_filter(struct git_istream
*st
,
261 struct stream_filter
*filter
)
263 struct git_istream
*ifs
= xmalloc(sizeof(*ifs
));
264 struct filtered_istream
*fs
= &(ifs
->u
.filtered
);
266 ifs
->vtbl
= &filtered_vtbl
;
269 fs
->i_end
= fs
->i_ptr
= 0;
270 fs
->o_end
= fs
->o_ptr
= 0;
271 fs
->input_finished
= 0;
272 ifs
->size
= -1; /* unknown */
276 /*****************************************************************
278 * Loose object stream
280 *****************************************************************/
282 static read_method_decl(loose
)
284 size_t total_read
= 0;
286 switch (st
->z_state
) {
295 if (st
->u
.loose
.hdr_used
< st
->u
.loose
.hdr_avail
) {
296 size_t to_copy
= st
->u
.loose
.hdr_avail
- st
->u
.loose
.hdr_used
;
299 memcpy(buf
, st
->u
.loose
.hdr
+ st
->u
.loose
.hdr_used
, to_copy
);
300 st
->u
.loose
.hdr_used
+= to_copy
;
301 total_read
+= to_copy
;
304 while (total_read
< sz
) {
307 st
->z
.next_out
= (unsigned char *)buf
+ total_read
;
308 st
->z
.avail_out
= sz
- total_read
;
309 status
= git_inflate(&st
->z
, Z_FINISH
);
311 total_read
= st
->z
.next_out
- (unsigned char *)buf
;
313 if (status
== Z_STREAM_END
) {
314 git_inflate_end(&st
->z
);
315 st
->z_state
= z_done
;
318 if (status
!= Z_OK
&& (status
!= Z_BUF_ERROR
|| total_read
< sz
)) {
319 git_inflate_end(&st
->z
);
320 st
->z_state
= z_error
;
327 static close_method_decl(loose
)
329 close_deflated_stream(st
);
330 munmap(st
->u
.loose
.mapped
, st
->u
.loose
.mapsize
);
334 static struct stream_vtbl loose_vtbl
= {
339 static open_method_decl(loose
)
341 st
->u
.loose
.mapped
= map_sha1_file(the_repository
,
342 oid
->hash
, &st
->u
.loose
.mapsize
);
343 if (!st
->u
.loose
.mapped
)
345 if ((unpack_sha1_header(&st
->z
,
349 sizeof(st
->u
.loose
.hdr
)) < 0) ||
350 (parse_sha1_header(st
->u
.loose
.hdr
, &st
->size
) < 0)) {
351 git_inflate_end(&st
->z
);
352 munmap(st
->u
.loose
.mapped
, st
->u
.loose
.mapsize
);
356 st
->u
.loose
.hdr_used
= strlen(st
->u
.loose
.hdr
) + 1;
357 st
->u
.loose
.hdr_avail
= st
->z
.total_out
;
358 st
->z_state
= z_used
;
360 st
->vtbl
= &loose_vtbl
;
365 /*****************************************************************
367 * Non-delta packed object stream
369 *****************************************************************/
371 static read_method_decl(pack_non_delta
)
373 size_t total_read
= 0;
375 switch (st
->z_state
) {
377 memset(&st
->z
, 0, sizeof(st
->z
));
378 git_inflate_init(&st
->z
);
379 st
->z_state
= z_used
;
389 while (total_read
< sz
) {
391 struct pack_window
*window
= NULL
;
392 unsigned char *mapped
;
394 mapped
= use_pack(st
->u
.in_pack
.pack
, &window
,
395 st
->u
.in_pack
.pos
, &st
->z
.avail_in
);
397 st
->z
.next_out
= (unsigned char *)buf
+ total_read
;
398 st
->z
.avail_out
= sz
- total_read
;
399 st
->z
.next_in
= mapped
;
400 status
= git_inflate(&st
->z
, Z_FINISH
);
402 st
->u
.in_pack
.pos
+= st
->z
.next_in
- mapped
;
403 total_read
= st
->z
.next_out
- (unsigned char *)buf
;
406 if (status
== Z_STREAM_END
) {
407 git_inflate_end(&st
->z
);
408 st
->z_state
= z_done
;
413 * Unlike the loose object case, we do not have to worry here
414 * about running out of input bytes and spinning infinitely. If
415 * we get Z_BUF_ERROR due to too few input bytes, then we'll
416 * replenish them in the next use_pack() call when we loop. If
417 * we truly hit the end of the pack (i.e., because it's corrupt
418 * or truncated), then use_pack() catches that and will die().
420 if (status
!= Z_OK
&& status
!= Z_BUF_ERROR
) {
421 git_inflate_end(&st
->z
);
422 st
->z_state
= z_error
;
429 static close_method_decl(pack_non_delta
)
431 close_deflated_stream(st
);
435 static struct stream_vtbl pack_non_delta_vtbl
= {
436 close_istream_pack_non_delta
,
437 read_istream_pack_non_delta
,
440 static open_method_decl(pack_non_delta
)
442 struct pack_window
*window
;
443 enum object_type in_pack_type
;
445 st
->u
.in_pack
.pack
= oi
->u
.packed
.pack
;
446 st
->u
.in_pack
.pos
= oi
->u
.packed
.offset
;
449 in_pack_type
= unpack_object_header(st
->u
.in_pack
.pack
,
454 switch (in_pack_type
) {
456 return -1; /* we do not do deltas for now */
463 st
->z_state
= z_unused
;
464 st
->vtbl
= &pack_non_delta_vtbl
;
469 /*****************************************************************
473 *****************************************************************/
475 static close_method_decl(incore
)
477 free(st
->u
.incore
.buf
);
481 static read_method_decl(incore
)
483 size_t read_size
= sz
;
484 size_t remainder
= st
->size
- st
->u
.incore
.read_ptr
;
486 if (remainder
<= read_size
)
487 read_size
= remainder
;
489 memcpy(buf
, st
->u
.incore
.buf
+ st
->u
.incore
.read_ptr
, read_size
);
490 st
->u
.incore
.read_ptr
+= read_size
;
495 static struct stream_vtbl incore_vtbl
= {
496 close_istream_incore
,
500 static open_method_decl(incore
)
502 st
->u
.incore
.buf
= read_object_file_extended(the_repository
, oid
, type
, &st
->size
, 0);
503 st
->u
.incore
.read_ptr
= 0;
504 st
->vtbl
= &incore_vtbl
;
506 return st
->u
.incore
.buf
? 0 : -1;
510 /****************************************************************
511 * Users of streaming interface
512 ****************************************************************/
514 int stream_blob_to_fd(int fd
, const struct object_id
*oid
, struct stream_filter
*filter
,
517 struct git_istream
*st
;
518 enum object_type type
;
523 st
= open_istream(oid
, &type
, &sz
, filter
);
526 free_stream_filter(filter
);
529 if (type
!= OBJ_BLOB
)
533 ssize_t wrote
, holeto
;
534 ssize_t readlen
= read_istream(st
, buf
, sizeof(buf
));
540 if (can_seek
&& sizeof(buf
) == readlen
) {
541 for (holeto
= 0; holeto
< readlen
; holeto
++)
544 if (readlen
== holeto
) {
550 if (kept
&& lseek(fd
, kept
, SEEK_CUR
) == (off_t
) -1)
554 wrote
= write_in_full(fd
, buf
, readlen
);
559 if (kept
&& (lseek(fd
, kept
- 1, SEEK_CUR
) == (off_t
) -1 ||
560 xwrite(fd
, "", 1) != 1))