2 * Bucket -> Object converter
4 * (c) 2004, Robert Spalek <robert@ucw.cz>
8 #include "lib/unaligned.h"
10 #include "lib/fastbuf.h"
11 #include "charset/unicode.h"
12 #include "lib/object.h"
13 #include "lib/bucket.h"
14 #include "lib/lizard.h"
15 #include "lib/buck2obj.h"
21 #define MAX_HEADER_SIZE 1024 // extra space for the header not counted in MaxObjSize
22 #define RET_ERR(num) ({ errno = num; return NULL; })
28 struct lizard_buffer *lizard;
33 buck2obj_alloc_internal(struct buck2obj_buf *buf, uns max_len)
35 buf->max_len = max_len;
42 buf->raw_len = max_len * LIZARD_MAX_MULTIPLY + LIZARD_MAX_ADD + MAX_HEADER_SIZE;
43 buf->raw = xmalloc(buf->raw_len);
47 buck2obj_alloc(struct mempool *mp)
49 struct buck2obj_buf *buf = xmalloc(sizeof(struct buck2obj_buf));
50 buck2obj_alloc_internal(buf, 0);
51 buf->lizard = lizard_alloc(0);
57 buck2obj_free(struct buck2obj_buf *buf)
59 lizard_free(buf->lizard);
66 buck2obj_realloc(struct buck2obj_buf *buf, uns max_len)
68 if (max_len <= buf->max_len)
70 if (max_len < 2*buf->max_len) // to ensure amortized logarithmic complexity
71 max_len = 2*buf->max_len;
74 buck2obj_alloc_internal(buf, max_len);
78 decode_attributes(byte *ptr, byte *end, struct odes *o, uns can_overwrite)
80 if (can_overwrite >= 2)
90 obj_add_attr_ref(o, type, ptr);
94 else if (can_overwrite == 1)
101 byte type = ptr[len];
104 obj_add_attr(o, type, ptr);
116 byte type = ptr[len];
118 byte *dup = mp_alloc_fast_noalign(o->pool, len+1);
119 memcpy(dup, ptr, len);
121 obj_add_attr_ref(o, type, dup);
129 obj_read_bucket(struct buck2obj_buf *buf, uns buck_type, struct fastbuf *body, uns want_body)
131 struct odes *o = obj_new(buf->mp);
133 if (buck_type < BUCKET_TYPE_V33)
135 if (want_body) // ignore empty lines, read until EOF
136 obj_read_multi(body, o);
137 else // end on EOF or the first empty line
142 /* Compute the length of the bucket. We cannot fetch this attribute
143 * directly due to remote indexing. */
144 bseek(body, 0, SEEK_END);
145 sh_off_t buck_len = btell(body);
148 /* Read all the bucket into 1 buffer, 0-copy if possible. */
149 int can_overwrite = bconfig(body, BCONFIG_CAN_OVERWRITE, 0);
150 if (can_overwrite < 0)
154 uns len = bdirect_read_prepare(body, &ptr);
156 || (can_overwrite < 2 && buck_type == BUCKET_TYPE_V33))
158 /* Copy if the original buffer is too small.
159 * If it is write-protected, copy it also if it is uncompressed. */
160 if (buck_len > buf->raw_len)
161 buck2obj_realloc(buf, buck_len);
162 len = bread(body, buf->raw, buck_len);
168 overwritten = can_overwrite > 1;
171 ptr = decode_attributes(ptr, end, o, can_overwrite);// header
174 if (buck_type == BUCKET_TYPE_V33)
176 else if (buck_type == BUCKET_TYPE_V33_LIZARD) // decompression
182 res = lizard_decompress_safe(ptr, buf->lizard, len);
183 if (res != (int) len)
187 else if (errno == EFBIG)
189 lizard_realloc(buf->lizard, len);
195 ptr = buf->lizard->ptr;
199 else // unknown bucket type
201 ASSERT(can_overwrite == 2); // because of the policy and decompression
202 ptr = decode_attributes(ptr, end, o, 2); // body
206 /* If (overwritten), bflush(body) might be needed. */