summaryrefslogtreecommitdiff
path: root/pbstream.c
diff options
context:
space:
mode:
authorJoshua Haberman <joshua@reverberate.org>2009-05-25 18:31:27 -0700
committerJoshua Haberman <joshua@reverberate.org>2009-05-25 18:31:27 -0700
commit0c80c384756a48d5f731eeafa62b6cd5f3861749 (patch)
treec723951c40b0dd7aea5ccd24e9b55fb0167ffb48 /pbstream.c
parentfdcefd68b17a62c7129e910351f5b323044f835d (diff)
A flurry of activity. Doesn't compile yet.
- a descriptor.c that describes the data structures in descriptor.proto using the data structures in descriptor.h. - everything renamed pbstream -> upb. - modularization rethought. - Doesn't compile yet, but should once things settle back down.
Diffstat (limited to 'pbstream.c')
-rw-r--r--pbstream.c403
1 files changed, 0 insertions, 403 deletions
diff --git a/pbstream.c b/pbstream.c
deleted file mode 100644
index b613e33..0000000
--- a/pbstream.c
+++ /dev/null
@@ -1,403 +0,0 @@
-/*
- * pbstream - a stream-oriented implementation of protocol buffers.
- *
- * Copyright (c) 2008-2009 Joshua Haberman. See LICENSE for details.
- */
-
-#include <assert.h>
-#include <stdlib.h>
-#include <string.h>
-#include "pbstream.h"
-#include "pbstream_lowlevel.h"
-
-/* Branch prediction hints for GCC. */
-#ifdef __GNUC__
-#define likely(x) __builtin_expect((x),1)
-#define unlikely(x) __builtin_expect((x),0)
-#else
-#define likely(x) (x)
-#define unlikely(x) (x)
-#endif
-
-#define CHECK(func) do { \
- pbstream_status_t status = func; \
- if(status != PBSTREAM_STATUS_OK) return status; \
- } while (0)
-
-/* Lowest-level functions -- these read integers from the input buffer.
- * To avoid branches, none of these do bounds checking. So we force clients
- * to overallocate their buffers by >=9 bytes. */
-
-static pbstream_status_t get_v_uint64_t(uint8_t *restrict *buf,
- uint64_t *restrict val)
-{
- uint8_t *ptr = *buf, b;
- uint32_t part0 = 0, part1 = 0, part2 = 0;
-
- /* From the original proto2 implementation. */
- b = *(ptr++); part0 = (b & 0x7F) ; if (!(b & 0x80)) goto done;
- b = *(ptr++); part0 |= (b & 0x7F) << 7; if (!(b & 0x80)) goto done;
- b = *(ptr++); part0 |= (b & 0x7F) << 14; if (!(b & 0x80)) goto done;
- b = *(ptr++); part0 |= (b & 0x7F) << 21; if (!(b & 0x80)) goto done;
- b = *(ptr++); part1 = (b & 0x7F) ; if (!(b & 0x80)) goto done;
- b = *(ptr++); part1 |= (b & 0x7F) << 7; if (!(b & 0x80)) goto done;
- b = *(ptr++); part1 |= (b & 0x7F) << 14; if (!(b & 0x80)) goto done;
- b = *(ptr++); part1 |= (b & 0x7F) << 21; if (!(b & 0x80)) goto done;
- b = *(ptr++); part2 = (b & 0x7F) ; if (!(b & 0x80)) goto done;
- b = *(ptr++); part2 |= (b & 0x7F) << 7; if (!(b & 0x80)) goto done;
- return PBSTREAM_ERROR_UNTERMINATED_VARINT;
-
-done:
- *buf = ptr;
- *val = (uint64_t)part0 | ((uint64_t)part1 << 28) | ((uint64_t)part2 << 56);
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t skip_v_uint64_t(uint8_t **buf)
-{
- uint8_t *ptr = *buf, b;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- b = *(ptr++); if (!(b & 0x80)) goto done;
- return PBSTREAM_ERROR_UNTERMINATED_VARINT;
-
-done:
- *buf = (uint8_t*)ptr;
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t get_v_uint32_t(uint8_t *restrict *buf,
- uint32_t *restrict val)
-{
- uint8_t *ptr = *buf, b;
- uint32_t result;
-
- /* From the original proto2 implementation. */
- b = *(ptr++); result = (b & 0x7F) ; if (!(b & 0x80)) goto done;
- b = *(ptr++); result |= (b & 0x7F) << 7; if (!(b & 0x80)) goto done;
- b = *(ptr++); result |= (b & 0x7F) << 14; if (!(b & 0x80)) goto done;
- b = *(ptr++); result |= (b & 0x7F) << 21; if (!(b & 0x80)) goto done;
- b = *(ptr++); result = (b & 0x7F) << 28; if (!(b & 0x80)) goto done;
- return PBSTREAM_ERROR_UNTERMINATED_VARINT;
-
-done:
- *buf = ptr;
- *val = result;
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t get_f_uint32_t(uint8_t *restrict *buf,
- uint32_t *restrict val)
-{
- uint8_t *b = *buf;
-#define SHL(val, bits) ((uint32_t)val << bits)
- *val = SHL(b[0], 0) | SHL(b[1], 8) | SHL(b[2], 16) | SHL(b[3], 24);
-#undef SHL
- *buf += sizeof(uint32_t);
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t skip_f_uint32_t(uint8_t **buf)
-{
- *buf += sizeof(uint32_t);
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t get_f_uint64_t(uint8_t *restrict *buf,
- uint64_t *restrict val)
-{
- uint8_t *b = *buf;
- /* TODO: is this worth 32/64 specializing? */
-#define SHL(val, bits) ((uint64_t)val << bits)
- *val = SHL(b[0], 0) | SHL(b[1], 8) | SHL(b[2], 16) | SHL(b[3], 24) |
- SHL(b[4], 32) | SHL(b[5], 40) | SHL(b[6], 48) | SHL(b[7], 56);
-#undef SHL
- *buf += sizeof(uint64_t);
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t skip_f_uint64_t(uint8_t **buf)
-{
- *buf += sizeof(uint64_t);
- return PBSTREAM_STATUS_OK;
-}
-
-static int32_t zz_decode_32(uint32_t n) { return (n >> 1) ^ -(int32_t)(n & 1); }
-static int64_t zz_decode_64(uint64_t n) { return (n >> 1) ^ -(int64_t)(n & 1); }
-
-/* Functions for reading wire values and converting them to values. These
- * are generated with macros because they follow a higly consistent pattern. */
-
-#define WVTOV(type, wire_t, val_t) \
- static void wvtov_ ## type(wire_t s, val_t *d)
-
-#define GET(type, v_or_f, wire_t, val_t, member_name) \
- static pbstream_status_t get_ ## type(struct pbstream_parse_state *s, \
- uint8_t *buf, \
- struct pbstream_tagged_value *d) { \
- wire_t tmp; \
- uint8_t *b = buf; \
- CHECK(get_ ## v_or_f ## _ ## wire_t(&b, &tmp)); \
- wvtov_ ## type(tmp, &d->v.member_name); \
- s->offset += (b-buf); \
- return PBSTREAM_STATUS_OK; \
- }
-
-#define T(type, v_or_f, wire_t, val_t, member_name) \
- WVTOV(type, wire_t, val_t); /* prototype for GET below */ \
- GET(type, v_or_f, wire_t, val_t, member_name) \
- WVTOV(type, wire_t, val_t)
-
-T(DOUBLE, f, uint64_t, double, _double) { memcpy(d, &s, sizeof(double)); }
-T(FLOAT, f, uint32_t, float, _float) { memcpy(d, &s, sizeof(float)); }
-T(INT32, v, uint32_t, int32_t, int32) { *d = (int32_t)s; }
-T(INT64, v, uint64_t, int64_t, int64) { *d = (int64_t)s; }
-T(UINT32, v, uint32_t, uint32_t, uint32) { *d = s; }
-T(UINT64, v, uint64_t, uint64_t, uint64) { *d = s; }
-T(SINT32, v, uint32_t, int32_t, int32) { *d = zz_decode_32(s); }
-T(SINT64, v, uint64_t, int64_t, int64) { *d = zz_decode_64(s); }
-T(FIXED32, f, uint32_t, uint32_t, uint32) { *d = s; }
-T(FIXED64, f, uint64_t, uint64_t, uint64) { *d = s; }
-T(SFIXED32, f, uint32_t, int32_t, int32) { *d = (int32_t)s; }
-T(SFIXED64, f, uint64_t, int64_t, int64) { *d = (int64_t)s; }
-T(BOOL, v, uint32_t, bool, _bool) { *d = (bool)s; }
-T(ENUM, v, uint32_t, int32_t, int32) { *d = (int32_t)s; }
-#undef WVTOV
-#undef GET
-#undef T
-
-static void wvtov_delimited(uint32_t s, struct pbstream_delimited *d, size_t o)
-{
- d->offset = o;
- d->len = s;
-}
-
-/* Use BYTES version for both STRING and BYTES, leave UTF-8 checks to client. */
-static pbstream_status_t get_BYTES(struct pbstream_parse_state *s, uint8_t *buf,
- struct pbstream_tagged_value *d) {
- uint32_t tmp;
- uint8_t *b = buf;
- CHECK(get_v_uint32_t(&b, &tmp));
- s->offset += (b-buf); /* advance past length varint. */
- wvtov_delimited(tmp, &d->v.delimited, s->offset);
- size_t new_offset = s->offset + d->v.delimited.len; /* skip bytes */
- if (unlikely(new_offset < s->offset)) return PBSTREAM_ERROR_OVERFLOW;
- s->offset = new_offset;
- return PBSTREAM_STATUS_OK;
-}
-
-static pbstream_status_t get_MESSAGE(struct pbstream_parse_state *s, uint8_t *buf,
- struct pbstream_tagged_value *d) {
- /* We're entering a sub-message. */
- uint32_t tmp;
- uint8_t *b = buf;
- CHECK(get_v_uint32_t(&b, &tmp));
- s->offset += (b-buf); /* advance past length varint. */
- wvtov_delimited(tmp, &d->v.delimited, s->offset);
- /* Unlike STRING and BYTES, we *don't* advance past delimited here. */
- if (unlikely(++s->top == s->limit)) return PBSTREAM_ERROR_STACK_OVERFLOW;
- s->top->fieldset = d->field->fieldset;
- s->top->end_offset = d->v.delimited.offset + d->v.delimited.len;
- if (unlikely(s->top->end_offset < s->offset)) return PBSTREAM_ERROR_OVERFLOW;
- return PBSTREAM_STATUS_OK;
-}
-
-struct pbstream_type_info {
- pbstream_wire_type_t expected_wire_type;
- pbstream_status_t (*get)(struct pbstream_parse_state *s, uint8_t *buf,
- struct pbstream_tagged_value *d);
-};
-static struct pbstream_type_info type_info[] = {
- {PBSTREAM_WIRE_TYPE_64BIT, get_DOUBLE},
- {PBSTREAM_WIRE_TYPE_32BIT, get_FLOAT},
- {PBSTREAM_WIRE_TYPE_VARINT, get_INT32},
- {PBSTREAM_WIRE_TYPE_VARINT, get_INT64},
- {PBSTREAM_WIRE_TYPE_VARINT, get_UINT32},
- {PBSTREAM_WIRE_TYPE_VARINT, get_UINT64},
- {PBSTREAM_WIRE_TYPE_VARINT, get_SINT32},
- {PBSTREAM_WIRE_TYPE_VARINT, get_SINT64},
- {PBSTREAM_WIRE_TYPE_32BIT, get_FIXED32},
- {PBSTREAM_WIRE_TYPE_64BIT, get_FIXED64},
- {PBSTREAM_WIRE_TYPE_32BIT, get_SFIXED32},
- {PBSTREAM_WIRE_TYPE_64BIT, get_SFIXED64},
- {PBSTREAM_WIRE_TYPE_VARINT, get_BOOL},
- {PBSTREAM_WIRE_TYPE_DELIMITED, get_BYTES},
- {PBSTREAM_WIRE_TYPE_DELIMITED, get_BYTES},
- {PBSTREAM_WIRE_TYPE_VARINT, get_ENUM},
- {PBSTREAM_WIRE_TYPE_DELIMITED, get_MESSAGE}
-};
-
-pbstream_status_t parse_tag(uint8_t **buf, struct pbstream_tag *tag)
-{
- uint32_t tag_int;
- CHECK(get_v_uint32_t(buf, &tag_int));
- tag->wire_type = (pbstream_wire_type_t)(tag_int & 0x07);
- tag->field_number = tag_int >> 3;
- return PBSTREAM_STATUS_OK;
-}
-
-pbstream_status_t parse_wire_value(uint8_t *buf, size_t *offset,
- pbstream_wire_type_t wt,
- union pbstream_wire_value *wv)
-{
-#define READ(expr) CHECK(expr); *offset += (b-buf)
- uint8_t *b = buf;
- switch(wt) {
- case PBSTREAM_WIRE_TYPE_VARINT:
- READ(get_v_uint64_t(&b, &wv->varint)); break;
- case PBSTREAM_WIRE_TYPE_64BIT:
- READ(get_f_uint64_t(&b, &wv->_64bit)); break;
- case PBSTREAM_WIRE_TYPE_32BIT:
- READ(get_f_uint32_t(&b, &wv->_32bit)); break;
- case PBSTREAM_WIRE_TYPE_DELIMITED:
- wv->delimited.offset = *offset;
- READ(get_v_uint32_t(&b, &wv->delimited.len));
- size_t new_offset = *offset + wv->delimited.len;
- if (new_offset < *offset) return PBSTREAM_ERROR_OVERFLOW;
- *offset += new_offset;
- break;
- case PBSTREAM_WIRE_TYPE_START_GROUP:
- case PBSTREAM_WIRE_TYPE_END_GROUP:
- return PBSTREAM_ERROR_GROUP; /* deprecated, no plans to support. */
- }
- return PBSTREAM_STATUS_OK;
-}
-
-pbstream_status_t skip_wire_value(uint8_t *buf, size_t *offset,
- pbstream_wire_type_t wt)
-{
- uint8_t *b = buf;
- switch(wt) {
- case PBSTREAM_WIRE_TYPE_VARINT:
- READ(skip_v_uint64_t(&b)); break;
- case PBSTREAM_WIRE_TYPE_64BIT:
- READ(skip_f_uint64_t(&b)); break;
- case PBSTREAM_WIRE_TYPE_32BIT:
- READ(skip_f_uint32_t(&b)); break;
- case PBSTREAM_WIRE_TYPE_DELIMITED: {
- /* Have to get (not skip) the length to skip the bytes. */
- uint32_t len;
- READ(get_v_uint32_t(&b, &len));
- size_t new_offset = *offset + len;
- if (new_offset < *offset) return PBSTREAM_ERROR_OVERFLOW;
- *offset += new_offset;
- break;
- }
- case PBSTREAM_WIRE_TYPE_START_GROUP:
- case PBSTREAM_WIRE_TYPE_END_GROUP:
- return PBSTREAM_ERROR_GROUP; /* deprecated, no plans to support. */
- }
- return PBSTREAM_STATUS_OK;
-#undef READ
-}
-
-struct pbstream_field *pbstream_find_field(struct pbstream_fieldset* fs,
- pbstream_field_number_t num)
-{
- /* TODO: the hashtable part. */
- return fs->array[num-1];
-}
-
-/* Parses and processes the next value from buf. */
-pbstream_status_t pbstream_parse_field(struct pbstream_parse_state *s,
- uint8_t *buf,
- pbstream_field_number_t *fieldnum,
- struct pbstream_tagged_value *val,
- struct pbstream_tagged_wire_value *wv)
-{
- /* Check for end-of-message at the current stack depth. */
- if(unlikely(s->offset >= s->top->end_offset)) {
- /* If the end offset isn't an exact field boundary, the pb is corrupt. */
- if(unlikely(s->offset != s->top->end_offset))
- return PBSTREAM_ERROR_BAD_SUBMESSAGE_END;
- s->top--;
- return PBSTREAM_STATUS_SUBMESSAGE_END;
- }
-
- struct pbstream_tag tag;
- uint8_t *b = buf;
- CHECK(parse_tag(&b, &tag));
- s->offset += (b-buf);
- struct pbstream_field *fd = pbstream_find_field(s->top->fieldset,
- tag.field_number);
- pbstream_status_t unknown_value_status;
- if(unlikely(!fd)) {
- unknown_value_status = PBSTREAM_ERROR_UNKNOWN_VALUE;
- goto unknown_value;
- }
- struct pbstream_type_info *info = &type_info[fd->type];
- if(unlikely(tag.wire_type != info->expected_wire_type)) {
- unknown_value_status = PBSTREAM_ERROR_MISMATCHED_TYPE;
- goto unknown_value;
- }
-
- *fieldnum = tag.field_number;
- val->field = fd;
- CHECK(info->get(s, b, val));
- return PBSTREAM_STATUS_OK;
-
-unknown_value:
- wv->type = tag.wire_type;
- CHECK(parse_wire_value(buf, &s->offset, tag.wire_type, &wv->v));
- return unknown_value_status;
-}
-
-void pbstream_init_parser(
- struct pbstream_parse_state *state,
- struct pbstream_fieldset *toplevel_fieldset)
-{
- state->offset = 0;
- state->top = state->stack;
- state->limit = state->top + PBSTREAM_MAX_STACK;
- state->top->fieldset = toplevel_fieldset;
- state->top->end_offset = SIZE_MAX;
-}
-
-static int compare_fields(const void *f1, const void *f2)
-{
- return ((struct pbstream_field*)f1)->field_number -
- ((struct pbstream_field*)f2)->field_number;
-}
-
-void pbstream_init_fieldset(struct pbstream_fieldset *fieldset,
- struct pbstream_field *fields,
- int num_fields)
-{
- qsort(fields, num_fields, sizeof(*fields), compare_fields);
-
- /* Find the largest n for which at least half the fieldnums <n are used.
- * Start at 8 to avoid noise of small numbers. */
- pbstream_field_number_t n = 0, maybe_n;
- for(int i = 0; i < num_fields; i++) {
- maybe_n = fields[i].field_number;
- if(maybe_n > 8 && maybe_n/(i+1) >= 2) break;
- n = maybe_n;
- }
-
- fieldset->num_fields = num_fields;
- fieldset->fields = malloc(sizeof(*fieldset->fields)*num_fields);
- memcpy(fieldset->fields, fields, sizeof(*fields)*num_fields);
-
- fieldset->array_size = n;
- fieldset->array = malloc(sizeof(*fieldset->array)*n);
- memset(fieldset->array, 0, sizeof(*fieldset->array)*n);
-
- for (int i = 0; i < num_fields && fields[i].field_number <= n; i++)
- fieldset->array[fields[i].field_number-1] = &fieldset->fields[i];
-
- /* Until we support the hashtable part... */
- assert(n == fields[num_fields-1].field_number);
-}
-
-void pbstream_free_fieldset(struct pbstream_fieldset *fieldset)
-{
- free(fieldset->fields);
- free(fieldset->array);
-}
generated by cgit on debian on lair
contact matthew@masot.net with questions or feedback