/* * upb - a minimalist implementation of protocol buffers. * * Copyright (c) 2010 Joshua Haberman. See LICENSE for details. * * upb_sink is a general purpose interface for pushing the contents of a * protobuf from one component to another in a streaming fashion. We call the * component that calls a upb_sink a "source". By "pushing" we mean that the * source calls into the sink; the opposite (where a sink calls into the * source) is known as "pull". In the push model the source gets the main * loop; in a pull model the sink does. * * This interface is used as general-purpose glue in upb. For example, the * parser interface works by implementing a source. Likewise the serialization * simply implements a sink. Copying one protobuf to another is just a matter * of using one message as a source and another as a sink. * * In terms of efficiency, we would generally expect "push" to be faster if the * source had more state to track, and "pull" to be faster if the sink had more * state. The reason is that whoever has the main loop can keep state on the * stack (and possibly even in callee-save registers), whereas the the * component that is "called into" always needs to reload its state from * memory. * * In terms of programming complexity, it is easier and simpler to have the * main loop, because you can store state in local variables. * * So the assumption inherent in using the push model is that sources are * generally more complicated and stateful than consumers. For example, in the * parser case, it has to deal with malformed input and associated errors; in * comparison, the serializer deals with known-good input. */ #ifndef UPB_SINK_H #define UPB_SINK_H #include "upb_def.h" #ifdef __cplusplus extern "C" { #endif // Each of the upb_sink callbacks returns a status of this type. typedef enum { // The normal case, where the consumer wants to continue consuming. UPB_SINK_CONTINUE, // The sink did not consume this value, and wants to halt further processing. // If the source is resumable, it should save the current state so that when // resumed, the value that was just provided will be replayed. UPB_SINK_STOP, // The consumer wants to skip to the end of the current submessage and // continue consuming. If we are at the top-level, the rest of the // data is discarded. UPB_SINK_SKIP } upb_sink_status; typedef struct { struct upb_sink_callbacks *vtbl; } upb_sink; /* upb_sink callbacks *********************************************************/ // The value callback is called for a regular value (ie. not a string or // submessage). typedef upb_sink_status (*upb_value_cb)(upb_sink *s, upb_fielddef *f, upb_value val, upb_status *status); // The string callback is called for string data. "str" is the string in which // the data lives, but it may contain more data than the effective string. // "start" and "end" indicate the substring of "str" that is the effective // string. If "start" is <0, this string is a continuation of the previous // string for this field. If end > upb_strlen(str) then there is more data to // follow for this string. "end" can also be used as a hint for how much data // follows, but this is only a hint and is not guaranteed. // // The data is supplied this way to give you the opportunity to reference this // data instead of copying it (perhaps using upb_strslice), or to minimize // copying if it is unavoidable. typedef upb_sink_status (*upb_str_cb)(upb_sink *s, upb_fielddef *f, upb_strptr str, int32_t start, uint32_t end, upb_status *status); // The start and end callbacks are called when a submessage begins and ends, // respectively. The caller is responsible for ensuring that the nesting // level never exceeds UPB_MAX_NESTING. typedef upb_sink_status (*upb_start_cb)(upb_sink *s, upb_fielddef *f, upb_status *status); typedef upb_sink_status (*upb_end_cb)(upb_sink *s, upb_fielddef *f, upb_status *status); /* upb_sink implementation ****************************************************/ typedef struct upb_sink_callbacks { upb_value_cb value_cb; upb_str_cb str_cb; upb_start_cb start_cb; upb_end_cb end_cb; } upb_sink_callbacks; // These macros implement a mini virtual function dispatch for upb_sink instances. // This allows functions that call upb_sinks to just write: // // upb_sink_onvalue(sink, field, val); // // The macro will handle the virtual function lookup and dispatch. We could // potentially define these later to also be capable of calling a C++ virtual // method instead of doing the virtual dispatch manually. This would make it // possible to write C++ sinks in a more natural style without loss of // efficiency. We could have a flag in upb_sink defining whether it is a C // sink or a C++ one. #define upb_sink_onvalue(s, f, val, status) s->vtbl->value_cb(s, f, val, status) #define upb_sink_onstr(s, f, str, start, end, status) s->vtbl->str_cb(s, f, str, start, end, status) #define upb_sink_onstart(s, f, status) s->vtbl->start_cb(s, f, status) #define upb_sink_onend(s, f, status) s->vtbl->end_cb(s, f, status) // Initializes a plain C visitor with the given vtbl. The sink must have been // allocated separately. INLINE void upb_sink_init(upb_sink *s, upb_sink_callbacks *vtbl) { s->vtbl = vtbl; } /* upb_bytesink ***************************************************************/ // A upb_bytesink is like a upb_sync, but for bytes instead of structured // protobuf data. Parsers implement upb_bytesink and push to a upb_sink, // serializers do the opposite (implement upb_sink and push to upb_bytesink). // // The two simplest kinds of sinks are "write to string" and "write to FILE*". // A forward declaration solely for the benefit of declaring upb_byte_cb below. // Always prefer upb_bytesink (without the "struct" keyword) instead. struct _upb_bytesink; // The single bytesink callback; it takes the bytes to be written and returns // how many were successfully written. If the return value is <0, the caller // should stop processing. typedef int32_t (*upb_byte_cb)(struct _upb_bytesink *s, upb_strptr str, uint32_t start, uint32_t end, upb_status *status); typedef struct _upb_bytesink { upb_byte_cb *cb; } upb_bytesink; #ifdef __cplusplus } /* extern "C" */ #endif #endif