pb_encode.c 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664
  1. /* pb_encode.c -- encode a protobuf using minimal resources
  2. *
  3. * 2011 Petteri Aimonen <jpa@kapsi.fi>
  4. */
  5. #include "pb.h"
  6. #include "pb_encode.h"
  7. #include "pb_common.h"
  8. /* Use the GCC warn_unused_result attribute to check that all return values
  9. * are propagated correctly. On other compilers and gcc before 3.4.0 just
  10. * ignore the annotation.
  11. */
  12. #if !defined(__GNUC__) || ( __GNUC__ < 3) || (__GNUC__ == 3 && __GNUC_MINOR__ < 4)
  13. #define checkreturn
  14. #else
  15. #define checkreturn __attribute__((warn_unused_result))
  16. #endif
  17. /**************************************
  18. * Declarations internal to this file *
  19. **************************************/
  20. typedef bool (*pb_encoder_t)(pb_ostream_t *stream, const pb_field_t *field, const void *src) checkreturn;
  21. static bool checkreturn buf_write(pb_ostream_t *stream, const uint8_t *buf, size_t count);
  22. static bool checkreturn encode_array(pb_ostream_t *stream, const pb_field_t *field, const void *pData, size_t count, pb_encoder_t func);
  23. static bool checkreturn encode_field(pb_ostream_t *stream, const pb_field_t *field, const void *pData);
  24. static bool checkreturn default_extension_encoder(pb_ostream_t *stream, const pb_extension_t *extension);
  25. static bool checkreturn encode_extension_field(pb_ostream_t *stream, const pb_field_t *field, const void *pData);
  26. static bool checkreturn pb_enc_varint(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  27. static bool checkreturn pb_enc_uvarint(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  28. static bool checkreturn pb_enc_svarint(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  29. static bool checkreturn pb_enc_fixed32(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  30. static bool checkreturn pb_enc_fixed64(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  31. static bool checkreturn pb_enc_bytes(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  32. static bool checkreturn pb_enc_string(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  33. static bool checkreturn pb_enc_submessage(pb_ostream_t *stream, const pb_field_t *field, const void *src);
  34. /* --- Function pointers to field encoders ---
  35. * Order in the array must match pb_action_t LTYPE numbering.
  36. */
  37. static const pb_encoder_t PB_ENCODERS[PB_LTYPES_COUNT] = {
  38. &pb_enc_varint,
  39. &pb_enc_uvarint,
  40. &pb_enc_svarint,
  41. &pb_enc_fixed32,
  42. &pb_enc_fixed64,
  43. &pb_enc_bytes,
  44. &pb_enc_string,
  45. &pb_enc_submessage,
  46. NULL /* extensions */
  47. };
  48. /*******************************
  49. * pb_ostream_t implementation *
  50. *******************************/
  51. static bool checkreturn buf_write(pb_ostream_t *stream, const uint8_t *buf, size_t count)
  52. {
  53. uint8_t *dest = (uint8_t*)stream->state;
  54. stream->state = dest + count;
  55. while (count--)
  56. *dest++ = *buf++;
  57. return true;
  58. }
  59. pb_ostream_t pb_ostream_from_buffer(uint8_t *buf, size_t bufsize)
  60. {
  61. pb_ostream_t stream;
  62. #ifdef PB_BUFFER_ONLY
  63. stream.callback = (void*)1; /* Just a marker value */
  64. #else
  65. stream.callback = &buf_write;
  66. #endif
  67. stream.state = buf;
  68. stream.max_size = bufsize;
  69. stream.bytes_written = 0;
  70. #ifndef PB_NO_ERRMSG
  71. stream.errmsg = NULL;
  72. #endif
  73. return stream;
  74. }
  75. bool checkreturn pb_write(pb_ostream_t *stream, const uint8_t *buf, size_t count)
  76. {
  77. if (stream->callback != NULL)
  78. {
  79. if (stream->bytes_written + count > stream->max_size)
  80. PB_RETURN_ERROR(stream, "stream full");
  81. #ifdef PB_BUFFER_ONLY
  82. if (!buf_write(stream, buf, count))
  83. PB_RETURN_ERROR(stream, "io error");
  84. #else
  85. if (!stream->callback(stream, buf, count))
  86. PB_RETURN_ERROR(stream, "io error");
  87. #endif
  88. }
  89. stream->bytes_written += count;
  90. return true;
  91. }
  92. /*************************
  93. * Encode a single field *
  94. *************************/
  95. /* Encode a static array. Handles the size calculations and possible packing. */
  96. static bool checkreturn encode_array(pb_ostream_t *stream, const pb_field_t *field,
  97. const void *pData, size_t count, pb_encoder_t func)
  98. {
  99. size_t i;
  100. const void *p;
  101. size_t size;
  102. if (count == 0)
  103. return true;
  104. if (PB_ATYPE(field->type) != PB_ATYPE_POINTER && count > field->array_size)
  105. PB_RETURN_ERROR(stream, "array max size exceeded");
  106. /* We always pack arrays if the datatype allows it. */
  107. if (PB_LTYPE(field->type) <= PB_LTYPE_LAST_PACKABLE)
  108. {
  109. if (!pb_encode_tag(stream, PB_WT_STRING, field->tag))
  110. return false;
  111. /* Determine the total size of packed array. */
  112. if (PB_LTYPE(field->type) == PB_LTYPE_FIXED32)
  113. {
  114. size = 4 * count;
  115. }
  116. else if (PB_LTYPE(field->type) == PB_LTYPE_FIXED64)
  117. {
  118. size = 8 * count;
  119. }
  120. else
  121. {
  122. pb_ostream_t sizestream = PB_OSTREAM_SIZING;
  123. p = pData;
  124. for (i = 0; i < count; i++)
  125. {
  126. if (!func(&sizestream, field, p))
  127. return false;
  128. p = (const char*)p + field->data_size;
  129. }
  130. size = sizestream.bytes_written;
  131. }
  132. if (!pb_encode_varint(stream, (uint64_t)size))
  133. return false;
  134. if (stream->callback == NULL)
  135. return pb_write(stream, NULL, size); /* Just sizing.. */
  136. /* Write the data */
  137. p = pData;
  138. for (i = 0; i < count; i++)
  139. {
  140. if (!func(stream, field, p))
  141. return false;
  142. p = (const char*)p + field->data_size;
  143. }
  144. }
  145. else
  146. {
  147. p = pData;
  148. for (i = 0; i < count; i++)
  149. {
  150. if (!pb_encode_tag_for_field(stream, field))
  151. return false;
  152. /* Normally the data is stored directly in the array entries, but
  153. * for pointer-type string and bytes fields, the array entries are
  154. * actually pointers themselves also. So we have to dereference once
  155. * more to get to the actual data. */
  156. if (PB_ATYPE(field->type) == PB_ATYPE_POINTER &&
  157. (PB_LTYPE(field->type) == PB_LTYPE_STRING ||
  158. PB_LTYPE(field->type) == PB_LTYPE_BYTES))
  159. {
  160. if (!func(stream, field, *(const void* const*)p))
  161. return false;
  162. }
  163. else
  164. {
  165. if (!func(stream, field, p))
  166. return false;
  167. }
  168. p = (const char*)p + field->data_size;
  169. }
  170. }
  171. return true;
  172. }
  173. /* Encode a field with static or pointer allocation, i.e. one whose data
  174. * is available to the encoder directly. */
  175. static bool checkreturn encode_basic_field(pb_ostream_t *stream,
  176. const pb_field_t *field, const void *pData)
  177. {
  178. pb_encoder_t func;
  179. const void *pSize;
  180. bool implicit_has = true;
  181. func = PB_ENCODERS[PB_LTYPE(field->type)];
  182. if (field->size_offset)
  183. pSize = (const char*)pData + field->size_offset;
  184. else
  185. pSize = &implicit_has;
  186. if (PB_ATYPE(field->type) == PB_ATYPE_POINTER)
  187. {
  188. /* pData is a pointer to the field, which contains pointer to
  189. * the data. If the 2nd pointer is NULL, it is interpreted as if
  190. * the has_field was false.
  191. */
  192. pData = *(const void* const*)pData;
  193. implicit_has = (pData != NULL);
  194. }
  195. switch (PB_HTYPE(field->type))
  196. {
  197. case PB_HTYPE_REQUIRED:
  198. if (!pData)
  199. PB_RETURN_ERROR(stream, "missing required field");
  200. if (!pb_encode_tag_for_field(stream, field))
  201. return false;
  202. if (!func(stream, field, pData))
  203. return false;
  204. break;
  205. case PB_HTYPE_OPTIONAL:
  206. if (*(const bool*)pSize)
  207. {
  208. if (!pb_encode_tag_for_field(stream, field))
  209. return false;
  210. if (!func(stream, field, pData))
  211. return false;
  212. }
  213. break;
  214. case PB_HTYPE_REPEATED:
  215. if (!encode_array(stream, field, pData, *(const pb_size_t*)pSize, func))
  216. return false;
  217. break;
  218. default:
  219. PB_RETURN_ERROR(stream, "invalid field type");
  220. }
  221. return true;
  222. }
  223. /* Encode a field with callback semantics. This means that a user function is
  224. * called to provide and encode the actual data. */
  225. static bool checkreturn encode_callback_field(pb_ostream_t *stream,
  226. const pb_field_t *field, const void *pData)
  227. {
  228. const pb_callback_t *callback = (const pb_callback_t*)pData;
  229. #ifdef PB_OLD_CALLBACK_STYLE
  230. const void *arg = callback->arg;
  231. #else
  232. void * const *arg = &(callback->arg);
  233. #endif
  234. if (callback->funcs.encode != NULL)
  235. {
  236. if (!callback->funcs.encode(stream, field, arg))
  237. PB_RETURN_ERROR(stream, "callback error");
  238. }
  239. return true;
  240. }
  241. /* Encode a single field of any callback or static type. */
  242. static bool checkreturn encode_field(pb_ostream_t *stream,
  243. const pb_field_t *field, const void *pData)
  244. {
  245. switch (PB_ATYPE(field->type))
  246. {
  247. case PB_ATYPE_STATIC:
  248. case PB_ATYPE_POINTER:
  249. return encode_basic_field(stream, field, pData);
  250. case PB_ATYPE_CALLBACK:
  251. return encode_callback_field(stream, field, pData);
  252. default:
  253. PB_RETURN_ERROR(stream, "invalid field type");
  254. }
  255. }
  256. /* Default handler for extension fields. Expects to have a pb_field_t
  257. * pointer in the extension->type->arg field. */
  258. static bool checkreturn default_extension_encoder(pb_ostream_t *stream,
  259. const pb_extension_t *extension)
  260. {
  261. const pb_field_t *field = (const pb_field_t*)extension->type->arg;
  262. return encode_field(stream, field, extension->dest);
  263. }
  264. /* Walk through all the registered extensions and give them a chance
  265. * to encode themselves. */
  266. static bool checkreturn encode_extension_field(pb_ostream_t *stream,
  267. const pb_field_t *field, const void *pData)
  268. {
  269. const pb_extension_t *extension = *(const pb_extension_t* const *)pData;
  270. PB_UNUSED(field);
  271. while (extension)
  272. {
  273. bool status;
  274. if (extension->type->encode)
  275. status = extension->type->encode(stream, extension);
  276. else
  277. status = default_extension_encoder(stream, extension);
  278. if (!status)
  279. return false;
  280. extension = extension->next;
  281. }
  282. return true;
  283. }
  284. /*********************
  285. * Encode all fields *
  286. *********************/
  287. static void *remove_const(const void *p)
  288. {
  289. /* Note: this casts away const, in order to use the common field iterator
  290. * logic for both encoding and decoding. */
  291. union {
  292. void *p1;
  293. const void *p2;
  294. } t;
  295. t.p2 = p;
  296. return t.p1;
  297. }
  298. bool checkreturn pb_encode(pb_ostream_t *stream, const pb_field_t fields[], const void *src_struct)
  299. {
  300. pb_field_iter_t iter;
  301. if (!pb_field_iter_begin(&iter, fields, remove_const(src_struct)))
  302. return true; /* Empty message type */
  303. do {
  304. if (PB_LTYPE(iter.pos->type) == PB_LTYPE_EXTENSION)
  305. {
  306. /* Special case for the extension field placeholder */
  307. if (!encode_extension_field(stream, iter.pos, iter.pData))
  308. return false;
  309. }
  310. else
  311. {
  312. /* Regular field */
  313. if (!encode_field(stream, iter.pos, iter.pData))
  314. return false;
  315. }
  316. } while (pb_field_iter_next(&iter));
  317. return true;
  318. }
  319. bool pb_encode_delimited(pb_ostream_t *stream, const pb_field_t fields[], const void *src_struct)
  320. {
  321. return pb_encode_submessage(stream, fields, src_struct);
  322. }
  323. bool pb_get_encoded_size(size_t *size, const pb_field_t fields[], const void *src_struct)
  324. {
  325. pb_ostream_t stream = PB_OSTREAM_SIZING;
  326. if (!pb_encode(&stream, fields, src_struct))
  327. return false;
  328. *size = stream.bytes_written;
  329. return true;
  330. }
  331. /********************
  332. * Helper functions *
  333. ********************/
  334. bool checkreturn pb_encode_varint(pb_ostream_t *stream, uint64_t value)
  335. {
  336. uint8_t buffer[10];
  337. size_t i = 0;
  338. if (value == 0)
  339. return pb_write(stream, (uint8_t*)&value, 1);
  340. while (value)
  341. {
  342. buffer[i] = (uint8_t)((value & 0x7F) | 0x80);
  343. value >>= 7;
  344. i++;
  345. }
  346. buffer[i-1] &= 0x7F; /* Unset top bit on last byte */
  347. return pb_write(stream, buffer, i);
  348. }
  349. bool checkreturn pb_encode_svarint(pb_ostream_t *stream, int64_t value)
  350. {
  351. uint64_t zigzagged;
  352. if (value < 0)
  353. zigzagged = ~((uint64_t)value << 1);
  354. else
  355. zigzagged = (uint64_t)value << 1;
  356. return pb_encode_varint(stream, zigzagged);
  357. }
  358. bool checkreturn pb_encode_fixed32(pb_ostream_t *stream, const void *value)
  359. {
  360. #ifdef __BIG_ENDIAN__
  361. const uint8_t *bytes = value;
  362. uint8_t lebytes[4];
  363. lebytes[0] = bytes[3];
  364. lebytes[1] = bytes[2];
  365. lebytes[2] = bytes[1];
  366. lebytes[3] = bytes[0];
  367. return pb_write(stream, lebytes, 4);
  368. #else
  369. return pb_write(stream, (const uint8_t*)value, 4);
  370. #endif
  371. }
  372. bool checkreturn pb_encode_fixed64(pb_ostream_t *stream, const void *value)
  373. {
  374. #ifdef __BIG_ENDIAN__
  375. const uint8_t *bytes = value;
  376. uint8_t lebytes[8];
  377. lebytes[0] = bytes[7];
  378. lebytes[1] = bytes[6];
  379. lebytes[2] = bytes[5];
  380. lebytes[3] = bytes[4];
  381. lebytes[4] = bytes[3];
  382. lebytes[5] = bytes[2];
  383. lebytes[6] = bytes[1];
  384. lebytes[7] = bytes[0];
  385. return pb_write(stream, lebytes, 8);
  386. #else
  387. return pb_write(stream, (const uint8_t*)value, 8);
  388. #endif
  389. }
  390. bool checkreturn pb_encode_tag(pb_ostream_t *stream, pb_wire_type_t wiretype, uint32_t field_number)
  391. {
  392. uint64_t tag = ((uint64_t)field_number << 3) | wiretype;
  393. return pb_encode_varint(stream, tag);
  394. }
  395. bool checkreturn pb_encode_tag_for_field(pb_ostream_t *stream, const pb_field_t *field)
  396. {
  397. pb_wire_type_t wiretype;
  398. switch (PB_LTYPE(field->type))
  399. {
  400. case PB_LTYPE_VARINT:
  401. case PB_LTYPE_UVARINT:
  402. case PB_LTYPE_SVARINT:
  403. wiretype = PB_WT_VARINT;
  404. break;
  405. case PB_LTYPE_FIXED32:
  406. wiretype = PB_WT_32BIT;
  407. break;
  408. case PB_LTYPE_FIXED64:
  409. wiretype = PB_WT_64BIT;
  410. break;
  411. case PB_LTYPE_BYTES:
  412. case PB_LTYPE_STRING:
  413. case PB_LTYPE_SUBMESSAGE:
  414. wiretype = PB_WT_STRING;
  415. break;
  416. default:
  417. PB_RETURN_ERROR(stream, "invalid field type");
  418. }
  419. return pb_encode_tag(stream, wiretype, field->tag);
  420. }
  421. bool checkreturn pb_encode_string(pb_ostream_t *stream, const uint8_t *buffer, size_t size)
  422. {
  423. if (!pb_encode_varint(stream, (uint64_t)size))
  424. return false;
  425. return pb_write(stream, buffer, size);
  426. }
  427. bool checkreturn pb_encode_submessage(pb_ostream_t *stream, const pb_field_t fields[], const void *src_struct)
  428. {
  429. /* First calculate the message size using a non-writing substream. */
  430. pb_ostream_t substream = PB_OSTREAM_SIZING;
  431. size_t size;
  432. bool status;
  433. if (!pb_encode(&substream, fields, src_struct))
  434. {
  435. #ifndef PB_NO_ERRMSG
  436. stream->errmsg = substream.errmsg;
  437. #endif
  438. return false;
  439. }
  440. size = substream.bytes_written;
  441. if (!pb_encode_varint(stream, (uint64_t)size))
  442. return false;
  443. if (stream->callback == NULL)
  444. return pb_write(stream, NULL, size); /* Just sizing */
  445. if (stream->bytes_written + size > stream->max_size)
  446. PB_RETURN_ERROR(stream, "stream full");
  447. /* Use a substream to verify that a callback doesn't write more than
  448. * what it did the first time. */
  449. substream.callback = stream->callback;
  450. substream.state = stream->state;
  451. substream.max_size = size;
  452. substream.bytes_written = 0;
  453. #ifndef PB_NO_ERRMSG
  454. substream.errmsg = NULL;
  455. #endif
  456. status = pb_encode(&substream, fields, src_struct);
  457. stream->bytes_written += substream.bytes_written;
  458. stream->state = substream.state;
  459. #ifndef PB_NO_ERRMSG
  460. stream->errmsg = substream.errmsg;
  461. #endif
  462. if (substream.bytes_written != size)
  463. PB_RETURN_ERROR(stream, "submsg size changed");
  464. return status;
  465. }
  466. /* Field encoders */
  467. static bool checkreturn pb_enc_varint(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  468. {
  469. int64_t value = 0;
  470. /* Cases 1 and 2 are for compilers that have smaller types for bool
  471. * or enums. */
  472. switch (field->data_size)
  473. {
  474. case 1: value = *(const int8_t*)src; break;
  475. case 2: value = *(const int16_t*)src; break;
  476. case 4: value = *(const int32_t*)src; break;
  477. case 8: value = *(const int64_t*)src; break;
  478. default: PB_RETURN_ERROR(stream, "invalid data_size");
  479. }
  480. return pb_encode_varint(stream, (uint64_t)value);
  481. }
  482. static bool checkreturn pb_enc_uvarint(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  483. {
  484. uint64_t value = 0;
  485. switch (field->data_size)
  486. {
  487. case 4: value = *(const uint32_t*)src; break;
  488. case 8: value = *(const uint64_t*)src; break;
  489. default: PB_RETURN_ERROR(stream, "invalid data_size");
  490. }
  491. return pb_encode_varint(stream, value);
  492. }
  493. static bool checkreturn pb_enc_svarint(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  494. {
  495. int64_t value = 0;
  496. switch (field->data_size)
  497. {
  498. case 4: value = *(const int32_t*)src; break;
  499. case 8: value = *(const int64_t*)src; break;
  500. default: PB_RETURN_ERROR(stream, "invalid data_size");
  501. }
  502. return pb_encode_svarint(stream, value);
  503. }
  504. static bool checkreturn pb_enc_fixed64(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  505. {
  506. PB_UNUSED(field);
  507. return pb_encode_fixed64(stream, src);
  508. }
  509. static bool checkreturn pb_enc_fixed32(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  510. {
  511. PB_UNUSED(field);
  512. return pb_encode_fixed32(stream, src);
  513. }
  514. static bool checkreturn pb_enc_bytes(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  515. {
  516. const pb_bytes_array_t *bytes = (const pb_bytes_array_t*)src;
  517. if (src == NULL)
  518. {
  519. /* Threat null pointer as an empty bytes field */
  520. return pb_encode_string(stream, NULL, 0);
  521. }
  522. if (PB_ATYPE(field->type) == PB_ATYPE_STATIC &&
  523. PB_BYTES_ARRAY_T_ALLOCSIZE(bytes->size) > field->data_size)
  524. {
  525. PB_RETURN_ERROR(stream, "bytes size exceeded");
  526. }
  527. return pb_encode_string(stream, bytes->bytes, bytes->size);
  528. }
  529. static bool checkreturn pb_enc_string(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  530. {
  531. size_t size = 0;
  532. size_t max_size = field->data_size;
  533. const char *p = (const char*)src;
  534. if (PB_ATYPE(field->type) == PB_ATYPE_POINTER)
  535. max_size = (size_t)-1;
  536. if (src == NULL)
  537. {
  538. size = 0; /* Threat null pointer as an empty string */
  539. }
  540. else
  541. {
  542. /* strnlen() is not always available, so just use a loop */
  543. while (size < max_size && *p != '\0')
  544. {
  545. size++;
  546. p++;
  547. }
  548. }
  549. return pb_encode_string(stream, (const uint8_t*)src, size);
  550. }
  551. static bool checkreturn pb_enc_submessage(pb_ostream_t *stream, const pb_field_t *field, const void *src)
  552. {
  553. if (field->ptr == NULL)
  554. PB_RETURN_ERROR(stream, "invalid field descriptor");
  555. return pb_encode_submessage(stream, (const pb_field_t*)field->ptr, src);
  556. }