[PATCH 1/2] pulse: Add a JSON-parsing library

tanuk@xxxxxx (Tanu Kaskinen) · Mon, 23 May 2016 18:01:09 +0300

On Tue, 2016-04-26 at 17:47 +0530, arun at accosted.net wrote:
> From: Arun Raghavan <git at arunraghavan.net>
> 
> Adding this to be able to drop dependency on json-c.
> 
> Fixes: https://bugs.freedesktop.org/show_bug.cgi?id=95135
> ---
> Â src/Makefile.amÂ Â Â Â Â Â Â |Â Â Â 8 +
> Â src/pulse/json.cÂ Â Â Â Â Â | 476 ++++++++++++++++++++++++++++++++++++++++++++++++++
> Â src/pulse/json.hÂ Â Â Â Â Â |Â Â 57 ++++++
> Â src/tests/json-test.c | 240 +++++++++++++++++++++++++
> Â 4 files changed, 781 insertions(+)
> Â create mode 100644 src/pulse/json.c
> Â create mode 100644 src/pulse/json.h
> Â create mode 100644 src/tests/json-test.c

This patch could also add src/json-test to .gitignore.

> diff --git a/src/Makefile.am b/src/Makefile.am
> index b600dfb..9d952fc 100644
> --- a/src/Makefile.am
> +++ b/src/Makefile.am
> @@ -248,6 +248,7 @@ TESTS_default = \
> Â 		thread-mainloop-test \
> Â 		utf8-test \
> Â 		format-test \
> +		json-test \
> Â 		get-binary-name-test \
> Â 		hook-list-test \
> Â 		memblock-test \
> @@ -375,6 +376,12 @@ format_test_CFLAGS = $(AM_CFLAGS) $(LIBCHECK_CFLAGS)
> Â format_test_LDADD = $(AM_LDADD) libpulsecore- at PA_MAJORMINOR@.la libpulse.la libpulsecommon- at PA_MAJORMINOR@.la
> Â format_test_LDFLAGS = $(AM_LDFLAGS) $(BINLDFLAGS) $(LIBCHECK_LIBS)
> Â 
> +json_test_SOURCES = tests/json-test.c
> +json_test_CFLAGS = $(AM_CFLAGS) $(LIBCHECK_CFLAGS)
> +json_test_LDADD = $(AM_LDADD) libpulse.la libpulsecommon- at PA_MAJORMINOR@.la
> +json_test_LDFLAGS = $(AM_LDFLAGS) $(BINLDFLAGS) $(LIBCHECK_LIBS)
> +
> +srbchannel_test_SOURCES = tests/srbchannel-test.c
> Â srbchannel_test_SOURCES = tests/srbchannel-test.c

It's probably sufficient to set srbchannel_test_SOURCES just once.

> Â srbchannel_test_CFLAGS = $(AM_CFLAGS) $(LIBCHECK_CFLAGS)
> Â srbchannel_test_LDADD = $(AM_LDADD) libpulse.la libpulsecommon- at PA_MAJORMINOR@.la
> @@ -646,6 +653,7 @@ libpulsecommon_ at PA_MAJORMINOR@_la_SOURCES = \
> Â 		pulse/client-conf.c pulse/client-conf.h \
> Â 		pulse/fork-detect.c pulse/fork-detect.h \
> Â 		pulse/format.c pulse/format.h \
> +		pulse/json.c pulse/json.h \
> Â 		pulse/xmalloc.c pulse/xmalloc.h \
> Â 		pulse/proplist.c pulse/proplist.h \
> Â 		pulse/utf8.c pulse/utf8.h \
> diff --git a/src/pulse/json.c b/src/pulse/json.c
> new file mode 100644
> index 0000000..0e53902
> --- /dev/null
> +++ b/src/pulse/json.c
> @@ -0,0 +1,476 @@
> +/***
> +Â Â This file is part of PulseAudio.
> +
> +Â Â Copyright 2016 Arun Raghavan <mail at arunraghavan.net>
> +
> +Â Â PulseAudio is free software; you can redistribute it and/or modify
> +Â Â it under the terms of the GNU Lesser General Public License as published
> +Â Â by the Free Software Foundation; either version 2.1 of the License,
> +Â Â or (at your option) any later version.
> +
> +Â Â PulseAudio is distributed in the hope that it will be useful, but
> +Â Â WITHOUT ANY WARRANTY; without even the implied warranty of
> +Â Â MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> +Â Â General Public License for more details.
> +
> +Â Â You should have received a copy of the GNU Lesser General Public License
> +Â Â along with PulseAudio; if not, see <http://www.gnu.org/licenses/>.
> +***/
> +
> +#include 
> +
> +#include 
> +#include 
> +#include 
> +#include 
> +
> +struct pa_json_object {
> +Â Â Â Â PA_REFCNT_DECLARE;
> +Â Â Â Â pa_json_type type;
> +
> +Â Â Â Â union {
> +Â Â Â Â Â Â Â Â int int_value;
> +Â Â Â Â Â Â Â Â double double_value;
> +Â Â Â Â Â Â Â Â bool bool_value;
> +Â Â Â Â Â Â Â Â char *string_value;
> +Â Â Â Â Â Â Â Â pa_hashmap *object_values; /* name -> object */
> +Â Â Â Â Â Â Â Â pa_idxset *array_values; /* objects */
> +Â Â Â Â };
> +};
> +
> +#define JSON_OBJECT_TYPE(o) ((o)->type)

What's the rationale for this macro? Why is using the macro better than
using o->type directly?

> +
> +static const char* parse_value(const char *str, const char *end, pa_json_object **obj);
> +
> +static pa_json_object* json_object_new(void) {
> +Â Â Â Â pa_json_object *obj;
> +
> +Â Â Â Â obj = pa_xnew0(pa_json_object, 1);
> +
> +Â Â Â Â return obj;
> +}
> +
> +static bool is_whitespace(char c) {
> +Â Â Â Â return c == '\t' || c == '\f' || c == '\r' || c == ' ';
> +}
> +
> +static bool is_digit(char c) {
> +Â Â Â Â return c >= '0' && c <= '9';
> +}
> +
> +static bool is_end(const char c, const char *end) {
> +Â Â Â Â if (!end)
> +Â Â Â Â Â Â Â Â return c == '\0';
> +Â Â Â Â elseÂ Â {
> +Â Â Â Â Â Â Â Â while (*end) {
> +Â Â Â Â Â Â Â Â Â Â Â Â if (c == *end)
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â return true;
> +Â Â Â Â Â Â Â Â Â Â Â Â end++;
> +Â Â Â Â Â Â Â Â }
> +Â Â Â Â }
> +
> +Â Â Â Â return false;
> +}
> +
> +static const char* consume_string(const char *str, const char *expect)
> +{

The opening brace got misplaced.

> +Â Â Â Â while (*expect) {
> +Â Â Â Â Â Â Â Â if (*str != *expect)
> +Â Â Â Â Â Â Â Â Â Â Â Â return NULL;
> +
> +Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â expect++;
> +Â Â Â Â }
> +
> +Â Â Â Â return str;
> +}
> +
> +static const char* parse_null(const char *str, pa_json_object *obj) {
> +Â Â Â Â str = consume_string(str, "null");
> +
> +Â Â Â Â if (str)
> +Â Â Â Â Â Â Â Â obj->type = PA_JSON_TYPE_NULL;
> +
> +Â Â Â Â return str;
> +}
> +
> +static const char* parse_boolean(const char *str, pa_json_object *obj) {
> +Â Â Â Â const char *tmp;
> +
> +Â Â Â Â tmp = consume_string(str, "true");
> +
> +Â Â Â Â if (tmp) {
> +Â Â Â Â Â Â Â Â obj->type = PA_JSON_TYPE_BOOL;
> +Â Â Â Â Â Â Â Â obj->bool_value = true;
> +Â Â Â Â } else {
> +Â Â Â Â Â Â Â Â tmp = consume_string(str, "false");
> +
> +Â Â Â Â Â Â Â Â if (str) {
> +Â Â Â Â Â Â Â Â Â Â Â Â obj->type = PA_JSON_TYPE_BOOL;
> +Â Â Â Â Â Â Â Â Â Â Â Â obj->bool_value = false;
> +Â Â Â Â Â Â Â Â }
> +Â Â Â Â }
> +
> +Â Â Â Â return tmp;
> +}
> +
> +static const char* parse_string(const char *str, pa_json_object *obj) {
> +Â Â Â Â pa_strbuf *buf = pa_strbuf_new();
> +
> +Â Â Â Â str++; /* Consume leading '"' */
> +
> +Â Â Â Â while (*str != '"') {
> +Â Â Â Â Â Â Â Â if (*str != '\\') {
> +Â Â Â Â Â Â Â Â Â Â Â Â /* Normal character, juts consume */
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, *str);

Control characters 0x00 <= *str <= 0x1F should cause an error, since
they are disallowed by the JSON spec (0x00 is maybe special, since it
signifies end-of-string, but that should cause an error nevertheless).

Also, JSON data can be UTF-8, UTF-16 or UTF-32 encoded, but this code
doesn't take that into account. If we are fed valid multi-byte
sequences, this code probably can get confused. I feel it would be
safest to only support 7-bit ASCII, and disallow any characters above
0x7F.

> +Â Â Â Â Â Â Â Â } else {
> +Â Â Â Â Â Â Â Â Â Â Â Â /* Need to unescape */
> +Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â switch (*str) {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case '"':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case '\\':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case '/':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, *str);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case 'b':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, '\b' /* backspace */);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case 'f':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, '\f' /* form feed */);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case 'n':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, '\n' /* new line */);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case 'r':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, '\r' /* carriage return */);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case 't':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_strbuf_putc(buf, '\t' /* horizontal tab */);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â case 'u':
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_log("Unicode code points are currently unsupported");
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â default:
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_log("Unexepcted escape value: %c", *str);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â Â Â Â Â Â Â Â Â }
> +Â Â Â Â Â Â Â Â }
> +
> +Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â }
> +
> +Â Â Â Â if (*str != '"') {
> +Â Â Â Â Â Â Â Â pa_log("Failed to parse remainder of string: %s", str);
> +Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â }
> +
> +Â Â Â Â str++;
> +
> +Â Â Â Â obj->type = PA_JSON_TYPE_STRING;
> +Â Â Â Â obj->string_value = pa_strbuf_to_string_free(buf);
> +
> +Â Â Â Â return str;
> +
> +error:
> +Â Â Â Â pa_strbuf_free(buf);
> +Â Â Â Â return NULL;
> +}
> +
> +static const char* parse_number(const char *str, pa_json_object *obj) {
> +Â Â Â Â bool negative = false, has_fraction = false, has_exponent = false;
> +Â Â Â Â unsigned int integer = 0;
> +Â Â Â Â unsigned int fraction = 0;
> +Â Â Â Â unsigned int fraction_digits = 0;
> +Â Â Â Â int exponent = 0;
> +
> +Â Â Â Â if (*str == '-') {
> +Â Â Â Â Â Â Â Â negative = true;
> +Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â }
> +
> +Â Â Â Â if (*str == '0') {
> +Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â goto fraction;
> +Â Â Â Â }
> +
> +Â Â Â Â while (is_digit(*str)) {
> +Â Â Â Â Â Â Â Â integer = (integer * 10) + (*str - '0');
> +Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â }

Missing overflow checking (imagine "12341234123412341234123412341234").

> +
> +fraction:
> +Â Â Â Â if (*str == '.') {
> +Â Â Â Â Â Â Â Â has_fraction = true;
> +Â Â Â Â Â Â Â Â str++;
> +
> +Â Â Â Â Â Â Â Â while (is_digit(*str)) {
> +Â Â Â Â Â Â Â Â Â Â Â Â fraction = (fraction * 10) + (*str - '0');
> +Â Â Â Â Â Â Â Â Â Â Â Â fraction_digits++;
> +Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â }

Missing overflow checking.

> +Â Â Â Â }
> +
> +Â Â Â Â if (*str == 'e' || *str == 'E') {
> +Â Â Â Â Â Â Â Â bool exponent_negative = false;
> +
> +Â Â Â Â Â Â Â Â has_exponent = true;
> +Â Â Â Â Â Â Â Â str++;
> +
> +Â Â Â Â Â Â Â Â if (*str == '-') {
> +Â Â Â Â Â Â Â Â Â Â Â Â exponent_negative = true;
> +Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â } else if (*str == '+')
> +Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +
> +Â Â Â Â Â Â Â Â while (is_digit(*str)) {
> +Â Â Â Â Â Â Â Â Â Â Â Â exponent = (exponent * 10) + (*str - '0');
> +Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â }

Missing overflow checking.

> +
> +Â Â Â Â Â Â Â Â if (exponent_negative)
> +Â Â Â Â Â Â Â Â Â Â Â Â exponent *= -1;
> +Â Â Â Â }
> +
> +Â Â Â Â if (has_fraction || has_exponent) {
> +Â Â Â Â Â Â Â Â obj->type = PA_JSON_TYPE_DOUBLE;
> +Â Â Â Â Â Â Â Â obj->double_value =
> +Â Â Â Â Â Â Â Â Â Â Â Â (negative ? -1.0 : 1.0) * (integer + (double) fraction / pow(10, fraction_digits)) * pow(10, exponent);
> +Â Â Â Â } else {
> +Â Â Â Â Â Â Â Â obj->type = PA_JSON_TYPE_INT;
> +Â Â Â Â Â Â Â Â obj->int_value = (negative ? -1 : 1) * integer;
> +Â Â Â Â }
> +
> +Â Â Â Â return str;
> +}

parse_number() doesn't seem to ever fail. Surely we should check that
we're not fed any random crap that happens to start with "-" or with a
digit? Maybe the idea is that parse_value() will fail if there's any
non-whitespace stuff left after parse_number() returns. In that case, I
think it would be good to have a comment about that in parse_number(),
and at least those cases need to be checked where some mandatory
content is missing (like "-", "1.", "1.e3" or "1e").

> +
> +static const char *parse_object(const char *str, pa_json_object *obj) {
> +Â Â Â Â pa_json_object *name, *value;
> +
> +Â Â Â Â obj->object_values = pa_hashmap_new_full(pa_idxset_string_hash_func, pa_idxset_string_compare_func,
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â pa_xfree, (pa_free_cb_t) pa_json_object_unref);
> +
> +Â Â Â Â while (*str != '}') {
> +Â Â Â Â Â Â Â Â str++; /* Consume leading '{' or ',' */
> +
> +Â Â Â Â Â Â Â Â str = parse_value(str, ":", &name);
> +Â Â Â Â Â Â Â Â if (!str || JSON_OBJECT_TYPE(name) != PA_JSON_TYPE_STRING) {
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_log("Could not parse key for object: %s", str);

str is either NULL or points to after the parsed non-string value. Is
that really what you want to log?

> +Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â Â Â Â Â }
> +
> +Â Â Â Â Â Â Â Â /* Consume the ':' */
> +Â Â Â Â Â Â Â Â str++;
> +
> +Â Â Â Â Â Â Â Â str = parse_value(str, ",}", &value);

As we parse nested objects, maybe we should check that we don't recurse
too deep. Consider {"a":{"a":{"a":{"a":{.... I remember libdbus used to
be vulnerable to this kind of an attack that made libdbus allocate so
deep stack that it crashed the application.

> +Â Â Â Â Â Â Â Â if (!str) {
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_log("Could not parse value for object: %s", str);

str is NULL, don't log it.

> +Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â Â Â Â Â }
> +
> +Â Â Â Â Â Â Â Â pa_hashmap_put(obj->object_values, pa_xstrdup(pa_json_object_get_string(name)), value);
> +Â Â Â Â Â Â Â Â pa_json_object_unref(name);
> +Â Â Â Â }
> +
> +Â Â Â Â /* Drop trailing '}' */
> +Â Â Â Â str++;
> +
> +Â Â Â Â /* We now know the value was correctly parsed */
> +Â Â Â Â obj->type = PA_JSON_TYPE_OBJECT;
> +
> +Â Â Â Â return str;
> +
> +error:
> +Â Â Â Â pa_hashmap_free(obj->object_values);

obj->object_values should be set to NULL.

> +Â Â Â Â return NULL;
> +}
> +
> +static const char *parse_array(const char *str, pa_json_object *obj) {
> +Â Â Â Â pa_json_object *value;
> +
> +Â Â Â Â obj->array_values = pa_idxset_new(NULL, NULL);
> +
> +Â Â Â Â while (*str != ']') {
> +Â Â Â Â Â Â Â Â str++; /* Consume leading '[' or ',' */
> +
> +Â Â Â Â Â Â Â Â /* Need to chew up whitespaces as a special case to deal with the
> +Â Â Â Â Â Â Â Â Â * possibility of an empty array */
> +Â Â Â Â Â Â Â Â while (is_whitespace(*str))
> +Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +
> +Â Â Â Â Â Â Â Â if (*str == ']')
> +Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â str = parse_value(str, ",]", &value);
> +Â Â Â Â Â Â Â Â if (!str) {
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_log("Could not parse value for array: %s", str);

str is NULL, don't log it.

> +Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â Â Â Â Â }
> +
> +Â Â Â Â Â Â Â Â pa_idxset_put(obj->array_values, value, NULL);
> +Â Â Â Â }
> +
> +Â Â Â Â /* Drop trailing ']' */
> +Â Â Â Â str++;
> +
> +Â Â Â Â /* We now know the value was correctly parsed */
> +Â Â Â Â obj->type = PA_JSON_TYPE_ARRAY;
> +
> +Â Â Â Â return str;
> +
> +error:
> +Â Â Â Â pa_idxset_free(obj->array_values, (pa_free_cb_t) pa_json_object_unref);

obj->array_values should be set to NULL.

> +Â Â Â Â return NULL;
> +}
> +
> +typedef enum {
> +Â Â Â Â JSON_PARSER_STATE_INIT,
> +Â Â Â Â JSON_PARSER_STATE_FINISH,
> +} json_parser_state;
> +
> +static const char* parse_value(const char *str, const char *end, pa_json_object **obj) {
> +Â Â Â Â json_parser_state state = JSON_PARSER_STATE_INIT;
> +
> +Â Â Â Â pa_return_val_if_fail(str != NULL, NULL);

I think a regular assertion would fit better here.

> +
> +Â Â Â Â *obj = json_object_new();

I think it's better style to assign to obj only after the parsing has
succeeded. Now you're returning a pointer to freed data in case of
failure.

> +
> +Â Â Â Â while (!is_end(*str, end)) {
> +Â Â Â Â Â Â Â Â switch (state) {
> +Â Â Â Â Â Â Â Â Â Â Â Â case JSON_PARSER_STATE_INIT:
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â if (is_whitespace(*str)) {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else if (*str == 'n') {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str = parse_null(str, *obj);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â state = JSON_PARSER_STATE_FINISH;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else if (*str == 't' || *str == 'f') {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str = parse_boolean(str, *obj);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â state = JSON_PARSER_STATE_FINISH;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else if (*str == '"') {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str = parse_string(str, *obj);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â state = JSON_PARSER_STATE_FINISH;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else if (is_digit(*str) || *str == '-') {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str = parse_number(str, *obj);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â state = JSON_PARSER_STATE_FINISH;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else if (*str == '{') {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str = parse_object(str, *obj);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â state = JSON_PARSER_STATE_FINISH;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else if (*str == '[') {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str = parse_array(str, *obj);
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â state = JSON_PARSER_STATE_FINISH;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â }

There's no final "else" branch here. If none of these checks evaluate
to true, that should be an error.

> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â if (!str)
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â Â Â Â Â case JSON_PARSER_STATE_FINISH:
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â /* Consume trailing whitespaces */
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â if (is_whitespace(*str)) {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â str++;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â } else {
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â Â }
> +Â Â Â Â Â Â Â Â }
> +Â Â Â Â }
> +
> +Â Â Â Â if (JSON_OBJECT_TYPE(*obj) == PA_JSON_TYPE_INIT) {
> +Â Â Â Â Â Â Â Â /* We didn't actually get any data */
> +Â Â Â Â Â Â Â Â pa_log("No data while parsing json string: '%s' till '%s'", str, end);

end can be NULL so maybe use pa_strnull()? I don't know if this is
required. I think glibc handles NULL gracefully, but the manual page
for printf appears silent on this, so probably this is undefined
behaviour.

> +Â Â Â Â Â Â Â Â goto error;
> +Â Â Â Â }
> +
> +Â Â Â Â return str;
> +
> +error:
> +Â Â Â Â pa_json_object_unref(*obj);
> +Â Â Â Â return NULL;
> +}
> +
> +
> +pa_json_object* pa_json_parse(const char *str) {
> +Â Â Â Â pa_json_object *obj;
> +
> +Â Â Â Â str = parse_value(str, NULL, &obj);
> +Â Â Â Â pa_assert(*str == '\0');

This will crash on any parse failure...

> +
> +Â Â Â Â return obj;
> +}
> +
> +pa_json_type pa_json_object_get_type(const pa_json_object *obj) {
> +Â Â Â Â return JSON_OBJECT_TYPE(obj);
> +}
> +
> +void pa_json_object_unref(pa_json_object *obj) {
> +Â Â Â Â if (PA_REFCNT_DEC(obj) > 0)
> +Â Â Â Â Â Â Â Â return;
> +
> +Â Â Â Â switch (JSON_OBJECT_TYPE(obj)) {
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_INIT:
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_INT:
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_DOUBLE:
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_BOOL:
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_NULL:
> +Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_STRING:
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_xfree(obj->string_value);
> +Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_OBJECT:
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_hashmap_free(obj->object_values);
> +Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â case PA_JSON_TYPE_ARRAY:
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_idxset_free(obj->array_values, (pa_free_cb_t) pa_json_object_unref);
> +Â Â Â Â Â Â Â Â Â Â Â Â break;
> +
> +Â Â Â Â Â Â Â Â default:
> +Â Â Â Â Â Â Â Â Â Â Â Â pa_assert_not_reached();
> +Â Â Â Â }
> +
> +Â Â Â Â pa_xfree(obj);
> +}
> +
> +int pa_json_object_get_int(const pa_json_object *o) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_INT, 0);

Is it a programming error to call this function with non-int object? If
yes, a regular assertion should be used. If not, then shouldn't the
caller decide whether to log something or not? (In case you didn't
know, pa_return_val_if_fail() prints "Assertion %s failed..." at debug
log level.)

This same comment applies to the following functions too.

> +Â Â Â Â return o->int_value;
> +}
> +
> +double pa_json_object_get_double(const pa_json_object *o) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_DOUBLE, 0);
> +Â Â Â Â return o->double_value;
> +}
> +
> +bool pa_json_object_get_bool(const pa_json_object *o) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_BOOL, false);
> +Â Â Â Â return o->bool_value;
> +}
> +
> +const char* pa_json_object_get_string(const pa_json_object *o) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_STRING, NULL);
> +Â Â Â Â return o->string_value;
> +}
> +
> +const pa_json_object* pa_json_object_get_object_member(const pa_json_object *o, const char *name) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_OBJECT, NULL);
> +Â Â Â Â return pa_hashmap_get(o->object_values, name);
> +}
> +
> +int pa_json_object_get_array_length(const pa_json_object *o) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_ARRAY, 0);
> +Â Â Â Â return pa_idxset_size(o->array_values);
> +}
> +
> +const pa_json_object* pa_json_object_get_array_member(const pa_json_object *o, int index) {
> +Â Â Â Â pa_return_val_if_fail(JSON_OBJECT_TYPE(o) == PA_JSON_TYPE_ARRAY, NULL);
> +Â Â Â Â return pa_idxset_get_by_index(o->array_values, index);
> +}
> diff --git a/src/pulse/json.h b/src/pulse/json.h
> new file mode 100644
> index 0000000..6eba9a9
> --- /dev/null
> +++ b/src/pulse/json.h
> @@ -0,0 +1,57 @@
> +/***
> +Â Â This file is part of PulseAudio.
> +
> +Â Â Copyright 2016 Arun Raghavan <mail at arunraghavan.net>
> +
> +Â Â PulseAudio is free software; you can redistribute it and/or modify
> +Â Â it under the terms of the GNU Lesser General Public License as published
> +Â Â by the Free Software Foundation; either version 2.1 of the License,
> +Â Â or (at your option) any later version.
> +
> +Â Â PulseAudio is distributed in the hope that it will be useful, but
> +Â Â WITHOUT ANY WARRANTY; without even the implied warranty of
> +Â Â MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> +Â Â General Public License for more details.
> +
> +Â Â You should have received a copy of the GNU Lesser General Public License
> +Â Â along with PulseAudio; if not, see <http://www.gnu.org/licenses/>.
> +***/
> +
> +#ifdef HAVE_CONFIG_H
> +#include 
> +#endif

This belongs in the .c file (if it's needed at all).

> +
> +#include 
> +
> +PA_C_DECL_BEGIN

This isn't a public API, so this seems unnecessary.

> diff --git a/src/tests/json-test.c b/src/tests/json-test.c
> new file mode 100644
> index 0000000..9be4dac
> --- /dev/null
> +++ b/src/tests/json-test.c
> +START_TEST(object_test) {
> +Â Â Â Â pa_json_object *o;
> +Â Â Â Â const pa_json_object *v;
> +
> +Â Â Â Â o = pa_json_parse(" { \"name\" : \"A Person\" } ");
> +
> +Â Â Â Â fail_unless(o != NULL);
> +Â Â Â Â fail_unless(pa_json_object_get_type(o) == PA_JSON_TYPE_OBJECT);
> +
> +Â Â Â Â v = pa_json_object_get_object_member(o, "name");
> +Â Â Â Â fail_unless(v != NULL);
> +Â Â Â Â fail_unless(pa_json_object_get_type(v) == PA_JSON_TYPE_STRING);
> +Â Â Â Â fail_unless(pa_streq(pa_json_object_get_string(v), "A Person"));
> +
> +Â Â Â Â pa_json_object_unref(o);
> +
> +Â Â Â Â o = pa_json_parse(" { \"age\" : -45.3e-0 } ");
> +
> +Â Â Â Â fail_unless(o != NULL);
> +Â Â Â Â fail_unless(pa_json_object_get_type(o) == PA_JSON_TYPE_OBJECT);
> +
> +Â Â Â Â v = pa_json_object_get_object_member(o, "age");
> +Â Â Â Â fail_unless(v != NULL);
> +Â Â Â Â fail_unless(pa_json_object_get_type(v) == PA_JSON_TYPE_DOUBLE);
> +Â Â Â Â fail_unless(IS_EQUAL(pa_json_object_get_double(v), -45.3));
> +
> +Â Â Â Â pa_json_object_unref(o);
> +
> +Â Â Â Â o = pa_json_parse("{\"person\":true}");
> +
> +Â Â Â Â fail_unless(o != NULL);
> +Â Â Â Â fail_unless(pa_json_object_get_type(o) == PA_JSON_TYPE_OBJECT);
> +
> +Â Â Â Â v = pa_json_object_get_object_member(o, "person");
> +Â Â Â Â fail_unless(v != NULL);
> +Â Â Â Â fail_unless(pa_json_object_get_type(v) == PA_JSON_TYPE_BOOL);
> +Â Â Â Â fail_unless(IS_EQUAL(pa_json_object_get_bool(v), true));

IS_EQUAL is only supposed to be used with floating point values, right?

-- 
Tanu