wireshark/wsutil/wsjsmn.c

194 lines
7.3 KiB
C

/* wsjsmn.c
* Utility to check if a payload is json using libjsmn
*
* Copyright 2016, Dario Lombardo
*
* Wireshark - Network traffic analyzer
* By Gerald Combs <gerald@wireshark.org>
* Copyright 1998 Gerald Combs
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation; either version 2
* of the License, or (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
*/
#include "wsjsmn.h"
#include <string.h>
#include <wsutil/jsmn.h>
#include <wsutil/str_util.h>
#include <wsutil/unicode-utils.h>
#include "log.h"
gboolean jsmn_is_json(const guint8* buf, const size_t len)
{
/* We expect no more than 1024 tokens */
guint max_tokens = 1024;
jsmntok_t* t;
jsmn_parser p;
gboolean ret = TRUE;
int rcode;
t = g_new0(jsmntok_t, max_tokens);
if (!t)
return FALSE;
jsmn_init(&p);
rcode = jsmn_parse(&p, buf, len, t, max_tokens);
if (rcode < 0) {
switch (rcode) {
case JSMN_ERROR_NOMEM:
g_log(LOG_DOMAIN_MAIN, G_LOG_LEVEL_DEBUG, "jsmn: not enough tokens were provided");
break;
case JSMN_ERROR_INVAL:
g_log(LOG_DOMAIN_MAIN, G_LOG_LEVEL_DEBUG, "jsmn: invalid character inside JSON string");
break;
case JSMN_ERROR_PART:
g_log(LOG_DOMAIN_MAIN, G_LOG_LEVEL_DEBUG, "jsmn: the string is not a full JSON packet, "
"more bytes expected");
break;
default:
g_log(LOG_DOMAIN_MAIN, G_LOG_LEVEL_DEBUG, "jsmn: unexpected error");
break;
}
ret = FALSE;
}
g_free(t);
return ret;
}
int wsjsmn_parse(const char *buf, jsmntok_t *tokens, unsigned int max_tokens)
{
jsmn_parser p;
jsmn_init(&p);
return jsmn_parse(&p, buf, strlen(buf), tokens, max_tokens);
}
gboolean wsjsmn_unescape_json_string(const char *input, char *output)
{
while (*input) {
char ch = *input++;
if (ch == '\\') {
ch = *input++;
switch (ch) {
case '\"':
case '\\':
case '/':
*output++ = ch;
break;
case 'b':
*output++ = '\b';
break;
case 'f':
*output++ = '\f';
break;
case 'n':
*output++ = '\n';
break;
case 'r':
*output++ = '\r';
break;
case 't':
*output++ = '\t';
break;
case 'u':
{
guint32 unicode_hex = 0;
int k;
int bin;
for (k = 0; k < 4; k++) {
unicode_hex <<= 4;
ch = *input++;
bin = ws_xton(ch);
if (bin == -1)
return FALSE;
unicode_hex |= bin;
}
if ((IS_LEAD_SURROGATE(unicode_hex))) {
guint16 lead_surrogate = unicode_hex;
guint16 trail_surrogate = 0;
if (input[0] != '\\' || input[1] != 'u')
return FALSE;
input += 2;
for (k = 0; k < 4; k++) {
trail_surrogate <<= 4;
ch = *input++;
bin = ws_xton(ch);
if (bin == -1)
return FALSE;
trail_surrogate |= bin;
}
if ((!IS_TRAIL_SURROGATE(trail_surrogate)))
return FALSE;
unicode_hex = SURROGATE_VALUE(lead_surrogate,trail_surrogate);
} else if ((IS_TRAIL_SURROGATE(unicode_hex))) {
return FALSE;
}
if (!g_unichar_validate(unicode_hex))
return FALSE;
/* Don't allow NUL byte injection. */
if (unicode_hex == 0)
return FALSE;
/* \uXXXX => 6 bytes, and g_unichar_to_utf8() requires to have output buffer at least 6 bytes -> OK. */
k = g_unichar_to_utf8(unicode_hex, output);
output += k;
break;
}
default:
return FALSE;
}
} else {
*output = ch;
output++;
}
}
*output = '\0';
return TRUE;
}
/*
* Editor modelines - https://www.wireshark.org/tools/modelines.html
*
* Local variables:
* c-basic-offset: 4
* tab-width: 8
* indent-tabs-mode: t
* End:
*
* vi: set shiftwidth=4 tabstop=8 noexpandtab:
* :indentSize=4:tabSize=8:noTabs=false:
*/