sync from xml.c: improve parsing whitespace after end tag names - extractjson - extract embedded JSON metadata from HTML pages
HTML git clone git://git.codemadness.org/extractjson
DIR Log
DIR Files
DIR Refs
DIR README
DIR LICENSE
---
DIR commit 64bf7c1c97f7de60a6358667d0836550fdf0ed49
DIR parent 1de46c41c6f72a1576352464a8458cfc70467094
HTML Author: Hiltjo Posthuma <hiltjo@codemadness.org>
Date: Sun, 30 Jun 2024 10:08:05 +0200
sync from xml.c: improve parsing whitespace after end tag names
Diffstat:
M extractjson.c | 2 ++
1 file changed, 2 insertions(+), 0 deletions(-)
---
DIR diff --git a/extractjson.c b/extractjson.c
@@ -269,6 +269,8 @@ xml_parse(XMLParser *x)
else if (c == '>' || ISSPACE(c)) {
x->tag[x->taglen] = '\0';
if (isend) { /* end tag, starts with </ */
+ while (c != '>' && c != EOF) /* skip until > */
+ c = GETNEXT();
x->tag[0] = '\0';
x->taglen = 0;
} else {