2 * Copyright (c) 2021 Omar Polo <op@omarpolo.com>
4 * Permission to use, copy, modify, and distribute this software for any
5 * purpose with or without fee is hereby granted, provided that the above
6 * copyright notice and this permission notice appear in all copies.
8 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
24 #include "telescope.h"
27 static int parser_foreach_line(struct buffer *, const char *, size_t);
30 parser_init(struct buffer *buffer, const struct parser *p)
34 memset(buffer->title, 0, sizeof(buffer->title));
36 buffer->mode = p->name;
37 buffer->parser_flags = p->initflags;
41 parser_parse(struct buffer *buffer, const char *chunk, size_t len)
43 const struct parser *p = buffer->parser;
46 return p->parse(buffer, chunk, len);
47 return parser_foreach_line(buffer, chunk, len);
51 parser_parsef(struct buffer *buffer, const char *fmt, ...)
58 r = vasprintf(&s, fmt, ap);
64 r = parser_parse(buffer, s, strlen(s));
70 parser_free(struct tab *tab)
72 struct buffer *buffer = &tab->buffer;
73 const struct parser *p = buffer->parser;
79 } else if (buffer->len != 0) {
81 r = p->parse(buffer, buffer->buf, buffer->len);
83 r = parser_foreach_line(buffer, buffer->buf,
91 if (*buffer->title != '\0')
95 * heuristic: see if there is a "tilde user" and use that as
96 * page title, using the full domain name as fallback.
98 if ((tilde = strstr(hist_cur(tab->hist), "/~")) != NULL) {
99 strlcpy(buffer->title, tilde+1, sizeof(buffer->title));
101 if ((slash = strchr(buffer->title, '/')) != NULL)
104 strlcpy(buffer->title, tab->iri.iri_host,
105 sizeof(buffer->title));
111 parser_serialize(struct buffer *b, FILE *fp)
113 const struct parser *p = b->parser;
118 if (p->serialize != NULL)
119 return p->serialize(b, fp);
121 /* a default implementation good enough for plain text */
122 TAILQ_FOREACH(line, &b->head, lines) {
123 if ((text = line->line) == NULL)
126 r = fprintf(fp, "%s\n", text);
135 parser_append(struct buffer *b, const char *buf, size_t len)
143 newlen = len + b->len;
144 t = xcalloc(1, newlen);
145 memcpy(t, b->buf, b->len);
146 memcpy(t + b->len, buf, len);
154 parser_set_buf(struct buffer *b, const char *buf, size_t len)
166 * p->buf and buf can (and probably almost always will)
170 tmp = xcalloc(1, len);
171 memcpy(tmp, buf, len);
179 parser_foreach_line(struct buffer *b, const char *buf, size_t size)
181 const struct parser *p = b->parser;
186 if (!parser_append(b, buf, size))
191 if (!(b->parser_flags & PARSER_IN_BODY) && len < 3)
194 if (!(b->parser_flags & PARSER_IN_BODY)) {
195 b->parser_flags |= PARSER_IN_BODY;
198 * drop the BOM: only UTF-8 is supported, and there
199 * it's useless; some editors may still add one
202 if (memmem(beg, len, "\xEF\xBB\xBF", 3) == beg) {
208 /* drop every "funny" ASCII character */
209 for (i = 0; i < len; ) {
211 if ((ch >= ' ' || ch == '\n' || ch == '\t')
212 && ch != 127) { /* del */
216 memmove(&beg[i], &beg[i+1], len - i - 1);
221 if ((end = memmem((char*)beg, len, "\n", 1)) == NULL)
225 if (!p->parseline(b, beg, l))
238 return parser_set_buf(b, beg, len);