From cd85eac0d3324555480b373df0e4051856a89f5e Mon Sep 17 00:00:00 2001 From: Nick Mathewson Date: Sat, 29 Dec 2007 17:36:03 +0000 Subject: r17433@catbus: nickm | 2007-12-29 12:35:57 -0500 Incomplete code to avoid doing needless pull-ups on HTTP. Also, use memstr instead of strstr to find the content-length header. svn:r13005 --- src/or/buffers.c | 112 ++++++++++++++++++++++++++++++++++++++++++++++++++++++- 1 file changed, 110 insertions(+), 2 deletions(-) (limited to 'src') diff --git a/src/or/buffers.c b/src/or/buffers.c index ea9ff3a2a..729b987b4 100644 --- a/src/or/buffers.c +++ b/src/or/buffers.c @@ -943,6 +943,93 @@ move_buf_to_buf(buf_t *buf_out, buf_t *buf_in, size_t *buf_flushlen) return cp; } +// #define BUFPOS +#ifdef BUFPOS +typedef struct buf_pos_t { + chunk_t *chunk; + int pos; + int pos_absolute; +}; + +static void +buf_pos_init(buf_t *buf, buf_pos_t *out) +{ + out->chunk = buf->head; + out->pos = 0; + out->pos_absolute = 0; +} + +static int +buf_find_pos_of_char(const buf_t *buf, char ch, buf_pos_t *out) +{ + chunk_t *chunk; + int offset = 0; + int pos = chunk->pos; + for (chunk = out->chunk; chunk; chunk = chunk->next) { + char *cp = memchr(chunk->data+pos, ch, chunk->datalen-pos); + if (cp) { + out->chunk = chunk; + out->pos = cp - chunk->data; + out->pos_absolute = offset + (cp - chunk->data); + return out->pos_absolute; + } else { + offset += chunk->datalen; + pos = 0; + } + } + return -1; +} + +static INLINE int +buf_pos_inc(buf_pos_t *pos) +{ + if (pos->pos == pos->chunk->datalen) { + if (!pos->chunk->next) + return -1; + pos->chunk = pos->chunk->next; + pos->pos = 0; + } else { + ++pos->pos; + } + ++pos->pos_absolute; +} + +static int +buf_matches_at_pos(const buf_t *buf, const buf_pos_t *pos, const char *s, + int n) +{ + buf_pos_t p; + memcpy(p, pos, sizeof(p)); + + while (n) { + char ch = p->chunk->data[p->pos]; + if (ch != *s) + return 0; + ++s; + --n; + if (buf_pos_inc(p)<0) + return 0; + } + return 1; +} + +static int +buf_find_string_offset(const char *buf, const char *s, int n) +{ + buf_pos_t pos; + buf_pos_init(buf, &pos); + while (buf_find_pos_of_char(buf, *s, &pos) >= 0) { + if (buf_matches_at_pos(buf, pos, s, n)) { + return pos->pos_absolute; + } else { + if (buf_pos_inc(pos)<0) + return -1; + } + } + return -1; +} +#endif + /** There is a (possibly incomplete) http statement on buf, of the * form "\%s\\r\\n\\r\\n\%s", headers, body. (body may contain nuls.) * If a) the headers include a Content-Length field and all bytes in @@ -968,14 +1055,33 @@ fetch_from_buf_http(buf_t *buf, char **body_out, size_t *body_used, size_t max_bodylen, int force_complete) { - char *headers, *body, *p; + char *headers, *p, *body; size_t headerlen, bodylen, contentlen; +#ifdef BUFPOS + int crlf_offset; +#endif check(); if (!buf->head) return 0; headers = buf->head->data; + +#ifdef BUFPOS + crlf_offset = buf_find_string_offset(buf, "\r\n\r\n", 4); + if (crlf_offset > max_headerlen || + (crlf_offset < 0 && buf->datalen > max_headerlen)) { + log_debug(LD_HTTP,"headers too long."); + return -1; + } else if (crlf_offset < 0) { + log_debug(LD_HTTP,"headers not all here yet."); + return 0; + } + if (buf->head->datalen < crlf_offset + 4) + buf_pullup(buf, crlf_offset+4, 0); + headerlen = crlf_offset + 4; + body = buf->data + headerlen; /*XXX020 unused. */ +#else /* See if CRLFCRLF is already in the head chunk. If it is, we don't need * to move or resize anything. */ body = (char*) tor_memmem(buf->head->data, buf->head->datalen, @@ -1001,6 +1107,8 @@ fetch_from_buf_http(buf_t *buf, } body += 4; /* Skip the the CRLFCRLF */ headerlen = body-headers; /* includes the CRLFCRLF */ +#endif + bodylen = buf->datalen - headerlen; log_debug(LD_HTTP,"headerlen %d, bodylen %d.", (int)headerlen, (int)bodylen); @@ -1016,7 +1124,7 @@ fetch_from_buf_http(buf_t *buf, } #define CONTENT_LENGTH "\r\nContent-Length: " - p = strstr(headers, CONTENT_LENGTH); + p = (char*) tor_memstr(headers, headerlen, CONTENT_LENGTH); if (p) { int i; i = atoi(p+strlen(CONTENT_LENGTH)); -- cgit v1.2.3