diff options
Diffstat (limited to 'lib/libfetch/http.c')
-rw-r--r-- | lib/libfetch/http.c | 461 |
1 files changed, 461 insertions, 0 deletions
diff --git a/lib/libfetch/http.c b/lib/libfetch/http.c new file mode 100644 index 0000000..5c49ec5 --- /dev/null +++ b/lib/libfetch/http.c @@ -0,0 +1,461 @@ +/*- + * Copyright (c) 1998 Dag-Erling Coïdan Smørgrav + * All rights reserved. + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions + * are met: + * 1. Redistributions of source code must retain the above copyright + * notice, this list of conditions and the following disclaimer + * in this position and unchanged. + * 2. Redistributions in binary form must reproduce the above copyright + * notice, this list of conditions and the following disclaimer in the + * documentation and/or other materials provided with the distribution. + * 3. The name of the author may not be used to endorse or promote products + * derived from this software without specific prior written permission + * + * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR + * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES + * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. + * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, + * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT + * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, + * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY + * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT + * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF + * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + * + * $Id: http.c,v 1.9 1998/12/16 11:44:31 des Exp $ + */ + +/* + * The base64 code in this file is based on code from MIT fetch, which + * has the following copyright and license: + * + *- + * Copyright 1997 Massachusetts Institute of Technology + * + * Permission to use, copy, modify, and distribute this software and + * its documentation for any purpose and without fee is hereby + * granted, provided that both the above copyright notice and this + * permission notice appear in all copies, that both the above + * copyright notice and this permission notice appear in all + * supporting documentation, and that the name of M.I.T. not be used + * in advertising or publicity pertaining to distribution of the + * software without specific, written prior permission. M.I.T. makes + * no representations about the suitability of this software for any + * purpose. It is provided "as is" without express or implied + * warranty. + * + * THIS SOFTWARE IS PROVIDED BY M.I.T. ``AS IS''. M.I.T. DISCLAIMS + * ALL EXPRESS OR IMPLIED WARRANTIES WITH REGARD TO THIS SOFTWARE, + * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF + * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT + * SHALL M.I.T. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, + * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT + * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF + * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND + * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, + * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT + * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF + * SUCH DAMAGE. */ + +#include <sys/param.h> + +#include <err.h> +#include <ctype.h> +#include <stdarg.h> +#include <stdio.h> +#include <stdlib.h> +#include <string.h> +#include <unistd.h> + +#include "fetch.h" +#include "common.h" +#include "httperr.h" + +extern char *__progname; + +#define ENDL "\r\n" + +struct cookie +{ + FILE *real_f; +#define ENC_NONE 0 +#define ENC_CHUNKED 1 + int encoding; /* 1 = chunked, 0 = none */ +#define HTTPCTYPELEN 59 + char content_type[HTTPCTYPELEN+1]; + char *buf; + int b_cur, eof; + unsigned b_len, chunksize; +}; + +/* + * Send a formatted line; optionally echo to terminal + */ +static int +_http_cmd(FILE *f, char *fmt, ...) +{ + va_list ap; + + va_start(ap, fmt); + vfprintf(f, fmt, ap); +#ifndef NDEBUG + fprintf(stderr, "\033[1m>>> "); + vfprintf(stderr, fmt, ap); + fprintf(stderr, "\033[m"); +#endif + va_end(ap); + + return 0; /* XXX */ +} + +/* + * Fill the input buffer, do chunk decoding on the fly + */ +static char * +_http_fillbuf(struct cookie *c) +{ + char *ln; + unsigned int len; + + if (c->eof) + return NULL; + + if (c->encoding == ENC_NONE) { + c->buf = fgetln(c->real_f, &(c->b_len)); + c->b_cur = 0; + } else if (c->encoding == ENC_CHUNKED) { + if (c->chunksize == 0) { + ln = fgetln(c->real_f, &len); + DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): new chunk: " + "%*.*s\033[m\n", (int)len-2, (int)len-2, ln)); + sscanf(ln, "%x", &(c->chunksize)); + if (!c->chunksize) { + DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): " + "end of last chunk\033[m\n")); + c->eof = 1; + return NULL; + } + DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): " + "new chunk: %X\033[m\n", c->chunksize)); + } + c->buf = fgetln(c->real_f, &(c->b_len)); + if (c->b_len > c->chunksize) + c->b_len = c->chunksize; + c->chunksize -= c->b_len; + c->b_cur = 0; + } + else return NULL; /* unknown encoding */ + return c->buf; +} + +/* + * Read function + */ +static int +_http_readfn(struct cookie *c, char *buf, int len) +{ + int l, pos = 0; + while (len) { + /* empty buffer */ + if (!c->buf || (c->b_cur == c->b_len)) + if (!_http_fillbuf(c)) + break; + + l = c->b_len - c->b_cur; + if (len < l) l = len; + memcpy(buf + pos, c->buf + c->b_cur, l); + c->b_cur += l; + pos += l; + len -= l; + } + + if (ferror(c->real_f)) + return -1; + else return pos; +} + +/* + * Write function + */ +static int +_http_writefn(struct cookie *c, const char *buf, int len) +{ + size_t r = fwrite(buf, 1, (size_t)len, c->real_f); + return r ? r : -1; +} + +/* + * Close function + */ +static int +_http_closefn(struct cookie *c) +{ + int r = fclose(c->real_f); + free(c); + return (r == EOF) ? -1 : 0; +} + +/* + * Extract content type from cookie + */ +char * +fetchContentType(FILE *f) +{ + /* + * We have no way of making sure this really *is* one of our cookies, + * so just check for a null pointer and hope for the best. + */ + return f->_cookie ? (((struct cookie *)f->_cookie)->content_type) : NULL; +} + +/* + * Base64 encoding + */ +int +_http_base64(char *dst, char *src, int l) +{ + static const char base64[] = + "ABCDEFGHIJKLMNOPQRSTUVWXYZ" + "abcdefghijklmnopqrstuvwxyz" + "0123456789+/"; + int t, r = 0; + + while (l >= 3) { + t = (src[0] << 16) | (src[1] << 8) | src[2]; + dst[0] = base64[(t >> 18) & 0x3f]; + dst[1] = base64[(t >> 12) & 0x3f]; + dst[2] = base64[(t >> 6) & 0x3f]; + dst[3] = base64[(t >> 0) & 0x3f]; + src += 3; l -= 3; + dst += 4; r += 4; + } + + switch (l) { + case 2: + t = (src[0] << 16) | (src[1] << 8); + dst[0] = base64[(t >> 18) & 0x3f]; + dst[1] = base64[(t >> 12) & 0x3f]; + dst[2] = base64[(t >> 6) & 0x3f]; + dst[3] = '='; + dst += 4; + r += 4; + break; + case 1: + t = src[0] << 16; + dst[0] = base64[(t >> 18) & 0x3f]; + dst[1] = base64[(t >> 12) & 0x3f]; + dst[2] = dst[3] = '='; + dst += 4; + r += 4; + break; + case 0: + break; + } + + *dst = 0; + return r; +} + +/* + * Encode username and password + */ +char * +_http_auth(char *usr, char *pwd) +{ + int len, lu, lp; + char *str, *s; + + lu = strlen(usr); + lp = strlen(pwd); + + len = (lu * 4 + 2) / 3 /* user name, round up */ + + 1 /* colon */ + + (lp * 4 + 2) / 3 /* password, round up */ + + 1; /* null */ + + if ((s = str = (char *)malloc(len)) == NULL) + return NULL; + + s += _http_base64(s, usr, lu); + *s++ = ':'; + s += _http_base64(s, pwd, lp); + *s = 0; + + return str; +} + +/* + * Retrieve a file by HTTP + */ +FILE * +fetchGetHTTP(struct url *URL, char *flags) +{ + int sd = -1, e, i, enc = ENC_NONE, verbose; + struct cookie *c; + char *ln, *p, *px, *q; + FILE *f, *cf; + size_t len; + + verbose = (strchr(flags, 'v') != NULL); + + /* allocate cookie */ + if ((c = calloc(1, sizeof(struct cookie))) == NULL) + return NULL; + + /* check port */ + if (!URL->port) + URL->port = 80; /* default HTTP port */ + + /* attempt to connect to proxy server */ + if ((px = getenv("HTTP_PROXY")) != NULL) { + char host[MAXHOSTNAMELEN]; + int port = 3128; /* XXX I think 3128 is default... check? */ + + /* measure length */ + len = strcspn(px, ":"); + + /* get port (atoi is a little too tolerant perhaps?) */ + if (px[len] == ':') + port = atoi(px+len+1); + + /* get host name */ + if (len >= MAXHOSTNAMELEN) + len = MAXHOSTNAMELEN - 1; + strncpy(host, px, len); + host[len] = 0; + + /* connect */ + sd = _fetch_connect(host, port, verbose); + } + + /* if no proxy is configured or could be contacted, try direct */ + if (sd == -1) { + if ((sd = _fetch_connect(URL->host, URL->port, verbose)) == -1) + goto ouch; + } + + /* reopen as stream */ + if ((f = fdopen(sd, "r+")) == NULL) + goto ouch; + c->real_f = f; + + /* send request (proxies require absolute form, so use that) */ + if (verbose) + _fetch_info("requesting http://%s:%d%s", + URL->host, URL->port, URL->doc); + _http_cmd(f, "GET http://%s:%d%s HTTP/1.1" ENDL, + URL->host, URL->port, URL->doc); + + /* start sending headers away */ + if (URL->user[0] || URL->pwd[0]) { + char *auth_str = _http_auth(URL->user, URL->pwd); + if (!auth_str) + goto fouch; + _http_cmd(f, "Authorization: Basic %s" ENDL, auth_str); + free(auth_str); + } + _http_cmd(f, "Host: %s:%d" ENDL, URL->host, URL->port); + _http_cmd(f, "User-Agent: %s " _LIBFETCH_VER ENDL, __progname); + _http_cmd(f, "Connection: close" ENDL ENDL); + + /* get response */ + if ((ln = fgetln(f, &len)) == NULL) + goto fouch; + DEBUG(fprintf(stderr, "response: [\033[1m%*.*s\033[m]\n", + (int)len-2, (int)len-2, ln)); + + /* we can't use strchr() and friends since ln isn't NUL-terminated */ + p = ln; + while ((p < ln + len) && !isspace(*p)) + p++; + while ((p < ln + len) && !isdigit(*p)) + p++; + if (!isdigit(*p)) + goto fouch; + e = atoi(p); + DEBUG(fprintf(stderr, "code: [\033[1m%d\033[m]\n", e)); + + /* add code to handle redirects later */ + if (e != 200) { + _http_seterr(e); + goto fouch; + } + + /* browse through header */ + while (1) { + if ((ln = fgetln(f, &len)) == NULL) + goto fouch; + if ((ln[0] == '\r') || (ln[0] == '\n')) + break; + DEBUG(fprintf(stderr, "header: [\033[1m%*.*s\033[m]\n", + (int)len-2, (int)len-2, ln)); +#define XFERENC "Transfer-Encoding:" + if (strncasecmp(ln, XFERENC, sizeof(XFERENC)-1) == 0) { + p = ln + sizeof(XFERENC) - 1; + while ((p < ln + len) && isspace(*p)) + p++; + for (q = p; (q < ln + len) && !isspace(*q); q++) + /* VOID */ ; + *q = 0; + if (strcasecmp(p, "chunked") == 0) + enc = ENC_CHUNKED; + DEBUG(fprintf(stderr, "xferenc: [\033[1m%s\033[m]\n", p)); +#undef XFERENC +#define CONTTYPE "Content-Type:" + } else if (strncasecmp(ln, CONTTYPE, sizeof(CONTTYPE)-1) == 0) { + p = ln + sizeof(CONTTYPE) - 1; + while ((p < ln + len) && isspace(*p)) + p++; + for (i = 0; p < ln + len; p++) + if (i < HTTPCTYPELEN) + c->content_type[i++] = *p; + do c->content_type[i--] = 0; while (isspace(c->content_type[i])); + DEBUG(fprintf(stderr, "conttype: [\033[1m%s\033[m]\n", + c->content_type)); +#undef CONTTYPE + } + } + + /* only body remains */ + c->encoding = enc; + cf = funopen(c, + (int (*)(void *, char *, int))_http_readfn, + (int (*)(void *, const char *, int))_http_writefn, + (fpos_t (*)(void *, fpos_t, int))NULL, + (int (*)(void *))_http_closefn); + if (cf == NULL) + goto fouch; + return cf; + +ouch: + if (sd >= 0) + close(sd); + free(c); + _http_seterr(999); /* XXX do this properly RSN */ + return NULL; +fouch: + fclose(f); + free(c); + _http_seterr(999); /* XXX do this properly RSN */ + return NULL; +} + +FILE * +fetchPutHTTP(struct url *URL, char *flags) +{ + warnx("fetchPutHTTP(): not implemented"); + return NULL; +} + +/* + * Get an HTTP document's metadata + */ +int +fetchStatHTTP(struct url *url, struct url_stat *us, char *flags) +{ + warnx("fetchStatHTTP(): not implemented"); + return -1; +} |