14ca1ab94SDag-Erling Smørgrav /*- 24ca1ab94SDag-Erling Smørgrav * Copyright (c) 1998 Dag-Erling Co�dan Sm�rgrav 34ca1ab94SDag-Erling Smørgrav * All rights reserved. 44ca1ab94SDag-Erling Smørgrav * 54ca1ab94SDag-Erling Smørgrav * Redistribution and use in source and binary forms, with or without 64ca1ab94SDag-Erling Smørgrav * modification, are permitted provided that the following conditions 74ca1ab94SDag-Erling Smørgrav * are met: 84ca1ab94SDag-Erling Smørgrav * 1. Redistributions of source code must retain the above copyright 94ca1ab94SDag-Erling Smørgrav * notice, this list of conditions and the following disclaimer 104ca1ab94SDag-Erling Smørgrav * in this position and unchanged. 114ca1ab94SDag-Erling Smørgrav * 2. Redistributions in binary form must reproduce the above copyright 124ca1ab94SDag-Erling Smørgrav * notice, this list of conditions and the following disclaimer in the 134ca1ab94SDag-Erling Smørgrav * documentation and/or other materials provided with the distribution. 144ca1ab94SDag-Erling Smørgrav * 3. The name of the author may not be used to endorse or promote products 154ca1ab94SDag-Erling Smørgrav * derived from this software without specific prior written permission 164ca1ab94SDag-Erling Smørgrav * 174ca1ab94SDag-Erling Smørgrav * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 184ca1ab94SDag-Erling Smørgrav * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 194ca1ab94SDag-Erling Smørgrav * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 204ca1ab94SDag-Erling Smørgrav * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 214ca1ab94SDag-Erling Smørgrav * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 224ca1ab94SDag-Erling Smørgrav * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 234ca1ab94SDag-Erling Smørgrav * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 244ca1ab94SDag-Erling Smørgrav * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 254ca1ab94SDag-Erling Smørgrav * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 264ca1ab94SDag-Erling Smørgrav * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 274ca1ab94SDag-Erling Smørgrav * 287f3dea24SPeter Wemm * $FreeBSD$ 294ca1ab94SDag-Erling Smørgrav */ 304ca1ab94SDag-Erling Smørgrav 31f62e5228SDag-Erling Smørgrav /* 32f62e5228SDag-Erling Smørgrav * The base64 code in this file is based on code from MIT fetch, which 33f62e5228SDag-Erling Smørgrav * has the following copyright and license: 34f62e5228SDag-Erling Smørgrav * 35f62e5228SDag-Erling Smørgrav *- 36f62e5228SDag-Erling Smørgrav * Copyright 1997 Massachusetts Institute of Technology 37f62e5228SDag-Erling Smørgrav * 38f62e5228SDag-Erling Smørgrav * Permission to use, copy, modify, and distribute this software and 39f62e5228SDag-Erling Smørgrav * its documentation for any purpose and without fee is hereby 40f62e5228SDag-Erling Smørgrav * granted, provided that both the above copyright notice and this 41f62e5228SDag-Erling Smørgrav * permission notice appear in all copies, that both the above 42f62e5228SDag-Erling Smørgrav * copyright notice and this permission notice appear in all 43f62e5228SDag-Erling Smørgrav * supporting documentation, and that the name of M.I.T. not be used 44f62e5228SDag-Erling Smørgrav * in advertising or publicity pertaining to distribution of the 45f62e5228SDag-Erling Smørgrav * software without specific, written prior permission. M.I.T. makes 46f62e5228SDag-Erling Smørgrav * no representations about the suitability of this software for any 47f62e5228SDag-Erling Smørgrav * purpose. It is provided "as is" without express or implied 48f62e5228SDag-Erling Smørgrav * warranty. 49f62e5228SDag-Erling Smørgrav * 50f62e5228SDag-Erling Smørgrav * THIS SOFTWARE IS PROVIDED BY M.I.T. ``AS IS''. M.I.T. DISCLAIMS 51f62e5228SDag-Erling Smørgrav * ALL EXPRESS OR IMPLIED WARRANTIES WITH REGARD TO THIS SOFTWARE, 52f62e5228SDag-Erling Smørgrav * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF 53f62e5228SDag-Erling Smørgrav * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT 54f62e5228SDag-Erling Smørgrav * SHALL M.I.T. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 55f62e5228SDag-Erling Smørgrav * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 56f62e5228SDag-Erling Smørgrav * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF 57f62e5228SDag-Erling Smørgrav * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND 58f62e5228SDag-Erling Smørgrav * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 59f62e5228SDag-Erling Smørgrav * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT 60f62e5228SDag-Erling Smørgrav * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 61f62e5228SDag-Erling Smørgrav * SUCH DAMAGE. */ 62f62e5228SDag-Erling Smørgrav 634ca1ab94SDag-Erling Smørgrav #include <sys/param.h> 644ca1ab94SDag-Erling Smørgrav 654ca1ab94SDag-Erling Smørgrav #include <err.h> 664ca1ab94SDag-Erling Smørgrav #include <ctype.h> 67e6182307SDag-Erling Smørgrav #include <netdb.h> 68f62e5228SDag-Erling Smørgrav #include <stdarg.h> 694ca1ab94SDag-Erling Smørgrav #include <stdio.h> 704ca1ab94SDag-Erling Smørgrav #include <stdlib.h> 714ca1ab94SDag-Erling Smørgrav #include <string.h> 724ca1ab94SDag-Erling Smørgrav #include <unistd.h> 734ca1ab94SDag-Erling Smørgrav 744ca1ab94SDag-Erling Smørgrav #include "fetch.h" 75842a95ccSDag-Erling Smørgrav #include "common.h" 760fba3a00SDag-Erling Smørgrav #include "httperr.h" 774ca1ab94SDag-Erling Smørgrav 784ca1ab94SDag-Erling Smørgrav extern char *__progname; 794ca1ab94SDag-Erling Smørgrav 804ca1ab94SDag-Erling Smørgrav #define ENDL "\r\n" 814ca1ab94SDag-Erling Smørgrav 823d2a8471SDag-Erling Smørgrav #define HTTP_OK 200 833d2a8471SDag-Erling Smørgrav #define HTTP_PARTIAL 206 843d2a8471SDag-Erling Smørgrav 854ca1ab94SDag-Erling Smørgrav struct cookie 864ca1ab94SDag-Erling Smørgrav { 874ca1ab94SDag-Erling Smørgrav FILE *real_f; 884ca1ab94SDag-Erling Smørgrav #define ENC_NONE 0 894ca1ab94SDag-Erling Smørgrav #define ENC_CHUNKED 1 904ca1ab94SDag-Erling Smørgrav int encoding; /* 1 = chunked, 0 = none */ 914ca1ab94SDag-Erling Smørgrav #define HTTPCTYPELEN 59 924ca1ab94SDag-Erling Smørgrav char content_type[HTTPCTYPELEN+1]; 934ca1ab94SDag-Erling Smørgrav char *buf; 944ca1ab94SDag-Erling Smørgrav int b_cur, eof; 954ca1ab94SDag-Erling Smørgrav unsigned b_len, chunksize; 964ca1ab94SDag-Erling Smørgrav }; 974ca1ab94SDag-Erling Smørgrav 98f62e5228SDag-Erling Smørgrav /* 99f62e5228SDag-Erling Smørgrav * Send a formatted line; optionally echo to terminal 100f62e5228SDag-Erling Smørgrav */ 101f62e5228SDag-Erling Smørgrav static int 102f62e5228SDag-Erling Smørgrav _http_cmd(FILE *f, char *fmt, ...) 103f62e5228SDag-Erling Smørgrav { 104f62e5228SDag-Erling Smørgrav va_list ap; 105f62e5228SDag-Erling Smørgrav 106f62e5228SDag-Erling Smørgrav va_start(ap, fmt); 107f62e5228SDag-Erling Smørgrav vfprintf(f, fmt, ap); 108f62e5228SDag-Erling Smørgrav #ifndef NDEBUG 109f62e5228SDag-Erling Smørgrav fprintf(stderr, "\033[1m>>> "); 110f62e5228SDag-Erling Smørgrav vfprintf(stderr, fmt, ap); 111f62e5228SDag-Erling Smørgrav fprintf(stderr, "\033[m"); 112f62e5228SDag-Erling Smørgrav #endif 113f62e5228SDag-Erling Smørgrav va_end(ap); 114f62e5228SDag-Erling Smørgrav 115f62e5228SDag-Erling Smørgrav return 0; /* XXX */ 116f62e5228SDag-Erling Smørgrav } 117f62e5228SDag-Erling Smørgrav 118f62e5228SDag-Erling Smørgrav /* 119f62e5228SDag-Erling Smørgrav * Fill the input buffer, do chunk decoding on the fly 120f62e5228SDag-Erling Smørgrav */ 1214ca1ab94SDag-Erling Smørgrav static char * 1224ca1ab94SDag-Erling Smørgrav _http_fillbuf(struct cookie *c) 1234ca1ab94SDag-Erling Smørgrav { 1244ca1ab94SDag-Erling Smørgrav char *ln; 1254ca1ab94SDag-Erling Smørgrav unsigned int len; 1264ca1ab94SDag-Erling Smørgrav 1274ca1ab94SDag-Erling Smørgrav if (c->eof) 1284ca1ab94SDag-Erling Smørgrav return NULL; 1294ca1ab94SDag-Erling Smørgrav 1304ca1ab94SDag-Erling Smørgrav if (c->encoding == ENC_NONE) { 1314ca1ab94SDag-Erling Smørgrav c->buf = fgetln(c->real_f, &(c->b_len)); 1324ca1ab94SDag-Erling Smørgrav c->b_cur = 0; 1334ca1ab94SDag-Erling Smørgrav } else if (c->encoding == ENC_CHUNKED) { 1344ca1ab94SDag-Erling Smørgrav if (c->chunksize == 0) { 1354ca1ab94SDag-Erling Smørgrav ln = fgetln(c->real_f, &len); 1364ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): new chunk: " 1374ca1ab94SDag-Erling Smørgrav "%*.*s\033[m\n", (int)len-2, (int)len-2, ln)); 1384ca1ab94SDag-Erling Smørgrav sscanf(ln, "%x", &(c->chunksize)); 1394ca1ab94SDag-Erling Smørgrav if (!c->chunksize) { 1404ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): " 1414ca1ab94SDag-Erling Smørgrav "end of last chunk\033[m\n")); 1424ca1ab94SDag-Erling Smørgrav c->eof = 1; 1434ca1ab94SDag-Erling Smørgrav return NULL; 1444ca1ab94SDag-Erling Smørgrav } 1454ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): " 1464ca1ab94SDag-Erling Smørgrav "new chunk: %X\033[m\n", c->chunksize)); 1474ca1ab94SDag-Erling Smørgrav } 1484ca1ab94SDag-Erling Smørgrav c->buf = fgetln(c->real_f, &(c->b_len)); 1494ca1ab94SDag-Erling Smørgrav if (c->b_len > c->chunksize) 1504ca1ab94SDag-Erling Smørgrav c->b_len = c->chunksize; 1514ca1ab94SDag-Erling Smørgrav c->chunksize -= c->b_len; 1524ca1ab94SDag-Erling Smørgrav c->b_cur = 0; 1534ca1ab94SDag-Erling Smørgrav } 1544ca1ab94SDag-Erling Smørgrav else return NULL; /* unknown encoding */ 1554ca1ab94SDag-Erling Smørgrav return c->buf; 1564ca1ab94SDag-Erling Smørgrav } 1574ca1ab94SDag-Erling Smørgrav 158f62e5228SDag-Erling Smørgrav /* 159f62e5228SDag-Erling Smørgrav * Read function 160f62e5228SDag-Erling Smørgrav */ 1614ca1ab94SDag-Erling Smørgrav static int 1624ca1ab94SDag-Erling Smørgrav _http_readfn(struct cookie *c, char *buf, int len) 1634ca1ab94SDag-Erling Smørgrav { 1644ca1ab94SDag-Erling Smørgrav int l, pos = 0; 1654ca1ab94SDag-Erling Smørgrav while (len) { 1664ca1ab94SDag-Erling Smørgrav /* empty buffer */ 1674ca1ab94SDag-Erling Smørgrav if (!c->buf || (c->b_cur == c->b_len)) 1684ca1ab94SDag-Erling Smørgrav if (!_http_fillbuf(c)) 1694ca1ab94SDag-Erling Smørgrav break; 1704ca1ab94SDag-Erling Smørgrav 1714ca1ab94SDag-Erling Smørgrav l = c->b_len - c->b_cur; 1724ca1ab94SDag-Erling Smørgrav if (len < l) l = len; 1734ca1ab94SDag-Erling Smørgrav memcpy(buf + pos, c->buf + c->b_cur, l); 1744ca1ab94SDag-Erling Smørgrav c->b_cur += l; 1754ca1ab94SDag-Erling Smørgrav pos += l; 1764ca1ab94SDag-Erling Smørgrav len -= l; 1774ca1ab94SDag-Erling Smørgrav } 1784ca1ab94SDag-Erling Smørgrav 1794ca1ab94SDag-Erling Smørgrav if (ferror(c->real_f)) 1804ca1ab94SDag-Erling Smørgrav return -1; 1814ca1ab94SDag-Erling Smørgrav else return pos; 1824ca1ab94SDag-Erling Smørgrav } 1834ca1ab94SDag-Erling Smørgrav 184f62e5228SDag-Erling Smørgrav /* 185f62e5228SDag-Erling Smørgrav * Write function 186f62e5228SDag-Erling Smørgrav */ 1874ca1ab94SDag-Erling Smørgrav static int 1884ca1ab94SDag-Erling Smørgrav _http_writefn(struct cookie *c, const char *buf, int len) 1894ca1ab94SDag-Erling Smørgrav { 1904ca1ab94SDag-Erling Smørgrav size_t r = fwrite(buf, 1, (size_t)len, c->real_f); 1914ca1ab94SDag-Erling Smørgrav return r ? r : -1; 1924ca1ab94SDag-Erling Smørgrav } 1934ca1ab94SDag-Erling Smørgrav 194f62e5228SDag-Erling Smørgrav /* 195f62e5228SDag-Erling Smørgrav * Close function 196f62e5228SDag-Erling Smørgrav */ 1974ca1ab94SDag-Erling Smørgrav static int 1984ca1ab94SDag-Erling Smørgrav _http_closefn(struct cookie *c) 1994ca1ab94SDag-Erling Smørgrav { 2004ca1ab94SDag-Erling Smørgrav int r = fclose(c->real_f); 2014ca1ab94SDag-Erling Smørgrav free(c); 2024ca1ab94SDag-Erling Smørgrav return (r == EOF) ? -1 : 0; 2034ca1ab94SDag-Erling Smørgrav } 2044ca1ab94SDag-Erling Smørgrav 205f62e5228SDag-Erling Smørgrav /* 206f62e5228SDag-Erling Smørgrav * Extract content type from cookie 207f62e5228SDag-Erling Smørgrav */ 2084ca1ab94SDag-Erling Smørgrav char * 2094ca1ab94SDag-Erling Smørgrav fetchContentType(FILE *f) 2104ca1ab94SDag-Erling Smørgrav { 2114ca1ab94SDag-Erling Smørgrav /* 2124ca1ab94SDag-Erling Smørgrav * We have no way of making sure this really *is* one of our cookies, 2134ca1ab94SDag-Erling Smørgrav * so just check for a null pointer and hope for the best. 2144ca1ab94SDag-Erling Smørgrav */ 2154ca1ab94SDag-Erling Smørgrav return f->_cookie ? (((struct cookie *)f->_cookie)->content_type) : NULL; 2164ca1ab94SDag-Erling Smørgrav } 2174ca1ab94SDag-Erling Smørgrav 218f62e5228SDag-Erling Smørgrav /* 219f62e5228SDag-Erling Smørgrav * Base64 encoding 220f62e5228SDag-Erling Smørgrav */ 221f62e5228SDag-Erling Smørgrav int 222f62e5228SDag-Erling Smørgrav _http_base64(char *dst, char *src, int l) 223f62e5228SDag-Erling Smørgrav { 224f62e5228SDag-Erling Smørgrav static const char base64[] = 225f62e5228SDag-Erling Smørgrav "ABCDEFGHIJKLMNOPQRSTUVWXYZ" 226f62e5228SDag-Erling Smørgrav "abcdefghijklmnopqrstuvwxyz" 227f62e5228SDag-Erling Smørgrav "0123456789+/"; 228f62e5228SDag-Erling Smørgrav int t, r = 0; 229f62e5228SDag-Erling Smørgrav 230f62e5228SDag-Erling Smørgrav while (l >= 3) { 231f62e5228SDag-Erling Smørgrav t = (src[0] << 16) | (src[1] << 8) | src[2]; 232f62e5228SDag-Erling Smørgrav dst[0] = base64[(t >> 18) & 0x3f]; 233f62e5228SDag-Erling Smørgrav dst[1] = base64[(t >> 12) & 0x3f]; 234f62e5228SDag-Erling Smørgrav dst[2] = base64[(t >> 6) & 0x3f]; 235f62e5228SDag-Erling Smørgrav dst[3] = base64[(t >> 0) & 0x3f]; 236f62e5228SDag-Erling Smørgrav src += 3; l -= 3; 237f62e5228SDag-Erling Smørgrav dst += 4; r += 4; 238f62e5228SDag-Erling Smørgrav } 239f62e5228SDag-Erling Smørgrav 240f62e5228SDag-Erling Smørgrav switch (l) { 241f62e5228SDag-Erling Smørgrav case 2: 242f62e5228SDag-Erling Smørgrav t = (src[0] << 16) | (src[1] << 8); 243f62e5228SDag-Erling Smørgrav dst[0] = base64[(t >> 18) & 0x3f]; 244f62e5228SDag-Erling Smørgrav dst[1] = base64[(t >> 12) & 0x3f]; 245f62e5228SDag-Erling Smørgrav dst[2] = base64[(t >> 6) & 0x3f]; 246f62e5228SDag-Erling Smørgrav dst[3] = '='; 247f62e5228SDag-Erling Smørgrav dst += 4; 248f62e5228SDag-Erling Smørgrav r += 4; 249f62e5228SDag-Erling Smørgrav break; 250f62e5228SDag-Erling Smørgrav case 1: 251f62e5228SDag-Erling Smørgrav t = src[0] << 16; 252f62e5228SDag-Erling Smørgrav dst[0] = base64[(t >> 18) & 0x3f]; 253f62e5228SDag-Erling Smørgrav dst[1] = base64[(t >> 12) & 0x3f]; 254f62e5228SDag-Erling Smørgrav dst[2] = dst[3] = '='; 255f62e5228SDag-Erling Smørgrav dst += 4; 256f62e5228SDag-Erling Smørgrav r += 4; 257f62e5228SDag-Erling Smørgrav break; 258f62e5228SDag-Erling Smørgrav case 0: 259f62e5228SDag-Erling Smørgrav break; 260f62e5228SDag-Erling Smørgrav } 261f62e5228SDag-Erling Smørgrav 262f62e5228SDag-Erling Smørgrav *dst = 0; 263f62e5228SDag-Erling Smørgrav return r; 264f62e5228SDag-Erling Smørgrav } 265f62e5228SDag-Erling Smørgrav 266f62e5228SDag-Erling Smørgrav /* 267f62e5228SDag-Erling Smørgrav * Encode username and password 268f62e5228SDag-Erling Smørgrav */ 269f62e5228SDag-Erling Smørgrav char * 270f62e5228SDag-Erling Smørgrav _http_auth(char *usr, char *pwd) 271f62e5228SDag-Erling Smørgrav { 272f62e5228SDag-Erling Smørgrav int len, lu, lp; 273f62e5228SDag-Erling Smørgrav char *str, *s; 274f62e5228SDag-Erling Smørgrav 275f62e5228SDag-Erling Smørgrav lu = strlen(usr); 276f62e5228SDag-Erling Smørgrav lp = strlen(pwd); 277f62e5228SDag-Erling Smørgrav 278f62e5228SDag-Erling Smørgrav len = (lu * 4 + 2) / 3 /* user name, round up */ 279f62e5228SDag-Erling Smørgrav + 1 /* colon */ 280f62e5228SDag-Erling Smørgrav + (lp * 4 + 2) / 3 /* password, round up */ 281f62e5228SDag-Erling Smørgrav + 1; /* null */ 282f62e5228SDag-Erling Smørgrav 283f62e5228SDag-Erling Smørgrav if ((s = str = (char *)malloc(len)) == NULL) 284f62e5228SDag-Erling Smørgrav return NULL; 285f62e5228SDag-Erling Smørgrav 286f62e5228SDag-Erling Smørgrav s += _http_base64(s, usr, lu); 287f62e5228SDag-Erling Smørgrav *s++ = ':'; 288f62e5228SDag-Erling Smørgrav s += _http_base64(s, pwd, lp); 289f62e5228SDag-Erling Smørgrav *s = 0; 290f62e5228SDag-Erling Smørgrav 291f62e5228SDag-Erling Smørgrav return str; 292f62e5228SDag-Erling Smørgrav } 293f62e5228SDag-Erling Smørgrav 294f62e5228SDag-Erling Smørgrav /* 295d8acd8dcSDag-Erling Smørgrav * Retrieve a file by HTTP 296f62e5228SDag-Erling Smørgrav */ 2974ca1ab94SDag-Erling Smørgrav FILE * 298d8acd8dcSDag-Erling Smørgrav fetchGetHTTP(struct url *URL, char *flags) 2994ca1ab94SDag-Erling Smørgrav { 300f5f109a0SDag-Erling Smørgrav int sd = -1, e, i, enc = ENC_NONE, direct, verbose; 3014ca1ab94SDag-Erling Smørgrav struct cookie *c; 3023b7a6740SDag-Erling Smørgrav char *ln, *p, *px, *q; 3034ca1ab94SDag-Erling Smørgrav FILE *f, *cf; 3044ca1ab94SDag-Erling Smørgrav size_t len; 3053d2a8471SDag-Erling Smørgrav off_t pos = 0; 3064ca1ab94SDag-Erling Smørgrav 307f5f109a0SDag-Erling Smørgrav direct = (flags && strchr(flags, 'd')); 308f5f109a0SDag-Erling Smørgrav verbose = (flags && strchr(flags, 'v')); 3090fba3a00SDag-Erling Smørgrav 3104ca1ab94SDag-Erling Smørgrav /* allocate cookie */ 311e6182307SDag-Erling Smørgrav if ((c = calloc(1, sizeof *c)) == NULL) 3124ca1ab94SDag-Erling Smørgrav return NULL; 3134ca1ab94SDag-Erling Smørgrav 3144ca1ab94SDag-Erling Smørgrav /* check port */ 315e6182307SDag-Erling Smørgrav if (!URL->port) { 316e6182307SDag-Erling Smørgrav struct servent *se; 317e6182307SDag-Erling Smørgrav 318e6182307SDag-Erling Smørgrav if ((se = getservbyname("http", "tcp")) != NULL) 319e6182307SDag-Erling Smørgrav URL->port = ntohs(se->s_port); 320e6182307SDag-Erling Smørgrav else 321e6182307SDag-Erling Smørgrav URL->port = 80; 322e6182307SDag-Erling Smørgrav } 3234ca1ab94SDag-Erling Smørgrav 3244ca1ab94SDag-Erling Smørgrav /* attempt to connect to proxy server */ 325f5f109a0SDag-Erling Smørgrav if (!direct && (px = getenv("HTTP_PROXY")) != NULL) { 3263b7a6740SDag-Erling Smørgrav char host[MAXHOSTNAMELEN]; 327e6182307SDag-Erling Smørgrav int port = 0; 3284ca1ab94SDag-Erling Smørgrav 3294ca1ab94SDag-Erling Smørgrav /* measure length */ 3304ca1ab94SDag-Erling Smørgrav len = strcspn(px, ":"); 3314ca1ab94SDag-Erling Smørgrav 332f5f109a0SDag-Erling Smørgrav /* get port (XXX atoi is a little too tolerant perhaps?) */ 333e6182307SDag-Erling Smørgrav if (px[len] == ':') { 334e6182307SDag-Erling Smørgrav if (strspn(px+len+1, "0123456789") != strlen(px+len+1) 335e6182307SDag-Erling Smørgrav || strlen(px+len+1) > 5) { 336e6182307SDag-Erling Smørgrav /* XXX we should emit some kind of warning */ 337e6182307SDag-Erling Smørgrav } 3384ca1ab94SDag-Erling Smørgrav port = atoi(px+len+1); 339e6182307SDag-Erling Smørgrav if (port < 1 || port > 65535) { 340e6182307SDag-Erling Smørgrav /* XXX we should emit some kind of warning */ 341e6182307SDag-Erling Smørgrav } 342e6182307SDag-Erling Smørgrav } 343e6182307SDag-Erling Smørgrav if (!port) { 344e6182307SDag-Erling Smørgrav #if 0 345e6182307SDag-Erling Smørgrav /* 346e6182307SDag-Erling Smørgrav * commented out, since there is currently no service name 347e6182307SDag-Erling Smørgrav * for HTTP proxies 348e6182307SDag-Erling Smørgrav */ 349e6182307SDag-Erling Smørgrav struct servent *se; 350e6182307SDag-Erling Smørgrav 351e6182307SDag-Erling Smørgrav if ((se = getservbyname("xxxx", "tcp")) != NULL) 352e6182307SDag-Erling Smørgrav port = ntohs(se->s_port); 353e6182307SDag-Erling Smørgrav else 354e6182307SDag-Erling Smørgrav #endif 355e6182307SDag-Erling Smørgrav port = 3128; 356e6182307SDag-Erling Smørgrav } 3574ca1ab94SDag-Erling Smørgrav 3584ca1ab94SDag-Erling Smørgrav /* get host name */ 3594ca1ab94SDag-Erling Smørgrav if (len >= MAXHOSTNAMELEN) 3604ca1ab94SDag-Erling Smørgrav len = MAXHOSTNAMELEN - 1; 3614ca1ab94SDag-Erling Smørgrav strncpy(host, px, len); 3624ca1ab94SDag-Erling Smørgrav host[len] = 0; 3634ca1ab94SDag-Erling Smørgrav 3644ca1ab94SDag-Erling Smørgrav /* connect */ 365d941fd2dSDag-Erling Smørgrav sd = _fetch_connect(host, port, verbose); 3664ca1ab94SDag-Erling Smørgrav } 3674ca1ab94SDag-Erling Smørgrav 3684ca1ab94SDag-Erling Smørgrav /* if no proxy is configured or could be contacted, try direct */ 369ecc91352SDag-Erling Smørgrav if (sd == -1) { 370d941fd2dSDag-Erling Smørgrav if ((sd = _fetch_connect(URL->host, URL->port, verbose)) == -1) 3714ca1ab94SDag-Erling Smørgrav goto ouch; 3724ca1ab94SDag-Erling Smørgrav } 3734ca1ab94SDag-Erling Smørgrav 3744ca1ab94SDag-Erling Smørgrav /* reopen as stream */ 3758e3986eaSDag-Erling Smørgrav if ((f = fdopen(sd, "r+")) == NULL) 3764ca1ab94SDag-Erling Smørgrav goto ouch; 3774ca1ab94SDag-Erling Smørgrav c->real_f = f; 3784ca1ab94SDag-Erling Smørgrav 3794ca1ab94SDag-Erling Smørgrav /* send request (proxies require absolute form, so use that) */ 3800fba3a00SDag-Erling Smørgrav if (verbose) 3810fba3a00SDag-Erling Smørgrav _fetch_info("requesting http://%s:%d%s", 3820fba3a00SDag-Erling Smørgrav URL->host, URL->port, URL->doc); 383f62e5228SDag-Erling Smørgrav _http_cmd(f, "GET http://%s:%d%s HTTP/1.1" ENDL, 3844ca1ab94SDag-Erling Smørgrav URL->host, URL->port, URL->doc); 3854ca1ab94SDag-Erling Smørgrav 3864ca1ab94SDag-Erling Smørgrav /* start sending headers away */ 3874ca1ab94SDag-Erling Smørgrav if (URL->user[0] || URL->pwd[0]) { 388f62e5228SDag-Erling Smørgrav char *auth_str = _http_auth(URL->user, URL->pwd); 389f62e5228SDag-Erling Smørgrav if (!auth_str) 390f62e5228SDag-Erling Smørgrav goto fouch; 391f62e5228SDag-Erling Smørgrav _http_cmd(f, "Authorization: Basic %s" ENDL, auth_str); 392f62e5228SDag-Erling Smørgrav free(auth_str); 3934ca1ab94SDag-Erling Smørgrav } 394f62e5228SDag-Erling Smørgrav _http_cmd(f, "Host: %s:%d" ENDL, URL->host, URL->port); 395f62e5228SDag-Erling Smørgrav _http_cmd(f, "User-Agent: %s " _LIBFETCH_VER ENDL, __progname); 3963d2a8471SDag-Erling Smørgrav if (URL->offset) 3973d2a8471SDag-Erling Smørgrav _http_cmd(f, "Range: bytes=%lld-" ENDL, URL->offset); 398f62e5228SDag-Erling Smørgrav _http_cmd(f, "Connection: close" ENDL ENDL); 3994ca1ab94SDag-Erling Smørgrav 4004ca1ab94SDag-Erling Smørgrav /* get response */ 4014ca1ab94SDag-Erling Smørgrav if ((ln = fgetln(f, &len)) == NULL) 4024ca1ab94SDag-Erling Smørgrav goto fouch; 4034ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "response: [\033[1m%*.*s\033[m]\n", 4044ca1ab94SDag-Erling Smørgrav (int)len-2, (int)len-2, ln)); 4054ca1ab94SDag-Erling Smørgrav 4064ca1ab94SDag-Erling Smørgrav /* we can't use strchr() and friends since ln isn't NUL-terminated */ 4074ca1ab94SDag-Erling Smørgrav p = ln; 4084ca1ab94SDag-Erling Smørgrav while ((p < ln + len) && !isspace(*p)) 4094ca1ab94SDag-Erling Smørgrav p++; 4104ca1ab94SDag-Erling Smørgrav while ((p < ln + len) && !isdigit(*p)) 4114ca1ab94SDag-Erling Smørgrav p++; 4124ca1ab94SDag-Erling Smørgrav if (!isdigit(*p)) 4134ca1ab94SDag-Erling Smørgrav goto fouch; 4143b7a6740SDag-Erling Smørgrav e = atoi(p); 4153b7a6740SDag-Erling Smørgrav DEBUG(fprintf(stderr, "code: [\033[1m%d\033[m]\n", e)); 4164ca1ab94SDag-Erling Smørgrav 4174ca1ab94SDag-Erling Smørgrav /* add code to handle redirects later */ 4183d2a8471SDag-Erling Smørgrav if (e != (URL->offset ? HTTP_PARTIAL : HTTP_OK)) { 4193b7a6740SDag-Erling Smørgrav _http_seterr(e); 4204ca1ab94SDag-Erling Smørgrav goto fouch; 4218e3986eaSDag-Erling Smørgrav } 4224ca1ab94SDag-Erling Smørgrav 4234ca1ab94SDag-Erling Smørgrav /* browse through header */ 4244ca1ab94SDag-Erling Smørgrav while (1) { 4254ca1ab94SDag-Erling Smørgrav if ((ln = fgetln(f, &len)) == NULL) 4264ca1ab94SDag-Erling Smørgrav goto fouch; 4274ca1ab94SDag-Erling Smørgrav if ((ln[0] == '\r') || (ln[0] == '\n')) 4284ca1ab94SDag-Erling Smørgrav break; 4294ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "header: [\033[1m%*.*s\033[m]\n", 4304ca1ab94SDag-Erling Smørgrav (int)len-2, (int)len-2, ln)); 4314ca1ab94SDag-Erling Smørgrav #define XFERENC "Transfer-Encoding:" 432e6182307SDag-Erling Smørgrav if (strncasecmp(ln, XFERENC, sizeof XFERENC - 1) == 0) { 433e6182307SDag-Erling Smørgrav p = ln + sizeof XFERENC - 1; 4344ca1ab94SDag-Erling Smørgrav while ((p < ln + len) && isspace(*p)) 4354ca1ab94SDag-Erling Smørgrav p++; 4364ca1ab94SDag-Erling Smørgrav for (q = p; (q < ln + len) && !isspace(*q); q++) 4374ca1ab94SDag-Erling Smørgrav /* VOID */ ; 4384ca1ab94SDag-Erling Smørgrav *q = 0; 4394ca1ab94SDag-Erling Smørgrav if (strcasecmp(p, "chunked") == 0) 4404ca1ab94SDag-Erling Smørgrav enc = ENC_CHUNKED; 4414ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "xferenc: [\033[1m%s\033[m]\n", p)); 4424ca1ab94SDag-Erling Smørgrav #undef XFERENC 4434ca1ab94SDag-Erling Smørgrav #define CONTTYPE "Content-Type:" 444e6182307SDag-Erling Smørgrav } else if (strncasecmp(ln, CONTTYPE, sizeof CONTTYPE - 1) == 0) { 445e6182307SDag-Erling Smørgrav p = ln + sizeof CONTTYPE - 1; 4464ca1ab94SDag-Erling Smørgrav while ((p < ln + len) && isspace(*p)) 4474ca1ab94SDag-Erling Smørgrav p++; 4484ca1ab94SDag-Erling Smørgrav for (i = 0; p < ln + len; p++) 4494ca1ab94SDag-Erling Smørgrav if (i < HTTPCTYPELEN) 4504ca1ab94SDag-Erling Smørgrav c->content_type[i++] = *p; 4514ca1ab94SDag-Erling Smørgrav do c->content_type[i--] = 0; while (isspace(c->content_type[i])); 4524ca1ab94SDag-Erling Smørgrav DEBUG(fprintf(stderr, "conttype: [\033[1m%s\033[m]\n", 4534ca1ab94SDag-Erling Smørgrav c->content_type)); 4544ca1ab94SDag-Erling Smørgrav #undef CONTTYPE 4553d2a8471SDag-Erling Smørgrav #define CONTRANGE "Content-Range:" 4563d2a8471SDag-Erling Smørgrav #define BYTES "bytes " 4573d2a8471SDag-Erling Smørgrav } else if (strncasecmp(ln, CONTRANGE, sizeof CONTRANGE - 1) == 0) { 4583d2a8471SDag-Erling Smørgrav p = ln + sizeof CONTRANGE - 1; 4593d2a8471SDag-Erling Smørgrav while ((p < ln + len) && isspace(*p)) 4603d2a8471SDag-Erling Smørgrav p++; 4613d2a8471SDag-Erling Smørgrav if (strncasecmp(p, BYTES, sizeof BYTES - 1) != 0 4623d2a8471SDag-Erling Smørgrav || (p += 6) >= ln + len) 4633d2a8471SDag-Erling Smørgrav goto fouch; 4643d2a8471SDag-Erling Smørgrav while ((p < ln + len) && isdigit(*p)) 4653d2a8471SDag-Erling Smørgrav pos = pos * 10 + (*p++ - '0'); 4663d2a8471SDag-Erling Smørgrav /* XXX wouldn't hurt to be slightly more paranoid here */ 4673d2a8471SDag-Erling Smørgrav DEBUG(fprintf(stderr, "contrange: [\033[1m%lld-\033[m]\n", pos)); 4683d2a8471SDag-Erling Smørgrav if (pos > URL->offset) 4693d2a8471SDag-Erling Smørgrav goto fouch; 4703d2a8471SDag-Erling Smørgrav #undef BYTES 4713d2a8471SDag-Erling Smørgrav #undef CONTRANGE 4724ca1ab94SDag-Erling Smørgrav } 4734ca1ab94SDag-Erling Smørgrav } 4744ca1ab94SDag-Erling Smørgrav 4754ca1ab94SDag-Erling Smørgrav /* only body remains */ 4764ca1ab94SDag-Erling Smørgrav c->encoding = enc; 4774ca1ab94SDag-Erling Smørgrav cf = funopen(c, 4784ca1ab94SDag-Erling Smørgrav (int (*)(void *, char *, int))_http_readfn, 4794ca1ab94SDag-Erling Smørgrav (int (*)(void *, const char *, int))_http_writefn, 4804ca1ab94SDag-Erling Smørgrav (fpos_t (*)(void *, fpos_t, int))NULL, 4814ca1ab94SDag-Erling Smørgrav (int (*)(void *))_http_closefn); 4824ca1ab94SDag-Erling Smørgrav if (cf == NULL) 4834ca1ab94SDag-Erling Smørgrav goto fouch; 484e6182307SDag-Erling Smørgrav 4853d2a8471SDag-Erling Smørgrav while (pos < URL->offset) 4863d2a8471SDag-Erling Smørgrav if (fgetc(cf) == EOF) 4873d2a8471SDag-Erling Smørgrav goto cfouch; 4883d2a8471SDag-Erling Smørgrav 4894ca1ab94SDag-Erling Smørgrav return cf; 4904ca1ab94SDag-Erling Smørgrav 4914ca1ab94SDag-Erling Smørgrav ouch: 4928e3986eaSDag-Erling Smørgrav if (sd >= 0) 4938e3986eaSDag-Erling Smørgrav close(sd); 4944ca1ab94SDag-Erling Smørgrav free(c); 4950fba3a00SDag-Erling Smørgrav _http_seterr(999); /* XXX do this properly RSN */ 4964ca1ab94SDag-Erling Smørgrav return NULL; 4974ca1ab94SDag-Erling Smørgrav fouch: 4984ca1ab94SDag-Erling Smørgrav fclose(f); 4994ca1ab94SDag-Erling Smørgrav free(c); 5000fba3a00SDag-Erling Smørgrav _http_seterr(999); /* XXX do this properly RSN */ 5014ca1ab94SDag-Erling Smørgrav return NULL; 5023d2a8471SDag-Erling Smørgrav cfouch: 5033d2a8471SDag-Erling Smørgrav fclose(cf); 5043d2a8471SDag-Erling Smørgrav _http_seterr(999); /* XXX do this properly RSN */ 5053d2a8471SDag-Erling Smørgrav return NULL; 5064ca1ab94SDag-Erling Smørgrav } 5074ca1ab94SDag-Erling Smørgrav 5084ca1ab94SDag-Erling Smørgrav FILE * 509d8acd8dcSDag-Erling Smørgrav fetchPutHTTP(struct url *URL, char *flags) 5104ca1ab94SDag-Erling Smørgrav { 5114ca1ab94SDag-Erling Smørgrav warnx("fetchPutHTTP(): not implemented"); 5124ca1ab94SDag-Erling Smørgrav return NULL; 5134ca1ab94SDag-Erling Smørgrav } 514d8acd8dcSDag-Erling Smørgrav 515d8acd8dcSDag-Erling Smørgrav /* 516d8acd8dcSDag-Erling Smørgrav * Get an HTTP document's metadata 517d8acd8dcSDag-Erling Smørgrav */ 518d8acd8dcSDag-Erling Smørgrav int 519d8acd8dcSDag-Erling Smørgrav fetchStatHTTP(struct url *url, struct url_stat *us, char *flags) 520d8acd8dcSDag-Erling Smørgrav { 521d8acd8dcSDag-Erling Smørgrav warnx("fetchStatHTTP(): not implemented"); 522d8acd8dcSDag-Erling Smørgrav return -1; 523d8acd8dcSDag-Erling Smørgrav } 524ce71b736SDag-Erling Smørgrav 525ce71b736SDag-Erling Smørgrav /* 526ce71b736SDag-Erling Smørgrav * List a directory 527ce71b736SDag-Erling Smørgrav */ 528ce71b736SDag-Erling Smørgrav struct url_ent * 529ce71b736SDag-Erling Smørgrav fetchListHTTP(struct url *url, char *flags) 530ce71b736SDag-Erling Smørgrav { 531ce71b736SDag-Erling Smørgrav warnx("fetchListHTTP(): not implemented"); 532ce71b736SDag-Erling Smørgrav return NULL; 533ce71b736SDag-Erling Smørgrav } 534