xref: /freebsd/lib/libfetch/http.c (revision 3d2a847151d0d4b222e4abedaf8c6640b91200d6)
14ca1ab94SDag-Erling Smørgrav /*-
24ca1ab94SDag-Erling Smørgrav  * Copyright (c) 1998 Dag-Erling Co�dan Sm�rgrav
34ca1ab94SDag-Erling Smørgrav  * All rights reserved.
44ca1ab94SDag-Erling Smørgrav  *
54ca1ab94SDag-Erling Smørgrav  * Redistribution and use in source and binary forms, with or without
64ca1ab94SDag-Erling Smørgrav  * modification, are permitted provided that the following conditions
74ca1ab94SDag-Erling Smørgrav  * are met:
84ca1ab94SDag-Erling Smørgrav  * 1. Redistributions of source code must retain the above copyright
94ca1ab94SDag-Erling Smørgrav  *    notice, this list of conditions and the following disclaimer
104ca1ab94SDag-Erling Smørgrav  *    in this position and unchanged.
114ca1ab94SDag-Erling Smørgrav  * 2. Redistributions in binary form must reproduce the above copyright
124ca1ab94SDag-Erling Smørgrav  *    notice, this list of conditions and the following disclaimer in the
134ca1ab94SDag-Erling Smørgrav  *    documentation and/or other materials provided with the distribution.
144ca1ab94SDag-Erling Smørgrav  * 3. The name of the author may not be used to endorse or promote products
154ca1ab94SDag-Erling Smørgrav  *    derived from this software without specific prior written permission
164ca1ab94SDag-Erling Smørgrav  *
174ca1ab94SDag-Erling Smørgrav  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
184ca1ab94SDag-Erling Smørgrav  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
194ca1ab94SDag-Erling Smørgrav  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
204ca1ab94SDag-Erling Smørgrav  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
214ca1ab94SDag-Erling Smørgrav  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
224ca1ab94SDag-Erling Smørgrav  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
234ca1ab94SDag-Erling Smørgrav  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
244ca1ab94SDag-Erling Smørgrav  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
254ca1ab94SDag-Erling Smørgrav  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
264ca1ab94SDag-Erling Smørgrav  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
274ca1ab94SDag-Erling Smørgrav  *
287f3dea24SPeter Wemm  * $FreeBSD$
294ca1ab94SDag-Erling Smørgrav  */
304ca1ab94SDag-Erling Smørgrav 
31f62e5228SDag-Erling Smørgrav /*
32f62e5228SDag-Erling Smørgrav  * The base64 code in this file is based on code from MIT fetch, which
33f62e5228SDag-Erling Smørgrav  * has the following copyright and license:
34f62e5228SDag-Erling Smørgrav  *
35f62e5228SDag-Erling Smørgrav  *-
36f62e5228SDag-Erling Smørgrav  * Copyright 1997 Massachusetts Institute of Technology
37f62e5228SDag-Erling Smørgrav  *
38f62e5228SDag-Erling Smørgrav  * Permission to use, copy, modify, and distribute this software and
39f62e5228SDag-Erling Smørgrav  * its documentation for any purpose and without fee is hereby
40f62e5228SDag-Erling Smørgrav  * granted, provided that both the above copyright notice and this
41f62e5228SDag-Erling Smørgrav  * permission notice appear in all copies, that both the above
42f62e5228SDag-Erling Smørgrav  * copyright notice and this permission notice appear in all
43f62e5228SDag-Erling Smørgrav  * supporting documentation, and that the name of M.I.T. not be used
44f62e5228SDag-Erling Smørgrav  * in advertising or publicity pertaining to distribution of the
45f62e5228SDag-Erling Smørgrav  * software without specific, written prior permission.	 M.I.T. makes
46f62e5228SDag-Erling Smørgrav  * no representations about the suitability of this software for any
47f62e5228SDag-Erling Smørgrav  * purpose.  It is provided "as is" without express or implied
48f62e5228SDag-Erling Smørgrav  * warranty.
49f62e5228SDag-Erling Smørgrav  *
50f62e5228SDag-Erling Smørgrav  * THIS SOFTWARE IS PROVIDED BY M.I.T. ``AS IS''.  M.I.T. DISCLAIMS
51f62e5228SDag-Erling Smørgrav  * ALL EXPRESS OR IMPLIED WARRANTIES WITH REGARD TO THIS SOFTWARE,
52f62e5228SDag-Erling Smørgrav  * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
53f62e5228SDag-Erling Smørgrav  * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT
54f62e5228SDag-Erling Smørgrav  * SHALL M.I.T. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
55f62e5228SDag-Erling Smørgrav  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
56f62e5228SDag-Erling Smørgrav  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
57f62e5228SDag-Erling Smørgrav  * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
58f62e5228SDag-Erling Smørgrav  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
59f62e5228SDag-Erling Smørgrav  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
60f62e5228SDag-Erling Smørgrav  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
61f62e5228SDag-Erling Smørgrav  * SUCH DAMAGE. */
62f62e5228SDag-Erling Smørgrav 
634ca1ab94SDag-Erling Smørgrav #include <sys/param.h>
644ca1ab94SDag-Erling Smørgrav 
654ca1ab94SDag-Erling Smørgrav #include <err.h>
664ca1ab94SDag-Erling Smørgrav #include <ctype.h>
67e6182307SDag-Erling Smørgrav #include <netdb.h>
68f62e5228SDag-Erling Smørgrav #include <stdarg.h>
694ca1ab94SDag-Erling Smørgrav #include <stdio.h>
704ca1ab94SDag-Erling Smørgrav #include <stdlib.h>
714ca1ab94SDag-Erling Smørgrav #include <string.h>
724ca1ab94SDag-Erling Smørgrav #include <unistd.h>
734ca1ab94SDag-Erling Smørgrav 
744ca1ab94SDag-Erling Smørgrav #include "fetch.h"
75842a95ccSDag-Erling Smørgrav #include "common.h"
760fba3a00SDag-Erling Smørgrav #include "httperr.h"
774ca1ab94SDag-Erling Smørgrav 
784ca1ab94SDag-Erling Smørgrav extern char *__progname;
794ca1ab94SDag-Erling Smørgrav 
804ca1ab94SDag-Erling Smørgrav #define ENDL "\r\n"
814ca1ab94SDag-Erling Smørgrav 
823d2a8471SDag-Erling Smørgrav #define HTTP_OK		200
833d2a8471SDag-Erling Smørgrav #define HTTP_PARTIAL	206
843d2a8471SDag-Erling Smørgrav 
854ca1ab94SDag-Erling Smørgrav struct cookie
864ca1ab94SDag-Erling Smørgrav {
874ca1ab94SDag-Erling Smørgrav     FILE *real_f;
884ca1ab94SDag-Erling Smørgrav #define ENC_NONE 0
894ca1ab94SDag-Erling Smørgrav #define ENC_CHUNKED 1
904ca1ab94SDag-Erling Smørgrav     int encoding;			/* 1 = chunked, 0 = none */
914ca1ab94SDag-Erling Smørgrav #define HTTPCTYPELEN 59
924ca1ab94SDag-Erling Smørgrav     char content_type[HTTPCTYPELEN+1];
934ca1ab94SDag-Erling Smørgrav     char *buf;
944ca1ab94SDag-Erling Smørgrav     int b_cur, eof;
954ca1ab94SDag-Erling Smørgrav     unsigned b_len, chunksize;
964ca1ab94SDag-Erling Smørgrav };
974ca1ab94SDag-Erling Smørgrav 
98f62e5228SDag-Erling Smørgrav /*
99f62e5228SDag-Erling Smørgrav  * Send a formatted line; optionally echo to terminal
100f62e5228SDag-Erling Smørgrav  */
101f62e5228SDag-Erling Smørgrav static int
102f62e5228SDag-Erling Smørgrav _http_cmd(FILE *f, char *fmt, ...)
103f62e5228SDag-Erling Smørgrav {
104f62e5228SDag-Erling Smørgrav     va_list ap;
105f62e5228SDag-Erling Smørgrav 
106f62e5228SDag-Erling Smørgrav     va_start(ap, fmt);
107f62e5228SDag-Erling Smørgrav     vfprintf(f, fmt, ap);
108f62e5228SDag-Erling Smørgrav #ifndef NDEBUG
109f62e5228SDag-Erling Smørgrav     fprintf(stderr, "\033[1m>>> ");
110f62e5228SDag-Erling Smørgrav     vfprintf(stderr, fmt, ap);
111f62e5228SDag-Erling Smørgrav     fprintf(stderr, "\033[m");
112f62e5228SDag-Erling Smørgrav #endif
113f62e5228SDag-Erling Smørgrav     va_end(ap);
114f62e5228SDag-Erling Smørgrav 
115f62e5228SDag-Erling Smørgrav     return 0; /* XXX */
116f62e5228SDag-Erling Smørgrav }
117f62e5228SDag-Erling Smørgrav 
118f62e5228SDag-Erling Smørgrav /*
119f62e5228SDag-Erling Smørgrav  * Fill the input buffer, do chunk decoding on the fly
120f62e5228SDag-Erling Smørgrav  */
1214ca1ab94SDag-Erling Smørgrav static char *
1224ca1ab94SDag-Erling Smørgrav _http_fillbuf(struct cookie *c)
1234ca1ab94SDag-Erling Smørgrav {
1244ca1ab94SDag-Erling Smørgrav     char *ln;
1254ca1ab94SDag-Erling Smørgrav     unsigned int len;
1264ca1ab94SDag-Erling Smørgrav 
1274ca1ab94SDag-Erling Smørgrav     if (c->eof)
1284ca1ab94SDag-Erling Smørgrav 	return NULL;
1294ca1ab94SDag-Erling Smørgrav 
1304ca1ab94SDag-Erling Smørgrav     if (c->encoding == ENC_NONE) {
1314ca1ab94SDag-Erling Smørgrav 	c->buf = fgetln(c->real_f, &(c->b_len));
1324ca1ab94SDag-Erling Smørgrav 	c->b_cur = 0;
1334ca1ab94SDag-Erling Smørgrav     } else if (c->encoding == ENC_CHUNKED) {
1344ca1ab94SDag-Erling Smørgrav 	if (c->chunksize == 0) {
1354ca1ab94SDag-Erling Smørgrav 	    ln = fgetln(c->real_f, &len);
1364ca1ab94SDag-Erling Smørgrav 	    DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): new chunk: "
1374ca1ab94SDag-Erling Smørgrav 			  "%*.*s\033[m\n", (int)len-2, (int)len-2, ln));
1384ca1ab94SDag-Erling Smørgrav 	    sscanf(ln, "%x", &(c->chunksize));
1394ca1ab94SDag-Erling Smørgrav 	    if (!c->chunksize) {
1404ca1ab94SDag-Erling Smørgrav 		DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): "
1414ca1ab94SDag-Erling Smørgrav 			      "end of last chunk\033[m\n"));
1424ca1ab94SDag-Erling Smørgrav 		c->eof = 1;
1434ca1ab94SDag-Erling Smørgrav 		return NULL;
1444ca1ab94SDag-Erling Smørgrav 	    }
1454ca1ab94SDag-Erling Smørgrav 	    DEBUG(fprintf(stderr, "\033[1m_http_fillbuf(): "
1464ca1ab94SDag-Erling Smørgrav 			  "new chunk: %X\033[m\n", c->chunksize));
1474ca1ab94SDag-Erling Smørgrav 	}
1484ca1ab94SDag-Erling Smørgrav 	c->buf = fgetln(c->real_f, &(c->b_len));
1494ca1ab94SDag-Erling Smørgrav 	if (c->b_len > c->chunksize)
1504ca1ab94SDag-Erling Smørgrav 	    c->b_len = c->chunksize;
1514ca1ab94SDag-Erling Smørgrav 	c->chunksize -= c->b_len;
1524ca1ab94SDag-Erling Smørgrav 	c->b_cur = 0;
1534ca1ab94SDag-Erling Smørgrav     }
1544ca1ab94SDag-Erling Smørgrav     else return NULL; /* unknown encoding */
1554ca1ab94SDag-Erling Smørgrav     return c->buf;
1564ca1ab94SDag-Erling Smørgrav }
1574ca1ab94SDag-Erling Smørgrav 
158f62e5228SDag-Erling Smørgrav /*
159f62e5228SDag-Erling Smørgrav  * Read function
160f62e5228SDag-Erling Smørgrav  */
1614ca1ab94SDag-Erling Smørgrav static int
1624ca1ab94SDag-Erling Smørgrav _http_readfn(struct cookie *c, char *buf, int len)
1634ca1ab94SDag-Erling Smørgrav {
1644ca1ab94SDag-Erling Smørgrav     int l, pos = 0;
1654ca1ab94SDag-Erling Smørgrav     while (len) {
1664ca1ab94SDag-Erling Smørgrav 	/* empty buffer */
1674ca1ab94SDag-Erling Smørgrav 	if (!c->buf || (c->b_cur == c->b_len))
1684ca1ab94SDag-Erling Smørgrav 	    if (!_http_fillbuf(c))
1694ca1ab94SDag-Erling Smørgrav 		break;
1704ca1ab94SDag-Erling Smørgrav 
1714ca1ab94SDag-Erling Smørgrav 	l = c->b_len - c->b_cur;
1724ca1ab94SDag-Erling Smørgrav 	if (len < l) l = len;
1734ca1ab94SDag-Erling Smørgrav 	memcpy(buf + pos, c->buf + c->b_cur, l);
1744ca1ab94SDag-Erling Smørgrav 	c->b_cur += l;
1754ca1ab94SDag-Erling Smørgrav 	pos += l;
1764ca1ab94SDag-Erling Smørgrav 	len -= l;
1774ca1ab94SDag-Erling Smørgrav     }
1784ca1ab94SDag-Erling Smørgrav 
1794ca1ab94SDag-Erling Smørgrav     if (ferror(c->real_f))
1804ca1ab94SDag-Erling Smørgrav 	return -1;
1814ca1ab94SDag-Erling Smørgrav     else return pos;
1824ca1ab94SDag-Erling Smørgrav }
1834ca1ab94SDag-Erling Smørgrav 
184f62e5228SDag-Erling Smørgrav /*
185f62e5228SDag-Erling Smørgrav  * Write function
186f62e5228SDag-Erling Smørgrav  */
1874ca1ab94SDag-Erling Smørgrav static int
1884ca1ab94SDag-Erling Smørgrav _http_writefn(struct cookie *c, const char *buf, int len)
1894ca1ab94SDag-Erling Smørgrav {
1904ca1ab94SDag-Erling Smørgrav     size_t r = fwrite(buf, 1, (size_t)len, c->real_f);
1914ca1ab94SDag-Erling Smørgrav     return r ? r : -1;
1924ca1ab94SDag-Erling Smørgrav }
1934ca1ab94SDag-Erling Smørgrav 
194f62e5228SDag-Erling Smørgrav /*
195f62e5228SDag-Erling Smørgrav  * Close function
196f62e5228SDag-Erling Smørgrav  */
1974ca1ab94SDag-Erling Smørgrav static int
1984ca1ab94SDag-Erling Smørgrav _http_closefn(struct cookie *c)
1994ca1ab94SDag-Erling Smørgrav {
2004ca1ab94SDag-Erling Smørgrav     int r = fclose(c->real_f);
2014ca1ab94SDag-Erling Smørgrav     free(c);
2024ca1ab94SDag-Erling Smørgrav     return (r == EOF) ? -1 : 0;
2034ca1ab94SDag-Erling Smørgrav }
2044ca1ab94SDag-Erling Smørgrav 
205f62e5228SDag-Erling Smørgrav /*
206f62e5228SDag-Erling Smørgrav  * Extract content type from cookie
207f62e5228SDag-Erling Smørgrav  */
2084ca1ab94SDag-Erling Smørgrav char *
2094ca1ab94SDag-Erling Smørgrav fetchContentType(FILE *f)
2104ca1ab94SDag-Erling Smørgrav {
2114ca1ab94SDag-Erling Smørgrav     /*
2124ca1ab94SDag-Erling Smørgrav      * We have no way of making sure this really *is* one of our cookies,
2134ca1ab94SDag-Erling Smørgrav      * so just check for a null pointer and hope for the best.
2144ca1ab94SDag-Erling Smørgrav      */
2154ca1ab94SDag-Erling Smørgrav     return f->_cookie ? (((struct cookie *)f->_cookie)->content_type) : NULL;
2164ca1ab94SDag-Erling Smørgrav }
2174ca1ab94SDag-Erling Smørgrav 
218f62e5228SDag-Erling Smørgrav /*
219f62e5228SDag-Erling Smørgrav  * Base64 encoding
220f62e5228SDag-Erling Smørgrav  */
221f62e5228SDag-Erling Smørgrav int
222f62e5228SDag-Erling Smørgrav _http_base64(char *dst, char *src, int l)
223f62e5228SDag-Erling Smørgrav {
224f62e5228SDag-Erling Smørgrav     static const char base64[] =
225f62e5228SDag-Erling Smørgrav 	"ABCDEFGHIJKLMNOPQRSTUVWXYZ"
226f62e5228SDag-Erling Smørgrav 	"abcdefghijklmnopqrstuvwxyz"
227f62e5228SDag-Erling Smørgrav 	"0123456789+/";
228f62e5228SDag-Erling Smørgrav     int t, r = 0;
229f62e5228SDag-Erling Smørgrav 
230f62e5228SDag-Erling Smørgrav     while (l >= 3) {
231f62e5228SDag-Erling Smørgrav 	t = (src[0] << 16) | (src[1] << 8) | src[2];
232f62e5228SDag-Erling Smørgrav 	dst[0] = base64[(t >> 18) & 0x3f];
233f62e5228SDag-Erling Smørgrav 	dst[1] = base64[(t >> 12) & 0x3f];
234f62e5228SDag-Erling Smørgrav 	dst[2] = base64[(t >> 6) & 0x3f];
235f62e5228SDag-Erling Smørgrav 	dst[3] = base64[(t >> 0) & 0x3f];
236f62e5228SDag-Erling Smørgrav 	src += 3; l -= 3;
237f62e5228SDag-Erling Smørgrav 	dst += 4; r += 4;
238f62e5228SDag-Erling Smørgrav     }
239f62e5228SDag-Erling Smørgrav 
240f62e5228SDag-Erling Smørgrav     switch (l) {
241f62e5228SDag-Erling Smørgrav     case 2:
242f62e5228SDag-Erling Smørgrav 	t = (src[0] << 16) | (src[1] << 8);
243f62e5228SDag-Erling Smørgrav 	dst[0] = base64[(t >> 18) & 0x3f];
244f62e5228SDag-Erling Smørgrav 	dst[1] = base64[(t >> 12) & 0x3f];
245f62e5228SDag-Erling Smørgrav 	dst[2] = base64[(t >> 6) & 0x3f];
246f62e5228SDag-Erling Smørgrav 	dst[3] = '=';
247f62e5228SDag-Erling Smørgrav 	dst += 4;
248f62e5228SDag-Erling Smørgrav 	r += 4;
249f62e5228SDag-Erling Smørgrav 	break;
250f62e5228SDag-Erling Smørgrav     case 1:
251f62e5228SDag-Erling Smørgrav 	t = src[0] << 16;
252f62e5228SDag-Erling Smørgrav 	dst[0] = base64[(t >> 18) & 0x3f];
253f62e5228SDag-Erling Smørgrav 	dst[1] = base64[(t >> 12) & 0x3f];
254f62e5228SDag-Erling Smørgrav 	dst[2] = dst[3] = '=';
255f62e5228SDag-Erling Smørgrav 	dst += 4;
256f62e5228SDag-Erling Smørgrav 	r += 4;
257f62e5228SDag-Erling Smørgrav 	break;
258f62e5228SDag-Erling Smørgrav     case 0:
259f62e5228SDag-Erling Smørgrav 	break;
260f62e5228SDag-Erling Smørgrav     }
261f62e5228SDag-Erling Smørgrav 
262f62e5228SDag-Erling Smørgrav     *dst = 0;
263f62e5228SDag-Erling Smørgrav     return r;
264f62e5228SDag-Erling Smørgrav }
265f62e5228SDag-Erling Smørgrav 
266f62e5228SDag-Erling Smørgrav /*
267f62e5228SDag-Erling Smørgrav  * Encode username and password
268f62e5228SDag-Erling Smørgrav  */
269f62e5228SDag-Erling Smørgrav char *
270f62e5228SDag-Erling Smørgrav _http_auth(char *usr, char *pwd)
271f62e5228SDag-Erling Smørgrav {
272f62e5228SDag-Erling Smørgrav     int len, lu, lp;
273f62e5228SDag-Erling Smørgrav     char *str, *s;
274f62e5228SDag-Erling Smørgrav 
275f62e5228SDag-Erling Smørgrav     lu = strlen(usr);
276f62e5228SDag-Erling Smørgrav     lp = strlen(pwd);
277f62e5228SDag-Erling Smørgrav 
278f62e5228SDag-Erling Smørgrav     len = (lu * 4 + 2) / 3	/* user name, round up */
279f62e5228SDag-Erling Smørgrav 	+ 1			/* colon */
280f62e5228SDag-Erling Smørgrav 	+ (lp * 4 + 2) / 3	/* password, round up */
281f62e5228SDag-Erling Smørgrav 	+ 1;			/* null */
282f62e5228SDag-Erling Smørgrav 
283f62e5228SDag-Erling Smørgrav     if ((s = str = (char *)malloc(len)) == NULL)
284f62e5228SDag-Erling Smørgrav 	return NULL;
285f62e5228SDag-Erling Smørgrav 
286f62e5228SDag-Erling Smørgrav     s += _http_base64(s, usr, lu);
287f62e5228SDag-Erling Smørgrav     *s++ = ':';
288f62e5228SDag-Erling Smørgrav     s += _http_base64(s, pwd, lp);
289f62e5228SDag-Erling Smørgrav     *s = 0;
290f62e5228SDag-Erling Smørgrav 
291f62e5228SDag-Erling Smørgrav     return str;
292f62e5228SDag-Erling Smørgrav }
293f62e5228SDag-Erling Smørgrav 
294f62e5228SDag-Erling Smørgrav /*
295d8acd8dcSDag-Erling Smørgrav  * Retrieve a file by HTTP
296f62e5228SDag-Erling Smørgrav  */
2974ca1ab94SDag-Erling Smørgrav FILE *
298d8acd8dcSDag-Erling Smørgrav fetchGetHTTP(struct url *URL, char *flags)
2994ca1ab94SDag-Erling Smørgrav {
300f5f109a0SDag-Erling Smørgrav     int sd = -1, e, i, enc = ENC_NONE, direct, verbose;
3014ca1ab94SDag-Erling Smørgrav     struct cookie *c;
3023b7a6740SDag-Erling Smørgrav     char *ln, *p, *px, *q;
3034ca1ab94SDag-Erling Smørgrav     FILE *f, *cf;
3044ca1ab94SDag-Erling Smørgrav     size_t len;
3053d2a8471SDag-Erling Smørgrav     off_t pos = 0;
3064ca1ab94SDag-Erling Smørgrav 
307f5f109a0SDag-Erling Smørgrav     direct = (flags && strchr(flags, 'd'));
308f5f109a0SDag-Erling Smørgrav     verbose = (flags && strchr(flags, 'v'));
3090fba3a00SDag-Erling Smørgrav 
3104ca1ab94SDag-Erling Smørgrav     /* allocate cookie */
311e6182307SDag-Erling Smørgrav     if ((c = calloc(1, sizeof *c)) == NULL)
3124ca1ab94SDag-Erling Smørgrav 	return NULL;
3134ca1ab94SDag-Erling Smørgrav 
3144ca1ab94SDag-Erling Smørgrav     /* check port */
315e6182307SDag-Erling Smørgrav     if (!URL->port) {
316e6182307SDag-Erling Smørgrav 	struct servent *se;
317e6182307SDag-Erling Smørgrav 
318e6182307SDag-Erling Smørgrav 	if ((se = getservbyname("http", "tcp")) != NULL)
319e6182307SDag-Erling Smørgrav 	    URL->port = ntohs(se->s_port);
320e6182307SDag-Erling Smørgrav 	else
321e6182307SDag-Erling Smørgrav 	    URL->port = 80;
322e6182307SDag-Erling Smørgrav     }
3234ca1ab94SDag-Erling Smørgrav 
3244ca1ab94SDag-Erling Smørgrav     /* attempt to connect to proxy server */
325f5f109a0SDag-Erling Smørgrav     if (!direct && (px = getenv("HTTP_PROXY")) != NULL) {
3263b7a6740SDag-Erling Smørgrav 	char host[MAXHOSTNAMELEN];
327e6182307SDag-Erling Smørgrav 	int port = 0;
3284ca1ab94SDag-Erling Smørgrav 
3294ca1ab94SDag-Erling Smørgrav 	/* measure length */
3304ca1ab94SDag-Erling Smørgrav 	len = strcspn(px, ":");
3314ca1ab94SDag-Erling Smørgrav 
332f5f109a0SDag-Erling Smørgrav 	/* get port (XXX atoi is a little too tolerant perhaps?) */
333e6182307SDag-Erling Smørgrav 	if (px[len] == ':') {
334e6182307SDag-Erling Smørgrav 	    if (strspn(px+len+1, "0123456789") != strlen(px+len+1)
335e6182307SDag-Erling Smørgrav 		|| strlen(px+len+1) > 5) {
336e6182307SDag-Erling Smørgrav 		/* XXX we should emit some kind of warning */
337e6182307SDag-Erling Smørgrav 	    }
3384ca1ab94SDag-Erling Smørgrav 	    port = atoi(px+len+1);
339e6182307SDag-Erling Smørgrav 	    if (port < 1 || port > 65535) {
340e6182307SDag-Erling Smørgrav 		/* XXX we should emit some kind of warning */
341e6182307SDag-Erling Smørgrav 	    }
342e6182307SDag-Erling Smørgrav 	}
343e6182307SDag-Erling Smørgrav 	if (!port) {
344e6182307SDag-Erling Smørgrav #if 0
345e6182307SDag-Erling Smørgrav 	    /*
346e6182307SDag-Erling Smørgrav 	     * commented out, since there is currently no service name
347e6182307SDag-Erling Smørgrav 	     * for HTTP proxies
348e6182307SDag-Erling Smørgrav 	     */
349e6182307SDag-Erling Smørgrav 	    struct servent *se;
350e6182307SDag-Erling Smørgrav 
351e6182307SDag-Erling Smørgrav 	    if ((se = getservbyname("xxxx", "tcp")) != NULL)
352e6182307SDag-Erling Smørgrav 		port = ntohs(se->s_port);
353e6182307SDag-Erling Smørgrav 	    else
354e6182307SDag-Erling Smørgrav #endif
355e6182307SDag-Erling Smørgrav 		port = 3128;
356e6182307SDag-Erling Smørgrav 	}
3574ca1ab94SDag-Erling Smørgrav 
3584ca1ab94SDag-Erling Smørgrav 	/* get host name */
3594ca1ab94SDag-Erling Smørgrav 	if (len >= MAXHOSTNAMELEN)
3604ca1ab94SDag-Erling Smørgrav 	    len = MAXHOSTNAMELEN - 1;
3614ca1ab94SDag-Erling Smørgrav 	strncpy(host, px, len);
3624ca1ab94SDag-Erling Smørgrav 	host[len] = 0;
3634ca1ab94SDag-Erling Smørgrav 
3644ca1ab94SDag-Erling Smørgrav 	/* connect */
365d941fd2dSDag-Erling Smørgrav 	sd = _fetch_connect(host, port, verbose);
3664ca1ab94SDag-Erling Smørgrav     }
3674ca1ab94SDag-Erling Smørgrav 
3684ca1ab94SDag-Erling Smørgrav     /* if no proxy is configured or could be contacted, try direct */
369ecc91352SDag-Erling Smørgrav     if (sd == -1) {
370d941fd2dSDag-Erling Smørgrav 	if ((sd = _fetch_connect(URL->host, URL->port, verbose)) == -1)
3714ca1ab94SDag-Erling Smørgrav 	    goto ouch;
3724ca1ab94SDag-Erling Smørgrav     }
3734ca1ab94SDag-Erling Smørgrav 
3744ca1ab94SDag-Erling Smørgrav     /* reopen as stream */
3758e3986eaSDag-Erling Smørgrav     if ((f = fdopen(sd, "r+")) == NULL)
3764ca1ab94SDag-Erling Smørgrav 	goto ouch;
3774ca1ab94SDag-Erling Smørgrav     c->real_f = f;
3784ca1ab94SDag-Erling Smørgrav 
3794ca1ab94SDag-Erling Smørgrav     /* send request (proxies require absolute form, so use that) */
3800fba3a00SDag-Erling Smørgrav     if (verbose)
3810fba3a00SDag-Erling Smørgrav 	_fetch_info("requesting http://%s:%d%s",
3820fba3a00SDag-Erling Smørgrav 		    URL->host, URL->port, URL->doc);
383f62e5228SDag-Erling Smørgrav     _http_cmd(f, "GET http://%s:%d%s HTTP/1.1" ENDL,
3844ca1ab94SDag-Erling Smørgrav 	      URL->host, URL->port, URL->doc);
3854ca1ab94SDag-Erling Smørgrav 
3864ca1ab94SDag-Erling Smørgrav     /* start sending headers away */
3874ca1ab94SDag-Erling Smørgrav     if (URL->user[0] || URL->pwd[0]) {
388f62e5228SDag-Erling Smørgrav 	char *auth_str = _http_auth(URL->user, URL->pwd);
389f62e5228SDag-Erling Smørgrav 	if (!auth_str)
390f62e5228SDag-Erling Smørgrav 	    goto fouch;
391f62e5228SDag-Erling Smørgrav 	_http_cmd(f, "Authorization: Basic %s" ENDL, auth_str);
392f62e5228SDag-Erling Smørgrav 	free(auth_str);
3934ca1ab94SDag-Erling Smørgrav     }
394f62e5228SDag-Erling Smørgrav     _http_cmd(f, "Host: %s:%d" ENDL, URL->host, URL->port);
395f62e5228SDag-Erling Smørgrav     _http_cmd(f, "User-Agent: %s " _LIBFETCH_VER ENDL, __progname);
3963d2a8471SDag-Erling Smørgrav     if (URL->offset)
3973d2a8471SDag-Erling Smørgrav 	_http_cmd(f, "Range: bytes=%lld-" ENDL, URL->offset);
398f62e5228SDag-Erling Smørgrav     _http_cmd(f, "Connection: close" ENDL ENDL);
3994ca1ab94SDag-Erling Smørgrav 
4004ca1ab94SDag-Erling Smørgrav     /* get response */
4014ca1ab94SDag-Erling Smørgrav     if ((ln = fgetln(f, &len)) == NULL)
4024ca1ab94SDag-Erling Smørgrav 	goto fouch;
4034ca1ab94SDag-Erling Smørgrav     DEBUG(fprintf(stderr, "response: [\033[1m%*.*s\033[m]\n",
4044ca1ab94SDag-Erling Smørgrav 		  (int)len-2, (int)len-2, ln));
4054ca1ab94SDag-Erling Smørgrav 
4064ca1ab94SDag-Erling Smørgrav     /* we can't use strchr() and friends since ln isn't NUL-terminated */
4074ca1ab94SDag-Erling Smørgrav     p = ln;
4084ca1ab94SDag-Erling Smørgrav     while ((p < ln + len) && !isspace(*p))
4094ca1ab94SDag-Erling Smørgrav 	p++;
4104ca1ab94SDag-Erling Smørgrav     while ((p < ln + len) && !isdigit(*p))
4114ca1ab94SDag-Erling Smørgrav 	p++;
4124ca1ab94SDag-Erling Smørgrav     if (!isdigit(*p))
4134ca1ab94SDag-Erling Smørgrav 	goto fouch;
4143b7a6740SDag-Erling Smørgrav     e = atoi(p);
4153b7a6740SDag-Erling Smørgrav     DEBUG(fprintf(stderr, "code:     [\033[1m%d\033[m]\n", e));
4164ca1ab94SDag-Erling Smørgrav 
4174ca1ab94SDag-Erling Smørgrav     /* add code to handle redirects later */
4183d2a8471SDag-Erling Smørgrav     if (e != (URL->offset ? HTTP_PARTIAL : HTTP_OK)) {
4193b7a6740SDag-Erling Smørgrav 	_http_seterr(e);
4204ca1ab94SDag-Erling Smørgrav 	goto fouch;
4218e3986eaSDag-Erling Smørgrav     }
4224ca1ab94SDag-Erling Smørgrav 
4234ca1ab94SDag-Erling Smørgrav     /* browse through header */
4244ca1ab94SDag-Erling Smørgrav     while (1) {
4254ca1ab94SDag-Erling Smørgrav 	if ((ln = fgetln(f, &len)) == NULL)
4264ca1ab94SDag-Erling Smørgrav 	    goto fouch;
4274ca1ab94SDag-Erling Smørgrav 	if ((ln[0] == '\r') || (ln[0] == '\n'))
4284ca1ab94SDag-Erling Smørgrav 	    break;
4294ca1ab94SDag-Erling Smørgrav 	DEBUG(fprintf(stderr, "header:	 [\033[1m%*.*s\033[m]\n",
4304ca1ab94SDag-Erling Smørgrav 		      (int)len-2, (int)len-2, ln));
4314ca1ab94SDag-Erling Smørgrav #define XFERENC "Transfer-Encoding:"
432e6182307SDag-Erling Smørgrav 	if (strncasecmp(ln, XFERENC, sizeof XFERENC - 1) == 0) {
433e6182307SDag-Erling Smørgrav 	    p = ln + sizeof XFERENC - 1;
4344ca1ab94SDag-Erling Smørgrav 	    while ((p < ln + len) && isspace(*p))
4354ca1ab94SDag-Erling Smørgrav 		p++;
4364ca1ab94SDag-Erling Smørgrav 	    for (q = p; (q < ln + len) && !isspace(*q); q++)
4374ca1ab94SDag-Erling Smørgrav 		/* VOID */ ;
4384ca1ab94SDag-Erling Smørgrav 	    *q = 0;
4394ca1ab94SDag-Erling Smørgrav 	    if (strcasecmp(p, "chunked") == 0)
4404ca1ab94SDag-Erling Smørgrav 		enc = ENC_CHUNKED;
4414ca1ab94SDag-Erling Smørgrav 	    DEBUG(fprintf(stderr, "xferenc:  [\033[1m%s\033[m]\n", p));
4424ca1ab94SDag-Erling Smørgrav #undef XFERENC
4434ca1ab94SDag-Erling Smørgrav #define CONTTYPE "Content-Type:"
444e6182307SDag-Erling Smørgrav 	} else if (strncasecmp(ln, CONTTYPE, sizeof CONTTYPE - 1) == 0) {
445e6182307SDag-Erling Smørgrav 	    p = ln + sizeof CONTTYPE - 1;
4464ca1ab94SDag-Erling Smørgrav 	    while ((p < ln + len) && isspace(*p))
4474ca1ab94SDag-Erling Smørgrav 		p++;
4484ca1ab94SDag-Erling Smørgrav 	    for (i = 0; p < ln + len; p++)
4494ca1ab94SDag-Erling Smørgrav 		if (i < HTTPCTYPELEN)
4504ca1ab94SDag-Erling Smørgrav 		    c->content_type[i++] = *p;
4514ca1ab94SDag-Erling Smørgrav 	    do c->content_type[i--] = 0; while (isspace(c->content_type[i]));
4524ca1ab94SDag-Erling Smørgrav 	    DEBUG(fprintf(stderr, "conttype: [\033[1m%s\033[m]\n",
4534ca1ab94SDag-Erling Smørgrav 			  c->content_type));
4544ca1ab94SDag-Erling Smørgrav #undef CONTTYPE
4553d2a8471SDag-Erling Smørgrav #define CONTRANGE "Content-Range:"
4563d2a8471SDag-Erling Smørgrav #define BYTES "bytes "
4573d2a8471SDag-Erling Smørgrav 	} else if (strncasecmp(ln, CONTRANGE, sizeof CONTRANGE - 1) == 0) {
4583d2a8471SDag-Erling Smørgrav 	    p = ln + sizeof CONTRANGE - 1;
4593d2a8471SDag-Erling Smørgrav 	    while ((p < ln + len) && isspace(*p))
4603d2a8471SDag-Erling Smørgrav 		p++;
4613d2a8471SDag-Erling Smørgrav 	    if (strncasecmp(p, BYTES, sizeof BYTES - 1) != 0
4623d2a8471SDag-Erling Smørgrav 		|| (p += 6) >= ln + len)
4633d2a8471SDag-Erling Smørgrav 		goto fouch;
4643d2a8471SDag-Erling Smørgrav 	    while ((p < ln + len) && isdigit(*p))
4653d2a8471SDag-Erling Smørgrav 		pos = pos * 10 + (*p++ - '0');
4663d2a8471SDag-Erling Smørgrav 	    /* XXX wouldn't hurt to be slightly more paranoid here */
4673d2a8471SDag-Erling Smørgrav 	    DEBUG(fprintf(stderr, "contrange: [\033[1m%lld-\033[m]\n", pos));
4683d2a8471SDag-Erling Smørgrav 	    if (pos > URL->offset)
4693d2a8471SDag-Erling Smørgrav 		goto fouch;
4703d2a8471SDag-Erling Smørgrav #undef BYTES
4713d2a8471SDag-Erling Smørgrav #undef CONTRANGE
4724ca1ab94SDag-Erling Smørgrav 	}
4734ca1ab94SDag-Erling Smørgrav     }
4744ca1ab94SDag-Erling Smørgrav 
4754ca1ab94SDag-Erling Smørgrav     /* only body remains */
4764ca1ab94SDag-Erling Smørgrav     c->encoding = enc;
4774ca1ab94SDag-Erling Smørgrav     cf = funopen(c,
4784ca1ab94SDag-Erling Smørgrav 		 (int (*)(void *, char *, int))_http_readfn,
4794ca1ab94SDag-Erling Smørgrav 		 (int (*)(void *, const char *, int))_http_writefn,
4804ca1ab94SDag-Erling Smørgrav 		 (fpos_t (*)(void *, fpos_t, int))NULL,
4814ca1ab94SDag-Erling Smørgrav 		 (int (*)(void *))_http_closefn);
4824ca1ab94SDag-Erling Smørgrav     if (cf == NULL)
4834ca1ab94SDag-Erling Smørgrav 	goto fouch;
484e6182307SDag-Erling Smørgrav 
4853d2a8471SDag-Erling Smørgrav     while (pos < URL->offset)
4863d2a8471SDag-Erling Smørgrav 	if (fgetc(cf) == EOF)
4873d2a8471SDag-Erling Smørgrav 	    goto cfouch;
4883d2a8471SDag-Erling Smørgrav 
4894ca1ab94SDag-Erling Smørgrav     return cf;
4904ca1ab94SDag-Erling Smørgrav 
4914ca1ab94SDag-Erling Smørgrav ouch:
4928e3986eaSDag-Erling Smørgrav     if (sd >= 0)
4938e3986eaSDag-Erling Smørgrav 	close(sd);
4944ca1ab94SDag-Erling Smørgrav     free(c);
4950fba3a00SDag-Erling Smørgrav     _http_seterr(999); /* XXX do this properly RSN */
4964ca1ab94SDag-Erling Smørgrav     return NULL;
4974ca1ab94SDag-Erling Smørgrav fouch:
4984ca1ab94SDag-Erling Smørgrav     fclose(f);
4994ca1ab94SDag-Erling Smørgrav     free(c);
5000fba3a00SDag-Erling Smørgrav     _http_seterr(999); /* XXX do this properly RSN */
5014ca1ab94SDag-Erling Smørgrav     return NULL;
5023d2a8471SDag-Erling Smørgrav cfouch:
5033d2a8471SDag-Erling Smørgrav     fclose(cf);
5043d2a8471SDag-Erling Smørgrav     _http_seterr(999); /* XXX do this properly RSN */
5053d2a8471SDag-Erling Smørgrav     return NULL;
5064ca1ab94SDag-Erling Smørgrav }
5074ca1ab94SDag-Erling Smørgrav 
5084ca1ab94SDag-Erling Smørgrav FILE *
509d8acd8dcSDag-Erling Smørgrav fetchPutHTTP(struct url *URL, char *flags)
5104ca1ab94SDag-Erling Smørgrav {
5114ca1ab94SDag-Erling Smørgrav     warnx("fetchPutHTTP(): not implemented");
5124ca1ab94SDag-Erling Smørgrav     return NULL;
5134ca1ab94SDag-Erling Smørgrav }
514d8acd8dcSDag-Erling Smørgrav 
515d8acd8dcSDag-Erling Smørgrav /*
516d8acd8dcSDag-Erling Smørgrav  * Get an HTTP document's metadata
517d8acd8dcSDag-Erling Smørgrav  */
518d8acd8dcSDag-Erling Smørgrav int
519d8acd8dcSDag-Erling Smørgrav fetchStatHTTP(struct url *url, struct url_stat *us, char *flags)
520d8acd8dcSDag-Erling Smørgrav {
521d8acd8dcSDag-Erling Smørgrav     warnx("fetchStatHTTP(): not implemented");
522d8acd8dcSDag-Erling Smørgrav     return -1;
523d8acd8dcSDag-Erling Smørgrav }
524ce71b736SDag-Erling Smørgrav 
525ce71b736SDag-Erling Smørgrav /*
526ce71b736SDag-Erling Smørgrav  * List a directory
527ce71b736SDag-Erling Smørgrav  */
528ce71b736SDag-Erling Smørgrav struct url_ent *
529ce71b736SDag-Erling Smørgrav fetchListHTTP(struct url *url, char *flags)
530ce71b736SDag-Erling Smørgrav {
531ce71b736SDag-Erling Smørgrav     warnx("fetchListHTTP(): not implemented");
532ce71b736SDag-Erling Smørgrav     return NULL;
533ce71b736SDag-Erling Smørgrav }
534