14ca1ab94SDag-Erling Smørgrav /*- 2e4878e39SDag-Erling Smørgrav * Copyright (c) 2000 Dag-Erling Co�dan Sm�rgrav 34ca1ab94SDag-Erling Smørgrav * All rights reserved. 44ca1ab94SDag-Erling Smørgrav * 54ca1ab94SDag-Erling Smørgrav * Redistribution and use in source and binary forms, with or without 64ca1ab94SDag-Erling Smørgrav * modification, are permitted provided that the following conditions 74ca1ab94SDag-Erling Smørgrav * are met: 84ca1ab94SDag-Erling Smørgrav * 1. Redistributions of source code must retain the above copyright 94ca1ab94SDag-Erling Smørgrav * notice, this list of conditions and the following disclaimer 104ca1ab94SDag-Erling Smørgrav * in this position and unchanged. 114ca1ab94SDag-Erling Smørgrav * 2. Redistributions in binary form must reproduce the above copyright 124ca1ab94SDag-Erling Smørgrav * notice, this list of conditions and the following disclaimer in the 134ca1ab94SDag-Erling Smørgrav * documentation and/or other materials provided with the distribution. 144ca1ab94SDag-Erling Smørgrav * 3. The name of the author may not be used to endorse or promote products 15e4878e39SDag-Erling Smørgrav * derived from this software without specific prior written permission. 164ca1ab94SDag-Erling Smørgrav * 174ca1ab94SDag-Erling Smørgrav * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 184ca1ab94SDag-Erling Smørgrav * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 194ca1ab94SDag-Erling Smørgrav * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 204ca1ab94SDag-Erling Smørgrav * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 214ca1ab94SDag-Erling Smørgrav * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 224ca1ab94SDag-Erling Smørgrav * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 234ca1ab94SDag-Erling Smørgrav * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 244ca1ab94SDag-Erling Smørgrav * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 254ca1ab94SDag-Erling Smørgrav * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 264ca1ab94SDag-Erling Smørgrav * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 274ca1ab94SDag-Erling Smørgrav */ 284ca1ab94SDag-Erling Smørgrav 29cecb889fSMatthew Dillon #include <sys/cdefs.h> 30cecb889fSMatthew Dillon __FBSDID("$FreeBSD$"); 31cecb889fSMatthew Dillon 326290ee73SDag-Erling Smørgrav /* 336290ee73SDag-Erling Smørgrav * The following copyright applies to the base64 code: 346290ee73SDag-Erling Smørgrav * 356290ee73SDag-Erling Smørgrav *- 366290ee73SDag-Erling Smørgrav * Copyright 1997 Massachusetts Institute of Technology 376290ee73SDag-Erling Smørgrav * 386290ee73SDag-Erling Smørgrav * Permission to use, copy, modify, and distribute this software and 396290ee73SDag-Erling Smørgrav * its documentation for any purpose and without fee is hereby 406290ee73SDag-Erling Smørgrav * granted, provided that both the above copyright notice and this 416290ee73SDag-Erling Smørgrav * permission notice appear in all copies, that both the above 426290ee73SDag-Erling Smørgrav * copyright notice and this permission notice appear in all 436290ee73SDag-Erling Smørgrav * supporting documentation, and that the name of M.I.T. not be used 446290ee73SDag-Erling Smørgrav * in advertising or publicity pertaining to distribution of the 456290ee73SDag-Erling Smørgrav * software without specific, written prior permission. M.I.T. makes 466290ee73SDag-Erling Smørgrav * no representations about the suitability of this software for any 476290ee73SDag-Erling Smørgrav * purpose. It is provided "as is" without express or implied 486290ee73SDag-Erling Smørgrav * warranty. 496290ee73SDag-Erling Smørgrav * 506290ee73SDag-Erling Smørgrav * THIS SOFTWARE IS PROVIDED BY M.I.T. ``AS IS''. M.I.T. DISCLAIMS 516290ee73SDag-Erling Smørgrav * ALL EXPRESS OR IMPLIED WARRANTIES WITH REGARD TO THIS SOFTWARE, 526290ee73SDag-Erling Smørgrav * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF 536290ee73SDag-Erling Smørgrav * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT 546290ee73SDag-Erling Smørgrav * SHALL M.I.T. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 556290ee73SDag-Erling Smørgrav * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 566290ee73SDag-Erling Smørgrav * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF 576290ee73SDag-Erling Smørgrav * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND 586290ee73SDag-Erling Smørgrav * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 596290ee73SDag-Erling Smørgrav * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT 606290ee73SDag-Erling Smørgrav * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 616290ee73SDag-Erling Smørgrav * SUCH DAMAGE. 626290ee73SDag-Erling Smørgrav */ 636290ee73SDag-Erling Smørgrav 644ca1ab94SDag-Erling Smørgrav #include <sys/param.h> 6528c645cfSHajimu UMEMOTO #include <sys/socket.h> 664ca1ab94SDag-Erling Smørgrav 674ca1ab94SDag-Erling Smørgrav #include <ctype.h> 68e4878e39SDag-Erling Smørgrav #include <err.h> 69e4878e39SDag-Erling Smørgrav #include <errno.h> 7060245e42SDag-Erling Smørgrav #include <locale.h> 71e6182307SDag-Erling Smørgrav #include <netdb.h> 72f62e5228SDag-Erling Smørgrav #include <stdarg.h> 734ca1ab94SDag-Erling Smørgrav #include <stdio.h> 744ca1ab94SDag-Erling Smørgrav #include <stdlib.h> 754ca1ab94SDag-Erling Smørgrav #include <string.h> 7660245e42SDag-Erling Smørgrav #include <time.h> 774ca1ab94SDag-Erling Smørgrav #include <unistd.h> 784ca1ab94SDag-Erling Smørgrav 794ca1ab94SDag-Erling Smørgrav #include "fetch.h" 80842a95ccSDag-Erling Smørgrav #include "common.h" 810fba3a00SDag-Erling Smørgrav #include "httperr.h" 824ca1ab94SDag-Erling Smørgrav 83e4878e39SDag-Erling Smørgrav /* Maximum number of redirects to follow */ 84e4878e39SDag-Erling Smørgrav #define MAX_REDIRECT 5 854ca1ab94SDag-Erling Smørgrav 86e4878e39SDag-Erling Smørgrav /* Symbolic names for reply codes we care about */ 873d2a8471SDag-Erling Smørgrav #define HTTP_OK 200 883d2a8471SDag-Erling Smørgrav #define HTTP_PARTIAL 206 89e4878e39SDag-Erling Smørgrav #define HTTP_MOVED_PERM 301 90e4878e39SDag-Erling Smørgrav #define HTTP_MOVED_TEMP 302 91e4878e39SDag-Erling Smørgrav #define HTTP_SEE_OTHER 303 92e4878e39SDag-Erling Smørgrav #define HTTP_NEED_AUTH 401 9365986545SDag-Erling Smørgrav #define HTTP_NEED_PROXY_AUTH 407 94e4878e39SDag-Erling Smørgrav #define HTTP_PROTOCOL_ERROR 999 95e4878e39SDag-Erling Smørgrav 96e4878e39SDag-Erling Smørgrav #define HTTP_REDIRECT(xyz) ((xyz) == HTTP_MOVED_PERM \ 97e4878e39SDag-Erling Smørgrav || (xyz) == HTTP_MOVED_TEMP \ 98e4878e39SDag-Erling Smørgrav || (xyz) == HTTP_SEE_OTHER) 99e4878e39SDag-Erling Smørgrav 100a8e9bd87SDag-Erling Smørgrav #define HTTP_ERROR(xyz) ((xyz) > 400 && (xyz) < 599) 101e4878e39SDag-Erling Smørgrav 102e19e6098SDag-Erling Smørgrav 103e4878e39SDag-Erling Smørgrav /***************************************************************************** 104e4878e39SDag-Erling Smørgrav * I/O functions for decoding chunked streams 105e4878e39SDag-Erling Smørgrav */ 1063d2a8471SDag-Erling Smørgrav 1074ca1ab94SDag-Erling Smørgrav struct cookie 1084ca1ab94SDag-Erling Smørgrav { 109dea29ca1SDag-Erling Smørgrav conn_t *conn; 1104ca1ab94SDag-Erling Smørgrav char *buf; 111e4878e39SDag-Erling Smørgrav size_t b_size; 112f573a5fcSDag-Erling Smørgrav ssize_t b_len; 113e4878e39SDag-Erling Smørgrav int b_pos; 114e4878e39SDag-Erling Smørgrav int eof; 115e4878e39SDag-Erling Smørgrav int error; 116f573a5fcSDag-Erling Smørgrav size_t chunksize; 117e66b3802SDag-Erling Smørgrav #ifndef NDEBUG 118f573a5fcSDag-Erling Smørgrav size_t total; 119e4878e39SDag-Erling Smørgrav #endif 1204ca1ab94SDag-Erling Smørgrav }; 1214ca1ab94SDag-Erling Smørgrav 122f62e5228SDag-Erling Smørgrav /* 123e4878e39SDag-Erling Smørgrav * Get next chunk header 124f62e5228SDag-Erling Smørgrav */ 125f62e5228SDag-Erling Smørgrav static int 126e4878e39SDag-Erling Smørgrav _http_new_chunk(struct cookie *c) 127f62e5228SDag-Erling Smørgrav { 128e4878e39SDag-Erling Smørgrav char *p; 129f62e5228SDag-Erling Smørgrav 130dea29ca1SDag-Erling Smørgrav if (_fetch_getln(c->conn) == -1) 131e19e6098SDag-Erling Smørgrav return (-1); 132f62e5228SDag-Erling Smørgrav 133dea29ca1SDag-Erling Smørgrav if (c->b_len < 2 || !ishexnumber(*c->conn->buf)) 134e19e6098SDag-Erling Smørgrav return (-1); 135e4878e39SDag-Erling Smørgrav 136dea29ca1SDag-Erling Smørgrav for (p = c->conn->buf; *p && !isspace(*p); ++p) { 137e19e6098SDag-Erling Smørgrav if (*p == ';') 138e19e6098SDag-Erling Smørgrav break; 139e4878e39SDag-Erling Smørgrav if (!ishexnumber(*p)) 140e19e6098SDag-Erling Smørgrav return (-1); 141e19e6098SDag-Erling Smørgrav if (isdigit(*p)) { 142e19e6098SDag-Erling Smørgrav c->chunksize = c->chunksize * 16 + 143e19e6098SDag-Erling Smørgrav *p - '0'; 144e19e6098SDag-Erling Smørgrav } else { 145e19e6098SDag-Erling Smørgrav c->chunksize = c->chunksize * 16 + 146e19e6098SDag-Erling Smørgrav 10 + tolower(*p) - 'a'; 147e19e6098SDag-Erling Smørgrav } 148e19e6098SDag-Erling Smørgrav } 149e4878e39SDag-Erling Smørgrav 150e66b3802SDag-Erling Smørgrav #ifndef NDEBUG 1517f807cb8SDag-Erling Smørgrav if (fetchDebug) { 152e4878e39SDag-Erling Smørgrav c->total += c->chunksize; 153e4878e39SDag-Erling Smørgrav if (c->chunksize == 0) 154f67efa37SDag-Erling Smørgrav fprintf(stderr, "_http_fillbuf(): " 155f67efa37SDag-Erling Smørgrav "end of last chunk\n"); 156e4878e39SDag-Erling Smørgrav else 157f67efa37SDag-Erling Smørgrav fprintf(stderr, "_http_fillbuf(): " 158f67efa37SDag-Erling Smørgrav "new chunk: %lu (%lu)\n", 159f573a5fcSDag-Erling Smørgrav (unsigned long)c->chunksize, (unsigned long)c->total); 1607f807cb8SDag-Erling Smørgrav } 161e4878e39SDag-Erling Smørgrav #endif 162e4878e39SDag-Erling Smørgrav 163e19e6098SDag-Erling Smørgrav return (c->chunksize); 164f62e5228SDag-Erling Smørgrav } 165f62e5228SDag-Erling Smørgrav 166f62e5228SDag-Erling Smørgrav /* 167f62e5228SDag-Erling Smørgrav * Fill the input buffer, do chunk decoding on the fly 168f62e5228SDag-Erling Smørgrav */ 169e4878e39SDag-Erling Smørgrav static int 1704ca1ab94SDag-Erling Smørgrav _http_fillbuf(struct cookie *c) 1714ca1ab94SDag-Erling Smørgrav { 172e4878e39SDag-Erling Smørgrav if (c->error) 173e19e6098SDag-Erling Smørgrav return (-1); 1744ca1ab94SDag-Erling Smørgrav if (c->eof) 175e19e6098SDag-Erling Smørgrav return (0); 1764ca1ab94SDag-Erling Smørgrav 1774ca1ab94SDag-Erling Smørgrav if (c->chunksize == 0) { 178e4878e39SDag-Erling Smørgrav switch (_http_new_chunk(c)) { 179e4878e39SDag-Erling Smørgrav case -1: 180e4878e39SDag-Erling Smørgrav c->error = 1; 181e19e6098SDag-Erling Smørgrav return (-1); 182e4878e39SDag-Erling Smørgrav case 0: 1834ca1ab94SDag-Erling Smørgrav c->eof = 1; 184e19e6098SDag-Erling Smørgrav return (0); 1854ca1ab94SDag-Erling Smørgrav } 1864ca1ab94SDag-Erling Smørgrav } 187e4878e39SDag-Erling Smørgrav 188e4878e39SDag-Erling Smørgrav if (c->b_size < c->chunksize) { 189e4878e39SDag-Erling Smørgrav char *tmp; 190e4878e39SDag-Erling Smørgrav 191e4878e39SDag-Erling Smørgrav if ((tmp = realloc(c->buf, c->chunksize)) == NULL) 192e19e6098SDag-Erling Smørgrav return (-1); 193e4878e39SDag-Erling Smørgrav c->buf = tmp; 194e4878e39SDag-Erling Smørgrav c->b_size = c->chunksize; 195e4878e39SDag-Erling Smørgrav } 196e4878e39SDag-Erling Smørgrav 197dea29ca1SDag-Erling Smørgrav if ((c->b_len = read(c->conn->sd, c->buf, c->chunksize)) == -1) 198e19e6098SDag-Erling Smørgrav return (-1); 1994ca1ab94SDag-Erling Smørgrav c->chunksize -= c->b_len; 200e4878e39SDag-Erling Smørgrav 201e4878e39SDag-Erling Smørgrav if (c->chunksize == 0) { 202dea29ca1SDag-Erling Smørgrav char endl[2]; 203dea29ca1SDag-Erling Smørgrav 204dea29ca1SDag-Erling Smørgrav if (read(c->conn->sd, &endl[0], 1) == -1 || 205dea29ca1SDag-Erling Smørgrav read(c->conn->sd, &endl[1], 1) == -1 || 206dea29ca1SDag-Erling Smørgrav endl[0] != '\r' || endl[1] != '\n') 207e19e6098SDag-Erling Smørgrav return (-1); 2084ca1ab94SDag-Erling Smørgrav } 209e4878e39SDag-Erling Smørgrav 210e4878e39SDag-Erling Smørgrav c->b_pos = 0; 211e4878e39SDag-Erling Smørgrav 212e19e6098SDag-Erling Smørgrav return (c->b_len); 2134ca1ab94SDag-Erling Smørgrav } 2144ca1ab94SDag-Erling Smørgrav 215f62e5228SDag-Erling Smørgrav /* 216f62e5228SDag-Erling Smørgrav * Read function 217f62e5228SDag-Erling Smørgrav */ 2184ca1ab94SDag-Erling Smørgrav static int 219e4878e39SDag-Erling Smørgrav _http_readfn(void *v, char *buf, int len) 2204ca1ab94SDag-Erling Smørgrav { 221e4878e39SDag-Erling Smørgrav struct cookie *c = (struct cookie *)v; 222e4878e39SDag-Erling Smørgrav int l, pos; 2234ca1ab94SDag-Erling Smørgrav 224e4878e39SDag-Erling Smørgrav if (c->error) 225e19e6098SDag-Erling Smørgrav return (-1); 226e4878e39SDag-Erling Smørgrav if (c->eof) 227e19e6098SDag-Erling Smørgrav return (0); 228e4878e39SDag-Erling Smørgrav 229e4878e39SDag-Erling Smørgrav for (pos = 0; len > 0; pos += l, len -= l) { 230e4878e39SDag-Erling Smørgrav /* empty buffer */ 231e4878e39SDag-Erling Smørgrav if (!c->buf || c->b_pos == c->b_len) 232e4878e39SDag-Erling Smørgrav if (_http_fillbuf(c) < 1) 233e4878e39SDag-Erling Smørgrav break; 234e4878e39SDag-Erling Smørgrav l = c->b_len - c->b_pos; 235e4878e39SDag-Erling Smørgrav if (len < l) 236e4878e39SDag-Erling Smørgrav l = len; 237e4878e39SDag-Erling Smørgrav bcopy(c->buf + c->b_pos, buf + pos, l); 238e4878e39SDag-Erling Smørgrav c->b_pos += l; 2394ca1ab94SDag-Erling Smørgrav } 2404ca1ab94SDag-Erling Smørgrav 241e4878e39SDag-Erling Smørgrav if (!pos && c->error) 242e19e6098SDag-Erling Smørgrav return (-1); 243e19e6098SDag-Erling Smørgrav return (pos); 2444ca1ab94SDag-Erling Smørgrav } 2454ca1ab94SDag-Erling Smørgrav 246f62e5228SDag-Erling Smørgrav /* 247f62e5228SDag-Erling Smørgrav * Write function 248f62e5228SDag-Erling Smørgrav */ 2494ca1ab94SDag-Erling Smørgrav static int 250e4878e39SDag-Erling Smørgrav _http_writefn(void *v, const char *buf, int len) 2514ca1ab94SDag-Erling Smørgrav { 252e4878e39SDag-Erling Smørgrav struct cookie *c = (struct cookie *)v; 253e4878e39SDag-Erling Smørgrav 254dea29ca1SDag-Erling Smørgrav return (write(c->conn->sd, buf, len)); 2554ca1ab94SDag-Erling Smørgrav } 2564ca1ab94SDag-Erling Smørgrav 257f62e5228SDag-Erling Smørgrav /* 258f62e5228SDag-Erling Smørgrav * Close function 259f62e5228SDag-Erling Smørgrav */ 2604ca1ab94SDag-Erling Smørgrav static int 261e4878e39SDag-Erling Smørgrav _http_closefn(void *v) 2624ca1ab94SDag-Erling Smørgrav { 263e4878e39SDag-Erling Smørgrav struct cookie *c = (struct cookie *)v; 264e4878e39SDag-Erling Smørgrav int r; 265e4878e39SDag-Erling Smørgrav 266dea29ca1SDag-Erling Smørgrav r = _fetch_close(c->conn); 267e4878e39SDag-Erling Smørgrav if (c->buf) 268e4878e39SDag-Erling Smørgrav free(c->buf); 2694ca1ab94SDag-Erling Smørgrav free(c); 270e19e6098SDag-Erling Smørgrav return (r); 2714ca1ab94SDag-Erling Smørgrav } 2724ca1ab94SDag-Erling Smørgrav 273f62e5228SDag-Erling Smørgrav /* 274e4878e39SDag-Erling Smørgrav * Wrap a file descriptor up 275f62e5228SDag-Erling Smørgrav */ 276e4878e39SDag-Erling Smørgrav static FILE * 277dea29ca1SDag-Erling Smørgrav _http_funopen(conn_t *conn) 2784ca1ab94SDag-Erling Smørgrav { 279e4878e39SDag-Erling Smørgrav struct cookie *c; 280e4878e39SDag-Erling Smørgrav FILE *f; 281e4878e39SDag-Erling Smørgrav 282e4878e39SDag-Erling Smørgrav if ((c = calloc(1, sizeof *c)) == NULL) { 283e4878e39SDag-Erling Smørgrav _fetch_syserr(); 284e19e6098SDag-Erling Smørgrav return (NULL); 2854ca1ab94SDag-Erling Smørgrav } 286dea29ca1SDag-Erling Smørgrav c->conn = conn; 287e19e6098SDag-Erling Smørgrav f = funopen(c, _http_readfn, _http_writefn, NULL, _http_closefn); 288e19e6098SDag-Erling Smørgrav if (f == NULL) { 289e4878e39SDag-Erling Smørgrav _fetch_syserr(); 290e4878e39SDag-Erling Smørgrav free(c); 291e19e6098SDag-Erling Smørgrav return (NULL); 292e4878e39SDag-Erling Smørgrav } 293e19e6098SDag-Erling Smørgrav return (f); 294e4878e39SDag-Erling Smørgrav } 295e4878e39SDag-Erling Smørgrav 296e19e6098SDag-Erling Smørgrav 297e4878e39SDag-Erling Smørgrav /***************************************************************************** 298e4878e39SDag-Erling Smørgrav * Helper functions for talking to the server and parsing its replies 299e4878e39SDag-Erling Smørgrav */ 300e4878e39SDag-Erling Smørgrav 301e4878e39SDag-Erling Smørgrav /* Header types */ 302e4878e39SDag-Erling Smørgrav typedef enum { 303e4878e39SDag-Erling Smørgrav hdr_syserror = -2, 304e4878e39SDag-Erling Smørgrav hdr_error = -1, 305e4878e39SDag-Erling Smørgrav hdr_end = 0, 306e4878e39SDag-Erling Smørgrav hdr_unknown = 1, 307e4878e39SDag-Erling Smørgrav hdr_content_length, 308e4878e39SDag-Erling Smørgrav hdr_content_range, 309e4878e39SDag-Erling Smørgrav hdr_last_modified, 310e4878e39SDag-Erling Smørgrav hdr_location, 3116490b215SDag-Erling Smørgrav hdr_transfer_encoding, 3126490b215SDag-Erling Smørgrav hdr_www_authenticate 313f573a5fcSDag-Erling Smørgrav } hdr_t; 314e4878e39SDag-Erling Smørgrav 315e4878e39SDag-Erling Smørgrav /* Names of interesting headers */ 316e4878e39SDag-Erling Smørgrav static struct { 317f573a5fcSDag-Erling Smørgrav hdr_t num; 31838c7e4a6SArchie Cobbs const char *name; 319e4878e39SDag-Erling Smørgrav } hdr_names[] = { 320e4878e39SDag-Erling Smørgrav { hdr_content_length, "Content-Length" }, 321e4878e39SDag-Erling Smørgrav { hdr_content_range, "Content-Range" }, 322e4878e39SDag-Erling Smørgrav { hdr_last_modified, "Last-Modified" }, 323e4878e39SDag-Erling Smørgrav { hdr_location, "Location" }, 324e4878e39SDag-Erling Smørgrav { hdr_transfer_encoding, "Transfer-Encoding" }, 3256490b215SDag-Erling Smørgrav { hdr_www_authenticate, "WWW-Authenticate" }, 326e4878e39SDag-Erling Smørgrav { hdr_unknown, NULL }, 327e4878e39SDag-Erling Smørgrav }; 328e4878e39SDag-Erling Smørgrav 329e4878e39SDag-Erling Smørgrav /* 330e4878e39SDag-Erling Smørgrav * Send a formatted line; optionally echo to terminal 331e4878e39SDag-Erling Smørgrav */ 332e4878e39SDag-Erling Smørgrav static int 333dea29ca1SDag-Erling Smørgrav _http_cmd(conn_t *conn, const char *fmt, ...) 334e4878e39SDag-Erling Smørgrav { 335e4878e39SDag-Erling Smørgrav va_list ap; 336e4878e39SDag-Erling Smørgrav size_t len; 337e4878e39SDag-Erling Smørgrav char *msg; 338e4878e39SDag-Erling Smørgrav int r; 339e4878e39SDag-Erling Smørgrav 340e4878e39SDag-Erling Smørgrav va_start(ap, fmt); 341e4878e39SDag-Erling Smørgrav len = vasprintf(&msg, fmt, ap); 342e4878e39SDag-Erling Smørgrav va_end(ap); 343e4878e39SDag-Erling Smørgrav 344e4878e39SDag-Erling Smørgrav if (msg == NULL) { 345e4878e39SDag-Erling Smørgrav errno = ENOMEM; 346e4878e39SDag-Erling Smørgrav _fetch_syserr(); 347e19e6098SDag-Erling Smørgrav return (-1); 348e4878e39SDag-Erling Smørgrav } 349e4878e39SDag-Erling Smørgrav 350dea29ca1SDag-Erling Smørgrav r = _fetch_putln(conn, msg, len); 351e4878e39SDag-Erling Smørgrav free(msg); 352e4878e39SDag-Erling Smørgrav 353e4878e39SDag-Erling Smørgrav if (r == -1) { 354e4878e39SDag-Erling Smørgrav _fetch_syserr(); 355e19e6098SDag-Erling Smørgrav return (-1); 356e4878e39SDag-Erling Smørgrav } 357e4878e39SDag-Erling Smørgrav 358e19e6098SDag-Erling Smørgrav return (0); 359e4878e39SDag-Erling Smørgrav } 360e4878e39SDag-Erling Smørgrav 361e4878e39SDag-Erling Smørgrav /* 362e4878e39SDag-Erling Smørgrav * Get and parse status line 363e4878e39SDag-Erling Smørgrav */ 364e4878e39SDag-Erling Smørgrav static int 365dea29ca1SDag-Erling Smørgrav _http_get_reply(conn_t *conn) 366e4878e39SDag-Erling Smørgrav { 367a898bb8dSDag-Erling Smørgrav char *p; 368a898bb8dSDag-Erling Smørgrav 369dea29ca1SDag-Erling Smørgrav if (_fetch_getln(conn) == -1) 370e19e6098SDag-Erling Smørgrav return (-1); 371e4878e39SDag-Erling Smørgrav /* 372e4878e39SDag-Erling Smørgrav * A valid status line looks like "HTTP/m.n xyz reason" where m 373e4878e39SDag-Erling Smørgrav * and n are the major and minor protocol version numbers and xyz 374e4878e39SDag-Erling Smørgrav * is the reply code. 375a898bb8dSDag-Erling Smørgrav * Unfortunately, there are servers out there (NCSA 1.5.1, to name 376a898bb8dSDag-Erling Smørgrav * just one) that do not send a version number, so we can't rely 377a898bb8dSDag-Erling Smørgrav * on finding one, but if we do, insist on it being 1.0 or 1.1. 378e4878e39SDag-Erling Smørgrav * We don't care about the reason phrase. 379e4878e39SDag-Erling Smørgrav */ 380dea29ca1SDag-Erling Smørgrav if (strncmp(conn->buf, "HTTP", 4) != 0) 381e19e6098SDag-Erling Smørgrav return (HTTP_PROTOCOL_ERROR); 382dea29ca1SDag-Erling Smørgrav p = conn->buf + 4; 383a898bb8dSDag-Erling Smørgrav if (*p == '/') { 384a898bb8dSDag-Erling Smørgrav if (p[1] != '1' || p[2] != '.' || (p[3] != '0' && p[3] != '1')) 385e19e6098SDag-Erling Smørgrav return (HTTP_PROTOCOL_ERROR); 386a898bb8dSDag-Erling Smørgrav p += 4; 387a898bb8dSDag-Erling Smørgrav } 388e19e6098SDag-Erling Smørgrav if (*p != ' ' || !isdigit(p[1]) || !isdigit(p[2]) || !isdigit(p[3])) 389e19e6098SDag-Erling Smørgrav return (HTTP_PROTOCOL_ERROR); 390e4878e39SDag-Erling Smørgrav 391dea29ca1SDag-Erling Smørgrav conn->err = (p[1] - '0') * 100 + (p[2] - '0') * 10 + (p[3] - '0'); 392dea29ca1SDag-Erling Smørgrav return (conn->err); 393e4878e39SDag-Erling Smørgrav } 394e4878e39SDag-Erling Smørgrav 395e4878e39SDag-Erling Smørgrav /* 396e19e6098SDag-Erling Smørgrav * Check a header; if the type matches the given string, return a pointer 397e19e6098SDag-Erling Smørgrav * to the beginning of the value. 398e4878e39SDag-Erling Smørgrav */ 39938c7e4a6SArchie Cobbs static const char * 40038c7e4a6SArchie Cobbs _http_match(const char *str, const char *hdr) 401e4878e39SDag-Erling Smørgrav { 402e4878e39SDag-Erling Smørgrav while (*str && *hdr && tolower(*str++) == tolower(*hdr++)) 403e4878e39SDag-Erling Smørgrav /* nothing */; 404e4878e39SDag-Erling Smørgrav if (*str || *hdr != ':') 405e19e6098SDag-Erling Smørgrav return (NULL); 406e4878e39SDag-Erling Smørgrav while (*hdr && isspace(*++hdr)) 407e4878e39SDag-Erling Smørgrav /* nothing */; 408e19e6098SDag-Erling Smørgrav return (hdr); 409e4878e39SDag-Erling Smørgrav } 410e4878e39SDag-Erling Smørgrav 411e4878e39SDag-Erling Smørgrav /* 412e4878e39SDag-Erling Smørgrav * Get the next header and return the appropriate symbolic code. 413e4878e39SDag-Erling Smørgrav */ 414f573a5fcSDag-Erling Smørgrav static hdr_t 415dea29ca1SDag-Erling Smørgrav _http_next_header(conn_t *conn, const char **p) 416e4878e39SDag-Erling Smørgrav { 417e4878e39SDag-Erling Smørgrav int i; 418e4878e39SDag-Erling Smørgrav 419dea29ca1SDag-Erling Smørgrav if (_fetch_getln(conn) == -1) 420e19e6098SDag-Erling Smørgrav return (hdr_syserror); 421dea29ca1SDag-Erling Smørgrav while (conn->buflen && isspace(conn->buf[conn->buflen - 1])) 422dea29ca1SDag-Erling Smørgrav conn->buflen--; 423dea29ca1SDag-Erling Smørgrav conn->buf[conn->buflen] = '\0'; 424dea29ca1SDag-Erling Smørgrav if (conn->buflen == 0) 425e19e6098SDag-Erling Smørgrav return (hdr_end); 426e4878e39SDag-Erling Smørgrav /* 427e4878e39SDag-Erling Smørgrav * We could check for malformed headers but we don't really care. 428e4878e39SDag-Erling Smørgrav * A valid header starts with a token immediately followed by a 429e4878e39SDag-Erling Smørgrav * colon; a token is any sequence of non-control, non-whitespace 430e4878e39SDag-Erling Smørgrav * characters except "()<>@,;:\\\"{}". 431e4878e39SDag-Erling Smørgrav */ 432e4878e39SDag-Erling Smørgrav for (i = 0; hdr_names[i].num != hdr_unknown; i++) 433dea29ca1SDag-Erling Smørgrav if ((*p = _http_match(hdr_names[i].name, conn->buf)) != NULL) 434e19e6098SDag-Erling Smørgrav return (hdr_names[i].num); 435e19e6098SDag-Erling Smørgrav return (hdr_unknown); 436e4878e39SDag-Erling Smørgrav } 437e4878e39SDag-Erling Smørgrav 438e4878e39SDag-Erling Smørgrav /* 439e4878e39SDag-Erling Smørgrav * Parse a last-modified header 440e4878e39SDag-Erling Smørgrav */ 441c78f1cc9SDag-Erling Smørgrav static int 44238c7e4a6SArchie Cobbs _http_parse_mtime(const char *p, time_t *mtime) 443e4878e39SDag-Erling Smørgrav { 444c78f1cc9SDag-Erling Smørgrav char locale[64], *r; 445e4878e39SDag-Erling Smørgrav struct tm tm; 446e4878e39SDag-Erling Smørgrav 447e4878e39SDag-Erling Smørgrav strncpy(locale, setlocale(LC_TIME, NULL), sizeof locale); 448e4878e39SDag-Erling Smørgrav setlocale(LC_TIME, "C"); 449c78f1cc9SDag-Erling Smørgrav r = strptime(p, "%a, %d %b %Y %H:%M:%S GMT", &tm); 450e4878e39SDag-Erling Smørgrav /* XXX should add support for date-2 and date-3 */ 451e4878e39SDag-Erling Smørgrav setlocale(LC_TIME, locale); 452c78f1cc9SDag-Erling Smørgrav if (r == NULL) 453e19e6098SDag-Erling Smørgrav return (-1); 454f67efa37SDag-Erling Smørgrav DEBUG(fprintf(stderr, "last modified: [%04d-%02d-%02d " 455f67efa37SDag-Erling Smørgrav "%02d:%02d:%02d]\n", 456e4878e39SDag-Erling Smørgrav tm.tm_year + 1900, tm.tm_mon + 1, tm.tm_mday, 457e4878e39SDag-Erling Smørgrav tm.tm_hour, tm.tm_min, tm.tm_sec)); 458c78f1cc9SDag-Erling Smørgrav *mtime = timegm(&tm); 459e19e6098SDag-Erling Smørgrav return (0); 460e4878e39SDag-Erling Smørgrav } 461e4878e39SDag-Erling Smørgrav 462e4878e39SDag-Erling Smørgrav /* 463e4878e39SDag-Erling Smørgrav * Parse a content-length header 464e4878e39SDag-Erling Smørgrav */ 465c78f1cc9SDag-Erling Smørgrav static int 46638c7e4a6SArchie Cobbs _http_parse_length(const char *p, off_t *length) 467e4878e39SDag-Erling Smørgrav { 468be6aff99SDag-Erling Smørgrav off_t len; 469e4878e39SDag-Erling Smørgrav 470e4878e39SDag-Erling Smørgrav for (len = 0; *p && isdigit(*p); ++p) 471e4878e39SDag-Erling Smørgrav len = len * 10 + (*p - '0'); 472f573a5fcSDag-Erling Smørgrav if (*p) 473e19e6098SDag-Erling Smørgrav return (-1); 474f67efa37SDag-Erling Smørgrav DEBUG(fprintf(stderr, "content length: [%lld]\n", 475f573a5fcSDag-Erling Smørgrav (long long)len)); 476c78f1cc9SDag-Erling Smørgrav *length = len; 477e19e6098SDag-Erling Smørgrav return (0); 478e4878e39SDag-Erling Smørgrav } 479e4878e39SDag-Erling Smørgrav 480e4878e39SDag-Erling Smørgrav /* 481e4878e39SDag-Erling Smørgrav * Parse a content-range header 482e4878e39SDag-Erling Smørgrav */ 483c78f1cc9SDag-Erling Smørgrav static int 48438c7e4a6SArchie Cobbs _http_parse_range(const char *p, off_t *offset, off_t *length, off_t *size) 485e4878e39SDag-Erling Smørgrav { 486f573a5fcSDag-Erling Smørgrav off_t first, last, len; 487e4878e39SDag-Erling Smørgrav 488e4878e39SDag-Erling Smørgrav if (strncasecmp(p, "bytes ", 6) != 0) 489e19e6098SDag-Erling Smørgrav return (-1); 490c78f1cc9SDag-Erling Smørgrav for (first = 0, p += 6; *p && isdigit(*p); ++p) 491c78f1cc9SDag-Erling Smørgrav first = first * 10 + *p - '0'; 492e4878e39SDag-Erling Smørgrav if (*p != '-') 493e19e6098SDag-Erling Smørgrav return (-1); 494c78f1cc9SDag-Erling Smørgrav for (last = 0, ++p; *p && isdigit(*p); ++p) 495c78f1cc9SDag-Erling Smørgrav last = last * 10 + *p - '0'; 496c78f1cc9SDag-Erling Smørgrav if (first > last || *p != '/') 497e19e6098SDag-Erling Smørgrav return (-1); 498c78f1cc9SDag-Erling Smørgrav for (len = 0, ++p; *p && isdigit(*p); ++p) 499c78f1cc9SDag-Erling Smørgrav len = len * 10 + *p - '0'; 500f573a5fcSDag-Erling Smørgrav if (*p || len < last - first + 1) 501e19e6098SDag-Erling Smørgrav return (-1); 502f67efa37SDag-Erling Smørgrav DEBUG(fprintf(stderr, "content range: [%lld-%lld/%lld]\n", 503f573a5fcSDag-Erling Smørgrav (long long)first, (long long)last, (long long)len)); 504c78f1cc9SDag-Erling Smørgrav *offset = first; 505c78f1cc9SDag-Erling Smørgrav *length = last - first + 1; 506c78f1cc9SDag-Erling Smørgrav *size = len; 507e19e6098SDag-Erling Smørgrav return (0); 508e4878e39SDag-Erling Smørgrav } 509e4878e39SDag-Erling Smørgrav 510e19e6098SDag-Erling Smørgrav 511e4878e39SDag-Erling Smørgrav /***************************************************************************** 512e4878e39SDag-Erling Smørgrav * Helper functions for authorization 513e4878e39SDag-Erling Smørgrav */ 5144ca1ab94SDag-Erling Smørgrav 515f62e5228SDag-Erling Smørgrav /* 516f62e5228SDag-Erling Smørgrav * Base64 encoding 517f62e5228SDag-Erling Smørgrav */ 51835f723dbSDag-Erling Smørgrav static char * 519e19e6098SDag-Erling Smørgrav _http_base64(const char *src) 520f62e5228SDag-Erling Smørgrav { 521f62e5228SDag-Erling Smørgrav static const char base64[] = 522f62e5228SDag-Erling Smørgrav "ABCDEFGHIJKLMNOPQRSTUVWXYZ" 523f62e5228SDag-Erling Smørgrav "abcdefghijklmnopqrstuvwxyz" 524f62e5228SDag-Erling Smørgrav "0123456789+/"; 52535f723dbSDag-Erling Smørgrav char *str, *dst; 52635f723dbSDag-Erling Smørgrav size_t l; 52735f723dbSDag-Erling Smørgrav int t, r; 52835f723dbSDag-Erling Smørgrav 52935f723dbSDag-Erling Smørgrav l = strlen(src); 53035f723dbSDag-Erling Smørgrav if ((str = malloc(((l + 2) / 3) * 4)) == NULL) 531e19e6098SDag-Erling Smørgrav return (NULL); 53235f723dbSDag-Erling Smørgrav dst = str; 53335f723dbSDag-Erling Smørgrav r = 0; 534f62e5228SDag-Erling Smørgrav 535f62e5228SDag-Erling Smørgrav while (l >= 3) { 536f62e5228SDag-Erling Smørgrav t = (src[0] << 16) | (src[1] << 8) | src[2]; 537f62e5228SDag-Erling Smørgrav dst[0] = base64[(t >> 18) & 0x3f]; 538f62e5228SDag-Erling Smørgrav dst[1] = base64[(t >> 12) & 0x3f]; 539f62e5228SDag-Erling Smørgrav dst[2] = base64[(t >> 6) & 0x3f]; 540f62e5228SDag-Erling Smørgrav dst[3] = base64[(t >> 0) & 0x3f]; 541f62e5228SDag-Erling Smørgrav src += 3; l -= 3; 542f62e5228SDag-Erling Smørgrav dst += 4; r += 4; 543f62e5228SDag-Erling Smørgrav } 544f62e5228SDag-Erling Smørgrav 545f62e5228SDag-Erling Smørgrav switch (l) { 546f62e5228SDag-Erling Smørgrav case 2: 547f62e5228SDag-Erling Smørgrav t = (src[0] << 16) | (src[1] << 8); 548f62e5228SDag-Erling Smørgrav dst[0] = base64[(t >> 18) & 0x3f]; 549f62e5228SDag-Erling Smørgrav dst[1] = base64[(t >> 12) & 0x3f]; 550f62e5228SDag-Erling Smørgrav dst[2] = base64[(t >> 6) & 0x3f]; 551f62e5228SDag-Erling Smørgrav dst[3] = '='; 552f62e5228SDag-Erling Smørgrav dst += 4; 553f62e5228SDag-Erling Smørgrav r += 4; 554f62e5228SDag-Erling Smørgrav break; 555f62e5228SDag-Erling Smørgrav case 1: 556f62e5228SDag-Erling Smørgrav t = src[0] << 16; 557f62e5228SDag-Erling Smørgrav dst[0] = base64[(t >> 18) & 0x3f]; 558f62e5228SDag-Erling Smørgrav dst[1] = base64[(t >> 12) & 0x3f]; 559f62e5228SDag-Erling Smørgrav dst[2] = dst[3] = '='; 560f62e5228SDag-Erling Smørgrav dst += 4; 561f62e5228SDag-Erling Smørgrav r += 4; 562f62e5228SDag-Erling Smørgrav break; 563f62e5228SDag-Erling Smørgrav case 0: 564f62e5228SDag-Erling Smørgrav break; 565f62e5228SDag-Erling Smørgrav } 566f62e5228SDag-Erling Smørgrav 567f62e5228SDag-Erling Smørgrav *dst = 0; 568e19e6098SDag-Erling Smørgrav return (str); 569f62e5228SDag-Erling Smørgrav } 570f62e5228SDag-Erling Smørgrav 571f62e5228SDag-Erling Smørgrav /* 572f62e5228SDag-Erling Smørgrav * Encode username and password 573f62e5228SDag-Erling Smørgrav */ 57435f723dbSDag-Erling Smørgrav static int 575dea29ca1SDag-Erling Smørgrav _http_basic_auth(conn_t *conn, const char *hdr, const char *usr, const char *pwd) 576f62e5228SDag-Erling Smørgrav { 57735f723dbSDag-Erling Smørgrav char *upw, *auth; 57835f723dbSDag-Erling Smørgrav int r; 579f62e5228SDag-Erling Smørgrav 580f67efa37SDag-Erling Smørgrav DEBUG(fprintf(stderr, "usr: [%s]\n", usr)); 581f67efa37SDag-Erling Smørgrav DEBUG(fprintf(stderr, "pwd: [%s]\n", pwd)); 58235f723dbSDag-Erling Smørgrav if (asprintf(&upw, "%s:%s", usr, pwd) == -1) 583e19e6098SDag-Erling Smørgrav return (-1); 58435f723dbSDag-Erling Smørgrav auth = _http_base64(upw); 58535f723dbSDag-Erling Smørgrav free(upw); 58635f723dbSDag-Erling Smørgrav if (auth == NULL) 587e19e6098SDag-Erling Smørgrav return (-1); 588dea29ca1SDag-Erling Smørgrav r = _http_cmd(conn, "%s: Basic %s", hdr, auth); 58935f723dbSDag-Erling Smørgrav free(auth); 590e19e6098SDag-Erling Smørgrav return (r); 5914d029f13SDag-Erling Smørgrav } 59235f723dbSDag-Erling Smørgrav 59335f723dbSDag-Erling Smørgrav /* 59435f723dbSDag-Erling Smørgrav * Send an authorization header 59535f723dbSDag-Erling Smørgrav */ 59635f723dbSDag-Erling Smørgrav static int 597dea29ca1SDag-Erling Smørgrav _http_authorize(conn_t *conn, const char *hdr, const char *p) 59835f723dbSDag-Erling Smørgrav { 59935f723dbSDag-Erling Smørgrav /* basic authorization */ 60035f723dbSDag-Erling Smørgrav if (strncasecmp(p, "basic:", 6) == 0) { 60135f723dbSDag-Erling Smørgrav char *user, *pwd, *str; 60235f723dbSDag-Erling Smørgrav int r; 60335f723dbSDag-Erling Smørgrav 60435f723dbSDag-Erling Smørgrav /* skip realm */ 60535f723dbSDag-Erling Smørgrav for (p += 6; *p && *p != ':'; ++p) 60635f723dbSDag-Erling Smørgrav /* nothing */ ; 60735f723dbSDag-Erling Smørgrav if (!*p || strchr(++p, ':') == NULL) 608e19e6098SDag-Erling Smørgrav return (-1); 60935f723dbSDag-Erling Smørgrav if ((str = strdup(p)) == NULL) 610e19e6098SDag-Erling Smørgrav return (-1); /* XXX */ 61135f723dbSDag-Erling Smørgrav user = str; 61235f723dbSDag-Erling Smørgrav pwd = strchr(str, ':'); 61335f723dbSDag-Erling Smørgrav *pwd++ = '\0'; 614dea29ca1SDag-Erling Smørgrav r = _http_basic_auth(conn, hdr, user, pwd); 61535f723dbSDag-Erling Smørgrav free(str); 616e19e6098SDag-Erling Smørgrav return (r); 6174d029f13SDag-Erling Smørgrav } 618e19e6098SDag-Erling Smørgrav return (-1); 619f62e5228SDag-Erling Smørgrav } 620f62e5228SDag-Erling Smørgrav 621e19e6098SDag-Erling Smørgrav 622e4878e39SDag-Erling Smørgrav /***************************************************************************** 623e4878e39SDag-Erling Smørgrav * Helper functions for connecting to a server or proxy 624f62e5228SDag-Erling Smørgrav */ 625e4878e39SDag-Erling Smørgrav 626e4878e39SDag-Erling Smørgrav /* 627e4878e39SDag-Erling Smørgrav * Connect to the correct HTTP server or proxy. 62860245e42SDag-Erling Smørgrav */ 629dea29ca1SDag-Erling Smørgrav static conn_t * 63038c7e4a6SArchie Cobbs _http_connect(struct url *URL, struct url *purl, const char *flags) 63160245e42SDag-Erling Smørgrav { 632dea29ca1SDag-Erling Smørgrav conn_t *conn; 6331a16ed4cSDag-Erling Smørgrav int verbose; 634dea29ca1SDag-Erling Smørgrav int af; 635e4878e39SDag-Erling Smørgrav 636e4878e39SDag-Erling Smørgrav #ifdef INET6 637e4878e39SDag-Erling Smørgrav af = AF_UNSPEC; 638e4878e39SDag-Erling Smørgrav #else 639e4878e39SDag-Erling Smørgrav af = AF_INET; 640e4878e39SDag-Erling Smørgrav #endif 641e4878e39SDag-Erling Smørgrav 642d74a913bSDag-Erling Smørgrav verbose = CHECK_FLAG('v'); 643d74a913bSDag-Erling Smørgrav if (CHECK_FLAG('4')) 644e4878e39SDag-Erling Smørgrav af = AF_INET; 6451a16ed4cSDag-Erling Smørgrav #ifdef INET6 646d74a913bSDag-Erling Smørgrav else if (CHECK_FLAG('6')) 647e4878e39SDag-Erling Smørgrav af = AF_INET6; 6481a16ed4cSDag-Erling Smørgrav #endif 649e4878e39SDag-Erling Smørgrav 6501a16ed4cSDag-Erling Smørgrav if (purl) { 6511a16ed4cSDag-Erling Smørgrav URL = purl; 6521a16ed4cSDag-Erling Smørgrav } else if (strcasecmp(URL->scheme, SCHEME_FTP) == 0) { 653e4878e39SDag-Erling Smørgrav /* can't talk http to an ftp server */ 654e4878e39SDag-Erling Smørgrav /* XXX should set an error code */ 655dea29ca1SDag-Erling Smørgrav return (NULL); 656e4878e39SDag-Erling Smørgrav } 6571a16ed4cSDag-Erling Smørgrav 658dea29ca1SDag-Erling Smørgrav if ((conn = _fetch_connect(URL->host, URL->port, af, verbose)) == NULL) 659e4878e39SDag-Erling Smørgrav /* _fetch_connect() has already set an error code */ 660dea29ca1SDag-Erling Smørgrav return (NULL); 661dea29ca1SDag-Erling Smørgrav return (conn); 662e4878e39SDag-Erling Smørgrav } 663e4878e39SDag-Erling Smørgrav 6641a16ed4cSDag-Erling Smørgrav static struct url * 66538c7e4a6SArchie Cobbs _http_get_proxy(void) 6661a16ed4cSDag-Erling Smørgrav { 6671a16ed4cSDag-Erling Smørgrav struct url *purl; 6681a16ed4cSDag-Erling Smørgrav char *p; 6691a16ed4cSDag-Erling Smørgrav 6704cee73c8SDag-Erling Smørgrav if (((p = getenv("HTTP_PROXY")) || (p = getenv("http_proxy"))) && 6714cee73c8SDag-Erling Smørgrav (purl = fetchParseURL(p))) { 6721a16ed4cSDag-Erling Smørgrav if (!*purl->scheme) 6731a16ed4cSDag-Erling Smørgrav strcpy(purl->scheme, SCHEME_HTTP); 6741a16ed4cSDag-Erling Smørgrav if (!purl->port) 675e828ada7SDag-Erling Smørgrav purl->port = _fetch_default_proxy_port(purl->scheme); 6761a16ed4cSDag-Erling Smørgrav if (strcasecmp(purl->scheme, SCHEME_HTTP) == 0) 677e19e6098SDag-Erling Smørgrav return (purl); 6781a16ed4cSDag-Erling Smørgrav fetchFreeURL(purl); 6791a16ed4cSDag-Erling Smørgrav } 680e19e6098SDag-Erling Smørgrav return (NULL); 681e4878e39SDag-Erling Smørgrav } 682e4878e39SDag-Erling Smørgrav 683a8e9bd87SDag-Erling Smørgrav static void 684a8e9bd87SDag-Erling Smørgrav _http_print_html(FILE *out, FILE *in) 685a8e9bd87SDag-Erling Smørgrav { 686a8e9bd87SDag-Erling Smørgrav size_t len; 687a8e9bd87SDag-Erling Smørgrav char *line, *p, *q; 688a8e9bd87SDag-Erling Smørgrav int comment, tag; 689a8e9bd87SDag-Erling Smørgrav 690a8e9bd87SDag-Erling Smørgrav comment = tag = 0; 691a8e9bd87SDag-Erling Smørgrav while ((line = fgetln(in, &len)) != NULL) { 692a8e9bd87SDag-Erling Smørgrav while (len && isspace(line[len - 1])) 693a8e9bd87SDag-Erling Smørgrav --len; 694a8e9bd87SDag-Erling Smørgrav for (p = q = line; q < line + len; ++q) { 695a8e9bd87SDag-Erling Smørgrav if (comment && *q == '-') { 696e19e6098SDag-Erling Smørgrav if (q + 2 < line + len && 697e19e6098SDag-Erling Smørgrav strcmp(q, "-->") == 0) { 698a8e9bd87SDag-Erling Smørgrav tag = comment = 0; 699a8e9bd87SDag-Erling Smørgrav q += 2; 700a8e9bd87SDag-Erling Smørgrav } 701e19e6098SDag-Erling Smørgrav } else if (tag && !comment && *q == '>') { 702a8e9bd87SDag-Erling Smørgrav p = q + 1; 703a8e9bd87SDag-Erling Smørgrav tag = 0; 704a8e9bd87SDag-Erling Smørgrav } else if (!tag && *q == '<') { 705a8e9bd87SDag-Erling Smørgrav if (q > p) 706a8e9bd87SDag-Erling Smørgrav fwrite(p, q - p, 1, out); 707a8e9bd87SDag-Erling Smørgrav tag = 1; 708e19e6098SDag-Erling Smørgrav if (q + 3 < line + len && 709e19e6098SDag-Erling Smørgrav strcmp(q, "<!--") == 0) { 710a8e9bd87SDag-Erling Smørgrav comment = 1; 711a8e9bd87SDag-Erling Smørgrav q += 3; 712a8e9bd87SDag-Erling Smørgrav } 713a8e9bd87SDag-Erling Smørgrav } 714a8e9bd87SDag-Erling Smørgrav } 715a8e9bd87SDag-Erling Smørgrav if (!tag && q > p) 716a8e9bd87SDag-Erling Smørgrav fwrite(p, q - p, 1, out); 717a8e9bd87SDag-Erling Smørgrav fputc('\n', out); 718a8e9bd87SDag-Erling Smørgrav } 719a8e9bd87SDag-Erling Smørgrav } 720a8e9bd87SDag-Erling Smørgrav 721e19e6098SDag-Erling Smørgrav 722e4878e39SDag-Erling Smørgrav /***************************************************************************** 723e4878e39SDag-Erling Smørgrav * Core 724e4878e39SDag-Erling Smørgrav */ 725e4878e39SDag-Erling Smørgrav 726e4878e39SDag-Erling Smørgrav /* 727e4878e39SDag-Erling Smørgrav * Send a request and process the reply 728e4878e39SDag-Erling Smørgrav */ 7291a16ed4cSDag-Erling Smørgrav FILE * 73038c7e4a6SArchie Cobbs _http_request(struct url *URL, const char *op, struct url_stat *us, 73138c7e4a6SArchie Cobbs struct url *purl, const char *flags) 732e4878e39SDag-Erling Smørgrav { 733dea29ca1SDag-Erling Smørgrav conn_t *conn; 734e4878e39SDag-Erling Smørgrav struct url *url, *new; 7351a16ed4cSDag-Erling Smørgrav int chunked, direct, need_auth, noredirect, verbose; 736dea29ca1SDag-Erling Smørgrav int i, n; 737be6aff99SDag-Erling Smørgrav off_t offset, clength, length, size; 738c78f1cc9SDag-Erling Smørgrav time_t mtime; 73938c7e4a6SArchie Cobbs const char *p; 740e4878e39SDag-Erling Smørgrav FILE *f; 741f573a5fcSDag-Erling Smørgrav hdr_t h; 74228c645cfSHajimu UMEMOTO char *host; 74328c645cfSHajimu UMEMOTO #ifdef INET6 74428c645cfSHajimu UMEMOTO char hbuf[MAXHOSTNAMELEN + 1]; 74528c645cfSHajimu UMEMOTO #endif 74660245e42SDag-Erling Smørgrav 747d74a913bSDag-Erling Smørgrav direct = CHECK_FLAG('d'); 748d74a913bSDag-Erling Smørgrav noredirect = CHECK_FLAG('A'); 749d74a913bSDag-Erling Smørgrav verbose = CHECK_FLAG('v'); 7504ca1ab94SDag-Erling Smørgrav 7511a16ed4cSDag-Erling Smørgrav if (direct && purl) { 7521a16ed4cSDag-Erling Smørgrav fetchFreeURL(purl); 7531a16ed4cSDag-Erling Smørgrav purl = NULL; 7541a16ed4cSDag-Erling Smørgrav } 7551a16ed4cSDag-Erling Smørgrav 756c78f1cc9SDag-Erling Smørgrav /* try the provided URL first */ 757c78f1cc9SDag-Erling Smørgrav url = URL; 758c78f1cc9SDag-Erling Smørgrav 759c78f1cc9SDag-Erling Smørgrav /* if the A flag is set, we only get one try */ 760e4878e39SDag-Erling Smørgrav n = noredirect ? 1 : MAX_REDIRECT; 761c78f1cc9SDag-Erling Smørgrav i = 0; 762e4878e39SDag-Erling Smørgrav 7636490b215SDag-Erling Smørgrav need_auth = 0; 764c78f1cc9SDag-Erling Smørgrav do { 765f4683775SDag-Erling Smørgrav new = NULL; 766f4683775SDag-Erling Smørgrav chunked = 0; 767f4683775SDag-Erling Smørgrav offset = 0; 768c78f1cc9SDag-Erling Smørgrav clength = -1; 769c78f1cc9SDag-Erling Smørgrav length = -1; 770c78f1cc9SDag-Erling Smørgrav size = -1; 771c78f1cc9SDag-Erling Smørgrav mtime = 0; 7726490b215SDag-Erling Smørgrav 7731a16ed4cSDag-Erling Smørgrav /* check port */ 7741a16ed4cSDag-Erling Smørgrav if (!url->port) 775e828ada7SDag-Erling Smørgrav url->port = _fetch_default_port(url->scheme); 7761a16ed4cSDag-Erling Smørgrav 77765986545SDag-Erling Smørgrav /* were we redirected to an FTP URL? */ 77865986545SDag-Erling Smørgrav if (purl == NULL && strcmp(url->scheme, SCHEME_FTP) == 0) { 77965986545SDag-Erling Smørgrav if (strcmp(op, "GET") == 0) 780e19e6098SDag-Erling Smørgrav return (_ftp_request(url, "RETR", us, purl, flags)); 78165986545SDag-Erling Smørgrav else if (strcmp(op, "HEAD") == 0) 782e19e6098SDag-Erling Smørgrav return (_ftp_request(url, "STAT", us, purl, flags)); 78365986545SDag-Erling Smørgrav } 78465986545SDag-Erling Smørgrav 785e4878e39SDag-Erling Smørgrav /* connect to server or proxy */ 786dea29ca1SDag-Erling Smørgrav if ((conn = _http_connect(url, purl, flags)) == NULL) 787e4878e39SDag-Erling Smørgrav goto ouch; 788e4878e39SDag-Erling Smørgrav 789e4878e39SDag-Erling Smørgrav host = url->host; 79028c645cfSHajimu UMEMOTO #ifdef INET6 791e4878e39SDag-Erling Smørgrav if (strchr(url->host, ':')) { 792e4878e39SDag-Erling Smørgrav snprintf(hbuf, sizeof(hbuf), "[%s]", url->host); 79328c645cfSHajimu UMEMOTO host = hbuf; 79428c645cfSHajimu UMEMOTO } 79528c645cfSHajimu UMEMOTO #endif 79628c645cfSHajimu UMEMOTO 797e4878e39SDag-Erling Smørgrav /* send request */ 7980fba3a00SDag-Erling Smørgrav if (verbose) 799c97925adSHajimu UMEMOTO _fetch_info("requesting %s://%s:%d%s", 800e4878e39SDag-Erling Smørgrav url->scheme, host, url->port, url->doc); 8011a16ed4cSDag-Erling Smørgrav if (purl) { 802dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "%s %s://%s:%d%s HTTP/1.1", 803e4878e39SDag-Erling Smørgrav op, url->scheme, host, url->port, url->doc); 804e4878e39SDag-Erling Smørgrav } else { 805dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "%s %s HTTP/1.1", 806e4878e39SDag-Erling Smørgrav op, url->doc); 80760245e42SDag-Erling Smørgrav } 80860245e42SDag-Erling Smørgrav 8096490b215SDag-Erling Smørgrav /* virtual host */ 8106490b215SDag-Erling Smørgrav if (url->port == _fetch_default_port(url->scheme)) 811dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "Host: %s", host); 8126490b215SDag-Erling Smørgrav else 813dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "Host: %s:%d", host, url->port); 8146490b215SDag-Erling Smørgrav 815e4878e39SDag-Erling Smørgrav /* proxy authorization */ 8161a16ed4cSDag-Erling Smørgrav if (purl) { 8171a16ed4cSDag-Erling Smørgrav if (*purl->user || *purl->pwd) 818dea29ca1SDag-Erling Smørgrav _http_basic_auth(conn, "Proxy-Authorization", 8191a16ed4cSDag-Erling Smørgrav purl->user, purl->pwd); 8201a16ed4cSDag-Erling Smørgrav else if ((p = getenv("HTTP_PROXY_AUTH")) != NULL && *p != '\0') 821dea29ca1SDag-Erling Smørgrav _http_authorize(conn, "Proxy-Authorization", p); 8221a16ed4cSDag-Erling Smørgrav } 823e4878e39SDag-Erling Smørgrav 824e4878e39SDag-Erling Smørgrav /* server authorization */ 8256490b215SDag-Erling Smørgrav if (need_auth || *url->user || *url->pwd) { 826e4878e39SDag-Erling Smørgrav if (*url->user || *url->pwd) 827dea29ca1SDag-Erling Smørgrav _http_basic_auth(conn, "Authorization", url->user, url->pwd); 828c78f1cc9SDag-Erling Smørgrav else if ((p = getenv("HTTP_AUTH")) != NULL && *p != '\0') 829dea29ca1SDag-Erling Smørgrav _http_authorize(conn, "Authorization", p); 8306490b215SDag-Erling Smørgrav else if (fetchAuthMethod && fetchAuthMethod(url) == 0) { 831dea29ca1SDag-Erling Smørgrav _http_basic_auth(conn, "Authorization", url->user, url->pwd); 8326490b215SDag-Erling Smørgrav } else { 833e4878e39SDag-Erling Smørgrav _http_seterr(HTTP_NEED_AUTH); 834e4878e39SDag-Erling Smørgrav goto ouch; 835e4878e39SDag-Erling Smørgrav } 836e4878e39SDag-Erling Smørgrav } 837e4878e39SDag-Erling Smørgrav 838e4878e39SDag-Erling Smørgrav /* other headers */ 8396a0cf64bSDag-Erling Smørgrav if ((p = getenv("HTTP_USER_AGENT")) != NULL && *p != '\0') 840dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "User-Agent: %s", p); 8416a0cf64bSDag-Erling Smørgrav else 842dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "User-Agent: %s " _LIBFETCH_VER, getprogname()); 84387b41116SDag-Erling Smørgrav if (url->offset) 844dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "Range: bytes=%lld-", (long long)url->offset); 845dea29ca1SDag-Erling Smørgrav _http_cmd(conn, "Connection: close"); 846dea29ca1SDag-Erling Smørgrav _http_cmd(conn, ""); 847e4878e39SDag-Erling Smørgrav 848e4878e39SDag-Erling Smørgrav /* get reply */ 849dea29ca1SDag-Erling Smørgrav switch (_http_get_reply(conn)) { 850e4878e39SDag-Erling Smørgrav case HTTP_OK: 851e4878e39SDag-Erling Smørgrav case HTTP_PARTIAL: 852e4878e39SDag-Erling Smørgrav /* fine */ 853e4878e39SDag-Erling Smørgrav break; 854e4878e39SDag-Erling Smørgrav case HTTP_MOVED_PERM: 855e4878e39SDag-Erling Smørgrav case HTTP_MOVED_TEMP: 85665986545SDag-Erling Smørgrav case HTTP_SEE_OTHER: 857e4878e39SDag-Erling Smørgrav /* 858e4878e39SDag-Erling Smørgrav * Not so fine, but we still have to read the headers to 859e4878e39SDag-Erling Smørgrav * get the new location. 860e4878e39SDag-Erling Smørgrav */ 861e4878e39SDag-Erling Smørgrav break; 862e4878e39SDag-Erling Smørgrav case HTTP_NEED_AUTH: 863e4878e39SDag-Erling Smørgrav if (need_auth) { 864e4878e39SDag-Erling Smørgrav /* 865e4878e39SDag-Erling Smørgrav * We already sent out authorization code, so there's 866e4878e39SDag-Erling Smørgrav * nothing more we can do. 867e4878e39SDag-Erling Smørgrav */ 868dea29ca1SDag-Erling Smørgrav _http_seterr(conn->err); 869e4878e39SDag-Erling Smørgrav goto ouch; 870e4878e39SDag-Erling Smørgrav } 871e4878e39SDag-Erling Smørgrav /* try again, but send the password this time */ 872e4878e39SDag-Erling Smørgrav if (verbose) 873e4878e39SDag-Erling Smørgrav _fetch_info("server requires authorization"); 8746490b215SDag-Erling Smørgrav break; 875e4878e39SDag-Erling Smørgrav case HTTP_NEED_PROXY_AUTH: 876e4878e39SDag-Erling Smørgrav /* 877e4878e39SDag-Erling Smørgrav * If we're talking to a proxy, we already sent our proxy 878e4878e39SDag-Erling Smørgrav * authorization code, so there's nothing more we can do. 879e4878e39SDag-Erling Smørgrav */ 880dea29ca1SDag-Erling Smørgrav _http_seterr(conn->err); 881e4878e39SDag-Erling Smørgrav goto ouch; 882e4878e39SDag-Erling Smørgrav case HTTP_PROTOCOL_ERROR: 883e4878e39SDag-Erling Smørgrav /* fall through */ 884e4878e39SDag-Erling Smørgrav case -1: 885e4878e39SDag-Erling Smørgrav _fetch_syserr(); 886e4878e39SDag-Erling Smørgrav goto ouch; 887e4878e39SDag-Erling Smørgrav default: 888dea29ca1SDag-Erling Smørgrav _http_seterr(conn->err); 889a8e9bd87SDag-Erling Smørgrav if (!verbose) 890e4878e39SDag-Erling Smørgrav goto ouch; 891a8e9bd87SDag-Erling Smørgrav /* fall through so we can get the full error message */ 892e4878e39SDag-Erling Smørgrav } 893e4878e39SDag-Erling Smørgrav 894e4878e39SDag-Erling Smørgrav /* get headers */ 895e4878e39SDag-Erling Smørgrav do { 896dea29ca1SDag-Erling Smørgrav switch ((h = _http_next_header(conn, &p))) { 897e4878e39SDag-Erling Smørgrav case hdr_syserror: 898e4878e39SDag-Erling Smørgrav _fetch_syserr(); 899e4878e39SDag-Erling Smørgrav goto ouch; 900e4878e39SDag-Erling Smørgrav case hdr_error: 901e4878e39SDag-Erling Smørgrav _http_seterr(HTTP_PROTOCOL_ERROR); 902e4878e39SDag-Erling Smørgrav goto ouch; 903e4878e39SDag-Erling Smørgrav case hdr_content_length: 904c78f1cc9SDag-Erling Smørgrav _http_parse_length(p, &clength); 905e4878e39SDag-Erling Smørgrav break; 906e4878e39SDag-Erling Smørgrav case hdr_content_range: 907c78f1cc9SDag-Erling Smørgrav _http_parse_range(p, &offset, &length, &size); 908e4878e39SDag-Erling Smørgrav break; 909e4878e39SDag-Erling Smørgrav case hdr_last_modified: 910c78f1cc9SDag-Erling Smørgrav _http_parse_mtime(p, &mtime); 911e4878e39SDag-Erling Smørgrav break; 912e4878e39SDag-Erling Smørgrav case hdr_location: 913dea29ca1SDag-Erling Smørgrav if (!HTTP_REDIRECT(conn->err)) 914e4878e39SDag-Erling Smørgrav break; 915f4683775SDag-Erling Smørgrav if (new) 916f4683775SDag-Erling Smørgrav free(new); 917e4878e39SDag-Erling Smørgrav if (verbose) 918dea29ca1SDag-Erling Smørgrav _fetch_info("%d redirect to %s", conn->err, p); 919f4683775SDag-Erling Smørgrav if (*p == '/') 920f4683775SDag-Erling Smørgrav /* absolute path */ 921f4683775SDag-Erling Smørgrav new = fetchMakeURL(url->scheme, url->host, url->port, p, 922f4683775SDag-Erling Smørgrav url->user, url->pwd); 923f4683775SDag-Erling Smørgrav else 924f4683775SDag-Erling Smørgrav new = fetchParseURL(p); 925f4683775SDag-Erling Smørgrav if (new == NULL) { 926f4683775SDag-Erling Smørgrav /* XXX should set an error code */ 927f4683775SDag-Erling Smørgrav DEBUG(fprintf(stderr, "failed to parse new URL\n")); 928e4878e39SDag-Erling Smørgrav goto ouch; 929f4683775SDag-Erling Smørgrav } 930e4878e39SDag-Erling Smørgrav if (!*new->user && !*new->pwd) { 931e4878e39SDag-Erling Smørgrav strcpy(new->user, url->user); 932e4878e39SDag-Erling Smørgrav strcpy(new->pwd, url->pwd); 933e4878e39SDag-Erling Smørgrav } 934e4878e39SDag-Erling Smørgrav new->offset = url->offset; 935e4878e39SDag-Erling Smørgrav new->length = url->length; 936f4683775SDag-Erling Smørgrav break; 937e4878e39SDag-Erling Smørgrav case hdr_transfer_encoding: 938e4878e39SDag-Erling Smørgrav /* XXX weak test*/ 939e4878e39SDag-Erling Smørgrav chunked = (strcasecmp(p, "chunked") == 0); 940e4878e39SDag-Erling Smørgrav break; 9416490b215SDag-Erling Smørgrav case hdr_www_authenticate: 942dea29ca1SDag-Erling Smørgrav if (conn->err != HTTP_NEED_AUTH) 9436490b215SDag-Erling Smørgrav break; 9446490b215SDag-Erling Smørgrav /* if we were smarter, we'd check the method and realm */ 9456490b215SDag-Erling Smørgrav break; 946e4878e39SDag-Erling Smørgrav case hdr_end: 947e4878e39SDag-Erling Smørgrav /* fall through */ 948e4878e39SDag-Erling Smørgrav case hdr_unknown: 949e4878e39SDag-Erling Smørgrav /* ignore */ 950e4878e39SDag-Erling Smørgrav break; 951e4878e39SDag-Erling Smørgrav } 952e4878e39SDag-Erling Smørgrav } while (h > hdr_end); 953e4878e39SDag-Erling Smørgrav 954a8e9bd87SDag-Erling Smørgrav /* we have a hit or an error */ 955dea29ca1SDag-Erling Smørgrav if (conn->err == HTTP_OK || conn->err == HTTP_PARTIAL || HTTP_ERROR(conn->err)) 956e4878e39SDag-Erling Smørgrav break; 957f4683775SDag-Erling Smørgrav 9586490b215SDag-Erling Smørgrav /* we need to provide authentication */ 959dea29ca1SDag-Erling Smørgrav if (conn->err == HTTP_NEED_AUTH) { 9606490b215SDag-Erling Smørgrav need_auth = 1; 961dea29ca1SDag-Erling Smørgrav _fetch_close(conn); 962dea29ca1SDag-Erling Smørgrav conn = NULL; 9636490b215SDag-Erling Smørgrav continue; 9646490b215SDag-Erling Smørgrav } 9656490b215SDag-Erling Smørgrav 9666490b215SDag-Erling Smørgrav /* all other cases: we got a redirect */ 9676490b215SDag-Erling Smørgrav need_auth = 0; 968dea29ca1SDag-Erling Smørgrav _fetch_close(conn); 969dea29ca1SDag-Erling Smørgrav conn = NULL; 9706490b215SDag-Erling Smørgrav if (!new) { 9716490b215SDag-Erling Smørgrav DEBUG(fprintf(stderr, "redirect with no new location\n")); 9726490b215SDag-Erling Smørgrav break; 9736490b215SDag-Erling Smørgrav } 974f4683775SDag-Erling Smørgrav if (url != URL) 975f4683775SDag-Erling Smørgrav fetchFreeURL(url); 976f4683775SDag-Erling Smørgrav url = new; 977c78f1cc9SDag-Erling Smørgrav } while (++i < n); 978e4878e39SDag-Erling Smørgrav 9796490b215SDag-Erling Smørgrav /* we failed, or ran out of retries */ 980dea29ca1SDag-Erling Smørgrav if (conn == NULL) { 981dea29ca1SDag-Erling Smørgrav _http_seterr(conn->err); 982e4878e39SDag-Erling Smørgrav goto ouch; 983e4878e39SDag-Erling Smørgrav } 984e4878e39SDag-Erling Smørgrav 985f573a5fcSDag-Erling Smørgrav DEBUG(fprintf(stderr, "offset %lld, length %lld," 986f573a5fcSDag-Erling Smørgrav " size %lld, clength %lld\n", 987f573a5fcSDag-Erling Smørgrav (long long)offset, (long long)length, 988f573a5fcSDag-Erling Smørgrav (long long)size, (long long)clength)); 989c78f1cc9SDag-Erling Smørgrav 990c78f1cc9SDag-Erling Smørgrav /* check for inconsistencies */ 991c78f1cc9SDag-Erling Smørgrav if (clength != -1 && length != -1 && clength != length) { 992c78f1cc9SDag-Erling Smørgrav _http_seterr(HTTP_PROTOCOL_ERROR); 993c78f1cc9SDag-Erling Smørgrav goto ouch; 994c78f1cc9SDag-Erling Smørgrav } 995c78f1cc9SDag-Erling Smørgrav if (clength == -1) 996c78f1cc9SDag-Erling Smørgrav clength = length; 997c78f1cc9SDag-Erling Smørgrav if (clength != -1) 998c78f1cc9SDag-Erling Smørgrav length = offset + clength; 999c78f1cc9SDag-Erling Smørgrav if (length != -1 && size != -1 && length != size) { 1000c78f1cc9SDag-Erling Smørgrav _http_seterr(HTTP_PROTOCOL_ERROR); 1001c78f1cc9SDag-Erling Smørgrav goto ouch; 1002c78f1cc9SDag-Erling Smørgrav } 1003c78f1cc9SDag-Erling Smørgrav if (size == -1) 1004c78f1cc9SDag-Erling Smørgrav size = length; 1005c78f1cc9SDag-Erling Smørgrav 1006c78f1cc9SDag-Erling Smørgrav /* fill in stats */ 1007c78f1cc9SDag-Erling Smørgrav if (us) { 1008c78f1cc9SDag-Erling Smørgrav us->size = size; 1009c78f1cc9SDag-Erling Smørgrav us->atime = us->mtime = mtime; 1010c78f1cc9SDag-Erling Smørgrav } 1011c78f1cc9SDag-Erling Smørgrav 101287b41116SDag-Erling Smørgrav /* too far? */ 1013c78f1cc9SDag-Erling Smørgrav if (offset > URL->offset) { 101487b41116SDag-Erling Smørgrav _http_seterr(HTTP_PROTOCOL_ERROR); 101587b41116SDag-Erling Smørgrav goto ouch; 101687b41116SDag-Erling Smørgrav } 101787b41116SDag-Erling Smørgrav 1018c78f1cc9SDag-Erling Smørgrav /* report back real offset and size */ 101987b41116SDag-Erling Smørgrav URL->offset = offset; 1020c78f1cc9SDag-Erling Smørgrav URL->length = clength; 102187b41116SDag-Erling Smørgrav 1022e4878e39SDag-Erling Smørgrav /* wrap it up in a FILE */ 1023dea29ca1SDag-Erling Smørgrav if (chunked) { 1024dea29ca1SDag-Erling Smørgrav f = _http_funopen(conn); 1025dea29ca1SDag-Erling Smørgrav } else { 1026dea29ca1SDag-Erling Smørgrav f = fdopen(dup(conn->sd), "r"); 1027dea29ca1SDag-Erling Smørgrav _fetch_close(conn); 1028dea29ca1SDag-Erling Smørgrav } 1029dea29ca1SDag-Erling Smørgrav if (f == NULL) { 1030e4878e39SDag-Erling Smørgrav _fetch_syserr(); 1031e4878e39SDag-Erling Smørgrav goto ouch; 1032e4878e39SDag-Erling Smørgrav } 1033e4878e39SDag-Erling Smørgrav 1034e4878e39SDag-Erling Smørgrav if (url != URL) 1035e4878e39SDag-Erling Smørgrav fetchFreeURL(url); 10361a16ed4cSDag-Erling Smørgrav if (purl) 10371a16ed4cSDag-Erling Smørgrav fetchFreeURL(purl); 1038e4878e39SDag-Erling Smørgrav 1039dea29ca1SDag-Erling Smørgrav if (HTTP_ERROR(conn->err)) { 1040a8e9bd87SDag-Erling Smørgrav _http_print_html(stderr, f); 1041a8e9bd87SDag-Erling Smørgrav fclose(f); 1042a8e9bd87SDag-Erling Smørgrav f = NULL; 1043a8e9bd87SDag-Erling Smørgrav } 1044a8e9bd87SDag-Erling Smørgrav 1045e19e6098SDag-Erling Smørgrav return (f); 1046e4878e39SDag-Erling Smørgrav 1047e4878e39SDag-Erling Smørgrav ouch: 1048e4878e39SDag-Erling Smørgrav if (url != URL) 1049e4878e39SDag-Erling Smørgrav fetchFreeURL(url); 10501a16ed4cSDag-Erling Smørgrav if (purl) 10511a16ed4cSDag-Erling Smørgrav fetchFreeURL(purl); 1052dea29ca1SDag-Erling Smørgrav if (conn != NULL) 1053dea29ca1SDag-Erling Smørgrav _fetch_close(conn); 1054e19e6098SDag-Erling Smørgrav return (NULL); 1055e4878e39SDag-Erling Smørgrav } 1056e4878e39SDag-Erling Smørgrav 1057e19e6098SDag-Erling Smørgrav 1058e4878e39SDag-Erling Smørgrav /***************************************************************************** 1059e4878e39SDag-Erling Smørgrav * Entry points 1060e4878e39SDag-Erling Smørgrav */ 1061e4878e39SDag-Erling Smørgrav 106260245e42SDag-Erling Smørgrav /* 10631a5faa10SDag-Erling Smørgrav * Retrieve and stat a file by HTTP 10641a5faa10SDag-Erling Smørgrav */ 10651a5faa10SDag-Erling Smørgrav FILE * 106638c7e4a6SArchie Cobbs fetchXGetHTTP(struct url *URL, struct url_stat *us, const char *flags) 10671a5faa10SDag-Erling Smørgrav { 1068e19e6098SDag-Erling Smørgrav return (_http_request(URL, "GET", us, _http_get_proxy(), flags)); 10691a5faa10SDag-Erling Smørgrav } 10701a5faa10SDag-Erling Smørgrav 10711a5faa10SDag-Erling Smørgrav /* 107260245e42SDag-Erling Smørgrav * Retrieve a file by HTTP 107360245e42SDag-Erling Smørgrav */ 107460245e42SDag-Erling Smørgrav FILE * 107538c7e4a6SArchie Cobbs fetchGetHTTP(struct url *URL, const char *flags) 107660245e42SDag-Erling Smørgrav { 1077e19e6098SDag-Erling Smørgrav return (fetchXGetHTTP(URL, NULL, flags)); 10784ca1ab94SDag-Erling Smørgrav } 10794ca1ab94SDag-Erling Smørgrav 10801a5faa10SDag-Erling Smørgrav /* 10811a5faa10SDag-Erling Smørgrav * Store a file by HTTP 10821a5faa10SDag-Erling Smørgrav */ 10834ca1ab94SDag-Erling Smørgrav FILE * 1084f573a5fcSDag-Erling Smørgrav fetchPutHTTP(struct url *URL __unused, const char *flags __unused) 10854ca1ab94SDag-Erling Smørgrav { 10864ca1ab94SDag-Erling Smørgrav warnx("fetchPutHTTP(): not implemented"); 1087e19e6098SDag-Erling Smørgrav return (NULL); 10884ca1ab94SDag-Erling Smørgrav } 1089d8acd8dcSDag-Erling Smørgrav 1090d8acd8dcSDag-Erling Smørgrav /* 1091d8acd8dcSDag-Erling Smørgrav * Get an HTTP document's metadata 1092d8acd8dcSDag-Erling Smørgrav */ 1093d8acd8dcSDag-Erling Smørgrav int 109438c7e4a6SArchie Cobbs fetchStatHTTP(struct url *URL, struct url_stat *us, const char *flags) 1095d8acd8dcSDag-Erling Smørgrav { 109660245e42SDag-Erling Smørgrav FILE *f; 109760245e42SDag-Erling Smørgrav 10981a16ed4cSDag-Erling Smørgrav if ((f = _http_request(URL, "HEAD", us, _http_get_proxy(), flags)) == NULL) 1099e19e6098SDag-Erling Smørgrav return (-1); 1100f8f4130bSDag-Erling Smørgrav fclose(f); 1101e19e6098SDag-Erling Smørgrav return (0); 1102d8acd8dcSDag-Erling Smørgrav } 1103ce71b736SDag-Erling Smørgrav 1104ce71b736SDag-Erling Smørgrav /* 1105ce71b736SDag-Erling Smørgrav * List a directory 1106ce71b736SDag-Erling Smørgrav */ 1107ce71b736SDag-Erling Smørgrav struct url_ent * 1108f573a5fcSDag-Erling Smørgrav fetchListHTTP(struct url *url __unused, const char *flags __unused) 1109ce71b736SDag-Erling Smørgrav { 1110ce71b736SDag-Erling Smørgrav warnx("fetchListHTTP(): not implemented"); 1111e19e6098SDag-Erling Smørgrav return (NULL); 1112ce71b736SDag-Erling Smørgrav } 1113