// The contents of this file are subject to the Mozilla Public License // Version 1.0 (the "License"); you may not use this file except in // compliance with the License. You may obtain a copy of the License at // http://www.mozilla.org/MPL/ // // Software distributed under the License is distributed on an "AS IS" // basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See the // License for the specific language governing rights and limitations // under the License. // // The Original Code is the Berkeley Open Infrastructure for Network Computing. // // The Initial Developer of the Original Code is the SETI@home project. // Portions created by the SETI@home project are Copyright (C) 2002 // University of California at Berkeley. All Rights Reserved. // // Contributor(s): // #include "windows_cpp.h" #include #ifdef _WIN32 #include "winsock.h" #endif #if HAVE_SYS_STAT_H #include #endif #if HAVE_SYS_SOCKET_H #include #endif #if HAVE_UNISTD_H #include #endif #include "error_numbers.h" #include "filesys.h" #include "log_flags.h" #include "http.h" #define HTTP_BLOCKSIZE 4096 // Breaks a url down into its server and file path components // TODO: deal with alternate protocols (ftp, gopher, etc) or disallow // them and parse accordingly // static void parse_url(char* url, char* host, char* file) { char* p; char buf[256]; if(url==NULL) { fprintf(stderr, "error: parse_url: unexpected NULL pointer url\n"); } if(host==NULL) { fprintf(stderr, "error: parse_url: unexpected NULL pointer host\n"); } if(file==NULL) { fprintf(stderr, "error: parse_url: unexpected NULL pointer file\n"); } if (strncmp(url, "http://", 7) == 0) strcpy(buf, url+7); else strcpy(buf, url); p = strchr(buf, '/'); if (p) { strcpy(file, p+1); *p = 0; } else { strcpy(file, ""); } strcpy(host, buf); } // Note: HTTP 1.1 keeps connection open. // We use 1.0 so we don't have to count bytes. // // Prints an HTTP 1.0 GET request header into buf // static void http_get_request_header( char* buf, char* host, char* file, double offset ) { if(buf==NULL) { fprintf(stderr, "error: http_get_request_header: unexpected NULL pointer buf\n"); } if(host==NULL) { fprintf(stderr, "error: http_get_request_header: unexpected NULL pointer host\n"); } if(file==NULL) { fprintf(stderr, "error: http_get_request_header: unexpected NULL pointer file\n"); } if(offset<0) { fprintf(stderr, "error: http_get_request_header: negative offset\n"); } if (offset) { sprintf(buf, "GET /%s;byte-range %12.0f- HTTP/1.0\015\012" "User-Agent: BOINC client\015\012" "Host: %s:80\015\012" "Accept: */*\015\012" "\015\012", file, offset, host ); } else { sprintf(buf, "GET /%s HTTP/1.0\015\012" "User-Agent: BOINC client\015\012" "Host: %s:80\015\012" "Accept: */*\015\012" "\015\012", file, host ); } } // Prints an HTTP 1.0 HEAD request header into buf // static void http_head_request_header(char* buf, char* host, char* file) { if(buf==NULL) { fprintf(stderr, "error: http_head_request_header: unexpected NULL pointer buf\n"); } if(host==NULL) { fprintf(stderr, "error: http_head_request_header: unexpected NULL pointer host\n"); } if(file==NULL) { fprintf(stderr, "error: http_head_request_header: unexpected NULL pointer file\n"); } sprintf(buf, "HEAD /%s HTTP/1.0\015\012" "User-Agent: BOINC client\015\012" "Host: %s:80\015\012" "Accept: */*\015\012" "\015\012", file, host ); } // Prints an HTTP 1.0 POST request header into buf // static void http_post_request_header( char* buf, char* host, char* file, int size ) { if(buf==NULL) { fprintf(stderr, "error: http_post_request_header: unexpected NULL pointer buf\n"); } if(host==NULL) { fprintf(stderr, "error: http_post_request_header: unexpected NULL pointer host\n"); } if(file==NULL) { fprintf(stderr, "error: http_post_request_header: unexpected NULL pointer file\n"); } if(size<0) { fprintf(stderr, "error: http_post_request_header: negative size\n"); } sprintf(buf, "POST /%s HTTP/1.0\015\012" "Pragma: no-cache\015\012" "Cache-Control: no-cache\015\012" "Host: %s:80\015\012" "Content-Type: application/octet-stream\015\012" "Content-Length: %d\015\012" "\015\012", file, host, size ); } #if 0 // Do we still need this? // void http_put_request_header( char* buf, char* host, char* file, int size, int offset ) { if(buf==NULL) { fprintf(stderr, "error: http_put_request_header: unexpected NULL pointer buf\n"); } if(host==NULL) { fprintf(stderr, "error: http_put_request_header: unexpected NULL pointer host\n"); } if(file==NULL) { fprintf(stderr, "error: http_put_request_header: unexpected NULL pointer file\n"); } if(size<0) { fprintf(stderr, "error: http_put_request_header: negative size\n"); } if(offset<0) { fprintf(stderr, "error: http_put_request_header: negative offset\n"); } if (offset) { sprintf(buf, "PUT /%s;byte-range %d- HTTP/1.0\015\012" "Pragma: no-cache\015\012" "Cache-Control: no-cache\015\012" "Host: %s:80\015\012" "Content-Type: application/octet-stream\015\012" "Content-Length: %d\015\012" "\015\012", file, offset, host, size ); } else { sprintf(buf, "PUT /%s HTTP/1.0\015\012" "Pragma: no-cache\015\012" "Cache-Control: no-cache\015\012" "Host: %s:80\015\012" "Content-Type: application/octet-stream\015\012" "Content-Length: %d\015\012" "\015\012", file, host, size ); } } #endif // Parse an http reply header into the header struct // int read_http_reply_header(int socket, HTTP_REPLY_HEADER& header) { int i, n; char buf[1024], *p; if(socket<0) { fprintf(stderr, "error: read_http_reply_header: negative socket\n"); return ERR_NEG; } memset(buf, 0, sizeof(buf)); header.content_length = 0; header.status = 404; // default to failure for (i=0; i<1024; i++) { n = recv(socket, buf+i, 1, 0); if (strstr(buf, "\r\n\r\n") || strstr(buf, "\n\n")) { if (log_flags.http_debug) printf("reply header:\n%s", buf); p = strchr(buf, ' '); if (p) { header.status = atoi(p+1); } p = strstr(buf, "Content-Length: "); if (p) { header.content_length = atoi(p+strlen("Content-Length: ")); } p = strstr(buf, "Location: "); if (p) { // TODO: Is there a better way to do this? n = 0; p += strlen( "Location: " ); while (p[n] != '\n' && p[n] != '\r') { header.redirect_location[n] = p[n]; n++; } p[n] = '\0'; } return 0; } } return 1; } // Read the contents of the socket into buf // static int read_reply(int socket, char* buf, int len) { int i, n; if(socket<0) { fprintf(stderr, "error: read_reply: negative socket\n"); return ERR_NEG; } if(buf==NULL) { fprintf(stderr, "error: read_reply: unexpected NULL pointer buf\n"); return ERR_NULL; } if(len<0) { fprintf(stderr, "error: read_reply: negative len\n"); return ERR_NEG; } for (i=0; iinsert(ho); if (retval) return retval; http_ops.push_back(ho); return 0; } // Runs through the set of HTTP_OP objects in the set and decides // what operation is appropriate for each. This section needs more // thorough documentation, as it is fairly complex // bool HTTP_OP_SET::poll() { unsigned int i; HTTP_OP* htp; int n; bool action = false; for (i=0; ihttp_op_state) { case HTTP_STATE_CONNECTING: // If the op is in the connecting state, and we notice it is done // connecting, move it to the HTTP_STATE_REQUEST_HEADER state if (htp->is_connected) { htp->http_op_state = HTTP_STATE_REQUEST_HEADER; htp->want_upload = true; action = true; } break; case HTTP_STATE_REQUEST_HEADER: if (htp->io_ready) { action = true; n = send(htp->socket, htp->request_header, strlen(htp->request_header), 0); if (log_flags.http_debug) { printf("wrote HTTP header: %d bytes\n", n); } htp->io_ready = false; switch(htp->http_op_type) { case HTTP_OP_POST: //case HTTP_OP_PUT: htp->http_op_state = HTTP_STATE_REQUEST_BODY; htp->file = fopen(htp->infile, "r"); if (!htp->file) { fprintf(stderr, "HTTP_OP: no input file %s\n", htp->infile); htp->io_done = true; htp->http_op_retval = ERR_FOPEN; htp->http_op_state = HTTP_STATE_DONE; break; } htp->do_file_io = true; break; case HTTP_OP_GET: case HTTP_OP_HEAD: htp->http_op_state = HTTP_STATE_REPLY_HEADER; htp->want_upload = false; htp->want_download = true; break; case HTTP_OP_POST2: htp->http_op_state = HTTP_STATE_REQUEST_BODY1; break; } } break; case HTTP_STATE_REQUEST_BODY1: if (htp->io_ready) { action = true; n = send(htp->socket, htp->req1, strlen(htp->req1), 0); htp->http_op_state = HTTP_STATE_REQUEST_BODY; htp->file = fopen(htp->infile, "r"); if (!htp->file) { fprintf(stderr, "HTTP_OP: no input file %s\n", htp->infile); htp->io_done = true; htp->http_op_retval = ERR_FOPEN; htp->http_op_state = HTTP_STATE_DONE; break; } fseek(htp->file, (long)htp->file_offset, SEEK_SET); htp->io_ready = false; htp->do_file_io = true; } break; case HTTP_STATE_REQUEST_BODY: if (htp->io_done) { action = true; if (log_flags.http_debug) { printf("finished sending request body\n"); } htp->http_op_state = HTTP_STATE_REPLY_HEADER; fclose(htp->file); htp->file = 0; htp->do_file_io = false; htp->want_upload = false; htp->want_download = true; htp->io_ready = false; } case HTTP_STATE_REPLY_HEADER: if (htp->io_ready) { action = true; if (log_flags.http_debug) printf("got reply header\n"); read_http_reply_header(htp->socket, htp->hrh); // TODO: handle all kinds of redirects here if (htp->hrh.status == 301 || htp->hrh.status == 302) { fprintf( stderr, "Redirect to %s\n", htp->hrh.redirect_location ); // Close the old socket htp->close_socket(); switch (htp->http_op_type) { case HTTP_OP_HEAD: htp->init_head( htp->hrh.redirect_location ); break; case HTTP_OP_GET: // *** Not sure if delete_old_file should be true htp->init_get( htp->hrh.redirect_location, htp->outfile, true ); break; case HTTP_OP_POST: htp->init_post( htp->hrh.redirect_location, htp->infile, htp->outfile ); break; case HTTP_OP_POST2: // TODO: Change offset to correct value htp->init_post2( htp->hrh.redirect_location, htp->req1, htp->infile,0 ); break; } // Open connection to the redirected server htp->open_server(); break; } if (htp->hrh.status/100 != 2) { htp->http_op_state = HTTP_STATE_DONE; htp->http_op_retval = htp->hrh.status; break; } switch (htp->http_op_type) { case HTTP_OP_HEAD: htp->http_op_state = HTTP_STATE_DONE; htp->http_op_retval = 0; break; case HTTP_OP_POST: unlink(htp->outfile); case HTTP_OP_GET: htp->http_op_state = HTTP_STATE_REPLY_BODY; // TODO: // Append to a file if it already exists, otherwise // create a new one. init_get should have already // deleted the file if necessary htp->file = fopen(htp->outfile, "w"); if (!htp->file) { fprintf(stderr, "HTTP_OP: can't open output file %s\n", htp->outfile ); htp->io_done = true; htp->http_op_state = HTTP_STATE_DONE; htp->http_op_retval = ERR_FOPEN; break; } htp->do_file_io = true; break; case HTTP_OP_POST2: htp->http_op_state = HTTP_STATE_REPLY_BODY; htp->io_ready = false; break; #if 0 case HTTP_OP_PUT: htp->http_op_state = HTTP_STATE_DONE; htp->http_op_retval = 0; #endif } } break; case HTTP_STATE_REPLY_BODY: if (htp->io_done) { switch(htp->http_op_type) { case HTTP_OP_POST2: read_reply(htp->socket, htp->req1, 256); break; default: action = true; fclose(htp->file); htp->file = 0; break; } if (log_flags.http_debug) printf("got reply body\n"); htp->http_op_state = HTTP_STATE_DONE; htp->http_op_retval = 0; } break; } } return action; } // Remove an HTTP_OP from the set // int HTTP_OP_SET::remove(HTTP_OP* p) { vector::iterator iter; if(p==NULL) { fprintf(stderr, "error: HTTP_OP_SET.remove: unexpected NULL pointer p\n"); return ERR_NULL; } net_xfers->remove(p); iter = http_ops.begin(); while (iter != http_ops.end()) { if (*iter == p) { http_ops.erase(iter); return 0; } iter++; } fprintf(stderr, "HTTP_OP_SET::remove(): not found\n"); return 1; } // Returns the size of the set of HTTP_OP objects // int HTTP_OP_SET::size() { return http_ops.size(); }