2002-09-03 13:52:59 +02:00
|
|
|
/***************************************************************************
|
1999-12-29 15:20:26 +01:00
|
|
|
* _ _ ____ _
|
|
|
|
* Project ___| | | | _ \| |
|
|
|
|
* / __| | | | |_) | |
|
|
|
|
* | (__| |_| | _ <| |___
|
|
|
|
* \___|\___/|_| \_\_____|
|
|
|
|
*
|
2004-01-07 10:19:33 +01:00
|
|
|
* Copyright (C) 1998 - 2004, Daniel Stenberg, <daniel@haxx.se>, et al.
|
1999-12-29 15:20:26 +01:00
|
|
|
*
|
2002-09-03 13:52:59 +02:00
|
|
|
* This software is licensed as described in the file COPYING, which
|
|
|
|
* you should have received as part of this distribution. The terms
|
|
|
|
* are also available at http://curl.haxx.se/docs/copyright.html.
|
|
|
|
*
|
2001-01-03 10:29:33 +01:00
|
|
|
* You may opt to use, copy, modify, merge, publish, distribute and/or sell
|
|
|
|
* copies of the Software, and permit persons to whom the Software is
|
2002-09-03 13:52:59 +02:00
|
|
|
* furnished to do so, under the terms of the COPYING file.
|
1999-12-29 15:20:26 +01:00
|
|
|
*
|
2001-01-03 10:29:33 +01:00
|
|
|
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
|
|
|
|
* KIND, either express or implied.
|
1999-12-29 15:20:26 +01:00
|
|
|
*
|
2001-01-03 10:29:33 +01:00
|
|
|
* $Id$
|
2002-09-03 13:52:59 +02:00
|
|
|
***************************************************************************/
|
1999-12-29 15:20:26 +01:00
|
|
|
|
2000-08-24 16:26:33 +02:00
|
|
|
#include "setup.h"
|
|
|
|
|
2002-06-11 13:13:01 +02:00
|
|
|
#ifndef CURL_DISABLE_FILE
|
1999-12-29 15:20:26 +01:00
|
|
|
/* -- WIN32 approved -- */
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <stdarg.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <ctype.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
|
|
|
|
#include <errno.h>
|
|
|
|
|
|
|
|
#if defined(WIN32) && !defined(__GNUC__) || defined(__MINGW32__)
|
|
|
|
#include <time.h>
|
|
|
|
#include <io.h>
|
|
|
|
#include <fcntl.h>
|
|
|
|
#else
|
|
|
|
#ifdef HAVE_SYS_SOCKET_H
|
|
|
|
#include <sys/socket.h>
|
|
|
|
#endif
|
2000-08-23 09:23:42 +02:00
|
|
|
#ifdef HAVE_NETINET_IN_H
|
1999-12-29 15:20:26 +01:00
|
|
|
#include <netinet/in.h>
|
2000-08-23 09:23:42 +02:00
|
|
|
#endif
|
1999-12-29 15:20:26 +01:00
|
|
|
#include <sys/time.h>
|
|
|
|
#ifdef HAVE_UNISTD_H
|
|
|
|
#include <unistd.h>
|
|
|
|
#endif
|
2000-08-23 09:23:42 +02:00
|
|
|
#ifdef HAVE_NETDB_H
|
1999-12-29 15:20:26 +01:00
|
|
|
#include <netdb.h>
|
2000-08-23 09:23:42 +02:00
|
|
|
#endif
|
1999-12-29 15:20:26 +01:00
|
|
|
#ifdef HAVE_ARPA_INET_H
|
|
|
|
#include <arpa/inet.h>
|
|
|
|
#endif
|
|
|
|
#ifdef HAVE_NET_IF_H
|
|
|
|
#include <net/if.h>
|
|
|
|
#endif
|
|
|
|
#include <sys/ioctl.h>
|
|
|
|
#include <signal.h>
|
|
|
|
|
|
|
|
#ifdef HAVE_SYS_PARAM_H
|
|
|
|
#include <sys/param.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifdef HAVE_SYS_STAT_H
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#endif
|
|
|
|
#ifdef HAVE_FCNTL_H
|
|
|
|
#include <fcntl.h>
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "urldata.h"
|
|
|
|
#include <curl/curl.h>
|
|
|
|
#include "progress.h"
|
|
|
|
#include "sendf.h"
|
|
|
|
#include "escape.h"
|
2004-01-29 14:56:45 +01:00
|
|
|
#include "file.h"
|
2004-03-04 16:23:57 +01:00
|
|
|
#include "speedcheck.h"
|
2004-03-05 10:40:16 +01:00
|
|
|
#include "getinfo.h"
|
2004-03-05 12:39:19 +01:00
|
|
|
#include "transfer.h" /* for Curl_readwrite_init() */
|
1999-12-29 15:20:26 +01:00
|
|
|
|
|
|
|
#define _MPRINTF_REPLACE /* use our functions only */
|
|
|
|
#include <curl/mprintf.h>
|
|
|
|
|
2000-11-27 13:04:51 +01:00
|
|
|
/* The last #include file should be: */
|
2003-06-26 13:16:37 +02:00
|
|
|
#ifdef CURLDEBUG
|
2000-11-27 13:04:51 +01:00
|
|
|
#include "memdebug.h"
|
|
|
|
#endif
|
1999-12-29 15:20:26 +01:00
|
|
|
|
2001-03-05 14:39:01 +01:00
|
|
|
/* Emulate a connect-then-transfer protocol. We connect to the file here */
|
|
|
|
CURLcode Curl_file_connect(struct connectdata *conn)
|
1999-12-29 15:20:26 +01:00
|
|
|
{
|
2003-08-08 19:12:04 +02:00
|
|
|
char *real_path = curl_unescape(conn->path, 0);
|
2004-03-03 10:25:59 +01:00
|
|
|
struct FILEPROTO *file;
|
1999-12-29 15:20:26 +01:00
|
|
|
int fd;
|
2001-03-14 09:28:19 +01:00
|
|
|
#if defined(WIN32) || defined(__EMX__)
|
|
|
|
int i;
|
2003-08-08 19:12:04 +02:00
|
|
|
char *actual_path;
|
2001-03-14 09:28:19 +01:00
|
|
|
#endif
|
2001-03-05 14:39:01 +01:00
|
|
|
|
2004-03-03 10:25:59 +01:00
|
|
|
file = (struct FILEPROTO *)calloc(sizeof(struct FILEPROTO), 1);
|
2001-03-05 14:39:01 +01:00
|
|
|
if(!file)
|
|
|
|
return CURLE_OUT_OF_MEMORY;
|
|
|
|
|
|
|
|
conn->proto.file = file;
|
1999-12-29 15:20:26 +01:00
|
|
|
|
2000-03-19 20:54:13 +01:00
|
|
|
#if defined(WIN32) || defined(__EMX__)
|
2003-08-08 19:12:04 +02:00
|
|
|
/* If the first character is a slash, and there's
|
|
|
|
something that looks like a drive at the beginning of
|
|
|
|
the path, skip the slash. If we remove the initial
|
|
|
|
slash in all cases, paths without drive letters end up
|
|
|
|
relative to the current directory which isn't how
|
|
|
|
browsers work.
|
|
|
|
|
|
|
|
Some browsers accept | instead of : as the drive letter
|
|
|
|
separator, so we do too.
|
|
|
|
|
|
|
|
On other platforms, we need the slash to indicate an
|
|
|
|
absolute pathname. On Windows, absolute paths start
|
|
|
|
with a drive letter.
|
|
|
|
*/
|
|
|
|
actual_path = real_path;
|
2003-08-08 19:56:47 +02:00
|
|
|
if ((actual_path[0] == '/') &&
|
|
|
|
actual_path[1] &&
|
2003-08-08 19:12:04 +02:00
|
|
|
(actual_path[2] == ':' || actual_path[2] == '|'))
|
|
|
|
{
|
|
|
|
actual_path[2] = ':';
|
|
|
|
actual_path++;
|
|
|
|
}
|
|
|
|
|
2000-03-19 20:54:13 +01:00
|
|
|
/* change path separators from '/' to '\\' for Windows and OS/2 */
|
1999-12-29 15:20:26 +01:00
|
|
|
for (i=0; actual_path[i] != '\0'; ++i)
|
|
|
|
if (actual_path[i] == '/')
|
|
|
|
actual_path[i] = '\\';
|
|
|
|
|
|
|
|
fd = open(actual_path, O_RDONLY | O_BINARY); /* no CR/LF translation! */
|
|
|
|
#else
|
2003-08-08 19:12:04 +02:00
|
|
|
fd = open(real_path, O_RDONLY);
|
1999-12-29 15:20:26 +01:00
|
|
|
#endif
|
2003-08-08 19:12:04 +02:00
|
|
|
free(real_path);
|
1999-12-29 15:20:26 +01:00
|
|
|
|
|
|
|
if(fd == -1) {
|
2001-03-05 14:39:01 +01:00
|
|
|
failf(conn->data, "Couldn't open file %s", conn->path);
|
2000-05-22 16:12:12 +02:00
|
|
|
return CURLE_FILE_COULDNT_READ_FILE;
|
1999-12-29 15:20:26 +01:00
|
|
|
}
|
2001-03-05 14:39:01 +01:00
|
|
|
file->fd = fd;
|
|
|
|
|
|
|
|
return CURLE_OK;
|
|
|
|
}
|
|
|
|
|
2004-01-22 14:11:35 +01:00
|
|
|
#if defined(WIN32) && (SIZEOF_CURL_OFF_T > 4)
|
|
|
|
#define lseek(x,y,z) _lseeki64(x, y, z)
|
|
|
|
#endif
|
|
|
|
|
2001-03-05 14:39:01 +01:00
|
|
|
/* This is the do-phase, separated from the connect-phase above */
|
|
|
|
|
|
|
|
CURLcode Curl_file(struct connectdata *conn)
|
|
|
|
{
|
|
|
|
/* This implementation ignores the host name in conformance with
|
|
|
|
RFC 1738. Only local files (reachable via the standard file system)
|
|
|
|
are supported. This means that files on remotely mounted directories
|
|
|
|
(via NFS, Samba, NT sharing) can be accessed through a file:// URL
|
|
|
|
*/
|
|
|
|
CURLcode res = CURLE_OK;
|
|
|
|
struct stat statbuf;
|
2004-01-22 13:45:50 +01:00
|
|
|
curl_off_t expected_size=0;
|
2003-10-30 10:08:16 +01:00
|
|
|
bool fstated=FALSE;
|
2001-08-14 10:22:27 +02:00
|
|
|
ssize_t nread;
|
2001-08-31 00:48:34 +02:00
|
|
|
struct SessionHandle *data = conn->data;
|
|
|
|
char *buf = data->state.buffer;
|
2004-01-22 13:45:50 +01:00
|
|
|
curl_off_t bytecount = 0;
|
2001-03-05 14:39:01 +01:00
|
|
|
int fd;
|
2004-03-04 16:12:12 +01:00
|
|
|
struct timeval now = Curl_tvnow();
|
2001-03-05 14:39:01 +01:00
|
|
|
|
2004-03-05 10:40:16 +01:00
|
|
|
Curl_readwrite_init(conn);
|
|
|
|
Curl_initinfo(data);
|
|
|
|
Curl_pgrsStartNow(data);
|
|
|
|
|
2001-03-05 14:39:01 +01:00
|
|
|
/* get the fd from the connection phase */
|
|
|
|
fd = conn->proto.file->fd;
|
|
|
|
|
2004-03-05 10:40:16 +01:00
|
|
|
/* VMS: This only works reliable for STREAMLF files */
|
1999-12-29 15:20:26 +01:00
|
|
|
if( -1 != fstat(fd, &statbuf)) {
|
|
|
|
/* we could stat it, then read out the size */
|
2003-10-30 10:08:16 +01:00
|
|
|
expected_size = statbuf.st_size;
|
|
|
|
fstated = TRUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* If we have selected NOBODY and HEADER, it means that we only want file
|
|
|
|
information. Which for FILE can't be much more than the file size and
|
|
|
|
date. */
|
|
|
|
if(data->set.no_body && data->set.include_header && fstated) {
|
|
|
|
CURLcode result;
|
2004-03-02 10:31:18 +01:00
|
|
|
sprintf(buf, "Content-Length: %" FORMAT_OFF_T "\r\n", expected_size);
|
2003-10-30 10:08:16 +01:00
|
|
|
result = Curl_client_write(data, CLIENTWRITE_BOTH, buf, 0);
|
|
|
|
if(result)
|
|
|
|
return result;
|
|
|
|
|
|
|
|
sprintf(buf, "Accept-ranges: bytes\r\n");
|
|
|
|
result = Curl_client_write(data, CLIENTWRITE_BOTH, buf, 0);
|
|
|
|
if(result)
|
|
|
|
return result;
|
|
|
|
|
|
|
|
#ifdef HAVE_STRFTIME
|
|
|
|
if(fstated) {
|
|
|
|
struct tm *tm;
|
2004-02-13 08:03:03 +01:00
|
|
|
time_t clock = (time_t)statbuf.st_mtime;
|
2003-10-30 10:13:04 +01:00
|
|
|
#ifdef HAVE_GMTIME_R
|
2003-10-30 10:08:16 +01:00
|
|
|
struct tm buffer;
|
2004-02-13 08:03:03 +01:00
|
|
|
tm = (struct tm *)gmtime_r(&clock, &buffer);
|
2003-10-30 10:08:16 +01:00
|
|
|
#else
|
2004-02-13 08:03:03 +01:00
|
|
|
tm = gmtime(&clock);
|
2003-10-30 10:08:16 +01:00
|
|
|
#endif
|
|
|
|
/* format: "Tue, 15 Nov 1994 12:45:26 GMT" */
|
|
|
|
strftime(buf, BUFSIZE-1, "Last-Modified: %a, %d %b %Y %H:%M:%S GMT\r\n",
|
|
|
|
tm);
|
|
|
|
result = Curl_client_write(data, CLIENTWRITE_BOTH, buf, 0);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
return result;
|
1999-12-29 15:20:26 +01:00
|
|
|
}
|
|
|
|
|
2002-09-23 14:46:23 +02:00
|
|
|
/* Added by Dolbneff A.V & Spiridonoff A.V */
|
2004-01-05 23:29:29 +01:00
|
|
|
if (conn->resume_from <= expected_size)
|
2002-09-23 14:46:23 +02:00
|
|
|
expected_size -= conn->resume_from;
|
|
|
|
else
|
|
|
|
/* Is this error code suitable in such situation? */
|
|
|
|
return CURLE_FTP_BAD_DOWNLOAD_RESUME;
|
|
|
|
|
2003-10-30 10:08:16 +01:00
|
|
|
if (fstated && (expected_size == 0))
|
2002-09-23 14:46:23 +02:00
|
|
|
return CURLE_OK;
|
|
|
|
|
1999-12-29 15:20:26 +01:00
|
|
|
/* The following is a shortcut implementation of file reading
|
|
|
|
this is both more efficient than the former call to download() and
|
|
|
|
it avoids problems with select() and recv() on file descriptors
|
|
|
|
in Winsock */
|
2003-10-30 10:08:16 +01:00
|
|
|
if(fstated)
|
|
|
|
Curl_pgrsSetDownloadSize(data, (double)expected_size);
|
2000-02-14 23:57:42 +01:00
|
|
|
|
2002-09-23 14:46:23 +02:00
|
|
|
if(conn->resume_from)
|
|
|
|
lseek(fd, conn->resume_from, SEEK_SET);
|
|
|
|
|
2004-03-04 16:12:12 +01:00
|
|
|
Curl_pgrsTime(data, TIMER_STARTTRANSFER);
|
|
|
|
|
2000-05-22 16:12:12 +02:00
|
|
|
while (res == CURLE_OK) {
|
1999-12-29 15:20:26 +01:00
|
|
|
nread = read(fd, buf, BUFSIZE-1);
|
|
|
|
|
2001-08-06 14:17:43 +02:00
|
|
|
if ( nread > 0)
|
1999-12-29 15:20:26 +01:00
|
|
|
buf[nread] = 0;
|
|
|
|
|
|
|
|
if (nread <= 0)
|
|
|
|
break;
|
2001-08-14 10:22:27 +02:00
|
|
|
|
1999-12-29 15:20:26 +01:00
|
|
|
bytecount += nread;
|
|
|
|
/* NOTE: The following call to fwrite does CR/LF translation on
|
|
|
|
Windows systems if the target is stdout. Use -O or -o parameters
|
|
|
|
to prevent CR/LF translation (this then goes to a binary mode
|
|
|
|
file descriptor). */
|
2000-11-22 13:51:18 +01:00
|
|
|
|
2001-01-05 11:11:41 +01:00
|
|
|
res = Curl_client_write(data, CLIENTWRITE_BODY, buf, nread);
|
2000-11-22 13:51:18 +01:00
|
|
|
if(res)
|
|
|
|
return res;
|
|
|
|
|
2004-03-04 16:12:12 +01:00
|
|
|
Curl_pgrsSetDownloadCounter(data, (double)bytecount);
|
|
|
|
|
2001-04-18 09:25:11 +02:00
|
|
|
if(Curl_pgrsUpdate(conn))
|
2000-05-22 16:12:12 +02:00
|
|
|
res = CURLE_ABORTED_BY_CALLBACK;
|
2004-03-04 16:12:12 +01:00
|
|
|
else
|
|
|
|
res = Curl_speedcheck (data, now);
|
1999-12-29 15:20:26 +01:00
|
|
|
}
|
2001-04-18 09:25:11 +02:00
|
|
|
if(Curl_pgrsUpdate(conn))
|
2000-05-22 16:12:12 +02:00
|
|
|
res = CURLE_ABORTED_BY_CALLBACK;
|
1999-12-29 15:20:26 +01:00
|
|
|
|
|
|
|
close(fd);
|
|
|
|
|
2000-05-22 16:12:12 +02:00
|
|
|
return res;
|
1999-12-29 15:20:26 +01:00
|
|
|
}
|
2002-06-11 13:13:01 +02:00
|
|
|
#endif
|