curl/lib/file.c

272 lines
7.2 KiB
C
Raw Normal View History

2002-09-03 13:52:59 +02:00
/***************************************************************************
1999-12-29 15:20:26 +01:00
* _ _ ____ _
* Project ___| | | | _ \| |
* / __| | | | |_) | |
* | (__| |_| | _ <| |___
* \___|\___/|_| \_\_____|
*
* Copyright (C) 1998 - 2003, Daniel Stenberg, <daniel@haxx.se>, et al.
1999-12-29 15:20:26 +01:00
*
2002-09-03 13:52:59 +02:00
* This software is licensed as described in the file COPYING, which
* you should have received as part of this distribution. The terms
* are also available at http://curl.haxx.se/docs/copyright.html.
*
2001-01-03 10:29:33 +01:00
* You may opt to use, copy, modify, merge, publish, distribute and/or sell
* copies of the Software, and permit persons to whom the Software is
2002-09-03 13:52:59 +02:00
* furnished to do so, under the terms of the COPYING file.
1999-12-29 15:20:26 +01:00
*
2001-01-03 10:29:33 +01:00
* This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
* KIND, either express or implied.
1999-12-29 15:20:26 +01:00
*
2001-01-03 10:29:33 +01:00
* $Id$
2002-09-03 13:52:59 +02:00
***************************************************************************/
1999-12-29 15:20:26 +01:00
#include "setup.h"
#ifndef CURL_DISABLE_FILE
1999-12-29 15:20:26 +01:00
/* -- WIN32 approved -- */
#include <stdio.h>
#include <string.h>
#include <stdarg.h>
#include <stdlib.h>
#include <ctype.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <errno.h>
#if defined(WIN32) && !defined(__GNUC__) || defined(__MINGW32__)
#include <time.h>
#include <io.h>
#include <fcntl.h>
#else
#ifdef HAVE_SYS_SOCKET_H
#include <sys/socket.h>
#endif
2000-08-23 09:23:42 +02:00
#ifdef HAVE_NETINET_IN_H
1999-12-29 15:20:26 +01:00
#include <netinet/in.h>
2000-08-23 09:23:42 +02:00
#endif
1999-12-29 15:20:26 +01:00
#include <sys/time.h>
#ifdef HAVE_UNISTD_H
#include <unistd.h>
#endif
2000-08-23 09:23:42 +02:00
#ifdef HAVE_NETDB_H
1999-12-29 15:20:26 +01:00
#include <netdb.h>
2000-08-23 09:23:42 +02:00
#endif
1999-12-29 15:20:26 +01:00
#ifdef HAVE_ARPA_INET_H
#include <arpa/inet.h>
#endif
#ifdef HAVE_NET_IF_H
#include <net/if.h>
#endif
#include <sys/ioctl.h>
#include <signal.h>
#ifdef HAVE_SYS_PARAM_H
#include <sys/param.h>
#endif
#ifdef HAVE_SYS_STAT_H
#include <sys/stat.h>
#endif
#ifdef HAVE_FCNTL_H
#include <fcntl.h>
#endif
#endif
#include "urldata.h"
#include <curl/curl.h>
#include "progress.h"
#include "sendf.h"
#include "escape.h"
#define _MPRINTF_REPLACE /* use our functions only */
#include <curl/mprintf.h>
2000-11-27 13:04:51 +01:00
/* The last #include file should be: */
2003-06-26 13:16:37 +02:00
#ifdef CURLDEBUG
2000-11-27 13:04:51 +01:00
#include "memdebug.h"
#endif
1999-12-29 15:20:26 +01:00
/* Emulate a connect-then-transfer protocol. We connect to the file here */
CURLcode Curl_file_connect(struct connectdata *conn)
1999-12-29 15:20:26 +01:00
{
char *real_path = curl_unescape(conn->path, 0);
struct FILE *file;
1999-12-29 15:20:26 +01:00
int fd;
2001-03-14 09:28:19 +01:00
#if defined(WIN32) || defined(__EMX__)
int i;
char *actual_path;
2001-03-14 09:28:19 +01:00
#endif
file = (struct FILE *)malloc(sizeof(struct FILE));
if(!file)
return CURLE_OUT_OF_MEMORY;
memset(file, 0, sizeof(struct FILE));
conn->proto.file = file;
1999-12-29 15:20:26 +01:00
2000-03-19 20:54:13 +01:00
#if defined(WIN32) || defined(__EMX__)
/* If the first character is a slash, and there's
something that looks like a drive at the beginning of
the path, skip the slash. If we remove the initial
slash in all cases, paths without drive letters end up
relative to the current directory which isn't how
browsers work.
Some browsers accept | instead of : as the drive letter
separator, so we do too.
On other platforms, we need the slash to indicate an
absolute pathname. On Windows, absolute paths start
with a drive letter.
*/
actual_path = real_path;
2003-08-08 19:56:47 +02:00
if ((actual_path[0] == '/') &&
actual_path[1] &&
(actual_path[2] == ':' || actual_path[2] == '|'))
{
actual_path[2] = ':';
actual_path++;
}
2000-03-19 20:54:13 +01:00
/* change path separators from '/' to '\\' for Windows and OS/2 */
1999-12-29 15:20:26 +01:00
for (i=0; actual_path[i] != '\0'; ++i)
if (actual_path[i] == '/')
actual_path[i] = '\\';
fd = open(actual_path, O_RDONLY | O_BINARY); /* no CR/LF translation! */
#else
fd = open(real_path, O_RDONLY);
1999-12-29 15:20:26 +01:00
#endif
free(real_path);
1999-12-29 15:20:26 +01:00
if(fd == -1) {
failf(conn->data, "Couldn't open file %s", conn->path);
2000-05-22 16:12:12 +02:00
return CURLE_FILE_COULDNT_READ_FILE;
1999-12-29 15:20:26 +01:00
}
file->fd = fd;
return CURLE_OK;
}
/* This is the do-phase, separated from the connect-phase above */
CURLcode Curl_file(struct connectdata *conn)
{
/* This implementation ignores the host name in conformance with
RFC 1738. Only local files (reachable via the standard file system)
are supported. This means that files on remotely mounted directories
(via NFS, Samba, NT sharing) can be accessed through a file:// URL
*/
CURLcode res = CURLE_OK;
struct stat statbuf;
unsigned long expected_size=0;
bool fstated=FALSE;
ssize_t nread;
struct SessionHandle *data = conn->data;
char *buf = data->state.buffer;
int bytecount = 0;
struct timeval start = Curl_tvnow();
struct timeval now = start;
int fd;
/* get the fd from the connection phase */
fd = conn->proto.file->fd;
/*VMS?? -- This only works reliable for STREAMLF files */
1999-12-29 15:20:26 +01:00
if( -1 != fstat(fd, &statbuf)) {
/* we could stat it, then read out the size */
expected_size = statbuf.st_size;
fstated = TRUE;
}
/* If we have selected NOBODY and HEADER, it means that we only want file
information. Which for FILE can't be much more than the file size and
date. */
if(data->set.no_body && data->set.include_header && fstated) {
CURLcode result;
sprintf(buf, "Content-Length: %lu\r\n", expected_size);
result = Curl_client_write(data, CLIENTWRITE_BOTH, buf, 0);
if(result)
return result;
sprintf(buf, "Accept-ranges: bytes\r\n");
result = Curl_client_write(data, CLIENTWRITE_BOTH, buf, 0);
if(result)
return result;
#ifdef HAVE_STRFTIME
if(fstated) {
struct tm *tm;
#ifdef HAVE_GMTIME_R
struct tm buffer;
tm = (struct tm *)gmtime_r((time_t *)&statbuf.st_mtime, &buffer);
#else
tm = gmtime((time_t *)&statbuf.st_mtime);
#endif
/* format: "Tue, 15 Nov 1994 12:45:26 GMT" */
strftime(buf, BUFSIZE-1, "Last-Modified: %a, %d %b %Y %H:%M:%S GMT\r\n",
tm);
result = Curl_client_write(data, CLIENTWRITE_BOTH, buf, 0);
}
#endif
return result;
1999-12-29 15:20:26 +01:00
}
/* Added by Dolbneff A.V & Spiridonoff A.V */
if (conn->resume_from <= (long)expected_size)
expected_size -= conn->resume_from;
else
/* Is this error code suitable in such situation? */
return CURLE_FTP_BAD_DOWNLOAD_RESUME;
if (fstated && (expected_size == 0))
return CURLE_OK;
1999-12-29 15:20:26 +01:00
/* The following is a shortcut implementation of file reading
this is both more efficient than the former call to download() and
it avoids problems with select() and recv() on file descriptors
in Winsock */
if(fstated)
Curl_pgrsSetDownloadSize(data, (double)expected_size);
if(conn->resume_from)
/* Added by Dolbneff A.V & Spiridonoff A.V */
lseek(fd, conn->resume_from, SEEK_SET);
2000-05-22 16:12:12 +02:00
while (res == CURLE_OK) {
1999-12-29 15:20:26 +01:00
nread = read(fd, buf, BUFSIZE-1);
if ( nread > 0)
1999-12-29 15:20:26 +01:00
buf[nread] = 0;
if (nread <= 0)
break;
1999-12-29 15:20:26 +01:00
bytecount += nread;
/* NOTE: The following call to fwrite does CR/LF translation on
Windows systems if the target is stdout. Use -O or -o parameters
to prevent CR/LF translation (this then goes to a binary mode
file descriptor). */
2000-11-22 13:51:18 +01:00
res = Curl_client_write(data, CLIENTWRITE_BODY, buf, nread);
2000-11-22 13:51:18 +01:00
if(res)
return res;
now = Curl_tvnow();
if(Curl_pgrsUpdate(conn))
2000-05-22 16:12:12 +02:00
res = CURLE_ABORTED_BY_CALLBACK;
1999-12-29 15:20:26 +01:00
}
now = Curl_tvnow();
if(Curl_pgrsUpdate(conn))
2000-05-22 16:12:12 +02:00
res = CURLE_ABORTED_BY_CALLBACK;
1999-12-29 15:20:26 +01:00
close(fd);
2000-05-22 16:12:12 +02:00
return res;
1999-12-29 15:20:26 +01:00
}
#endif