| /*- |
| * Copyright (c) 2003-2007 Tim Kientzle |
| * All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in the |
| * documentation and/or other materials provided with the distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR |
| * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES |
| * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. |
| * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT, |
| * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT |
| * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF |
| * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #include "archive_platform.h" |
| __FBSDID("$FreeBSD: head/lib/libarchive/archive_read_open_filename.c 201093 2009-12-28 02:28:44Z kientzle $"); |
| |
| #ifdef HAVE_SYS_STAT_H |
| #include <sys/stat.h> |
| #endif |
| #ifdef HAVE_ERRNO_H |
| #include <errno.h> |
| #endif |
| #ifdef HAVE_FCNTL_H |
| #include <fcntl.h> |
| #endif |
| #ifdef HAVE_IO_H |
| #include <io.h> |
| #endif |
| #ifdef HAVE_STDLIB_H |
| #include <stdlib.h> |
| #endif |
| #ifdef HAVE_STRING_H |
| #include <string.h> |
| #endif |
| #ifdef HAVE_UNISTD_H |
| #include <unistd.h> |
| #endif |
| |
| #include "archive.h" |
| |
| #ifndef O_BINARY |
| #define O_BINARY 0 |
| #endif |
| |
| struct read_file_data { |
| int fd; |
| size_t block_size; |
| void *buffer; |
| mode_t st_mode; /* Mode bits for opened file. */ |
| char can_skip; /* This file supports skipping. */ |
| char filename[1]; /* Must be last! */ |
| }; |
| |
| static int file_close(struct archive *, void *); |
| static ssize_t file_read(struct archive *, void *, const void **buff); |
| #if ARCHIVE_API_VERSION < 2 |
| static ssize_t file_skip(struct archive *, void *, size_t request); |
| #else |
| static off_t file_skip(struct archive *, void *, off_t request); |
| #endif |
| |
| int |
| archive_read_open_file(struct archive *a, const char *filename, |
| size_t block_size) |
| { |
| return (archive_read_open_filename(a, filename, block_size)); |
| } |
| |
| int |
| archive_read_open_filename(struct archive *a, const char *filename, |
| size_t block_size) |
| { |
| struct stat st; |
| struct read_file_data *mine; |
| void *b; |
| int fd; |
| |
| archive_clear_error(a); |
| if (filename == NULL || filename[0] == '\0') { |
| /* We used to invoke archive_read_open_fd(a,0,block_size) |
| * here, but that doesn't (and shouldn't) handle the |
| * end-of-file flush when reading stdout from a pipe. |
| * Basically, read_open_fd() is intended for folks who |
| * are willing to handle such details themselves. This |
| * API is intended to be a little smarter for folks who |
| * want easy handling of the common case. |
| */ |
| filename = ""; /* Normalize NULL to "" */ |
| fd = 0; |
| #if defined(__CYGWIN__) || defined(_WIN32) |
| setmode(0, O_BINARY); |
| #endif |
| } else { |
| fd = open(filename, O_RDONLY | O_BINARY); |
| if (fd < 0) { |
| archive_set_error(a, errno, |
| "Failed to open '%s'", filename); |
| return (ARCHIVE_FATAL); |
| } |
| } |
| if (fstat(fd, &st) != 0) { |
| archive_set_error(a, errno, "Can't stat '%s'", filename); |
| return (ARCHIVE_FATAL); |
| } |
| |
| mine = (struct read_file_data *)calloc(1, |
| sizeof(*mine) + strlen(filename)); |
| b = malloc(block_size); |
| if (mine == NULL || b == NULL) { |
| archive_set_error(a, ENOMEM, "No memory"); |
| free(mine); |
| free(b); |
| return (ARCHIVE_FATAL); |
| } |
| strcpy(mine->filename, filename); |
| mine->block_size = block_size; |
| mine->buffer = b; |
| mine->fd = fd; |
| /* Remember mode so close can decide whether to flush. */ |
| mine->st_mode = st.st_mode; |
| /* If we're reading a file from disk, ensure that we don't |
| overwrite it with an extracted file. */ |
| if (S_ISREG(st.st_mode)) { |
| archive_read_extract_set_skip_file(a, st.st_dev, st.st_ino); |
| /* |
| * Enabling skip here is a performance optimization |
| * for anything that supports lseek(). On FreeBSD |
| * (and probably many other systems), only regular |
| * files and raw disk devices support lseek() (on |
| * other input types, lseek() returns success but |
| * doesn't actually change the file pointer, which |
| * just completely screws up the position-tracking |
| * logic). In addition, I've yet to find a portable |
| * way to determine if a device is a raw disk device. |
| * So I don't see a way to do much better than to only |
| * enable this optimization for regular files. |
| */ |
| mine->can_skip = 1; |
| } |
| return (archive_read_open2(a, mine, |
| NULL, file_read, file_skip, file_close)); |
| } |
| |
| static ssize_t |
| file_read(struct archive *a, void *client_data, const void **buff) |
| { |
| struct read_file_data *mine = (struct read_file_data *)client_data; |
| ssize_t bytes_read; |
| |
| *buff = mine->buffer; |
| bytes_read = read(mine->fd, mine->buffer, mine->block_size); |
| if (bytes_read < 0) { |
| if (mine->filename[0] == '\0') |
| archive_set_error(a, errno, "Error reading stdin"); |
| else |
| archive_set_error(a, errno, "Error reading '%s'", |
| mine->filename); |
| } |
| return (bytes_read); |
| } |
| |
| #if ARCHIVE_API_VERSION < 2 |
| static ssize_t |
| file_skip(struct archive *a, void *client_data, size_t request) |
| #else |
| static off_t |
| file_skip(struct archive *a, void *client_data, off_t request) |
| #endif |
| { |
| struct read_file_data *mine = (struct read_file_data *)client_data; |
| off_t old_offset, new_offset; |
| |
| if (!mine->can_skip) /* We can't skip, so ... */ |
| return (0); /* ... skip zero bytes. */ |
| |
| /* Reduce request to the next smallest multiple of block_size */ |
| request = (request / mine->block_size) * mine->block_size; |
| if (request == 0) |
| return (0); |
| |
| /* |
| * Hurray for lazy evaluation: if the first lseek fails, the second |
| * one will not be executed. |
| */ |
| if (((old_offset = lseek(mine->fd, 0, SEEK_CUR)) < 0) || |
| ((new_offset = lseek(mine->fd, request, SEEK_CUR)) < 0)) |
| { |
| /* If skip failed once, it will probably fail again. */ |
| mine->can_skip = 0; |
| |
| if (errno == ESPIPE) |
| { |
| /* |
| * Failure to lseek() can be caused by the file |
| * descriptor pointing to a pipe, socket or FIFO. |
| * Return 0 here, so the compression layer will use |
| * read()s instead to advance the file descriptor. |
| * It's slower of course, but works as well. |
| */ |
| return (0); |
| } |
| /* |
| * There's been an error other than ESPIPE. This is most |
| * likely caused by a programmer error (too large request) |
| * or a corrupted archive file. |
| */ |
| if (mine->filename[0] == '\0') |
| /* |
| * Should never get here, since lseek() on stdin ought |
| * to return an ESPIPE error. |
| */ |
| archive_set_error(a, errno, "Error seeking in stdin"); |
| else |
| archive_set_error(a, errno, "Error seeking in '%s'", |
| mine->filename); |
| return (-1); |
| } |
| return (new_offset - old_offset); |
| } |
| |
| static int |
| file_close(struct archive *a, void *client_data) |
| { |
| struct read_file_data *mine = (struct read_file_data *)client_data; |
| |
| (void)a; /* UNUSED */ |
| |
| /* Only flush and close if open succeeded. */ |
| if (mine->fd >= 0) { |
| /* |
| * Sometimes, we should flush the input before closing. |
| * Regular files: faster to just close without flush. |
| * Devices: must not flush (user might need to |
| * read the "next" item on a non-rewind device). |
| * Pipes and sockets: must flush (otherwise, the |
| * program feeding the pipe or socket may complain). |
| * Here, I flush everything except for regular files and |
| * device nodes. |
| */ |
| if (!S_ISREG(mine->st_mode) |
| && !S_ISCHR(mine->st_mode) |
| && !S_ISBLK(mine->st_mode)) { |
| ssize_t bytesRead; |
| do { |
| bytesRead = read(mine->fd, mine->buffer, |
| mine->block_size); |
| } while (bytesRead > 0); |
| } |
| /* If a named file was opened, then it needs to be closed. */ |
| if (mine->filename[0] != '\0') |
| close(mine->fd); |
| } |
| free(mine->buffer); |
| free(mine); |
| return (ARCHIVE_OK); |
| } |