create a compressed tar file with a file index

pull/2/head
Dave Vasilevsky 15 years ago
parent 62443a29fe
commit ba095bb055

@ -4,7 +4,7 @@ CFLAGS = -I/Library/Fink/sl64/include -g -O0 -std=c99 -Wall
CC = gcc $(CFLAGS) -c -o
LD = gcc $(LDFLAGS) -o
all: pixz pixzlist pixztar
all: pixz pixzlist pixztar write
%.o: %.c pixz.h

@ -6,6 +6,7 @@
#include <sys/errno.h>
#define CHUNKSIZE 4096
#define INDEXFILE "index.xz"
typedef struct {
FILE *file;

@ -2,11 +2,14 @@
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <archive.h>
#include <archive_entry.h>
#include <lzma.h>
#include <libkern/OSByteOrder.h>
#pragma mark DEFINES
@ -16,23 +19,54 @@
#define CHECK LZMA_CHECK_CRC32
#pragma mark TYPES
struct file_index_t {
char *name;
off_t offset;
struct file_index_t *next;
};
typedef struct file_index_t file_index_t;
#pragma mark GLOBALS
FILE *gInFile = NULL, *gOutFile = NULL;
off_t gTotalRead = 0;
uint8_t gBlockBuf[BLOCKSIZE];
size_t gBlockSize = 0;
lzma_filter gFilters[LZMA_FILTERS_MAX + 1];
lzma_stream gStream = LZMA_STREAM_INIT;
lzma_index *gIndex = NULL;
file_index_t *gFileIndex = NULL;
file_index_t *gLastFile = NULL;
off_t gMultiHeaderStart = 0;
bool gMultiHeader = false;
uint8_t gFileIndexBuf[CHUNKSIZE];
size_t gFileIndexBufPos = 0;
#pragma mark FUNCTION DECLARATIONS
void die(const char *fmt, ...);
void stream_edge(lzma_vli backward_size);
void write_block(void);
void write_block_header(lzma_block *block);
void encode_index(void);
bool is_multi_header(const char *name);
void add_file(off_t offset, const char *name);
void dump_file_index(void);
void free_file_index(void);
void write_file_index(void);
void write_file_index_bytes(size_t size, uint8_t *buf);
void write_file_index_buf(lzma_action action);
archive_read_callback tar_read;
archive_open_callback tar_ok;
archive_close_callback tar_ok;
@ -78,13 +112,18 @@ int main(int argc, char **argv) {
die("Error reading archive entry");
}
printf("%s\n", archive_entry_pathname(entry));
add_file(archive_read_header_position(ar),
archive_entry_pathname(entry));
}
archive_read_finish(ar);
fclose(gInFile);
// xz cleanup (index, footer)
write_block(); // write last block, if necessary
add_file(gTotalRead, NULL);
write_file_index();
// xz cleanup (index, footer)
encode_index();
stream_edge(lzma_index_size(gIndex));
lzma_index_end(gIndex, NULL);
@ -113,6 +152,7 @@ ssize_t tar_read(struct archive *ar, void *ref, const void **bufp) {
if (rd == 0 && feof(gInFile))
die("Error reading input file");
gBlockSize += rd;
gTotalRead += rd;
*bufp = buf;
return rd;
}
@ -137,29 +177,34 @@ void stream_edge(lzma_vli backward_size) {
die("Error writing stream edge");
}
void write_block(void) {
if (gBlockSize == 0)
return;
void write_block_header(lzma_block *block) {
block->version = 0;
block->check = CHECK;
block->filters = gFilters;
block->compressed_size = block->uncompressed_size = LZMA_VLI_UNKNOWN;
lzma_block block = { .version = 0, .check = CHECK, .filters = gFilters };
block.compressed_size = block.uncompressed_size = LZMA_VLI_UNKNOWN;
uint8_t obuf[CHUNKSIZE];
// header
if (lzma_block_header_size(&block) != LZMA_OK)
if (lzma_block_header_size(block) != LZMA_OK)
die("Error getting block header size");
if (block.header_size > CHUNKSIZE)
die("Block header too big"); // can this really happen!?
if (lzma_block_header_encode(&block, obuf) != LZMA_OK)
uint8_t buf[block->header_size];
if (lzma_block_header_encode(block, buf) != LZMA_OK)
die("Error encoding block header");
if (fwrite(obuf, block.header_size, 1, gOutFile) != 1)
if (fwrite(buf, block->header_size, 1, gOutFile) != 1)
die("Error writing block header");
}
void write_block(void) {
if (gBlockSize == 0)
return;
lzma_block block;
write_block_header(&block);
// encode
if (lzma_block_encoder(&gStream, &block) != LZMA_OK)
die("Error creating block encoder");
gStream.next_in = gBlockBuf;
gStream.avail_in = gBlockSize;
uint8_t obuf[CHUNKSIZE];
lzma_ret err = LZMA_OK;
while (err != LZMA_STREAM_END) {
gStream.next_out = obuf;
@ -169,11 +214,12 @@ void write_block(void) {
if (err != LZMA_OK && err != LZMA_STREAM_END)
die("Error encoding block");
if (fwrite(obuf, CHUNKSIZE - gStream.avail_out, 1, gOutFile) != 1)
die("Error writing block data");
if (gStream.avail_out != CHUNKSIZE) {
if (fwrite(obuf, CHUNKSIZE - gStream.avail_out, 1, gOutFile) != 1)
die("Error writing block data");
}
}
// index
if (lzma_index_append(gIndex, NULL, lzma_block_unpadded_size(&block),
block.uncompressed_size) != LZMA_OK)
die("Error adding to index");
@ -192,7 +238,116 @@ void encode_index(void) {
err = lzma_code(&gStream, LZMA_RUN);
if (err != LZMA_OK && err != LZMA_STREAM_END)
die("Error encoding index");
if (fwrite(obuf, CHUNKSIZE - gStream.avail_out, 1, gOutFile) != 1)
die("Error writing index data");
if (gStream.avail_out != CHUNKSIZE) {
if (fwrite(obuf, CHUNKSIZE - gStream.avail_out, 1, gOutFile) != 1)
die("Error writing index data");
}
}
}
void add_file(off_t offset, const char *name) {
if (name && is_multi_header(name)) {
if (!gMultiHeader)
gMultiHeaderStart = offset;
gMultiHeader = true;
return;
}
file_index_t *f = malloc(sizeof(file_index_t));
f->offset = gMultiHeader ? gMultiHeaderStart : offset;
gMultiHeader = false;
f->name = name ? strdup(name) : NULL;
f->next = NULL;
if (gLastFile) {
gLastFile->next = f;
} else { // new index
gFileIndex = f;
}
gLastFile = f;
}
void dump_file_index(void) {
for (file_index_t *f = gFileIndex; f != NULL; f = f->next) {
printf("%s\n", f->name ? f->name : "");
}
}
void free_file_index(void) {
for (file_index_t *f = gFileIndex; f != NULL; ) {
file_index_t *next = f->next;
free(f->name);
free(f);
f = next;
}
gFileIndex = gLastFile = NULL;
}
bool is_multi_header(const char *name) {
size_t i = strlen(name);
while (i != 0 && name[i - 1] != '/')
--i;
return strncmp(name + i, "._", 2) == 0;
}
void write_file_index(void) {
lzma_block block;
write_block_header(&block);
if (lzma_block_encoder(&gStream, &block) != LZMA_OK)
die("Error creating file index encoder");
uint8_t offbuf[sizeof(uint64_t)];
for (file_index_t *f = gFileIndex; f != NULL; f = f->next) {
char *name = f->name ? f->name : "";
printf("%s\n", name);
size_t len = strlen(name);
write_file_index_bytes(len + 1, (uint8_t*)name);
OSWriteLittleInt64(offbuf, 0, f->offset);
write_file_index_bytes(sizeof(offbuf), offbuf);
}
write_file_index_buf(LZMA_FINISH);
if (lzma_index_append(gIndex, NULL, lzma_block_unpadded_size(&block),
block.uncompressed_size) != LZMA_OK)
die("Error adding file-index to index");
}
void write_file_index_bytes(size_t size, uint8_t *buf) {
size_t bufpos = 0;
while (bufpos < size) {
size_t len = size - bufpos;
size_t space = CHUNKSIZE - gFileIndexBufPos;
if (len > space)
len = space;
memcpy(gFileIndexBuf + gFileIndexBufPos, buf + bufpos, len);
gFileIndexBufPos += len;
bufpos += len;
if (gFileIndexBufPos == CHUNKSIZE) {
write_file_index_buf(LZMA_RUN);
gFileIndexBufPos = 0;
}
}
}
void write_file_index_buf(lzma_action action) {
printf("%ld\n", gFileIndexBufPos);
uint8_t obuf[CHUNKSIZE];
gStream.avail_in = gFileIndexBufPos;
gStream.next_in = gFileIndexBuf;
lzma_ret err = LZMA_OK;
while (err != LZMA_STREAM_END && (action == LZMA_FINISH || gStream.avail_in)) {
gStream.avail_out = CHUNKSIZE;
gStream.next_out = obuf;
err = lzma_code(&gStream, action);
if (err != LZMA_OK && err != LZMA_STREAM_END)
die("Error encoding file index");
if (gStream.avail_out != CHUNKSIZE) {
if (fwrite(obuf, CHUNKSIZE - gStream.avail_out, 1, gOutFile) != 1)
die("Error writing file index");
}
}
gFileIndexBufPos = 0;
}

Loading…
Cancel
Save