Never send a monster to do the work of an evil scientist...

This commit is contained in:
Aaron Giles 2009-07-16 07:10:16 +00:00
parent 7254c65d28
commit d879a67a4a
2 changed files with 442 additions and 0 deletions

1
.gitattributes vendored
View File

@ -3673,6 +3673,7 @@ src/tools/ldverify.c svneol=native#text/plain
src/tools/regrep.c svneol=native#text/plain
src/tools/romcmp.c svneol=native#text/plain
src/tools/runtest.cmd svneol=CRLF#text/plain eol=crlf
src/tools/split.c svneol=native#text/plain
src/tools/src2html.c svneol=native#text/plain
src/tools/srcclean.c svneol=native#text/plain
src/tools/tools.mak svneol=native#text/plain

441
src/tools/split.c Normal file
View File

@ -0,0 +1,441 @@
/***************************************************************************
split.c
Simple file splitter/joiner with hashes.
Copyright Aaron Giles. Released under the MAME license.
Visit http://mamedev.org for licensing and usage restrictions.
***************************************************************************/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include "astring.h"
#include "corefile.h"
#include "sha1.h"
#define DEFAULT_SPLIT_SIZE 100
#define MAX_PARTS 1000
/***************************************************************************
CORE IMPLEMENTATION
***************************************************************************/
/*-------------------------------------------------
compute_hash_as_string - compute an SHA1
hash over a buffer and return a string
-------------------------------------------------*/
static void compute_hash_as_string(astring *buffer, void *data, UINT32 length)
{
char expanded[SHA1_DIGEST_SIZE * 2];
UINT8 sha1digest[SHA1_DIGEST_SIZE];
struct sha1_ctx sha1;
int ch;
// compute the SHA1
sha1_init(&sha1);
sha1_update(&sha1, length, data);
sha1_final(&sha1);
sha1_digest(&sha1, sizeof(sha1digest), sha1digest);
// expand the digest to a string
for (ch = 0; ch < SHA1_DIGEST_SIZE; ch++)
{
expanded[ch * 2 + 0] = "0123456789ABCDEF"[sha1digest[ch] >> 4];
expanded[ch * 2 + 1] = "0123456789ABCDEF"[sha1digest[ch] & 15];
}
// copy it to the buffer
astring_cpych(buffer, expanded, sizeof(expanded));
}
/*-------------------------------------------------
split_file - split a file into multiple parts
-------------------------------------------------*/
static int split_file(const char *filename, const char *basename, UINT32 splitsize)
{
astring *outfilename = astring_alloc(), *basefilename = astring_alloc(), *splitfilename = astring_alloc();
core_file *outfile = NULL, *infile = NULL, *splitfile = NULL;
astring *computedhash = astring_alloc();
void *splitbuffer = NULL;
int index, partnum;
UINT64 totallength;
UINT32 totalparts;
file_error filerr;
int error = 1;
// convert split size to MB
if (splitsize > 500)
{
fprintf(stderr, "Fatal error: maximum split size is 500MB (even that is way huge!)\n");
goto cleanup;
}
splitsize *= 1024 * 1024;
// open the file for read
filerr = core_fopen(filename, OPEN_FLAG_READ, &infile);
if (filerr != FILERR_NONE)
{
fprintf(stderr, "Fatal error: unable to open file '%s'\n", filename);
goto cleanup;
}
// get the total length
totallength = core_fsize(infile);
if (totallength < splitsize)
{
fprintf(stderr, "Fatal error: file is smaller than the split size\n");
goto cleanup;
}
if ((UINT64)splitsize * MAX_PARTS < totallength)
{
fprintf(stderr, "Fatal error: too many splits (maximum is %d)\n", MAX_PARTS);
goto cleanup;
}
totalparts = totallength / splitsize;
// allocate a buffer for reading
splitbuffer = malloc(splitsize);
if (splitbuffer == NULL)
{
fprintf(stderr, "Fatal error: unable to allocate memory for the split\n");
goto cleanup;
}
// find the base name of the file
astring_cpyc(basefilename, basename);
index = astring_rchr(basefilename, 0, PATH_SEPARATOR[0]);
if (index != -1)
astring_del(basefilename, 0, index + 1);
// compute the split filename
astring_cpyc(splitfilename, basename);
astring_catc(splitfilename, ".split");
// create the split file
filerr = core_fopen(astring_c(splitfilename), OPEN_FLAG_WRITE | OPEN_FLAG_CREATE | OPEN_FLAG_NO_BOM, &splitfile);
if (filerr != FILERR_NONE)
{
fprintf(stderr, "Fatal error: unable to create split file '%s'\n", astring_c(splitfilename));
goto cleanup;
}
// write the basics out
core_fprintf(splitfile, "splitfile=%s\n", astring_c(basefilename));
core_fprintf(splitfile, "splitsize=%d\n", splitsize);
printf("Split file is '%s'\n", astring_c(splitfilename));
printf("Splitting file %s into chunks of %dMB...\n", astring_c(basefilename), splitsize / (1024 * 1024));
// now iterate until done
for (partnum = 0; partnum < 1000; partnum++)
{
UINT32 actual, length;
printf("Reading part %d...", partnum);
// read as much as we can from the file
length = core_fread(infile, splitbuffer, splitsize);
if (length == 0)
break;
// hash what we have
compute_hash_as_string(computedhash, splitbuffer, length);
// write that info to the split file
core_fprintf(splitfile, "hash=%s file=%s.%03d\n", astring_c(computedhash), astring_c(basefilename), partnum);
// compute the full filename for this guy
astring_printf(outfilename, "%s.%03d", basename, partnum);
// create it
filerr = core_fopen(astring_c(outfilename), OPEN_FLAG_WRITE | OPEN_FLAG_CREATE, &outfile);
if (filerr != FILERR_NONE)
{
printf("\n");
fprintf(stderr, "Fatal error: unable to create output file '%s'\n", astring_c(outfilename));
goto cleanup;
}
printf(" writing %s.%03d...", astring_c(basefilename), partnum);
// write the data
actual = core_fwrite(outfile, splitbuffer, length);
if (actual != length)
{
printf("\n");
fprintf(stderr, "Fatal error: Error writing output file (out of space?)\n");
goto cleanup;
}
core_fclose(outfile);
outfile = NULL;
printf(" done\n");
// stop if this is the end
if (length < splitsize)
break;
}
printf("File split successfully\n");
// if we get here, clear the errors
error = 0;
cleanup:
if (splitfile != NULL)
{
core_fclose(splitfile);
if (error != 0)
remove(astring_c(splitfilename));
}
if (infile != NULL)
core_fclose(infile);
if (outfile != NULL)
{
core_fclose(outfile);
if (error != 0)
remove(astring_c(outfilename));
}
if (splitbuffer != NULL)
free(splitbuffer);
astring_free(splitfilename);
astring_free(basefilename);
astring_free(outfilename);
astring_free(computedhash);
return error;
}
/*-------------------------------------------------
join_file - rejoin a file from its split
parts
-------------------------------------------------*/
static int join_file(const char *filename, const char *outname, int write_output)
{
astring *expectedhash = astring_alloc(), *computedhash = astring_alloc();
astring *outfilename = astring_alloc(), *infilename = astring_alloc();
astring *basepath = astring_alloc();
core_file *outfile = NULL, *infile = NULL, *splitfile = NULL;
void *splitbuffer = NULL;
file_error filerr;
UINT32 splitsize;
char buffer[256];
int error = 1;
int index;
// open the file for read
filerr = core_fopen(filename, OPEN_FLAG_READ, &splitfile);
if (filerr != FILERR_NONE)
{
fprintf(stderr, "Fatal error: unable to open file '%s'\n", filename);
goto cleanup;
}
// read the first line and verify this is a split file
if (!core_fgets(buffer, sizeof(buffer), splitfile) || strncmp(buffer, "splitfile=", 10) != 0)
{
fprintf(stderr, "Fatal error: corrupt or incomplete split file at line:\n%s\n", buffer);
goto cleanup;
}
astring_trimspace(astring_cpyc(outfilename, buffer + 10));
// compute the base path
astring_cpyc(basepath, filename);
index = astring_rchr(basepath, 0, PATH_SEPARATOR[0]);
if (index != -1)
astring_del(basepath, index + 1, -1);
else
astring_reset(basepath);
// override the output filename if specified, otherwise prepend the path
if (outname != NULL)
astring_cpyc(outfilename, outname);
else
astring_ins(outfilename, 0, basepath);
// read the split size
if (!core_fgets(buffer, sizeof(buffer), splitfile) || sscanf(buffer, "splitsize=%d", &splitsize) != 1)
{
fprintf(stderr, "Fatal error: corrupt or incomplete split file at line:\n%s\n", buffer);
goto cleanup;
}
// attempt to open the new file
if (write_output)
{
// don't overwrite the original!
filerr = core_fopen(astring_c(outfilename), OPEN_FLAG_READ, &outfile);
if (filerr == FILERR_NONE)
{
core_fclose(outfile);
outfile = NULL;
fprintf(stderr, "Fatal error: output file '%s' already exists\n", astring_c(outfilename));
goto cleanup;
}
// open the output for write
filerr = core_fopen(astring_c(outfilename), OPEN_FLAG_WRITE | OPEN_FLAG_CREATE, &outfile);
if (filerr != FILERR_NONE)
{
fprintf(stderr, "Fatal error: unable to create file '%s'\n", astring_c(outfilename));
goto cleanup;
}
}
printf("%s file '%s'...\n", write_output ? "Joining" : "Verifying", astring_c(outfilename));
// now iterate through each file
while (core_fgets(buffer, sizeof(buffer), splitfile))
{
UINT32 length, actual;
// make sure the hash and filename are in the right place
if (strncmp(buffer, "hash=", 5) != 0 || strncmp(buffer + 5 + SHA1_DIGEST_SIZE * 2, " file=", 6) != 0)
{
fprintf(stderr, "Fatal error: corrupt or incomplete split file at line:\n%s\n", buffer);
goto cleanup;
}
astring_cpych(expectedhash, buffer + 5, SHA1_DIGEST_SIZE * 2);
astring_trimspace(astring_cpyc(infilename, buffer + 5 + SHA1_DIGEST_SIZE * 2 + 6));
printf(" Reading file '%s'...", astring_c(infilename));
// read the file's contents
astring_ins(infilename, 0, basepath);
filerr = core_fload(astring_c(infilename), &splitbuffer, &length);
if (filerr != FILERR_NONE)
{
printf("\n");
fprintf(stderr, "Fatal error: unable to load file '%s'\n", astring_c(infilename));
goto cleanup;
}
// hash the contents
compute_hash_as_string(computedhash, splitbuffer, length);
// compare
if (astring_cmp(computedhash, expectedhash) != 0)
{
printf("\n");
fprintf(stderr, "Fatal error: file '%s' has incorrect hash\n Expected: %s\n Computed: %s\n", astring_c(infilename), astring_c(expectedhash), astring_c(computedhash));
goto cleanup;
}
// append to the file
if (write_output)
{
printf(" writing...");
actual = core_fwrite(outfile, splitbuffer, length);
if (actual != length)
{
printf("\n");
fprintf(stderr, "Fatal error: Error writing output file (out of space?)\n");
goto cleanup;
}
printf(" done\n");
}
else
printf(" verified\n");
// release allocated memory
free(splitbuffer);
splitbuffer = NULL;
}
if (write_output)
printf("File re-created successfully\n");
else
printf("File verified successfully\n");
// if we get here, clear the errors
error = 0;
cleanup:
if (splitfile != NULL)
core_fclose(splitfile);
if (infile != NULL)
core_fclose(infile);
if (outfile != NULL)
{
core_fclose(outfile);
if (error != 0)
remove(astring_c(outfilename));
}
if (splitbuffer != NULL)
free(splitbuffer);
astring_free(outfilename);
astring_free(infilename);
astring_free(basepath);
astring_free(expectedhash);
astring_free(computedhash);
return error;
}
/*-------------------------------------------------
main - primary entry point
-------------------------------------------------*/
int main(int argc, char *argv[])
{
int result;
/* skip if no command */
if (argc < 2)
goto usage;
/* split command */
if (stricmp(argv[1], "-split") == 0)
{
if (argc != 4 && argc != 5)
goto usage;
result = split_file(argv[2], argv[3], (argc < 5) ? DEFAULT_SPLIT_SIZE : atoi(argv[4]));
}
/* join command */
else if (stricmp(argv[1], "-join") == 0)
{
if (argc != 3 && argc != 4)
goto usage;
result = join_file(argv[2], (argc >= 4) ? argv[3] : NULL, TRUE);
}
/* verify command */
else if (stricmp(argv[1], "-verify") == 0)
{
if (argc != 3)
goto usage;
result = join_file(argv[2], NULL, FALSE);
}
else
goto usage;
return 0;
usage:
fprintf(stderr,
"Usage:\n"
" split -split <bigfile> <basename> [<size>] -- split file into parts\n"
" split -join <splitfile> [<outputfile>] -- join file parts into original file\n"
" split -verify <splitfile> -- verify a split file\n"
"\n"
"Where:\n"
" <bigfile> is the large file you wish to split\n"
" <basename> is the base path and name to assign to the split files\n"
" <size> is the optional split size, in MB (100MB is the default)\n"
" <splitfile> is the name of the <basename>.split generated with -split\n"
" <outputfile> is the name of the file to output (defaults to original name)\n"
);
return 0;
}