mdbtools/src/libmdb/file.c

526 lines
13 KiB
C
Raw Normal View History

2000-02-13 07:51:37 +08:00
/* MDB Tools - A library for reading MS Access database files
* Copyright (C) 2000 Brian Bruns
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Library General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Library General Public License for more details.
*
* You should have received a copy of the GNU Library General Public
2011-08-29 07:53:29 +08:00
* License along with this library; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
2000-02-13 07:51:37 +08:00
*/
#include <inttypes.h>
2020-08-21 09:57:25 +08:00
#include <stddef.h>
#include "mdbtools.h"
2000-02-13 07:51:37 +08:00
/*
typedef struct {
int pg_size;
guint16 row_count_offset;
guint16 tab_num_rows_offset;
guint16 tab_num_cols_offset;
guint16 tab_num_idxs_offset;
guint16 tab_num_ridxs_offset;
guint16 tab_usage_map_offset;
guint16 tab_first_dpg_offset;
guint16 tab_cols_start_offset;
guint16 tab_ridx_entry_size;
guint16 col_flags_offset;
guint16 col_size_offset;
guint16 col_num_offset;
guint16 tab_col_entry_size;
guint16 tab_free_map_offset;
guint16 tab_col_offset_var;
guint16 tab_col_offset_fixed;
guint16 tab_row_col_num_offset;
} MdbFormatConstants;
*/
2003-01-02 06:29:39 +08:00
MdbFormatConstants MdbJet4Constants = {
4096, 0x0c, 16, 45, 47, 51, 55, 56, 63, 12, 15, 23, 5, 25, 59, 7, 21, 9
2003-01-02 06:29:39 +08:00
};
MdbFormatConstants MdbJet3Constants = {
2048, 0x08, 12, 25, 27, 31, 35, 36, 43, 8, 13, 16, 1, 18, 39, 3, 14, 5
2003-01-02 06:29:39 +08:00
};
2010-06-18 10:23:45 +08:00
typedef struct _RC4_KEY
{
unsigned char state[256];
unsigned char x;
unsigned char y;
} RC4_KEY;
#define swap_byte(x,y) t = *(x); *(x) = *(y); *(y) = t
static ssize_t _mdb_read_pg(MdbHandle *mdb, void *pg_buf, unsigned long pg);
2004-06-01 02:21:43 +08:00
2010-06-18 10:23:45 +08:00
static void RC4_set_key(RC4_KEY *key, int key_data_len, unsigned char *key_data_ptr)
{
unsigned char t;
unsigned char index1;
unsigned char index2;
unsigned char* state;
short counter;
state = &key->state[0];
for(counter = 0; counter < 256; counter++)
state[counter] = counter;
key->x = 0;
key->y = 0;
index1 = 0;
index2 = 0;
for(counter = 0; counter < 256; counter++) {
index2 = (key_data_ptr[index1] + state[counter] + index2) % 256;
swap_byte(&state[counter], &state[index2]);
index1 = (index1 + 1) % key_data_len;
}
}
/*
* this algorithm does 'encrypt in place' instead of inbuff/outbuff
* note also: encryption and decryption use same routine
* implementation supplied by (Adam Back) at <adam at cypherspace dot org>
*/
static void RC4(RC4_KEY *key, int buffer_len, unsigned char * buff)
{
unsigned char t;
unsigned char x;
unsigned char y;
unsigned char* state;
unsigned char xorIndex;
short counter;
x = key->x;
y = key->y;
state = &key->state[0];
for(counter = 0; counter < buffer_len; counter++) {
x = (x + 1) % 256;
y = (state[x] + y) % 256;
swap_byte(&state[x], &state[y]);
xorIndex = (state[x] + state[y]) % 256;
buff[counter] ^= state[xorIndex];
}
key->x = x;
key->y = y;
}
/**
* mdb_find_file:
* @filename: path to MDB (database) file
*
2004-06-22 12:27:42 +08:00
* Finds and returns the absolute path to an MDB file. Function will first try
* to fstat file as passed, then search through the $MDBPATH if not found.
*
* Return value: gchar pointer to absolute path. Caller is responsible for
* freeing.
**/
static char *mdb_find_file(const char *file_name)
{
2004-06-01 02:21:43 +08:00
struct stat status;
gchar *mdbpath, **dir, *tmpfname;
unsigned int i = 0;
/* try the provided file name first */
if (!stat(file_name, &status)) {
char *result;
result = g_strdup(file_name);
if (!result)
fprintf(stderr, "Can't alloc filename\n");
return result;
}
/* Now pull apart $MDBPATH and try those */
2004-06-01 02:21:43 +08:00
mdbpath = (gchar *) getenv("MDBPATH");
/* no path, can't find file */
if (!mdbpath || !strlen(mdbpath)) return NULL;
2004-06-01 02:21:43 +08:00
dir = g_strsplit(mdbpath, ":", 0);
while (dir[i]) {
if (!strlen(dir[i])) continue;
tmpfname = g_strconcat(dir[i++], "/", file_name, NULL);
if (!stat(tmpfname, &status)) {
2004-06-01 02:21:43 +08:00
g_strfreev(dir);
return tmpfname;
}
g_free(tmpfname);
2004-06-01 02:21:43 +08:00
}
g_strfreev(dir);
return NULL;
}
2004-04-14 04:06:04 +08:00
/**
* mdb_handle_from_stream:
* @stream An open file stream
* @flags MDB_NOFLAGS for read-only, MDB_WRITABLE for read/write
2004-04-14 04:06:04 +08:00
*
* Allocates, initializes, and return an MDB handle from a file stream pointing
* to an MDB file.
2004-04-14 04:06:04 +08:00
*
* Return value: The handle on success, NULL on failure
*/
static MdbHandle *mdb_handle_from_stream(FILE *stream, MdbFileFlags flags) {
2010-06-18 10:23:45 +08:00
int key[] = {0x86, 0xfb, 0xec, 0x37, 0x5d, 0x44, 0x9c, 0xfa, 0xc6, 0x5e, 0x28, 0xe6, 0x13, 0xb6};
int j, pos;
2000-02-13 07:51:37 +08:00
MdbHandle *mdb = (MdbHandle *) g_malloc0(sizeof(MdbHandle));
mdb_set_default_backend(mdb, "access");
mdb_set_date_fmt(mdb, "%x %X");
mdb_set_shortdate_fmt(mdb, "%x");
mdb_set_bind_size(mdb, MDB_BIND_SIZE);
mdb_set_boolean_fmt_numbers(mdb);
2005-03-28 11:33:11 +08:00
#ifdef HAVE_ICONV
mdb->iconv_in = (iconv_t)-1;
mdb->iconv_out = (iconv_t)-1;
#endif
2003-01-02 06:29:39 +08:00
/* need something to bootstrap with, reassign after page 0 is read */
mdb->fmt = &MdbJet3Constants;
2004-06-01 02:21:43 +08:00
mdb->f = (MdbFile *) g_malloc0(sizeof(MdbFile));
2004-06-02 20:31:18 +08:00
mdb->f->refs = 1;
mdb->f->stream = stream;
2004-04-14 04:06:04 +08:00
if (flags & MDB_WRITABLE) {
2004-06-01 02:21:43 +08:00
mdb->f->writable = TRUE;
}
2000-03-22 10:12:31 +08:00
if (!mdb_read_pg(mdb, 0)) {
// fprintf(stderr,"Couldn't read first page.\n");
2004-06-02 20:31:18 +08:00
mdb_close(mdb);
2000-03-22 10:12:31 +08:00
return NULL;
}
if (mdb->pg_buf[0] != 0) {
2004-06-02 20:31:18 +08:00
mdb_close(mdb);
return NULL;
}
mdb->f->jet_version = mdb_get_byte(mdb->pg_buf, 0x14);
switch(mdb->f->jet_version) {
case MDB_VER_JET3:
2003-01-02 06:29:39 +08:00
mdb->fmt = &MdbJet3Constants;
break;
case MDB_VER_JET4:
case MDB_VER_ACCDB_2007:
case MDB_VER_ACCDB_2010:
case MDB_VER_ACCDB_2013:
case MDB_VER_ACCDB_2016:
mdb->fmt = &MdbJet4Constants;
break;
default:
2018-01-17 07:24:53 +08:00
fprintf(stderr,"Unknown Jet version: %x\n", mdb->f->jet_version);
2004-06-02 20:31:18 +08:00
mdb_close(mdb);
return NULL;
2000-03-22 10:12:31 +08:00
}
2010-06-18 10:23:45 +08:00
mdb->f->db_key = mdb_get_int32(mdb->pg_buf, 0x3e);
/* I don't know if this value is valid for some versions?
* it doesn't seem to be valid for the databases I have
*
* f->db_key ^= 0xe15e01b9;
*/
mdb->f->db_key ^= 0x4ebc8afb;
/* fprintf(stderr, "Encrypted file, RC4 key seed= %d\n", mdb->f->db_key); */
/* write is not supported for encrypted files yet */
mdb->f->writable = mdb->f->writable && !mdb->f->db_key;
2010-06-18 10:23:45 +08:00
/* get the db password located at 0x42 bytes into the file */
for (pos=0;pos<14;pos++) {
j = mdb_get_int32(mdb->pg_buf, 0x42+pos);
2010-06-18 10:23:45 +08:00
j ^= key[pos];
if ( j != 0)
mdb->f->db_passwd[pos] = j;
else
mdb->f->db_passwd[pos] = '\0';
}
2004-11-26 13:22:52 +08:00
mdb_iconv_init(mdb);
2000-03-22 10:12:31 +08:00
2000-02-13 07:51:37 +08:00
return mdb;
}
2004-04-14 04:06:04 +08:00
/**
* mdb_open_buffer:
* @buffer A memory buffer containing an MDB file
* @len Length of the buffer
*
* Opens an MDB file in memory and returns an MdbHandle to it.
*
* Return value: point to MdbHandle structure.
*/
MdbHandle *mdb_open_buffer(void *buffer, size_t len, MdbFileFlags flags) {
FILE *file = NULL;
#ifdef HAVE_FMEMOPEN
file = fmemopen(buffer, len, (flags & MDB_WRITABLE) ? "r+" : "r");
#else
fprintf(stderr, "mdb_open_buffer requires a platform with support for fmemopen(3)\n");
#endif
if (file == NULL) {
fprintf(stderr, "Couldn't open memory buffer\n");
return NULL;
}
return mdb_handle_from_stream(file, flags);
}
/**
* mdb_open:
* @filename: path to MDB (database) file
* @flags: MDB_NOFLAGS for read-only, MDB_WRITABLE for read/write
*
* Opens an MDB file and returns an MdbHandle to it. MDB File may be relative
* to the current directory, a full path to the file, or relative to a
* component of $MDBPATH.
*
* Return value: pointer to MdbHandle structure.
**/
MdbHandle *mdb_open(const char *filename, MdbFileFlags flags)
{
FILE *file;
char *filepath = mdb_find_file(filename);
if (!filepath) {
fprintf(stderr, "File not found\n");
return NULL;
}
#ifdef _WIN32
char *mode = (flags & MDB_WRITABLE) ? "rb+" : "rb";
#else
char *mode = (flags & MDB_WRITABLE) ? "r+" : "r";
#endif
if ((file = fopen(filepath, mode)) == NULL) {
fprintf(stderr,"Couldn't open file %s\n",filepath);
g_free(filepath);
return NULL;
}
g_free(filepath);
return mdb_handle_from_stream(file, flags);
}
2004-04-13 08:39:12 +08:00
/**
2004-04-14 04:06:04 +08:00
* mdb_close:
* @mdb: Handle to open MDB database file
2004-04-13 08:39:12 +08:00
*
2004-04-14 04:06:04 +08:00
* Dereferences MDB file, closes if reference count is 0, and destroys handle.
2004-04-13 08:39:12 +08:00
*
**/
void
mdb_close(MdbHandle *mdb)
{
if (!mdb) return;
mdb_free_catalog(mdb);
2004-08-19 13:12:21 +08:00
g_free(mdb->stats);
g_free(mdb->backend_name);
2003-01-02 06:29:39 +08:00
if (mdb->f) {
if (mdb->f->refs > 1) {
mdb->f->refs--;
} else {
if (mdb->f->stream) fclose(mdb->f->stream);
2004-05-30 13:06:26 +08:00
g_free(mdb->f);
}
}
2004-11-26 13:22:52 +08:00
mdb_iconv_close(mdb);
mdb_remove_backends(mdb);
2004-11-26 13:22:52 +08:00
2004-05-30 13:06:26 +08:00
g_free(mdb);
}
2004-04-14 04:06:04 +08:00
/**
* mdb_clone_handle:
* @mdb: Handle to open MDB database file
*
* Clones an existing database handle. Cloned handle shares the file descriptor
* but has its own page buffer, page position, and similar internal variables.
2004-04-14 04:06:04 +08:00
*
* Return value: new handle to the database.
*/
MdbHandle *mdb_clone_handle(MdbHandle *mdb)
{
MdbHandle *newmdb;
2004-04-24 13:53:05 +08:00
MdbCatalogEntry *entry, *data;
2004-07-09 20:47:04 +08:00
unsigned int i;
2004-05-30 13:06:26 +08:00
newmdb = (MdbHandle *) g_memdup(mdb, sizeof(MdbHandle));
2020-08-21 09:57:25 +08:00
2020-08-21 20:53:05 +08:00
memset(&newmdb->catalog, 0, sizeof(MdbHandle) - offsetof(MdbHandle, catalog));
2020-08-21 09:57:25 +08:00
newmdb->catalog = g_ptr_array_new();
for (i=0;i<mdb->num_catalog;i++) {
entry = g_ptr_array_index(mdb->catalog,i);
2004-04-24 13:53:05 +08:00
data = g_memdup(entry,sizeof(MdbCatalogEntry));
2020-08-21 09:57:25 +08:00
data->mdb = newmdb;
data->props = NULL;
2004-04-24 13:53:05 +08:00
g_ptr_array_add(newmdb->catalog, data);
}
2020-08-21 09:57:25 +08:00
mdb_iconv_init(newmdb);
mdb_set_default_backend(newmdb, mdb->backend_name);
if (mdb->f) {
mdb->f->refs++;
}
2004-11-26 13:22:52 +08:00
return newmdb;
}
2000-02-13 07:51:37 +08:00
/*
** mdb_read a wrapper for read that bails if anything is wrong
*/
ssize_t mdb_read_pg(MdbHandle *mdb, unsigned long pg)
2000-02-13 07:51:37 +08:00
{
ssize_t len;
if (pg && mdb->cur_pg == pg) return mdb->fmt->pg_size;
len = _mdb_read_pg(mdb, mdb->pg_buf, pg);
2020-08-19 09:20:40 +08:00
//fprintf(stderr, "read page %ld type %02x\n", pg, mdb->pg_buf[0]);
mdb->cur_pg = pg;
/* kan - reset the cur_pos on a new page read */
mdb->cur_pos = 0; /* kan */
return len;
}
ssize_t mdb_read_alt_pg(MdbHandle *mdb, unsigned long pg)
{
2020-08-19 09:20:40 +08:00
return _mdb_read_pg(mdb, mdb->alt_pg_buf, pg);
}
static ssize_t _mdb_read_pg(MdbHandle *mdb, void *pg_buf, unsigned long pg)
{
ssize_t len;
off_t offset = pg * mdb->fmt->pg_size;
2000-02-13 07:51:37 +08:00
if (fseeko(mdb->f->stream, 0, SEEK_END) == -1) {
fprintf(stderr, "Unable to seek to end of file\n");
return 0;
}
if (ftello(mdb->f->stream) < offset) {
fprintf(stderr,"offset %" PRIu64 " is beyond EOF\n",(uint64_t)offset);
return 0;
}
if (mdb->stats && mdb->stats->collect)
mdb->stats->pg_reads++;
if (fseeko(mdb->f->stream, offset, SEEK_SET) == -1) {
fprintf(stderr, "Unable to seek to page %lu\n", pg);
return 0;
}
len = fread(pg_buf, 1, mdb->fmt->pg_size, mdb->f->stream);
if (ferror(mdb->f->stream)) {
2000-02-13 07:51:37 +08:00
perror("read");
return 0;
}
memset(pg_buf + len, 0, mdb->fmt->pg_size - len);
2010-06-18 10:23:45 +08:00
/*
* unencrypt the page if necessary.
* it might make sense to cache the unencrypted data blocks?
*/
if (pg != 0 && mdb->f->db_key != 0)
{
RC4_KEY rc4_key;
unsigned int tmp_key = mdb->f->db_key ^ pg;
RC4_set_key(&rc4_key, 4, (unsigned char *)&tmp_key);
RC4(&rc4_key, mdb->fmt->pg_size, pg_buf);
}
return mdb->fmt->pg_size;
2000-02-13 07:51:37 +08:00
}
2002-12-11 07:35:24 +08:00
void mdb_swap_pgbuf(MdbHandle *mdb)
2002-04-22 12:54:59 +08:00
{
char tmpbuf[MDB_PGSIZE];
memcpy(tmpbuf,mdb->pg_buf, MDB_PGSIZE);
memcpy(mdb->pg_buf,mdb->alt_pg_buf, MDB_PGSIZE);
memcpy(mdb->alt_pg_buf,tmpbuf,MDB_PGSIZE);
}
2004-08-20 10:43:21 +08:00
2005-05-02 20:46:33 +08:00
unsigned char mdb_get_byte(void *buf, int offset)
{
2005-05-02 20:46:33 +08:00
return ((unsigned char *)(buf))[offset];
}
unsigned char mdb_pg_get_byte(MdbHandle *mdb, int offset)
{
2004-08-20 10:43:21 +08:00
if (offset < 0 || offset+1 > mdb->fmt->pg_size) return -1;
mdb->cur_pos++;
2004-08-20 10:43:21 +08:00
return mdb->pg_buf[offset];
}
2004-08-20 10:43:21 +08:00
2005-05-02 20:46:33 +08:00
int mdb_get_int16(void *buf, int offset)
2003-01-02 06:29:39 +08:00
{
2005-05-02 20:46:33 +08:00
guint16 l;
memcpy(&l, (char*)buf + offset, 2);
2005-05-02 20:46:33 +08:00
return (int)GUINT16_FROM_LE(l);
2003-01-02 06:29:39 +08:00
}
2004-08-20 10:43:21 +08:00
int mdb_pg_get_int16(MdbHandle *mdb, int offset)
2000-02-13 07:51:37 +08:00
{
2003-01-02 06:29:39 +08:00
if (offset < 0 || offset+2 > mdb->fmt->pg_size) return -1;
2000-02-13 07:51:37 +08:00
mdb->cur_pos+=2;
2004-08-20 10:43:21 +08:00
return mdb_get_int16(mdb->pg_buf, offset);
2000-02-13 07:51:37 +08:00
}
2005-06-23 15:04:17 +08:00
long mdb_get_int32_msb(void *buf, int offset)
2004-08-20 10:43:21 +08:00
{
2005-06-23 15:04:17 +08:00
gint32 l;
memcpy(&l, (char*)buf + offset, 4);
2005-06-23 15:04:17 +08:00
return (long)GINT32_FROM_BE(l);
2002-04-22 12:54:59 +08:00
}
2005-05-02 20:46:33 +08:00
long mdb_get_int32(void *buf, int offset)
2000-02-13 07:51:37 +08:00
{
2005-05-02 20:46:33 +08:00
gint32 l;
memcpy(&l, (char*)buf + offset, 4);
2004-08-20 10:43:21 +08:00
return (long)GINT32_FROM_LE(l);
2002-12-20 14:17:41 +08:00
}
long mdb_pg_get_int32(MdbHandle *mdb, int offset)
2002-12-20 14:17:41 +08:00
{
2003-01-02 06:29:39 +08:00
if (offset <0 || offset+4 > mdb->fmt->pg_size) return -1;
2000-02-13 07:51:37 +08:00
mdb->cur_pos+=4;
2004-08-20 10:43:21 +08:00
return mdb_get_int32(mdb->pg_buf, offset);
2000-02-13 07:51:37 +08:00
}
2005-05-02 20:46:33 +08:00
float mdb_get_single(void *buf, int offset)
2004-08-20 10:43:21 +08:00
{
union {guint32 g; float f;} f;
memcpy(&f, (char*)buf + offset, 4);
f.g = GUINT32_FROM_LE(f.g);
return f.f;
}
2004-08-20 10:43:21 +08:00
float mdb_pg_get_single(MdbHandle *mdb, int offset)
{
if (offset <0 || offset+4 > mdb->fmt->pg_size) return -1;
mdb->cur_pos+=4;
return mdb_get_single(mdb->pg_buf, offset);
}
2005-05-02 20:46:33 +08:00
double mdb_get_double(void *buf, int offset)
{
union {guint64 g; double d;} d;
memcpy(&d, (char*)buf + offset, 8);
d.g = GUINT64_FROM_LE(d.g);
return d.d;
}
2004-08-20 10:43:21 +08:00
double mdb_pg_get_double(MdbHandle *mdb, int offset)
{
2004-01-06 08:42:07 +08:00
if (offset <0 || offset+8 > mdb->fmt->pg_size) return -1;
mdb->cur_pos+=8;
return mdb_get_double(mdb->pg_buf, offset);
}
2004-08-20 10:43:21 +08:00
int
mdb_set_pos(MdbHandle *mdb, int pos)
2000-02-13 07:51:37 +08:00
{
2003-01-02 06:29:39 +08:00
if (pos<0 || pos >= mdb->fmt->pg_size) return 0;
2000-02-13 07:51:37 +08:00
mdb->cur_pos=pos;
return pos;
}
2000-02-28 03:24:44 +08:00
int mdb_get_pos(MdbHandle *mdb)
2000-02-13 07:51:37 +08:00
{
return mdb->cur_pos;
}