mdbtools/src/libmdb/table.c

337 lines
8.9 KiB
C
Raw Normal View History

/* MDB Tools - A library for reading MS Access database file
* Copyright (C) 2000 Brian Bruns
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Library General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Library General Public License for more details.
*
* You should have received a copy of the GNU Library General Public
* License along with this library; if not, write to the
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
* Boston, MA 02111-1307, USA.
*/
#include "mdbtools.h"
#ifdef DMALLOC
#include "dmalloc.h"
#endif
#define MDB_DEBUG_USAGE 0
2002-02-03 10:49:08 +08:00
static gint mdb_col_comparer(MdbColumn *a, MdbColumn *b)
{
if (a->col_num > b->col_num)
return 1;
else if (a->col_num < b->col_num)
return -1;
else
return 0;
}
unsigned char mdb_col_needs_size(int col_type)
{
if (col_type == MDB_TEXT) {
return TRUE;
} else {
return FALSE;
}
}
2000-03-05 01:31:07 +08:00
MdbTableDef *mdb_read_table(MdbCatalogEntry *entry)
{
MdbTableDef *table;
MdbHandle *mdb = entry->mdb;
2003-01-02 06:29:39 +08:00
MdbFormatConstants *fmt = mdb->fmt;
int len;
2002-12-20 14:17:41 +08:00
int rownum, row_start, row_end;
2000-03-05 01:31:07 +08:00
table = mdb_alloc_tabledef(entry);
mdb_read_pg(mdb, entry->table_pg);
len = mdb_get_int16(mdb,8);
2003-01-02 06:29:39 +08:00
table->num_rows = mdb_get_int32(mdb, fmt->tab_num_rows_offset);
table->num_cols = mdb_get_int16(mdb, fmt->tab_num_cols_offset);
table->num_idxs = mdb_get_int32(mdb, fmt->tab_num_idxs_offset);
table->num_real_idxs = mdb_get_int32(mdb, fmt->tab_num_ridxs_offset);
2002-12-20 14:17:41 +08:00
/* grab a copy of the usage map */
2003-01-02 06:29:39 +08:00
rownum = mdb->pg_buf[fmt->tab_usage_map_offset];
mdb_read_alt_pg(mdb, mdb_get_int24(mdb, fmt->tab_usage_map_offset + 1));
2002-12-20 14:17:41 +08:00
mdb_swap_pgbuf(mdb);
2003-01-02 06:29:39 +08:00
row_start = mdb_get_int16(mdb, (fmt->row_count_offset + 2) + (rownum*2));
2003-02-10 07:19:21 +08:00
row_end = mdb_find_end_of_row(mdb, rownum);
table->map_sz = row_end - row_start + 1;
2002-12-20 14:17:41 +08:00
table->usage_map = malloc(table->map_sz);
memcpy(table->usage_map, &mdb->pg_buf[row_start], table->map_sz);
#if MDB_DEBUG_USAGE
2002-12-20 14:17:41 +08:00
buffer_dump(mdb->pg_buf, row_start, row_end);
#endif
2002-12-20 14:17:41 +08:00
/* swap back */
mdb_swap_pgbuf(mdb);
#if MDB_DEBUG_USAGE
2003-01-02 06:29:39 +08:00
printf ("usage map found on page %ld start %d end %d\n", mdb_get_int24(mdb, fmt->tab_usage_map_offset + 1), row_start, row_end);
#endif
2002-12-20 14:17:41 +08:00
2003-02-10 07:19:21 +08:00
/* now grab the free space page map */
mdb_swap_pgbuf(mdb);
rownum = mdb->pg_buf[fmt->tab_free_map_offset];
mdb_read_alt_pg(mdb, mdb_get_int24(mdb, fmt->tab_free_map_offset + 1));
mdb_swap_pgbuf(mdb);
row_start = mdb_get_int16(mdb, (fmt->row_count_offset + 2) + (rownum*2));
row_end = mdb_find_end_of_row(mdb, rownum);
table->freemap_sz = row_end - row_start + 1;
table->free_usage_map = malloc(table->freemap_sz);
memcpy(table->free_usage_map, &mdb->pg_buf[row_start], table->freemap_sz);
2003-01-02 06:29:39 +08:00
table->first_data_pg = mdb_get_int16(mdb, fmt->tab_first_dpg_offset);
2000-03-05 01:31:07 +08:00
return table;
}
/*
** read the next page if offset is > pg_size
** return true if page was read
*/
int
read_pg_if(MdbHandle *mdb, int *cur_pos, int offset)
{
2003-01-02 06:29:39 +08:00
if (*cur_pos + offset >= mdb->fmt->pg_size) {
mdb_read_pg(mdb, mdb_get_int32(mdb,4));
2003-01-02 06:29:39 +08:00
*cur_pos = 8 - (mdb->fmt->pg_size - (*cur_pos));
return 1;
}
return 0;
}
guint32
read_pg_if_32(MdbHandle *mdb, int *cur_pos)
{
unsigned char c[4];
int i, rc = 0;
for (i=0;i<4;i++) {
rc += read_pg_if(mdb, cur_pos, i);
c[i] = mdb->pg_buf[(*cur_pos) + i];
}
return _mdb_get_int32(c, 0);
}
guint16
read_pg_if_16(MdbHandle *mdb, int *cur_pos)
{
unsigned char low_byte, high_byte;
int rc = 0;
rc += read_pg_if(mdb, cur_pos, 0);
low_byte = mdb->pg_buf[*cur_pos];
rc += read_pg_if(mdb, cur_pos, 1);
high_byte = mdb->pg_buf[(*cur_pos) + 1];
return (high_byte * 256 + low_byte);
}
guint16
read_pg_if_n(MdbHandle *mdb, unsigned char *buf, int *cur_pos, int len)
{
int half;
if (*cur_pos + len < mdb->fmt->pg_size) {
memcpy(buf, &mdb->pg_buf[*cur_pos], len);
return 0;
}
half = (mdb->fmt->pg_size - *cur_pos - 1);
memcpy(buf, &mdb->pg_buf[*cur_pos], half);
mdb_read_pg(mdb, mdb_get_int32(mdb,4));
memcpy(buf, &mdb->pg_buf[8], len - half);
*cur_pos = 8 - (mdb->fmt->pg_size - (*cur_pos));
return 1;
}
GPtrArray *mdb_read_columns(MdbTableDef *table)
{
2000-03-09 12:48:59 +08:00
MdbHandle *mdb = table->entry->mdb;
2003-01-02 06:29:39 +08:00
MdbFormatConstants *fmt = mdb->fmt;
MdbColumn col, *pcol;
2002-02-03 10:49:08 +08:00
int len, i,j;
unsigned char low_byte, high_byte;
int cur_col, cur_name;
int name_sz;
2002-02-03 10:49:08 +08:00
GSList *slist = NULL;
2000-03-05 21:10:42 +08:00
table->columns = g_ptr_array_new();
2000-03-05 01:31:07 +08:00
2003-01-02 06:29:39 +08:00
cur_col = fmt->tab_cols_start_offset +
(table->num_real_idxs * fmt->tab_ridx_entry_size);
/* new code based on patch submitted by Tim Nelson 2000.09.27 */
/*
** column attributes
*/
2002-02-03 10:49:08 +08:00
for (i=0;i<table->num_cols;i++) {
2002-12-11 07:35:24 +08:00
#ifdef MDB_DEBUG
/* printf("column %d\n", i);
buffer_dump(mdb->pg_buf, cur_col ,cur_col + 18); */
#endif
2002-02-03 10:49:08 +08:00
memset(&col, 0, sizeof(col));
2003-01-02 06:29:39 +08:00
col.col_num = mdb->pg_buf[cur_col + fmt->col_num_offset];
2000-03-05 21:10:42 +08:00
read_pg_if(mdb, &cur_col, 0);
2000-03-05 21:10:42 +08:00
col.col_type = mdb->pg_buf[cur_col];
2002-12-11 07:35:24 +08:00
if (col.col_type == MDB_NUMERIC) {
col.col_prec = mdb->pg_buf[cur_col + 11];
col.col_scale = mdb->pg_buf[cur_col + 12];
}
2002-02-03 10:49:08 +08:00
read_pg_if(mdb, &cur_col, 13);
2003-01-02 06:29:39 +08:00
col.is_fixed = mdb->pg_buf[cur_col + fmt->col_fixed_offset] &
2002-02-03 10:49:08 +08:00
0x01 ? 1 : 0;
2002-03-16 10:24:53 +08:00
if (col.col_type != MDB_BOOL) {
read_pg_if(mdb, &cur_col, 17);
2003-01-02 06:29:39 +08:00
low_byte = mdb->pg_buf[cur_col + fmt->col_size_offset];
2002-03-16 10:24:53 +08:00
read_pg_if(mdb, &cur_col, 18);
2003-01-02 06:29:39 +08:00
high_byte = mdb->pg_buf[cur_col + fmt->col_size_offset + 1];
2002-03-16 10:24:53 +08:00
col.col_size += high_byte * 256 + low_byte;
} else
col.col_size=0;
2002-02-03 10:49:08 +08:00
pcol = g_memdup(&col, sizeof(MdbColumn));
slist = g_slist_insert_sorted(slist,pcol,(GCompareFunc)mdb_col_comparer);
2003-01-02 06:29:39 +08:00
cur_col += fmt->tab_col_entry_size;
2000-03-05 21:10:42 +08:00
}
cur_name = cur_col;
/*
** column names
*/
for (i=0;i<table->num_cols;i++) {
/* fetch the column */
2002-02-03 10:49:08 +08:00
pcol = g_slist_nth_data (slist, i);
/* we have reached the end of page */
read_pg_if(mdb, &cur_name, 0);
name_sz = mdb->pg_buf[cur_name];
2003-01-02 06:29:39 +08:00
if (IS_JET4(mdb)) {
2002-02-03 10:49:08 +08:00
/* FIX ME - for now just skip the high order byte */
cur_name += 2;
/* determine amount of name on this page */
2003-01-02 06:29:39 +08:00
len = ((cur_name + name_sz) > fmt->pg_size) ?
fmt->pg_size - cur_name :
2002-02-03 10:49:08 +08:00
name_sz;
/* strip high order (second) byte from unicode string */
for (j=0;j<len;j+=2) {
pcol->name[j/2] = mdb->pg_buf[cur_name + j];
}
/* name wrapped over page */
if (len < name_sz) {
/* read the next pg */
mdb_read_pg(mdb, mdb_get_int32(mdb,4));
2003-01-02 06:29:39 +08:00
cur_name = 8 - (fmt->pg_size - cur_name);
2002-02-03 10:49:08 +08:00
if (len % 2) cur_name++;
/* get the rest of the name */
for (j=0;j<len;j+=2) {
}
memcpy(&pcol->name[len], &mdb->pg_buf[cur_name], name_sz - len);
}
pcol->name[name_sz]='\0';
cur_name += name_sz;
2003-01-02 06:29:39 +08:00
} else if (IS_JET3(mdb)) {
2002-02-03 10:49:08 +08:00
/* determine amount of name on this page */
2003-01-02 06:29:39 +08:00
len = ((cur_name + name_sz) > fmt->pg_size) ?
fmt->pg_size - cur_name :
2002-02-03 10:49:08 +08:00
name_sz;
if (len) {
memcpy(pcol->name, &mdb->pg_buf[cur_name+1], len);
}
/* name wrapped over page */
if (len < name_sz) {
/* read the next pg */
mdb_read_pg(mdb, mdb_get_int32(mdb,4));
2003-01-02 06:29:39 +08:00
cur_name = 8 - (fmt->pg_size - cur_name);
2002-02-03 10:49:08 +08:00
/* get the rest of the name */
memcpy(&pcol->name[len], &mdb->pg_buf[cur_name], name_sz - len);
}
pcol->name[name_sz]='\0';
cur_name += name_sz + 1;
} else {
fprintf(stderr,"Unknown MDB version\n");
}
}
2002-02-03 10:49:08 +08:00
/* turn this list into an array */
for (i=0;i<table->num_cols;i++) {
pcol = g_slist_nth_data (slist, i);
g_ptr_array_add(table->columns, pcol);
}
g_slist_free(slist);
2001-04-02 06:10:15 +08:00
table->index_start = cur_name;
2000-03-05 21:10:42 +08:00
return table->columns;
}
void mdb_table_dump(MdbCatalogEntry *entry)
{
MdbTableDef *table;
MdbColumn *col;
2003-01-02 06:29:39 +08:00
int coln;
2001-04-02 06:10:15 +08:00
MdbIndex *idx;
2000-03-05 21:10:42 +08:00
MdbHandle *mdb = entry->mdb;
2002-12-20 14:17:41 +08:00
int i,bitn;
guint32 pgnum;
2000-03-05 21:10:42 +08:00
table = mdb_read_table(entry);
fprintf(stdout,"definition page = %lu\n",entry->table_pg);
2000-03-05 21:10:42 +08:00
fprintf(stdout,"number of datarows = %d\n",table->num_rows);
fprintf(stdout,"number of columns = %d\n",table->num_cols);
2001-04-02 06:10:15 +08:00
fprintf(stdout,"number of indices = %d\n",table->num_real_idxs);
2000-03-05 21:10:42 +08:00
2000-03-09 12:48:59 +08:00
mdb_read_columns(table);
2001-04-02 06:10:15 +08:00
mdb_read_indices(table);
2000-03-05 21:10:42 +08:00
for (i=0;i<table->num_cols;i++) {
col = g_ptr_array_index(table->columns,i);
2000-03-05 21:10:42 +08:00
2000-03-09 12:48:59 +08:00
fprintf(stdout,"column %d Name: %-20s Type: %s(%d)\n",
i, col->name,
mdb_get_coltype_string(mdb->default_backend, col->col_type),
col->col_size);
}
2001-04-02 06:10:15 +08:00
for (i=0;i<table->num_idxs;i++) {
idx = g_ptr_array_index (table->indices, i);
mdb_index_dump(table, idx);
2001-04-02 06:10:15 +08:00
}
2002-12-20 14:17:41 +08:00
if (table->usage_map) {
printf("pages reserved by this object\n");
2002-12-20 14:17:41 +08:00
pgnum = _mdb_get_int32(table->usage_map,1);
/* the first 5 bytes of the usage map mean something */
2003-01-02 06:29:39 +08:00
coln = 0;
2002-12-20 14:17:41 +08:00
for (i=5;i<table->map_sz;i++) {
for (bitn=0;bitn<8;bitn++) {
2003-01-02 06:29:39 +08:00
if (table->usage_map[i] & 1 << bitn) {
coln++;
printf("%6lu ",(long unsigned) pgnum);
2003-01-02 06:29:39 +08:00
if (coln==10) {
printf("\n");
coln = 0;
}
}
2002-12-20 14:17:41 +08:00
pgnum++;
}
}
}
}