|
DataMuseum.dkPresents historical artifacts from the history of: DKUUG/EUUG Conference tapes |
This is an automatic "excavation" of a thematic subset of
See our Wiki for more about DKUUG/EUUG Conference tapes Excavated with: AutoArchaeologist - Free & Open Source Software. |
top - metrics - downloadIndex: T g
Length: 17675 (0x450b) Types: TextFile Names: »gdbmopen.c«
└─⟦a05ed705a⟧ Bits:30007078 DKUUG GNU 2/12/89 └─⟦0befd2614⟧ »./gdbm-0.8.tar.Z« └─⟦b993d2893⟧ └─⟦this⟧ »gdbm/gdbmopen.c«
/* gdbmopen.c - Open the dbm file and initialize data structures for use. */ /* GNU DBM - DataBase Manager (database subroutines) by Philip A. Nelson Copyright (C) 1989 Free Software Foundation, Inc. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. You may contact the author by: e-mail: phil@wwu.edu us-mail: Philip A. Nelson Computer Science Department Western Washington University Bellingham, WA 98226 phone: (206) 676-3035 *************************************************************************/ #include <stdio.h> #include <sys/file.h> #include <sys/types.h> #include <sys/stat.h> #include "gdbm.h" #include "gdbmerrno.h" extern gdbm_error gdbm_errno; #ifdef RANDOM_HASH #include "extern.h" #endif /* RANDOM_HASH */ /* Initialize dbm system. FILE is a pointer to the file name. If the file has a size of zero bytes, a file initialization procedure is performed, setting up the initial structure in the file. BLOCK_SIZE is used during initialization to determine the size of various constructs. If the value is less than 512, the file system blocksize is used, otherwise the value of BLOCK_SIZE is used. BLOCK_SIZE is ignored if the file has previously initialized. If READ_WRITE is set to DBM_READ the user wants to just read the database and any call to dbm_store or dbm_delete will fail. Many readers can access the database at the same time. If READ_WRITE is set to DBM_WRITE, the user wants both read and write access to the database and requires exclusive access. Any error detected will cause a return value of null and an approprate value will be in gdbm_errno. If no errors occur, a pointer to the "dbm file descriptor" will be returned. */ dbm_file_info * gdbm_open (file, block_size, read_write, fatal_func) char *file; int block_size; int read_write; void (*fatal_func) (); { dbm_file_info *dbf; /* The record to return. */ struct stat file_stat; /* Space for the stat information. */ int len; /* Length of the file name. */ int num_bytes; /* Used in reading and writing. */ int lock_val; /* Returned by the flock call. */ /* Allocate new info structure. */ dbf = (dbm_file_info *) malloc (sizeof (dbm_file_info)); if (dbf == NULL) { gdbm_errno = MALLOC_ERROR; return NULL; } /* Initialize some fields for known values. This is done so dbmclose will work if called before allocating some structures. */ dbf->dir = NULL; dbf->bucket = NULL; dbf->avail = NULL; /* Save name of file. */ len = strlen (file); dbf->name = (char *) malloc (len + 1); if (dbf->name == NULL) { free (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } strcpy (dbf->name, file); /* Initialize the fatal error routine. */ dbf->fatal_err = fatal_func; /* Open the file. */ dbf->desc = open (dbf->name, O_RDWR, 0); if (dbf->desc < 0) { free (dbf->name); free (dbf); gdbm_errno = FILE_OPEN_ERROR; return NULL; } /* Get the status of the file. */ fstat (dbf->desc, &file_stat); /* Lock the file in the approprate way. */ if (read_write == DBM_READER) { if (file_stat.st_size == 0) { close (dbf->desc); free (dbf->name); free (dbf); gdbm_errno = EMPTY_DATABASE; return NULL; } lock_val = flock (dbf->desc, LOCK_SH + LOCK_NB); } else { lock_val = flock (dbf->desc, LOCK_EX + LOCK_NB); } if (lock_val != 0) { close (dbf->desc); free (dbf->name); free (dbf); if (read_write == DBM_READER) gdbm_errno = CANT_BE_READER; else gdbm_errno = CANT_BE_WRITER; return NULL; } #ifdef RANDOM_HASH /* Set up the random number generator used by the hash function. */ setstate (initstate (567943, _dbm_hash_state, 64)); #endif /* RANDOM_HASH */ /* Record the kind of user. */ dbf->read_write = read_write; /* Decide if this is a new file or an old file. */ if (file_stat.st_size == 0) { int index; /* This is a new file. Create an empty database. */ /* Start with the blocksize. */ if (block_size < 512) dbf->header.block_size = file_stat.st_blksize; else dbf->header.block_size = block_size; /* Create the initial hash table directory. */ dbf->header.dir_size = 8 * sizeof (int); dbf->header.dir_bits = 3; while (dbf->header.dir_size < dbf->header.block_size /2) { dbf->header.dir_size <<= 1; dbf->header.dir_bits += 1; } dbf->dir = (int *) malloc (dbf->header.dir_size); if (dbf->dir == NULL) { gdbm_close (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } dbf->header.dir = sizeof (dbf->header); /* Create the first and only hash bucket. */ dbf->header.bucket_elems = (dbf->header.block_size - 2 * sizeof (int)) / sizeof (bucket_element); dbf->header.bucket_size = dbf->header.bucket_elems * sizeof (bucket_element) + 2 * sizeof (int); dbf->bucket_adr = dbf->header.block_size; dbf->bucket_dir = 0; dbf->bucket = (hash_bucket *) (malloc(dbf->header.bucket_size)); if (dbf->bucket == NULL) { gdbm_close (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } _dbm_new_bucket (dbf, dbf->bucket, 0); /* Set table entries to point to hash buckets. */ for (index = 0; index <= dbf->header.dir_size / sizeof (int); index++) dbf->dir[index] = dbf->bucket_adr; /* Make the initial avail block. */ dbf->avail = (avail_block *) malloc (dbf->header.block_size); if (dbf->avail == NULL) { gdbm_close (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } dbf->avail_adr = 2*dbf->header.block_size; for (index = 0; index < AVAIL_SIZE; index++) dbf->header.avail_list[index] = dbf->avail_adr; dbf->avail->size = ((dbf->header.block_size - sizeof (avail_block)) / sizeof (avail_elem)) + 1; dbf->avail->count = 0; dbf->avail->next_block = 0; dbf->avail->prev_block = 0; /* Other fields in the file header. */ dbf->header.file_size = 3*dbf->header.block_size; dbf->header.header_magic = 0x13579ace; /* Set this field so we do crash detection and recovery. */ dbf->header.update_state = 0; /* Write initial configuration to the file. */ num_bytes = write (dbf->desc, &dbf->header, sizeof(dbf->header)); if (num_bytes != sizeof(dbf->header)) { gdbm_close (dbf); gdbm_errno = FILE_WRITE_ERROR; return NULL; } num_bytes = write (dbf->desc, dbf->dir, dbf->header.dir_size); if (num_bytes != dbf->header.dir_size) { gdbm_close (dbf); gdbm_errno = FILE_WRITE_ERROR; return NULL; } num_bytes = lseek (dbf->desc, dbf->header.block_size, L_SET); if (num_bytes != dbf->header.block_size) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; } num_bytes = write (dbf->desc, dbf->bucket, dbf->header.bucket_size); if (num_bytes != dbf->header.bucket_size) { gdbm_close (dbf); gdbm_errno = FILE_WRITE_ERROR; return NULL; } num_bytes = lseek (dbf->desc, 2 * dbf->header.block_size, L_SET); if (num_bytes != 2 * dbf->header.block_size) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; } num_bytes = write (dbf->desc, dbf->avail, dbf->header.block_size); if (num_bytes != dbf->header.block_size) { gdbm_close (dbf); gdbm_errno = FILE_WRITE_ERROR; return NULL; } fsync (dbf->desc); /* Finally, "free" the unused space in the initial file. */ index = sizeof (dbf->header) + dbf->header.dir_size; _dbm_free (dbf, index, dbf->header.block_size - index); _dbm_free (dbf, dbf->bucket_adr + dbf->header.bucket_size, dbf->header.block_size - dbf->header.bucket_size); _dbm_end_update (dbf); } else { /* This is an old database. Read in the information from the file header and initialize the hash directory. */ /* Read the file header. */ num_bytes = read (dbf->desc, &dbf->header, sizeof(dbf->header)); if (num_bytes != sizeof(dbf->header)) { gdbm_close (dbf); gdbm_errno = FILE_READ_ERROR; return NULL; } /* Is the magic number good? */ if (dbf->header.header_magic != 0x13579ace) { gdbm_close (dbf); gdbm_errno = BAD_MAGIC_NUMBER; return NULL; } /* Is the database consistent? */ if (dbf->header.update_state != 0 && dbf->header.update_state != -1) /* If it is not in the middle of an update or we are a reader we can not continue. */ if ((dbf->header.update_state & 0xffffff00) != 0x77777700 || read_write == DBM_READER) { gdbm_close (dbf); gdbm_errno = READER_CANT_RECOVER; return NULL; } /* Allocate space for the hash table directory. */ dbf->dir = (int *) malloc (dbf->header.dir_size); if (dbf->dir == NULL) { gdbm_close (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } /* Read the hash table directory. */ num_bytes = lseek (dbf->desc, dbf->header.dir, L_SET); if (num_bytes != dbf->header.dir) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; } num_bytes = read (dbf->desc, dbf->dir, dbf->header.dir_size); if (num_bytes != dbf->header.dir_size) { gdbm_close (dbf); gdbm_errno = FILE_READ_ERROR; return NULL; } /* Initialize the hash bucket buffer. */ dbf->bucket = (hash_bucket *) malloc (dbf->header.bucket_size); if (dbf->bucket == NULL) { gdbm_close (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } dbf->bucket_adr = 0; /* Initialize the avail block buffer. */ dbf->avail = (avail_block *) malloc (dbf->header.block_size); if (dbf->avail == NULL) { gdbm_close (dbf); gdbm_errno = MALLOC_ERROR; return NULL; } dbf->avail_adr = 0; /* Now that everything has been read and initialized, if we were in an update, it is now time to fix the database. */ if ((dbf->header.update_state & 0xffffff00) == 0x77777700) { int update_code; int param1; int param2; int param3; int param4; /* Crash recovery! Save the information from the header in local variables so that the information is not lost. */ update_code = dbf->header.update_state & 0xff; param1 = dbf->header.upd_param1; param2 = dbf->header.upd_param2; param3 = dbf->header.upd_param3; param4 = dbf->header.upd_param4; switch (update_code) { case 1: /* _file_alloc - updating current avail block. param1 = address of new allocation. param2 = size of new allocation. param3 = size of unused portion. param4 = address of avail block. */ case 2: /* _file_alloc - allocating at the end of the file. param1 = address of new allocation. param2 = size of new allocation. param3 = address of unused portion of previous block. param4 = size of unused portion. */ case 3: /* _dbm_free - updating current avail block. param1 = address of new available block. param2 = size of new avaliable block. param3 = address of the avail block. param4 = size of avail block. */ case 4: /* _dbm_free - splitting current avail block. Sharing with the previous block. param1 = address of current block. param2 = size of current block before split. param3 = address of previous block. param4 = size of previous block before split. */ case 5: /* _dbm_free - splitting current avail block. Sharing with the next block. param1 = address of current block. param2 = size of current block before split. param3 = address of next param4 = size of unused portion before split. */ case 6: /* _dbm_free - splitting current avail block. Creating a new block. param1 = address of current block. param2 = size of current block before the split. param3 = address of new block. param4 = address of the next block. */ /* Cases 1 to 6 call a repair routine in falloc.c. */ _dbm_alloc_repair (dbf, update_code, param1, param2, param3, param4); break; case 7: /* gdbm_store - writing the data to the file. param1 = data pointer param2 = total size (key and data) param3 = current bucket address param4 = element location in the current bucket */ /* Read the bucket to figure out what to do. */ dbf->bucket_adr = param3; num_bytes = lseek (dbf->desc, dbf->bucket_adr, L_SET); if (num_bytes != dbf->bucket_adr) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; }; num_bytes = read (dbf->desc, dbf->bucket, dbf->header.bucket_size); if (num_bytes != dbf->header.bucket_size) { gdbm_close (dbf); gdbm_errno = FILE_READ_ERROR; return NULL; }; /* Check to see if bucket was updated. -1 => no update wrong address => no update In both cases, we don't need to touch the bucket, we just free the space allocated for the new item. If it was updated, we don't need to do anything. */ if (dbf->bucket->h_table[param4].hash_value == -1 || dbf->bucket->h_table[param4].data_pointer != param1) { /* We need to free the allocated space. */ _dbm_free (dbf, param1, param2); } break; case 8: /* split_current - splitting a bucket. param1 = new bucket address param2 = old bucket size param3 = old bucket address param4 = old bucket directory entry */ /* Read the bucket to figure out what to do. */ dbf->bucket_adr = param3; num_bytes = lseek (dbf->desc, dbf->bucket_adr, L_SET); if (num_bytes != dbf->bucket_adr) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; }; num_bytes = read (dbf->desc, dbf->bucket, dbf->header.bucket_size); if (num_bytes != dbf->header.bucket_size) { gdbm_close (dbf); gdbm_errno = FILE_READ_ERROR; return NULL; }; if (dbf->bucket->count == param3) { /* The old bucket was not saved. Toss the new bucket! */ _dbm_free (dbf, param1, dbf->header.bucket_size); } else { /* The old bucket was saved. Make sure the table is correct. */ int dir_start, dir_end, index, new_bits; new_bits = dbf->bucket->bucket_bits; dir_start = (param4 >> (dbf->header.dir_bits - new_bits)) | 1; dir_end = (dir_start + 1) << (dbf->header.dir_bits - new_bits); dir_start = dir_start << (dbf->header.dir_bits - new_bits); if (dbf->dir[dir_start] != param1) { for (index = dir_start; index < dir_end; index++) dbf->dir[index] = param1; num_bytes = lseek (dbf->desc, dbf->header.dir, L_SET); if (num_bytes != dbf->header.dir) _dbm_fatal (dbf, "lseek error"); num_bytes = write (dbf->desc, dbf->dir, dbf->header.dir_size); if (num_bytes != dbf->header.dir_size) _dbm_fatal (dbf, "write error"); } } break; case 9: /* gdbm_delete - updating the current bucket. param1 = data pointer param2 = total size (key and data) param3 = bucket address param4 = bucket count after delete */ /* Read the bucket to figure out what to do. */ dbf->bucket_adr = param3; num_bytes = lseek (dbf->desc, dbf->bucket_adr, L_SET); if (num_bytes != dbf->bucket_adr) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; }; num_bytes = read (dbf->desc, dbf->bucket, dbf->header.bucket_size); if (num_bytes != dbf->header.bucket_size) { gdbm_close (dbf); gdbm_errno = FILE_READ_ERROR; return NULL; }; if (dbf->bucket->count == param4) { /* It was written out, just free the space. */ _dbm_free (dbf, param1, param2); } else { /* It was not written out, must delete the element. */ datum key; int index, num_bytes; index = 0; while (dbf->bucket->h_table[index].data_pointer != param3) index++; /* Delete the index item. */ key.dsize = dbf->bucket->h_table[index].key_size; key.dptr = (char *) alloca (key.dsize); num_bytes = lseek (dbf->desc, param3, L_SET); if (num_bytes != param3) { gdbm_close (dbf); gdbm_errno = FILE_SEEK_ERROR; return NULL; }; num_bytes = read (dbf->desc, key.dptr, key.dsize); if (num_bytes != key.dsize) { gdbm_close (dbf); gdbm_errno = FILE_READ_ERROR; return NULL; }; gdbm_delete (dbf, key); } break; default: /* Unknow update code! */ gdbm_close (dbf); gdbm_errno = UNKNOWN_UPDATE; return NULL; } /* The correction was completed correctly. */ _dbm_end_update (dbf); } } /* Everything is fine, return the pointer to the file information structure. */ return dbf; }