📄 os_rw.c
字号:
/*- * See the file LICENSE for redistribution information. * * Copyright (c) 1997-2002 * Sleepycat Software. All rights reserved. */#include "db_config.h"#ifndef lintstatic const char revid[] = "$Id: os_rw.c,v 1.1.1.1 2004/08/19 23:53:56 gopalan Exp $";#endif /* not lint */#ifndef __KERNEL__#ifndef NO_SYSTEM_INCLUDES#include <sys/types.h>#include <sys/stat.h>#include <string.h>#include <unistd.h>#endif#else#include <linux/types.h>#include <linux/string.h>#include <asm/uaccess.h>#endif /* __KERNEL__ */#include "db_int.h"#ifdef HAVE_FILESYSTEM_NOTZEROstatic int __os_zerofill __P((DB_ENV *, DB_FH *));#endifstatic int __os_physwrite __P((DB_ENV *, DB_FH *, void *, size_t, size_t *));#ifdef __KERNEL__ssize_t read(struct file * fd, char * buf, size_t count){ int ret; struct file * file; mm_segment_t oldfs; oldfs = get_fs(); set_fs(KERNEL_DS); ret = -EBADF; file = fd; if (file) { if (fd->f_mode & FMODE_READ) { ssize_t (*read)(struct file *, char *, size_t, loff_t *); ret = -EINVAL; if (file->f_op && (read = file->f_op->read) != NULL) ret = read(file, buf, count, &file->f_pos); } } set_fs(oldfs); return ret;}ssize_t write(struct file * fd, const char * buf, size_t count){ ssize_t ret; struct file * file; mm_segment_t oldfs; oldfs = get_fs(); set_fs(KERNEL_DS); ret = -EBADF; file = fd; if (file) { if (file->f_mode & FMODE_WRITE) { ssize_t (*write)(struct file *, const char *, size_t, loff_t *); ret = -EINVAL; if (file->f_op && (write = file->f_op->write) != NULL) ret = write(file, buf, count, &file->f_pos); } } set_fs(oldfs); return ret;}#endif/* * __os_io -- * Do an I/O. * * PUBLIC: int __os_io __P((DB_ENV *, DB_IO *, int, size_t *)); */int__os_io(dbenv, db_iop, op, niop) DB_ENV *dbenv; DB_IO *db_iop; int op; size_t *niop;{ int ret; print_entry_location();#ifndef __KERNEL__ /* Check for illegal usage. */ DB_ASSERT(F_ISSET(db_iop->fhp, DB_FH_VALID) && db_iop->fhp->fd != -1);#else /* Check for illegal usage. */ DB_ASSERT(F_ISSET(db_iop->fhp, DB_FH_VALID) && !IS_ERR(db_iop->fhp->fd));#endif #if defined(HAVE_PREAD) && defined(HAVE_PWRITE) switch (op) { case DB_IO_READ: if (DB_GLOBAL(j_read) != NULL) goto slow; *niop = pread(db_iop->fhp->fd, db_iop->buf, db_iop->bytes, (off_t)db_iop->pgno * db_iop->pagesize); break; case DB_IO_WRITE: if (DB_GLOBAL(j_write) != NULL) goto slow;#ifdef HAVE_FILESYSTEM_NOTZERO if (__os_fs_notzero()) goto slow;#endif *niop = pwrite(db_iop->fhp->fd, db_iop->buf, db_iop->bytes, (off_t)db_iop->pgno * db_iop->pagesize); break; } if (*niop == (size_t)db_iop->bytes) { print_exit_location(0); return (0); }slow:#endif MUTEX_THREAD_LOCK(dbenv, db_iop->mutexp); if ((ret = __os_seek(dbenv, db_iop->fhp, db_iop->pagesize, db_iop->pgno, 0, 0, DB_OS_SEEK_SET)) != 0) goto err; switch (op) { case DB_IO_READ: ret = __os_read(dbenv, db_iop->fhp, db_iop->buf, db_iop->bytes, niop); break; case DB_IO_WRITE: ret = __os_write(dbenv, db_iop->fhp, db_iop->buf, db_iop->bytes, niop); break; }err: MUTEX_THREAD_UNLOCK(dbenv, db_iop->mutexp); print_exit_location(ret); return (ret);}/* * __os_read -- * Read from a file handle. * * PUBLIC: int __os_read __P((DB_ENV *, DB_FH *, void *, size_t, size_t *)); */int__os_read(dbenv, fhp, addr, len, nrp)DB_ENV *dbenv;DB_FH *fhp;void *addr;size_t len;size_t *nrp;{ size_t offset; ssize_t nr = 0; int ret = 0; u_int8_t *taddr; print_entry_location(); /* Check for illegal usage. */ DB_ASSERT(F_ISSET(fhp, DB_FH_VALID) && !IS_ERR(fhp->fd)); if (fhp->fd == NULL) printk("fd is NULL\n"); for (taddr = addr, offset = 0; offset < len; taddr += nr, offset += nr) {retry: if ((nr = DB_GLOBAL(j_read) != NULL ? DB_GLOBAL(j_read)(fhp->fd, taddr, len - offset) : read(fhp->fd, taddr, len - offset)) < 0) { if ((ret = __os_get_errno()) == EINTR) goto retry; __db_err(dbenv, "read: 0x%x, %lu: %d", taddr, (u_long)len-offset, ret); print_exit_location(ret); return (ret); } if (nr == 0) break; } *nrp = taddr - (u_int8_t *)addr; print_exit_location(ret); return (0);}/* * __os_write -- * Write to a file handle. * * PUBLIC: int __os_write __P((DB_ENV *, DB_FH *, void *, size_t, size_t *)); */int__os_write(dbenv, fhp, addr, len, nwp) DB_ENV *dbenv; DB_FH *fhp; void *addr; size_t len; size_t *nwp;{#ifdef __KERNEL__ int ret = 0;#endif print_entry_location(); /* Check for illegal usage. */ DB_ASSERT(F_ISSET(fhp, DB_FH_VALID) && fhp->fd != -1); /* Check for illegal usage. */ DB_ASSERT(F_ISSET(fhp, DB_FH_VALID) && fhp->fd != -1);#ifdef HAVE_FILESYSTEM_NOTZERO /* Zero-fill as necessary. */ if (__os_fs_notzero()) { int ret; if ((ret = __os_zerofill(dbenv, fhp)) != 0) { print_exit_location(ret); return (ret); } }#endif ret = __os_physwrite(dbenv, fhp, addr, len, nwp); print_exit_location(ret); return (ret);}/* * __os_physwrite -- * Physical write to a file handle. */static int__os_physwrite(dbenv, fhp, addr, len, nwp) DB_ENV *dbenv; DB_FH *fhp; void *addr; size_t len; size_t *nwp;{ size_t offset; ssize_t nw; int ret = 0; u_int8_t *taddr; print_entry_location(); #if defined(HAVE_FILESYSTEM_NOTZERO) && defined(DIAGNOSTIC) if (__os_fs_notzero()) { struct stat sb; off_t cur_off; DB_ASSERT(fstat(fhp->fd, &sb) != -1 && (cur_off = lseek(fhp->fd, (off_t)0, SEEK_CUR)) != -1 && cur_off <= sb.st_size); }#endif for (taddr = addr, offset = 0; offset < len; taddr += nw, offset += nw) retry: if ((nw = DB_GLOBAL(j_write) != NULL ? DB_GLOBAL(j_write)(fhp->fd, taddr, len - offset) : write(fhp->fd, taddr, len - offset)) < 0) { if ((ret = __os_get_errno()) == EINTR) goto retry; __db_err(dbenv, "write: 0x%x, %lu: ret=%d", taddr, (u_long)len-offset, ret); print_exit_location(ret); return (ret);}*nwp = len;print_exit_location(0);return (0);}#ifdef HAVE_FILESYSTEM_NOTZERO/* * __os_zerofill -- * Zero out bytes in the file. * * Pages allocated by writing pages past end-of-file are not zeroed, * on some systems. Recovery could theoretically be fooled by a page * showing up that contained garbage. In order to avoid this, we * have to write the pages out to disk, and flush them. The reason * for the flush is because if we don't sync, the allocation of another * page subsequent to this one might reach the disk first, and if we * crashed at the right moment, leave us with this page as the one * allocated by writing a page past it in the file. */static int__os_zerofill(dbenv, fhp) DB_ENV *dbenv; DB_FH *fhp;{ off_t stat_offset, write_offset; size_t blen, nw; u_int32_t bytes, mbytes; int group_sync, need_free, ret; u_int8_t buf[8 * 1024], *bp; print_entry_location(); /* Calculate the byte offset of the next write. */ write_offset = (off_t)fhp->pgno * fhp->pgsize + fhp->offset; /* Stat the file. */ if ((ret = __os_ioinfo(dbenv, NULL, fhp, &mbytes, &bytes, NULL)) != 0) { print_exit_location(ret); return (ret); } stat_offset = (off_t)mbytes * MEGABYTE + bytes; /* Check if the file is large enough. */ if (stat_offset >= write_offset) { print_exit_location(0); return (0); } /* Get a large buffer if we're writing lots of data. */#undef ZF_LARGE_WRITE#define ZF_LARGE_WRITE (64 * 1024) if (write_offset - stat_offset > ZF_LARGE_WRITE) { if ((ret = __os_calloc(dbenv, 1, ZF_LARGE_WRITE, &bp)) != 0) { print_exit_location(ret); return (ret); } blen = ZF_LARGE_WRITE; need_free = 1; } else { bp = buf; blen = sizeof(buf); need_free = 0; memset(buf, 0, sizeof(buf)); } /* Seek to the current end of the file. */ if ((ret = __os_seek( dbenv, fhp, MEGABYTE, mbytes, bytes, 0, DB_OS_SEEK_SET)) != 0) goto err; /* * Hash is the only access method that allocates groups of pages. Hash * uses the existence of the last page in a group to signify the entire * group is OK; so, write all the pages but the last one in the group, * flush them to disk, then write the last one to disk and flush it. */ for (group_sync = 0; stat_offset < write_offset; group_sync = 1) { if (write_offset - stat_offset <= blen) { blen = (size_t)(write_offset - stat_offset); if (group_sync && (ret = __os_fsync(dbenv, fhp)) != 0) goto err; } if ((ret = __os_physwrite(dbenv, fhp, bp, blen, &nw)) != 0) goto err; stat_offset += blen; } if ((ret = __os_fsync(dbenv, fhp)) != 0) goto err; /* Seek back to where we started. */ mbytes = (u_int32_t)(write_offset / MEGABYTE); bytes = (u_int32_t)(write_offset % MEGABYTE); ret = __os_seek(dbenv, fhp, MEGABYTE, mbytes, bytes, 0, DB_OS_SEEK_SET);err: if (need_free) __os_free(dbenv, bp); print_exit_location(ret); return (ret);}#endif
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -