Blame gfs2/libgfs2/super.c

Packit 6ef888
#include "clusterautoconfig.h"
Packit 6ef888
Packit 6ef888
#include <unistd.h>
Packit 6ef888
#include <inttypes.h>
Packit 6ef888
#include <stdio.h>
Packit 6ef888
#include <stdint.h>
Packit 6ef888
#include <stdlib.h>
Packit 6ef888
#include <string.h>
Packit 6ef888
#include <errno.h>
Packit 6ef888
#include <fcntl.h>
Packit 6ef888
Packit 6ef888
#include "libgfs2.h"
Packit 6ef888
#include "osi_list.h"
Packit 6ef888
Packit 6ef888
/**
Packit 6ef888
 * check_sb - Check superblock
Packit 6ef888
 * @sb: The superblock
Packit 6ef888
 *
Packit 6ef888
 * Checks the version code of the FS is one that we understand how to
Packit 6ef888
 * read and that the sizes of the various on-disk structures have not
Packit 6ef888
 * changed.
Packit 6ef888
 *
Packit 6ef888
 * Returns: -1 on failure, 1 if this is gfs (gfs1), 2 if this is gfs2
Packit 6ef888
 */
Packit 6ef888
int check_sb(struct gfs2_sb *sb)
Packit 6ef888
{
Packit 6ef888
	if (sb->sb_header.mh_magic != GFS2_MAGIC ||
Packit 6ef888
	    sb->sb_header.mh_type != GFS2_METATYPE_SB) {
Packit 6ef888
		errno = EIO;
Packit 6ef888
		return -1;
Packit 6ef888
	}
Packit Service 786bf1
	/* Check for gfs1 */
Packit 6ef888
	if (sb->sb_fs_format == GFS_FORMAT_FS &&
Packit 6ef888
	    sb->sb_header.mh_format == GFS_FORMAT_SB &&
Packit 6ef888
	    sb->sb_multihost_format == GFS_FORMAT_MULTI) {
Packit 6ef888
		return 1;
Packit 6ef888
	}
Packit Service 786bf1
	/* It's gfs2. Check format number is in a sensible range. */
Packit Service 786bf1
	if (sb->sb_fs_format < GFS2_FORMAT_FS ||
Packit Service 786bf1
	    sb->sb_fs_format > 1899) {
Packit Service 786bf1
		errno = EINVAL;
Packit Service 786bf1
		return -1;
Packit Service 786bf1
	}
Packit 6ef888
	return 2;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
Packit 6ef888
/*
Packit 6ef888
 * read_sb: read the super block from disk
Packit 6ef888
 * sdp: in-core super block
Packit 6ef888
 *
Packit 6ef888
 * This function reads in the super block from disk and
Packit 6ef888
 * initializes various constants maintained in the super
Packit 6ef888
 * block
Packit 6ef888
 *
Packit 6ef888
 * Returns: 0 on success, -1 on failure
Packit 6ef888
 * sdp->gfs1 will be set if this is gfs (gfs1)
Packit 6ef888
 */
Packit 6ef888
int read_sb(struct gfs2_sbd *sdp)
Packit 6ef888
{
Packit 6ef888
	struct gfs2_buffer_head *bh;
Packit 6ef888
	uint64_t space = 0;
Packit 6ef888
	unsigned int x;
Packit 6ef888
	int ret;
Packit 6ef888
Packit 6ef888
	bh = bread(sdp, GFS2_SB_ADDR >> sdp->sd_fsb2bb_shift);
Packit 6ef888
	gfs2_sb_in(&sdp->sd_sb, bh->b_data);
Packit 6ef888
	brelse(bh);
Packit 6ef888
Packit 6ef888
	ret = check_sb(&sdp->sd_sb);
Packit 6ef888
	if (ret < 0)
Packit 6ef888
		return ret;
Packit 6ef888
	if (ret == 1)
Packit 6ef888
		sdp->gfs1 = 1;
Packit 6ef888
	sdp->sd_fsb2bb_shift = sdp->sd_sb.sb_bsize_shift - GFS2_BASIC_BLOCK_SHIFT;
Packit 6ef888
	sdp->bsize = sdp->sd_sb.sb_bsize;
Packit 6ef888
	if (sdp->bsize < 512 || sdp->bsize != (sdp->bsize & -sdp->bsize)) {
Packit 6ef888
		return -1;
Packit 6ef888
	}
Packit 6ef888
	if (sdp->gfs1) {
Packit 6ef888
		sdp->sd_diptrs = (sdp->sd_sb.sb_bsize -
Packit 6ef888
				  sizeof(struct gfs_dinode)) /
Packit 6ef888
			sizeof(uint64_t);
Packit 6ef888
		sdp->sd_inptrs = (sdp->sd_sb.sb_bsize -
Packit 6ef888
				  sizeof(struct gfs_indirect)) /
Packit 6ef888
			sizeof(uint64_t);
Packit 6ef888
	} else {
Packit 6ef888
		sdp->sd_diptrs = (sdp->sd_sb.sb_bsize -
Packit 6ef888
				  sizeof(struct gfs2_dinode)) /
Packit 6ef888
			sizeof(uint64_t);
Packit 6ef888
		sdp->sd_inptrs = (sdp->sd_sb.sb_bsize -
Packit 6ef888
				  sizeof(struct gfs2_meta_header)) /
Packit 6ef888
			sizeof(uint64_t);
Packit 6ef888
	}
Packit 6ef888
	sdp->sd_jbsize = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_meta_header);
Packit 6ef888
	sdp->sd_hash_bsize = sdp->bsize / 2;
Packit 6ef888
	sdp->sd_hash_bsize_shift = sdp->sd_sb.sb_bsize_shift - 1;
Packit 6ef888
	sdp->sd_hash_ptrs = sdp->sd_hash_bsize / sizeof(uint64_t);
Packit 6ef888
	sdp->sd_heightsize[0] = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode);
Packit 6ef888
	sdp->sd_heightsize[1] = sdp->sd_sb.sb_bsize * sdp->sd_diptrs;
Packit 6ef888
	for (x = 2; x < GFS2_MAX_META_HEIGHT; x++){
Packit 6ef888
		space = sdp->sd_heightsize[x - 1] * sdp->sd_inptrs;
Packit 6ef888
		/* FIXME: Do we really need this first check?? */
Packit 6ef888
		if (space / sdp->sd_inptrs != sdp->sd_heightsize[x - 1] ||
Packit 6ef888
		    space % sdp->sd_inptrs != 0)
Packit 6ef888
			break;
Packit 6ef888
		sdp->sd_heightsize[x] = space;
Packit 6ef888
	}
Packit 6ef888
	if (x > GFS2_MAX_META_HEIGHT){
Packit 6ef888
		errno = E2BIG;
Packit 6ef888
		return -1;
Packit 6ef888
	}
Packit 6ef888
Packit 6ef888
	sdp->sd_jheightsize[0] = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode);
Packit 6ef888
	sdp->sd_jheightsize[1] = sdp->sd_jbsize * sdp->sd_diptrs;
Packit 6ef888
	for (x = 2; ; x++){
Packit 6ef888
		space = sdp->sd_jheightsize[x - 1] * sdp->sd_inptrs;
Packit 6ef888
		if (space / sdp->sd_inptrs != sdp->sd_jheightsize[x - 1] ||
Packit 6ef888
			space % sdp->sd_inptrs != 0)
Packit 6ef888
			break;
Packit 6ef888
		sdp->sd_jheightsize[x] = space;
Packit 6ef888
	}
Packit 6ef888
	sdp->sd_max_jheight = x;
Packit 6ef888
	if(sdp->sd_max_jheight > GFS2_MAX_META_HEIGHT) {
Packit 6ef888
		errno = E2BIG;
Packit 6ef888
		return -1;
Packit 6ef888
	}
Packit 6ef888
	sdp->fssize = lseek(sdp->device_fd, 0, SEEK_END) / sdp->sd_sb.sb_bsize;
Packit 6ef888
	sdp->sd_blocks_per_bitmap = (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_meta_header))
Packit 6ef888
	                             * GFS2_NBBY;
Packit 6ef888
	sdp->qcsize = GFS2_DEFAULT_QCSIZE;
Packit 6ef888
Packit 6ef888
	return 0;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
/* rgd_seems_sane - check some general things about the rindex entry
Packit 6ef888
 *
Packit 6ef888
 * If rg lengths are not consistent, it's not sane (or it's converted from
Packit 6ef888
 * gfs1). The first RG will be a different length due to space reserved for
Packit 6ef888
 * the superblock, so we can't detect this until we check rgrp 3, when we
Packit 6ef888
 * can compare the distance between rgrp 1 and rgrp 2.
Packit 6ef888
 *
Packit 6ef888
 * Returns: 1 if the rgd seems relatively sane
Packit 6ef888
 */
Packit 6ef888
static int rgd_seems_sane(struct gfs2_sbd *sdp, struct rgrp_tree *rgd)
Packit 6ef888
{
Packit 6ef888
	uint32_t most_bitmaps_possible;
Packit 6ef888
Packit 6ef888
	/* rg length must be at least 1 */
Packit 6ef888
	if (rgd->ri.ri_length == 0)
Packit 6ef888
		return 0;
Packit 6ef888
Packit 6ef888
	/* A max rgrp, 2GB, divided into blocksize, divided by blocks/byte
Packit 6ef888
	   represented in the bitmap, NBBY. Rough approximation only, due to
Packit 6ef888
	   metadata headers. I'm doing the math this way to avoid overflow. */
Packit 6ef888
	most_bitmaps_possible = (GFS2_MAX_RGSIZE * 1024 * 256) / sdp->bsize;
Packit 6ef888
	if (rgd->ri.ri_length > most_bitmaps_possible)
Packit 6ef888
		return 0;
Packit 6ef888
Packit 6ef888
	if (rgd->ri.ri_data0 != rgd->ri.ri_addr + rgd->ri.ri_length)
Packit 6ef888
		return 0;
Packit 6ef888
Packit 6ef888
	if (rgd->ri.ri_bitbytes != rgd->ri.ri_data / GFS2_NBBY)
Packit 6ef888
		return 0;
Packit 6ef888
Packit 6ef888
	return 1;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
/* good_on_disk - check if the rindex points to what looks like an rgrp on disk
Packit 6ef888
 *
Packit 6ef888
 * This is only called when the rindex pointers aren't spaced evenly, which
Packit 6ef888
 * isn't often. The rindex is pointing to an unexpected location, so we
Packit 6ef888
 * check if the block it is pointing to is really an rgrp. If so, we count the
Packit 6ef888
 * rindex entry as "sane" (after all, it did pass the previous checks above.)
Packit 6ef888
 * If not, we count it as not sane, and therefore, the whole rindex is not to
Packit 6ef888
 * be trusted by fsck.gfs2.
Packit 6ef888
 */
Packit 6ef888
static int good_on_disk(struct gfs2_sbd *sdp, struct rgrp_tree *rgd)
Packit 6ef888
{
Packit 6ef888
	struct gfs2_buffer_head *bh;
Packit 6ef888
	int is_rgrp;
Packit 6ef888
Packit 6ef888
	bh = bread(sdp, rgd->ri.ri_addr);
Packit 6ef888
	is_rgrp = (gfs2_check_meta(bh, GFS2_METATYPE_RG) == 0);
Packit 6ef888
	brelse(bh);
Packit 6ef888
	return is_rgrp;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
/**
Packit 6ef888
 * rindex_read - read in the rg index file
Packit 6ef888
 * @sdp: the incore superblock pointer
Packit 6ef888
 * fd: optional file handle for rindex file (if meta_fs file system is mounted)
Packit 6ef888
 *     (if fd is <= zero, it will read from raw device)
Packit 6ef888
 * @count1: return count of the rgs.
Packit 6ef888
 * @sane: return whether rindex is consistent
Packit 6ef888
 *
Packit 6ef888
 * Returns: 0 on success, -1 on failure
Packit 6ef888
 */
Packit 6ef888
int rindex_read(struct gfs2_sbd *sdp, int fd, uint64_t *count1, int *sane)
Packit 6ef888
{
Packit 6ef888
	unsigned int rg;
Packit 6ef888
	int error;
Packit 6ef888
	union {
Packit 6ef888
		struct gfs2_rindex bufgfs2;
Packit 6ef888
	} buf;
Packit 6ef888
	struct gfs2_rindex ri;
Packit 6ef888
	struct rgrp_tree *rgd = NULL, *prev_rgd = NULL;
Packit 6ef888
	uint64_t prev_length = 0;
Packit 6ef888
Packit 6ef888
	*sane = 1;
Packit 6ef888
	*count1 = 0;
Packit 6ef888
	if (!fd && sdp->md.riinode->i_di.di_size % sizeof(struct gfs2_rindex))
Packit 6ef888
		*sane = 0; /* rindex file size must be a multiple of 96 */
Packit 6ef888
	for (rg = 0; ; rg++) {
Packit 6ef888
		if (fd > 0)
Packit 6ef888
			error = read(fd, &buf, sizeof(struct gfs2_rindex));
Packit 6ef888
		else
Packit 6ef888
			error = gfs2_readi(sdp->md.riinode,
Packit 6ef888
					   (char *)&buf.bufgfs2,
Packit 6ef888
					   rg * sizeof(struct gfs2_rindex),
Packit 6ef888
					   sizeof(struct gfs2_rindex));
Packit 6ef888
		if (!error)
Packit 6ef888
			break;
Packit 6ef888
		if (error != sizeof(struct gfs2_rindex))
Packit 6ef888
			return -1;
Packit 6ef888
Packit 6ef888
		gfs2_rindex_in(&ri, (char *)&buf.bufgfs2);
Packit 6ef888
		if (gfs2_check_range(sdp, ri.ri_addr) != 0) {
Packit 6ef888
			*sane = 0;
Packit 6ef888
			if (prev_rgd == NULL)
Packit 6ef888
				continue;
Packit 6ef888
			ri.ri_addr = prev_rgd->ri.ri_addr + prev_rgd->length;
Packit 6ef888
		}
Packit 6ef888
		rgd = rgrp_insert(&sdp->rgtree, ri.ri_addr);
Packit 6ef888
		memcpy(&rgd->ri, &ri, sizeof(struct gfs2_rindex));
Packit 6ef888
Packit 6ef888
		rgd->start = rgd->ri.ri_addr;
Packit 6ef888
		if (prev_rgd) {
Packit 6ef888
			/* If rg addresses go backwards, it's not sane
Packit 6ef888
			   (or it's converted from gfs1). */
Packit 6ef888
			if (!sdp->gfs1) {
Packit 6ef888
				if (prev_rgd->start >= rgd->start)
Packit 6ef888
					*sane = 0;
Packit 6ef888
				else if (!rgd_seems_sane(sdp, rgd))
Packit 6ef888
					*sane = 0;
Packit 6ef888
				else if (*sane && rg > 2 && prev_length &&
Packit 6ef888
				    prev_length != rgd->start -
Packit 6ef888
				    prev_rgd->start)
Packit 6ef888
					*sane = good_on_disk(sdp, rgd);
Packit 6ef888
			}
Packit 6ef888
			prev_length = rgd->start - prev_rgd->start;
Packit 6ef888
			prev_rgd->length = rgrp_size(prev_rgd);
Packit 6ef888
		}
Packit 6ef888
Packit 6ef888
		if(gfs2_compute_bitstructs(sdp->sd_sb.sb_bsize, rgd))
Packit 6ef888
			*sane = 0;
Packit 6ef888
Packit 6ef888
		(*count1)++;
Packit 6ef888
		prev_rgd = rgd;
Packit 6ef888
	}
Packit 6ef888
	if (prev_rgd)
Packit 6ef888
		prev_rgd->length = rgrp_size(prev_rgd);
Packit 6ef888
	if (*count1 == 0)
Packit 6ef888
		return -1;
Packit 6ef888
	return 0;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
#define RA_WINDOW 32
Packit 6ef888
Packit 6ef888
static unsigned gfs2_rgrp_reada(struct gfs2_sbd *sdp, unsigned cur_window,
Packit 6ef888
				struct osi_node *n)
Packit 6ef888
{
Packit 6ef888
	struct rgrp_tree *rgd;
Packit 6ef888
	unsigned i;
Packit 6ef888
	off_t start, len;
Packit 6ef888
Packit 6ef888
	for (i = 0; i < RA_WINDOW; i++, n = osi_next(n)) {
Packit 6ef888
		if (n == NULL)
Packit 6ef888
			return i;
Packit 6ef888
		if (i < cur_window)
Packit 6ef888
			continue;
Packit 6ef888
		rgd = (struct rgrp_tree *)n;
Packit 6ef888
		start = rgd->ri.ri_addr * sdp->bsize;
Packit 6ef888
		len = rgd->ri.ri_length * sdp->bsize;
Packit 6ef888
		posix_fadvise(sdp->device_fd, start, len, POSIX_FADV_WILLNEED);
Packit 6ef888
	}
Packit 6ef888
Packit 6ef888
	return i;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
/**
Packit 6ef888
 * ri_update - attach rgrps to the super block
Packit 6ef888
 * @sdp: incore superblock data
Packit 6ef888
 * fd: optional file handle for rindex (through the meta_fs)
Packit 6ef888
 * @rgcount: returned count of rgs
Packit 6ef888
 *
Packit 6ef888
 * Given the rgrp index inode, link in all rgrps into the super block
Packit 6ef888
 * and be sure that they can be read.
Packit 6ef888
 *
Packit 6ef888
 * Returns: 0 on success, -1 on failure.
Packit 6ef888
 */
Packit 6ef888
static int __ri_update(struct gfs2_sbd *sdp, int fd, int *rgcount, int *sane,
Packit 6ef888
		       int quiet)
Packit 6ef888
{
Packit 6ef888
	struct rgrp_tree *rgd;
Packit 6ef888
	struct gfs2_rindex *ri;
Packit 6ef888
	uint64_t count1 = 0, count2 = 0;
Packit 6ef888
	uint64_t errblock = 0;
Packit 6ef888
	uint64_t rmax = 0;
Packit 6ef888
	struct osi_node *n, *next = NULL;
Packit 6ef888
	unsigned ra_window = 0;
Packit 6ef888
Packit 6ef888
	/* Turn off generic readhead */
Packit 6ef888
	posix_fadvise(sdp->device_fd, 0, 0, POSIX_FADV_RANDOM);
Packit 6ef888
Packit 6ef888
	if (rindex_read(sdp, fd, &count1, sane))
Packit 6ef888
		goto fail;
Packit 6ef888
	for (n = osi_first(&sdp->rgtree); n; n = next) {
Packit 6ef888
		next = osi_next(n);
Packit 6ef888
		rgd = (struct rgrp_tree *)n;
Packit 6ef888
		/* Readahead resource group headers */
Packit 6ef888
		if (ra_window < RA_WINDOW/2)
Packit 6ef888
			ra_window = gfs2_rgrp_reada(sdp, ra_window, n);
Packit 6ef888
		/* Read resource group header */
Packit 6ef888
		errblock = gfs2_rgrp_read(sdp, rgd);
Packit 6ef888
		if (errblock)
Packit 6ef888
			return errblock;
Packit 6ef888
		ra_window--;
Packit 6ef888
		count2++;
Packit 6ef888
		if (!quiet && count2 % 100 == 0) {
Packit 6ef888
			printf(".");
Packit 6ef888
			fflush(stdout);
Packit 6ef888
		}
Packit 6ef888
		ri = &rgd->ri;
Packit 6ef888
		if (ri->ri_data0 + ri->ri_data - 1 > rmax)
Packit 6ef888
			rmax = ri->ri_data0 + ri->ri_data - 1;
Packit 6ef888
	}
Packit 6ef888
Packit 6ef888
	sdp->fssize = rmax;
Packit 6ef888
	*rgcount = count1;
Packit 6ef888
	if (count1 != count2)
Packit 6ef888
		goto fail;
Packit 6ef888
Packit 6ef888
	posix_fadvise(sdp->device_fd, 0, 0, POSIX_FADV_NORMAL);
Packit 6ef888
	return 0;
Packit 6ef888
Packit 6ef888
 fail:
Packit 6ef888
	posix_fadvise(sdp->device_fd, 0, 0, POSIX_FADV_NORMAL);
Packit 6ef888
	gfs2_rgrp_free(&sdp->rgtree);
Packit 6ef888
	return -1;
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
int ri_update(struct gfs2_sbd *sdp, int fd, int *rgcount, int *sane)
Packit 6ef888
{
Packit 6ef888
	return __ri_update(sdp, fd, rgcount, sane, 1);
Packit 6ef888
}
Packit 6ef888
Packit 6ef888
/**
Packit 6ef888
 * gfs1_ri_update - attach rgrps to the super block
Packit 6ef888
 *                  Stolen from libgfs2/super.c, but modified to handle gfs1.
Packit 6ef888
 * @sdp:
Packit 6ef888
 *
Packit 6ef888
 * Given the rgrp index inode, link in all rgrps into the super block
Packit 6ef888
 * and be sure that they can be read.
Packit 6ef888
 *
Packit 6ef888
 * Returns: 0 on success, -1 on failure.
Packit 6ef888
 */
Packit 6ef888
int gfs1_ri_update(struct gfs2_sbd *sdp, int fd, int *rgcount, int quiet)
Packit 6ef888
{
Packit 6ef888
	int sane;
Packit 6ef888
Packit 6ef888
	return __ri_update(sdp, fd, rgcount, &sane, quiet);
Packit 6ef888
}