/* * Copyright (C) 2001-2004 Sistina Software, Inc. All rights reserved. * Copyright (C) 2004 Red Hat, Inc. All rights reserved. * * This file is part of LVM2. * * This copyrighted material is made available to anyone wishing to use, * modify, copy, or redistribute it subject to the terms and conditions * of the GNU General Public License v.2. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software Foundation, * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ #include "lib.h" #include "disk-rep.h" #include "pool.h" #include "hash.h" #include "limits.h" #include "list.h" #include "display.h" #include "toolcontext.h" #include "lvmcache.h" #include "lvm1-label.h" #include "format1.h" #include "segtype.h" #define FMT_LVM1_NAME "lvm1" /* VG consistency checks */ static int _check_vgs(struct list *pvs, int *partial) { struct list *pvh, *t; struct disk_list *dl = NULL; struct disk_list *first = NULL; uint32_t pv_count = 0; uint32_t exported = 0; int first_time = 1; *partial = 0; /* * If there are exported and unexported PVs, ignore exported ones. * This means an active VG won't be affected if disks are inserted * bearing an exported VG with the same name. */ list_iterate(pvh, pvs) { dl = list_item(pvh, struct disk_list); if (first_time) { exported = dl->pvd.pv_status & VG_EXPORTED; first_time = 0; continue; } if (exported != (dl->pvd.pv_status & VG_EXPORTED)) { /* Remove exported PVs */ list_iterate_safe(pvh, t, pvs) { dl = list_item(pvh, struct disk_list); if (dl->pvd.pv_status & VG_EXPORTED) list_del(pvh); } break; } } /* Remove any PVs with VG structs that differ from the first */ list_iterate_safe(pvh, t, pvs) { dl = list_item(pvh, struct disk_list); if (!first) first = dl; else if (memcmp(&first->vgd, &dl->vgd, sizeof(first->vgd))) { log_error("VG data differs between PVs %s and %s", dev_name(first->dev), dev_name(dl->dev)); log_debug("VG data on %s: %s %s %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32, dev_name(first->dev), first->vgd.vg_uuid, first->vgd.vg_name_dummy, first->vgd.vg_number, first->vgd.vg_access, first->vgd.vg_status, first->vgd.lv_max, first->vgd.lv_cur, first->vgd.lv_open, first->vgd.pv_max, first->vgd.pv_cur, first->vgd.pv_act, first->vgd.dummy, first->vgd.vgda, first->vgd.pe_size, first->vgd.pe_total, first->vgd.pe_allocated, first->vgd.pvg_total); log_debug("VG data on %s: %s %s %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32 " %" PRIu32, dev_name(dl->dev), dl->vgd.vg_uuid, dl->vgd.vg_name_dummy, dl->vgd.vg_number, dl->vgd.vg_access, dl->vgd.vg_status, dl->vgd.lv_max, dl->vgd.lv_cur, dl->vgd.lv_open, dl->vgd.pv_max, dl->vgd.pv_cur, dl->vgd.pv_act, dl->vgd.dummy, dl->vgd.vgda, dl->vgd.pe_size, dl->vgd.pe_total, dl->vgd.pe_allocated, dl->vgd.pvg_total); list_del(pvh); if (partial_mode()) { *partial = 1; continue; } return 0; } pv_count++; } /* On entry to fn, list known to be non-empty */ if (pv_count != first->vgd.pv_cur) { log_error("%d PV(s) found for VG %s: expected %d", pv_count, first->pvd.vg_name, first->vgd.pv_cur); if (!partial_mode()) return 0; *partial = 1; } return 1; } static struct volume_group *_build_vg(struct format_instance *fid, struct list *pvs) { struct pool *mem = fid->fmt->cmd->mem; struct volume_group *vg = pool_alloc(mem, sizeof(*vg)); struct disk_list *dl; int partial; if (!vg) goto bad; if (list_empty(pvs)) goto bad; memset(vg, 0, sizeof(*vg)); vg->cmd = fid->fmt->cmd; vg->fid = fid; vg->seqno = 0; list_init(&vg->pvs); list_init(&vg->lvs); list_init(&vg->tags); if (!_check_vgs(pvs, &partial)) goto bad; dl = list_item(pvs->n, struct disk_list); if (!import_vg(mem, vg, dl, partial)) goto bad; if (!import_pvs(fid->fmt, mem, vg, pvs, &vg->pvs, &vg->pv_count)) goto bad; if (!import_lvs(mem, vg, pvs)) goto bad; if (!import_extents(fid->fmt->cmd, vg, pvs)) goto bad; if (!import_snapshots(mem, vg, pvs)) goto bad; return vg; bad: stack; pool_free(mem, vg); return NULL; } static struct volume_group *_vg_read(struct format_instance *fid, const char *vg_name, struct metadata_area *mda) { struct pool *mem = pool_create("lvm1 vg_read", 1024 * 10); struct list pvs; struct volume_group *vg = NULL; list_init(&pvs); if (!mem) { stack; return NULL; } /* Strip dev_dir if present */ vg_name = strip_dir(vg_name, fid->fmt->cmd->dev_dir); if (!read_pvs_in_vg (fid->fmt, vg_name, fid->fmt->cmd->filter, mem, &pvs)) { stack; goto bad; } if (!(vg = _build_vg(fid, &pvs))) { stack; goto bad; } bad: pool_destroy(mem); return vg; } static struct disk_list *_flatten_pv(struct format_instance *fid, struct pool *mem, struct volume_group *vg, struct physical_volume *pv, const char *dev_dir) { struct disk_list *dl = pool_alloc(mem, sizeof(*dl)); if (!dl) { stack; return NULL; } dl->mem = mem; dl->dev = pv->dev; list_init(&dl->uuids); list_init(&dl->lvds); if (!export_pv(fid->fmt->cmd, mem, vg, &dl->pvd, pv) || !export_vg(&dl->vgd, vg) || !export_uuids(dl, vg) || !export_lvs(dl, vg, pv, dev_dir) || !calculate_layout(dl)) { stack; pool_free(mem, dl); return NULL; } return dl; } static int _flatten_vg(struct format_instance *fid, struct pool *mem, struct volume_group *vg, struct list *pvds, const char *dev_dir, struct dev_filter *filter) { struct list *pvh; struct pv_list *pvl; struct disk_list *data; list_iterate(pvh, &vg->pvs) { pvl = list_item(pvh, struct pv_list); if (!(data = _flatten_pv(fid, mem, vg, pvl->pv, dev_dir))) { stack; return 0; } list_add(pvds, &data->list); } export_numbers(pvds, vg); export_pv_act(pvds); if (!export_vg_number(fid, pvds, vg->name, filter)) { stack; return 0; } return 1; } static int _vg_write(struct format_instance *fid, struct volume_group *vg, struct metadata_area *mda) { struct pool *mem = pool_create("lvm1 vg_write", 1024 * 10); struct list pvds; int r = 0; if (!mem) { stack; return 0; } list_init(&pvds); r = (_flatten_vg(fid, mem, vg, &pvds, fid->fmt->cmd->dev_dir, fid->fmt->cmd->filter) && write_disks(fid->fmt, &pvds)); lvmcache_update_vg(vg); pool_destroy(mem); return r; } static int _pv_read(const struct format_type *fmt, const char *pv_name, struct physical_volume *pv, struct list *mdas) { struct pool *mem = pool_create("lvm1 pv_read", 1024); struct disk_list *dl; struct device *dev; int r = 0; log_very_verbose("Reading physical volume data %s from disk", pv_name); if (!mem) { stack; return 0; } if (!(dev = dev_cache_get(pv_name, fmt->cmd->filter))) { stack; goto out; } if (!(dl = read_disk(fmt, dev, mem, NULL))) { stack; goto out; } if (!import_pv(fmt->cmd->mem, dl->dev, NULL, pv, &dl->pvd)) { stack; goto out; } pv->fmt = fmt; r = 1; out: pool_destroy(mem); return r; } static int _pv_setup(const struct format_type *fmt, uint64_t pe_start, uint32_t extent_count, uint32_t extent_size, int pvmetadatacopies, uint64_t pvmetadatasize, struct list *mdas, struct physical_volume *pv, struct volume_group *vg) { if (pv->size > MAX_PV_SIZE) pv->size--; if (pv->size > MAX_PV_SIZE) { log_error("Physical volumes cannot be bigger than %s", display_size(fmt->cmd, (uint64_t) MAX_PV_SIZE, SIZE_SHORT)); return 0; } /* Nothing more to do if extent size isn't provided */ if (!extent_size) return 1; /* * This works out pe_start and pe_count. */ if (!calculate_extent_count(pv, extent_size, extent_count, pe_start)) { stack; return 0; } /* Retain existing extent locations exactly */ if (((pe_start || extent_count) && (pe_start != pv->pe_start)) || (extent_count && (extent_count != pv->pe_count))) { log_error("Metadata would overwrite physical extents"); return 0; } return 1; } static int _lv_setup(struct format_instance *fid, struct logical_volume *lv) { uint64_t max_size = UINT_MAX; if (!*lv->lvid.s) lvid_from_lvnum(&lv->lvid, &lv->vg->id, find_free_lvnum(lv)); if (lv->le_count > MAX_LE_TOTAL) { log_error("logical volumes cannot contain more than " "%d extents.", MAX_LE_TOTAL); return 0; } if (lv->size > max_size) { log_error("logical volumes cannot be larger than %s", display_size(fid->fmt->cmd, max_size, SIZE_SHORT)); return 0; } return 1; } static int _pv_write(const struct format_type *fmt, struct physical_volume *pv, struct list *mdas, int64_t sector) { struct pool *mem; struct disk_list *dl; struct list pvs; struct label *label; struct lvmcache_info *info; if (!(info = lvmcache_add(fmt->labeller, (char *) &pv->id, pv->dev, pv->vg_name, NULL))) { stack; return 0; } label = info->label; info->device_size = pv->size << SECTOR_SHIFT; info->fmt = fmt; list_init(&info->mdas); list_init(&pvs); /* Ensure any residual PE structure is gone */ pv->pe_size = pv->pe_count = 0; pv->pe_start = PE_ALIGN; if (!(mem = pool_create("lvm1 pv_write", 1024))) { stack; return 0; } if (!(dl = pool_alloc(mem, sizeof(*dl)))) { stack; goto bad; } dl->mem = mem; dl->dev = pv->dev; if (!export_pv(fmt->cmd, mem, NULL, &dl->pvd, pv)) { stack; goto bad; } /* must be set to be able to zero gap after PV structure in dev_write in order to make other disk tools happy */ dl->pvd.pv_on_disk.base = METADATA_BASE; dl->pvd.pv_on_disk.size = PV_SIZE; dl->pvd.pe_on_disk.base = PE_ALIGN << SECTOR_SHIFT; list_add(&pvs, &dl->list); if (!write_disks(fmt, &pvs)) { stack; goto bad; } pool_destroy(mem); return 1; bad: pool_destroy(mem); return 0; } static int _vg_setup(struct format_instance *fid, struct volume_group *vg) { /* just check max_pv and max_lv */ if (!vg->max_lv || vg->max_lv >= MAX_LV) vg->max_lv = MAX_LV - 1; if (!vg->max_pv || vg->max_pv >= MAX_PV) vg->max_pv = MAX_PV - 1; if (vg->extent_size > MAX_PE_SIZE || vg->extent_size < MIN_PE_SIZE) { log_error("Extent size must be between %s and %s", display_size(fid->fmt->cmd, (uint64_t) MIN_PE_SIZE, SIZE_SHORT), display_size(fid->fmt->cmd, (uint64_t) MAX_PE_SIZE, SIZE_SHORT)); return 0; } if (vg->extent_size % MIN_PE_SIZE) { log_error("Extent size must be multiple of %s", display_size(fid->fmt->cmd, (uint64_t) MIN_PE_SIZE, SIZE_SHORT)); return 0; } /* Redundant? */ if (vg->extent_size & (vg->extent_size - 1)) { log_error("Extent size must be power of 2"); return 0; } return 1; } static int _segtype_supported (struct format_instance *fid, struct segment_type *segtype) { if (!(segtype->flags & SEG_FORMAT1_SUPPORT)) { stack; return 0; } return 1; } static struct metadata_area_ops _metadata_format1_ops = { vg_read:_vg_read, vg_write:_vg_write, }; static struct format_instance *_create_instance(const struct format_type *fmt, const char *vgname, void *private) { struct format_instance *fid; struct metadata_area *mda; if (!(fid = pool_alloc(fmt->cmd->mem, sizeof(*fid)))) { stack; return NULL; } fid->fmt = fmt; list_init(&fid->metadata_areas); /* Define a NULL metadata area */ if (!(mda = pool_alloc(fmt->cmd->mem, sizeof(*mda)))) { stack; pool_free(fmt->cmd->mem, fid); return NULL; } mda->ops = &_metadata_format1_ops; mda->metadata_locn = NULL; list_add(&fid->metadata_areas, &mda->list); return fid; } static void _destroy_instance(struct format_instance *fid) { return; } static void _destroy(const struct format_type *fmt) { dbg_free((void *) fmt); } static struct format_handler _format1_ops = { pv_read:_pv_read, pv_setup:_pv_setup, pv_write:_pv_write, lv_setup:_lv_setup, vg_setup:_vg_setup, segtype_supported:_segtype_supported, create_instance:_create_instance, destroy_instance:_destroy_instance, destroy:_destroy, }; #ifdef LVM1_INTERNAL struct format_type *init_lvm1_format(struct cmd_context *cmd) #else /* Shared */ struct format_type *init_format(struct cmd_context *cmd); struct format_type *init_format(struct cmd_context *cmd) #endif { struct format_type *fmt = dbg_malloc(sizeof(*fmt)); if (!fmt) { stack; return NULL; } fmt->cmd = cmd; fmt->ops = &_format1_ops; fmt->name = FMT_LVM1_NAME; fmt->alias = NULL; fmt->features = FMT_RESTRICTED_LVIDS | FMT_ORPHAN_ALLOCATABLE; fmt->private = NULL; if (!(fmt->labeller = lvm1_labeller_create(fmt))) { log_error("Couldn't create lvm1 label handler."); return NULL; } if (!(label_register_handler(FMT_LVM1_NAME, fmt->labeller))) { log_error("Couldn't register lvm1 label handler."); return NULL; } log_very_verbose("Initialised format: %s", fmt->name); return fmt; }