/* * Copyright (C) 2001 Sistina Software * * This file is released under the LGPL. */ #include "lib.h" #include "metadata.h" #include "locking.h" #include "pv_map.h" #include "lvm-string.h" #include "toolcontext.h" #include "lv_alloc.h" /* * These functions adjust the pe counts in pv's * after we've added or removed segments. */ static void _get_extents(struct lv_segment *seg) { unsigned int s, count; struct physical_volume *pv; for (s = 0; s < seg->area_count; s++) { if (seg->area[s].type != AREA_PV) continue; pv = seg->area[s].u.pv.pv; count = seg->area_len; pv->pe_alloc_count += count; } } static void _put_extents(struct lv_segment *seg) { unsigned int s, count; struct physical_volume *pv; for (s = 0; s < seg->area_count; s++) { if (seg->area[s].type != AREA_PV) continue; pv = seg->area[s].u.pv.pv; if (pv) { count = seg->area_len; assert(pv->pe_alloc_count >= count); pv->pe_alloc_count -= count; } } } struct lv_segment *alloc_lv_segment(struct pool *mem, uint32_t stripes) { struct lv_segment *seg; uint32_t len = sizeof(*seg) + (stripes * sizeof(seg->area[0])); if (!(seg = pool_zalloc(mem, len))) { stack; return NULL; } return seg; } static int _alloc_stripe_area(struct logical_volume *lv, uint32_t stripes, uint32_t stripe_size, struct pv_area **areas, uint32_t *ix) { uint32_t count = lv->le_count - *ix; uint32_t area_len = count / stripes; uint32_t smallest = areas[stripes - 1]->count; uint32_t s; struct lv_segment *seg; if (smallest < area_len) area_len = smallest; if (!(seg = alloc_lv_segment(lv->vg->cmd->mem, stripes))) { log_err("Couldn't allocate new stripe segment."); return 0; } seg->lv = lv; seg->type = SEG_STRIPED; seg->le = *ix; seg->len = area_len * stripes; seg->area_len = area_len; seg->area_count = stripes; seg->stripe_size = stripe_size; for (s = 0; s < stripes; s++) { struct pv_area *pva = areas[s]; seg->area[s].type = AREA_PV; seg->area[s].u.pv.pv = pva->map->pvl->pv; seg->area[s].u.pv.pe = pva->start; consume_pv_area(pva, area_len); } list_add(&lv->segments, &seg->list); *ix += seg->len; return 1; } static int _comp_area(const void *l, const void *r) { const struct pv_area *lhs = *((const struct pv_area **) l); const struct pv_area *rhs = *((const struct pv_area **) r); if (lhs->count < rhs->count) return 1; else if (lhs->count > rhs->count) return -1; return 0; } static int _alloc_striped(struct logical_volume *lv, struct list *pvms, uint32_t allocated, uint32_t stripes, uint32_t stripe_size) { int r = 0; struct list *pvmh; struct pv_area **areas; unsigned int pv_count = 0, ix; struct pv_map *pvm; size_t len; list_iterate(pvmh, pvms) pv_count++; /* allocate an array of pv_areas, one candidate per pv */ len = sizeof(*areas) * pv_count; if (!(areas = dbg_malloc(sizeof(*areas) * pv_count))) { log_err("Couldn't allocate areas array."); return 0; } while (allocated != lv->le_count) { ix = 0; list_iterate(pvmh, pvms) { pvm = list_item(pvmh, struct pv_map); if (list_empty(&pvm->areas)) continue; areas[ix++] = list_item(pvm->areas.n, struct pv_area); } if (ix < stripes) { log_error("Insufficient allocatable extents suitable " "for striping for logical volume " "%s: %u required", lv->name, lv->le_count); goto out; } /* sort the areas so we allocate from the biggest */ qsort(areas, ix, sizeof(*areas), _comp_area); if (!_alloc_stripe_area(lv, stripes, stripe_size, areas, &allocated)) { stack; goto out; } } r = 1; out: dbg_free(areas); return r; } /* * The heart of the allocation code. This function takes a * pv_area and allocates it to the lv. If the lv doesn't need * the complete area then the area is split, otherwise the area * is unlinked from the pv_map. */ static int _alloc_linear_area(struct logical_volume *lv, uint32_t *ix, struct pv_map *map, struct pv_area *pva) { uint32_t count, remaining; struct lv_segment *seg; count = pva->count; remaining = lv->le_count - *ix; if (count > remaining) count = remaining; if (!(seg = alloc_lv_segment(lv->vg->cmd->mem, 1))) { log_err("Couldn't allocate new stripe segment."); return 0; } seg->lv = lv; seg->type = SEG_STRIPED; seg->le = *ix; seg->len = count; seg->area_len = count; seg->stripe_size = 0; seg->area_count = 1; seg->area[0].type = AREA_PV; seg->area[0].u.pv.pv = map->pvl->pv; seg->area[0].u.pv.pe = pva->start; list_add(&lv->segments, &seg->list); consume_pv_area(pva, count); *ix += count; return 1; } static int _alloc_mirrored_area(struct logical_volume *lv, uint32_t *ix, struct pv_map *map, struct pv_area *pva, struct physical_volume *mirrored_pv, uint32_t mirrored_pe) { uint32_t count, remaining; struct lv_segment *seg; count = pva->count; remaining = lv->le_count - *ix; if (count > remaining) count = remaining; if (!(seg = alloc_lv_segment(lv->vg->cmd->mem, 2))) { log_err("Couldn't allocate new mirrored segment."); return 0; } seg->lv = lv; seg->type = SEG_MIRRORED; seg->status = 0u; seg->le = *ix; seg->len = count; seg->area_len = count; seg->stripe_size = 0; seg->area_count = 2; seg->extents_moved = 0u; /* FIXME Remove AREA_PV restriction here? */ seg->area[0].type = AREA_PV; seg->area[0].u.pv.pv = mirrored_pv; seg->area[0].u.pv.pe = mirrored_pe; seg->area[1].type = AREA_PV; seg->area[1].u.pv.pv = map->pvl->pv; seg->area[1].u.pv.pe = pva->start; list_add(&lv->segments, &seg->list); consume_pv_area(pva, count); *ix += count; return 1; } /* * Only one area per pv is allowed, so we search * for the biggest area, or the first area that * can complete the allocation. */ /* * FIXME: subsequent lvextends may not be contiguous. */ static int _alloc_contiguous(struct logical_volume *lv, struct list *pvms, uint32_t allocated) { struct list *tmp1; struct pv_map *pvm; struct pv_area *pva; list_iterate(tmp1, pvms) { pvm = list_item(tmp1, struct pv_map); if (list_empty(&pvm->areas)) continue; /* first item in the list is the biggest */ pva = list_item(pvm->areas.n, struct pv_area); if (pva->count < lv->le_count) continue; if (!_alloc_linear_area(lv, &allocated, pvm, pva)) { stack; return 0; } break; } if (allocated != lv->le_count) { log_error("Insufficient allocatable extents (%u) " "for logical volume %s: %u required", allocated, lv->name, lv->le_count); return 0; } return 1; } /* FIXME Contiguous depends on *segment* (i.e. stripe) not LV */ static int _alloc_mirrored(struct logical_volume *lv, struct list *pvms, uint32_t allocated, struct physical_volume *mirrored_pv, uint32_t mirrored_pe) { struct list *tmp1; struct pv_map *pvm; struct pv_area *pva; uint32_t max_found = 0; /* Try each PV in turn */ list_iterate(tmp1, pvms) { pvm = list_item(tmp1, struct pv_map); if (list_empty(&pvm->areas)) continue; /* first item in the list is the biggest */ pva = list_item(pvm->areas.n, struct pv_area); if (pva->count < lv->le_count - allocated) { max_found = pva->count; continue; } if (!_alloc_mirrored_area(lv, &allocated, pvm, pva, mirrored_pv, mirrored_pe)) { stack; return 0; } break; } if (allocated != lv->le_count) { log_error("Insufficient contiguous allocatable extents (%u) " "for logical volume %s: %u required", allocated + max_found, lv->name, lv->le_count); return 0; } return 1; } /* * Areas just get allocated in order until the lv * is full. */ static int _alloc_next_free(struct logical_volume *lv, struct list *pvms, uint32_t allocated) { struct list *tmp1, *tmp2; struct pv_map *pvm; struct pv_area *pva; list_iterate(tmp1, pvms) { pvm = list_item(tmp1, struct pv_map); list_iterate(tmp2, &pvm->areas) { pva = list_item(tmp2, struct pv_area); if (!_alloc_linear_area(lv, &allocated, pvm, pva) || (allocated == lv->le_count)) goto done; } } done: if (allocated != lv->le_count) { log_error("Insufficient allocatable logical extents (%u) " "for logical volume %s: %u required", allocated, lv->name, lv->le_count); return 0; } return 1; } /* * Chooses a correct allocation policy. */ static int _allocate(struct volume_group *vg, struct logical_volume *lv, struct list *allocatable_pvs, uint32_t allocated, uint32_t stripes, uint32_t stripe_size, struct physical_volume *mirrored_pv, uint32_t mirrored_pe, uint32_t status) { int r = 0; struct pool *scratch; struct list *pvms, *old_tail = lv->segments.p, *segh; struct lv_segment *seg; if (!(scratch = pool_create(1024))) { stack; return 0; } /* * Build the sets of available areas on the pv's. */ if (!(pvms = create_pv_maps(scratch, vg, allocatable_pvs))) goto out; if (stripes > 1) r = _alloc_striped(lv, pvms, allocated, stripes, stripe_size); else if (mirrored_pv) r = _alloc_mirrored(lv, pvms, allocated, mirrored_pv, mirrored_pe); else if (lv->alloc == ALLOC_CONTIGUOUS) r = _alloc_contiguous(lv, pvms, allocated); else if (lv->alloc == ALLOC_NEXT_FREE || lv->alloc == ALLOC_DEFAULT) r = _alloc_next_free(lv, pvms, allocated); else { log_error("Unknown allocation policy: " "unable to setup logical volume."); goto out; } if (r) { vg->free_count -= lv->le_count - allocated; /* * Iterate through the new segments, updating pe * counts in pv's. */ for (segh = lv->segments.p; segh != old_tail; segh = segh->p) { seg = list_item(segh, struct lv_segment); _get_extents(seg); seg->status = status; } } else { /* * Put the segment list back how we found it. */ old_tail->n = &lv->segments; lv->segments.p = old_tail; } out: pool_destroy(scratch); return r; } static char *_generate_lv_name(struct volume_group *vg, const char *format, char *buffer, size_t len) { struct list *lvh; struct logical_volume *lv; int high = -1, i; list_iterate(lvh, &vg->lvs) { lv = (list_item(lvh, struct lv_list)->lv); if (sscanf(lv->name, format, &i) != 1) continue; if (i > high) high = i; } if (lvm_snprintf(buffer, len, format, high + 1) < 0) return NULL; return buffer; } struct logical_volume *lv_create_empty(struct format_instance *fi, const char *name, const char *name_format, uint32_t status, alloc_policy_t alloc, struct volume_group *vg) { struct cmd_context *cmd = vg->cmd; struct lv_list *ll = NULL; struct logical_volume *lv; char dname[32]; if (vg->max_lv && (vg->max_lv == vg->lv_count)) { log_error("Maximum number of logical volumes (%u) reached " "in volume group %s", vg->max_lv, vg->name); return NULL; } if (!name && !(name = _generate_lv_name(vg, name_format, dname, sizeof(dname)))) { log_error("Failed to generate unique name for the new " "logical volume"); return NULL; } log_verbose("Creating logical volume %s", name); if (!(ll = pool_zalloc(cmd->mem, sizeof(*ll))) || !(ll->lv = pool_zalloc(cmd->mem, sizeof(*ll->lv)))) { log_error("lv_list allocation failed"); if (ll) pool_free(cmd->mem, ll); return NULL; } lv = ll->lv; lv->vg = vg; if (!(lv->name = pool_strdup(cmd->mem, name))) { log_error("lv name strdup failed"); if (ll) pool_free(cmd->mem, ll); return NULL; } lv->status = status; lv->alloc = alloc; lv->read_ahead = 0; lv->major = -1; lv->minor = -1; lv->size = UINT64_C(0); lv->le_count = 0; list_init(&lv->segments); if (fi->fmt->ops->lv_setup && !fi->fmt->ops->lv_setup(fi, lv)) { stack; if (ll) pool_free(cmd->mem, ll); return NULL; } vg->lv_count++; list_add(&vg->lvs, &ll->list); return lv; } struct logical_volume *lv_create(struct format_instance *fi, const char *name, uint32_t status, alloc_policy_t alloc, uint32_t stripes, uint32_t stripe_size, uint32_t extents, struct volume_group *vg, struct list *allocatable_pvs) { struct logical_volume *lv; if (!extents) { log_error("Unable to create logical volume %s with no extents", name); return NULL; } if (vg->free_count < extents) { log_error("Insufficient free extents (%u) in volume group %s: " "%u required", vg->free_count, vg->name, extents); return NULL; } if (stripes > list_size(allocatable_pvs)) { log_error("Number of stripes (%u) must not exceed " "number of physical volumes (%d)", stripes, list_size(allocatable_pvs)); return NULL; } if (!(lv = lv_create_empty(fi, name, "lvol%d", status, alloc, vg))) { stack; return NULL; } lv->size = (uint64_t) extents *vg->extent_size; lv->le_count = extents; if (!_allocate(vg, lv, allocatable_pvs, 0u, stripes, stripe_size, NULL, 0u, 0u)) { stack; return NULL; } if (fi->fmt->ops->lv_setup && !fi->fmt->ops->lv_setup(fi, lv)) { stack; return NULL; } return lv; } int lv_reduce(struct format_instance *fi, struct logical_volume *lv, uint32_t extents) { struct list *segh; struct lv_segment *seg; uint32_t count = extents; for (segh = lv->segments.p; (segh != &lv->segments) && count; segh = segh->p) { seg = list_item(segh, struct lv_segment); if (seg->len <= count) { /* remove this segment completely */ count -= seg->len; _put_extents(seg); list_del(segh); } else { /* reduce this segment */ _put_extents(seg); seg->len -= count; _get_extents(seg); count = 0; } } lv->le_count -= extents; lv->size = (uint64_t) lv->le_count * lv->vg->extent_size; lv->vg->free_count += extents; if (fi->fmt->ops->lv_setup && !fi->fmt->ops->lv_setup(fi, lv)) { stack; return 0; } return 1; } int lv_extend(struct format_instance *fi, struct logical_volume *lv, uint32_t stripes, uint32_t stripe_size, uint32_t extents, struct list *allocatable_pvs) { uint32_t old_le_count = lv->le_count; uint64_t old_size = lv->size; lv->le_count += extents; lv->size += (uint64_t) extents *lv->vg->extent_size; if (!_allocate(lv->vg, lv, allocatable_pvs, old_le_count, stripes, stripe_size, NULL, 0u, 0u)) { lv->le_count = old_le_count; lv->size = old_size; stack; return 0; } if (!lv_merge_segments(lv)) { log_err("Couldn't merge segments after extending " "logical volume."); return 0; } if (fi->fmt->ops->lv_setup && !fi->fmt->ops->lv_setup(fi, lv)) { stack; return 0; } return 1; } int lv_extend_mirror(struct format_instance *fid, struct logical_volume *lv, struct physical_volume *mirrored_pv, uint32_t mirrored_pe, uint32_t extents, struct list *allocatable_pvs, uint32_t status) { uint32_t old_le_count = lv->le_count; uint64_t old_size = lv->size; lv->le_count += extents; lv->size += (uint64_t) extents *lv->vg->extent_size; if (!_allocate(lv->vg, lv, allocatable_pvs, old_le_count, 1, extents, mirrored_pv, mirrored_pe, status)) { lv->le_count = old_le_count; lv->size = old_size; stack; return 0; } if (fid->fmt->ops->lv_setup && !fid->fmt->ops->lv_setup(fid, lv)) { stack; return 0; } return 1; } int lv_remove(struct volume_group *vg, struct logical_volume *lv) { struct list *segh; struct lv_list *lvl; /* find the lv list */ if (!(lvl = find_lv_in_vg(vg, lv->name))) { stack; return 0; } /* iterate through the lv's segments freeing off the pe's */ list_iterate(segh, &lv->segments) _put_extents(list_item(segh, struct lv_segment)); vg->lv_count--; vg->free_count += lv->le_count; list_del(&lvl->list); return 1; } /* Unlock list of LVs */ int unlock_lvs(struct cmd_context *cmd, struct list *lvs) { struct list *lvh; struct logical_volume *lv; list_iterate(lvh, lvs) { lv = list_item(lvh, struct lv_list)->lv; unlock_lv(cmd, lv->lvid.s); } return 1; } /* Lock a list of LVs */ int lock_lvs(struct cmd_context *cmd, struct list *lvs, int flags) { struct list *lvh; struct logical_volume *lv; list_iterate(lvh, lvs) { lv = list_item(lvh, struct lv_list)->lv; if (!lock_vol(cmd, lv->lvid.s, flags)) { log_error("Failed to lock %s", lv->name); list_uniterate(lvh, lvs, lvh) { lv = list_item(lvh, struct lv_list)->lv; unlock_lv(cmd, lv->lvid.s); } return 0; } } return 1; } uint32_t find_free_lvnum(struct logical_volume *lv) { int lvnum_used[MAX_RESTRICTED_LVS + 1]; uint32_t i = 0; struct list *lvh; struct lv_list *lvl; int lvnum; memset(&lvnum_used, 0, sizeof(lvnum_used)); list_iterate(lvh, &lv->vg->lvs) { lvl = list_item(lvh, struct lv_list); lvnum = lvnum_from_lvid(&lvl->lv->lvid); if (lvnum <= MAX_RESTRICTED_LVS) lvnum_used[lvnum] = 1; } while (lvnum_used[i]) i++; return i; }