> Alexandre Derumier via pve-devel <pve-devel@lists.proxmox.com> hat am > 11.03.2025 11:28 CET geschrieben:
same here - please add some description about why things are implemented how they are.. else we have to dive through multiple threads of review discussions in 2 years when we want to find out ;) > Signed-off-by: Alexandre Derumier <alexandre.derum...@groupe-cyllene.com> > --- > src/PVE/Storage/LVMPlugin.pm | 228 ++++++++++++++++++++++++++++++++--- > 1 file changed, 210 insertions(+), 18 deletions(-) > > diff --git a/src/PVE/Storage/LVMPlugin.pm b/src/PVE/Storage/LVMPlugin.pm > index 38f7fa1..19dbd7e 100644 > --- a/src/PVE/Storage/LVMPlugin.pm > +++ b/src/PVE/Storage/LVMPlugin.pm > @@ -4,6 +4,7 @@ use strict; > use warnings; > > use IO::File; > +use POSIX qw/ceil/; > > use PVE::Tools qw(run_command trim); > use PVE::Storage::Plugin; > @@ -218,6 +219,7 @@ sub type { > sub plugindata { > return { > content => [ {images => 1, rootdir => 1}, { images => 1 }], > + format => [ { raw => 1, qcow2 => 1 } , 'raw' ], > }; > } > > @@ -293,7 +295,10 @@ sub parse_volname { > PVE::Storage::Plugin::parse_lvm_name($volname); > > if ($volname =~ m/^(vm-(\d+)-\S+)$/) { > - return ('images', $1, $2, undef, undef, undef, 'raw'); > + my $name = $1; > + my $vmid = $2; > + my $format = $volname =~ m/\.qcow2$/ ? 'qcow2' : 'raw'; this is really tricky and I am afraid there are still pitfalls/bugs here unless we add additional checks in places that a requested $format and the one in the name match.. > + return ('images', $name, $vmid, undef, undef, undef, $format); > } > > die "unable to parse lvm volume name '$volname'\n"; > @@ -302,11 +307,13 @@ sub parse_volname { > sub filesystem_path { > my ($class, $scfg, $volname, $snapname) = @_; > > - die "lvm snapshot is not implemented"if defined($snapname); > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > + $class->parse_volname($volname); > > - my ($vtype, $name, $vmid) = $class->parse_volname($volname); > + die "snapshot is working with qcow2 format only" if defined($snapname) > && $format ne 'qcow2'; > > my $vg = $scfg->{vgname}; > + $name = $class->get_snap_volname($volname, $snapname) if $snapname; > > my $path = "/dev/$vg/$name"; > > @@ -334,7 +341,9 @@ sub find_free_diskname { > > my $disk_list = [ keys %{$lvs->{$vg}} ]; > > - return PVE::Storage::Plugin::get_next_vm_diskname($disk_list, $storeid, > $vmid, undef, $scfg); > + $add_fmt_suffix = $fmt eq 'qcow2' ? 1 : undef; > + > + return PVE::Storage::Plugin::get_next_vm_diskname($disk_list, $storeid, > $vmid, $fmt, $scfg, $add_fmt_suffix); > } > > sub lvcreate { > @@ -363,9 +372,9 @@ sub lvrename { > } > > sub alloc_image { > - my ($class, $storeid, $scfg, $vmid, $fmt, $name, $size) = @_; > + my ($class, $storeid, $scfg, $vmid, $fmt, $name, $size, $backing) = @_; same as for the dir-based one - $backing as arbitrary path is not a good idea.. this should either be a snapshot $volname, or just the $snapname itself? > > - die "unsupported format '$fmt'" if $fmt ne 'raw'; > + die "unsupported format '$fmt'" if $fmt !~ m/(raw|qcow2)/; > > die "illegal name '$name' - should be 'vm-$vmid-*'\n" > if $name && $name !~ m/^vm-$vmid-/; > @@ -378,12 +387,36 @@ sub alloc_image { > > my $free = int($vgs->{$vg}->{free}); > > + > + #add extra space for qcow2 metadatas > + #without sub-allocated clusters : For 1TB storage : l2_size = disk_size > × 8 / cluster_size > + #with sub-allocated clusters : For 1TB storage : l2_size = disk_size × 8 > / cluster_size / 16 are these formulas valid for all disk sizes, or just for 1TB? > + #4MB overhead for 1TB with extented l2 > clustersize=128k so this means 1TB x 8 / 128K / 16 = 1GB / 256 = 4MB if the formula is generic, that means 1 GB of storage == 4KB of overhead, or 1MB of storage == 4 bytes of overhead? > + > + #can't use qemu-img measure, because it's not possible to define options > like clustersize && extended_l2 > + #verification has been done with : qemu-img create -f qcow2 -o > extended_l2=on,cluster_size=128k test.img 1G > + > + my $qcow2_overhead = ceil($size/1024/1024/1024) * 4096; above you say 4MB for 1TB, but here you go down to KB and then multiply by 4K? why not go down to MB and multiply by 4? > + > + my $lvmsize = $size; > + $lvmsize += $qcow2_overhead if $fmt eq 'qcow2'; > + > die "not enough free space ($free < $size)\n" if $free < $size; > > - $name = $class->find_free_diskname($storeid, $scfg, $vmid) > + $name = $class->find_free_diskname($storeid, $scfg, $vmid, $fmt) > if !$name; > > - lvcreate($vg, $name, $size, ["pve-vm-$vmid"]); > + my $tags = ["pve-vm-$vmid"]; > + #tags all snapshots volumes with the main volume tag for easier > activation of the whole group > + push @$tags, "\@pve-$name" if $fmt eq 'qcow2'; > + lvcreate($vg, $name, $lvmsize, $tags); > + > + if ($fmt eq 'qcow2') { > + #format the lvm volume with qcow2 format > + $class->activate_volume($storeid, $scfg, $name, undef, {}); the last two parameters are not needed.. > + my $path = $class->path($scfg, $name, $storeid); > + PVE::Storage::Plugin::qemu_img_create($scfg, $fmt, $size, $path, > $backing); > + } > > return $name; > } > @@ -538,6 +571,12 @@ sub activate_volume { > > my $lvm_activate_mode = 'ey'; > > + #activate volume && all snapshots volumes by tag > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > + $class->parse_volname($volname); > + > + $path = "\@pve-$name" if $format eq 'qcow2'; > + > my $cmd = ['/sbin/lvchange', "-a$lvm_activate_mode", $path]; > run_command($cmd, errmsg => "can't activate LV '$path'"); > $cmd = ['/sbin/lvchange', '--refresh', $path]; > @@ -550,6 +589,10 @@ sub deactivate_volume { > my $path = $class->path($scfg, $volname, $storeid, $snapname); > return if ! -b $path; > > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > + $class->parse_volname($volname); > + $path = "\@pve-$name" if $format eq 'qcow2'; > + > my $cmd = ['/sbin/lvchange', '-aln', $path]; > run_command($cmd, errmsg => "can't deactivate LV '$path'"); > } > @@ -557,15 +600,27 @@ sub deactivate_volume { > sub volume_resize { > my ($class, $scfg, $storeid, $volname, $size, $running) = @_; > > - $size = ($size/1024/1024) . "M"; > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > + $class->parse_volname($volname); > + > + my $lvmsize = $size / 1024; I don't really get this, see comments above for alloc_image > + my $qcow2_overhead = ceil($size/1024/1024/1024/1024) * 4096; > + $lvmsize += $qcow2_overhead if $format eq 'qcow2'; we definitely don't want to have this twice.. > + $lvmsize = "${lvmsize}k"; > > my $path = $class->path($scfg, $volname); > - my $cmd = ['/sbin/lvextend', '-L', $size, $path]; > + my $cmd = ['/sbin/lvextend', '-L', $lvmsize, $path]; > > $class->cluster_lock_storage($storeid, $scfg->{shared}, undef, sub { > run_command($cmd, errmsg => "error resizing volume '$path'"); > }); > > + if(!$running && $format eq 'qcow2') { > + my $prealloc_opt = > PVE::Storage::Plugin::preallocation_cmd_option($scfg, $format); > + my $cmd = ['/usr/bin/qemu-img', 'resize', "--$prealloc_opt", '-f', > $format, $path , $size]; > + run_command($cmd, timeout => 10); > + } > + > return 1; > } > > @@ -587,30 +642,159 @@ sub volume_size_info { > sub volume_snapshot { > my ($class, $scfg, $storeid, $volname, $snap) = @_; > > - die "lvm snapshot is not implemented"; > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > + $class->parse_volname($volname); > + > + die "can't snapshot this image format\n" if $format ne 'qcow2'; > + > + $class->activate_volume($storeid, $scfg, $volname, undef, {}); last two not needed > + > + my $snap_volname = $class->get_snap_volname($volname, $snap); > + my $snap_path = $class->path($scfg, $volname, $storeid, $snap); see above.. > + > + my $size = $class->volume_size_info($scfg, $storeid, $volname, 5); > + > + #rename current lvm volume to snap volume > + my $vg = $scfg->{vgname}; > + print"rename $volname to $snap_volname\n"; > + eval { lvrename($vg, $volname, $snap_volname); }; > + if ($@) { > + die "can't rename lvm volume from $volname to $snap_volname: $@ \n"; > + } > + > + eval { $class->alloc_image($storeid, $scfg, $vmid, 'qcow2', $volname, > $size/1024, $snap_path); }; > + if ($@) { > + eval { $class->free_image($storeid, $scfg, $volname, 0) }; missing error handling, this needs to rename back? also, this might return a code-reference that needs to be executed.. > + warn $@ if $@; > + } > } > > +sub volume_rollback_is_possible { > + my ($class, $scfg, $storeid, $volname, $snap, $blockers) = @_; > + > + my $snap_path = $class->path($scfg, $volname, $storeid, $snap); > + > + $class->activate_volume($storeid, $scfg, $volname, undef, {}); > + my $snapshots = $class->volume_snapshot_info($scfg, $storeid, $volname); > + my $parent_snap = $snapshots->{current}->{parent}; wouldn't it be enough to check that this equals $snap? > + > + return 1 if $snapshots->{$parent_snap}->{file} eq $snap_path; > + die "can't rollback, '$snap' is not most recent snapshot on > '$volname'\n"; > + > + return 1; > +} > + > + > sub volume_snapshot_rollback { > my ($class, $scfg, $storeid, $volname, $snap) = @_; > > - die "lvm snapshot rollback is not implemented"; > + die "can't rollback snapshot for this image format\n" if $volname !~ > m/\.(qcow2)$/; this should go below parse_volname and use the format it returns.. > + > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > + $class->parse_volname($volname); > + > + $class->activate_volume($storeid, $scfg, $volname, undef, {}); two unneeded parameters > + my $size = $class->volume_size_info($scfg, $storeid, $volname, 5); > + my $snap_path = $class->path($scfg, $volname, $storeid, $snap); > + > + #simply delete the current snapshot and recreate it > + eval { $class->free_image($storeid, $scfg, $volname, 0) }; might return a code reference that needs to be executed.. > + if ($@) { > + die "can't delete old volume $volname: $@\n"; > + } > + > + eval { $class->alloc_image($storeid, $scfg, $vmid, 'qcow2', $volname, > $size/1024, $snap_path) }; > + if ($@) { > + die "can't allocate new volume $volname: $@\n"; > + } > + > + return undef; > } > > sub volume_snapshot_delete { > - my ($class, $scfg, $storeid, $volname, $snap) = @_; > + my ($class, $scfg, $storeid, $volname, $snap, $running) = @_; > + > + die "can't delete snapshot for this image format\n" if $volname !~ > m/\.(qcow2)$/; this should parse the volname and use the returned format! > + > + return 1 if $running; > + > + my $cmd = ""; > + my $path = $class->filesystem_path($scfg, $volname); > + > + my $snapshots = $class->volume_snapshot_info($scfg, $storeid, $volname); > + my $snap_path = $snapshots->{$snap}->{file}; > + my $snap_volname = $snapshots->{$snap}->{volname}; > + die "volume $snap_path is missing" if !-e $snap_path; > > - die "lvm snapshot delete is not implemented"; > + my $parent_snap = $snapshots->{$snap}->{parent}; > + my $child_snap = $snapshots->{$snap}->{child}; > + > + my $parent_path = $snapshots->{$parent_snap}->{file} if $parent_snap; > + my $child_path = $snapshots->{$child_snap}->{file} if $child_snap; > + my $child_volname = $snapshots->{$child_snap}->{volname} if $child_snap; same as in the Plugin.pm patch, this is not allowed code style! > + > + #if first snapshot,as it should be bigger, we merge child, and rename > the snapshot to child > + if(!$parent_snap) { > + print"commit $child_path\n"; > + $cmd = ['/usr/bin/qemu-img', 'commit', $child_path]; could use `-d`, since we don't use $child_path afterwards anyway > + eval { run_command($cmd) }; > + if ($@) { > + die "error commiting $child_path to $parent_path: $@\n"; > + } > + print"delete $child_volname\n"; > + eval { $class->free_image($storeid, $scfg, $child_volname, 0) }; might return a code reference that needs to be executed.. > + if ($@) { > + die "error delete old snapshot volume $child_volname: $@\n"; > + } > + print"rename $snap_volname to $child_volname\n"; > + my $vg = $scfg->{vgname}; > + eval { lvrename($vg, $snap_volname, $child_volname) }; > + if ($@) { > + die "error renaming snapshot: $@\n"; > + } > + } else { > + #we rebase the child image on the parent as new backing image > + die "missing parentsnap snapshot to rebase child $child_path\n" if > !$parent_path; how would this happen? > + print "link $child_snap to $parent_snap\n"; > + $cmd = ['/usr/bin/qemu-img', 'rebase', '-b', $parent_path, '-F', > 'qcow2', '-f', 'qcow2', $child_path]; > + eval { run_command($cmd) }; > + if ($@) { > + die "error rebase $child_path with $parent_path; $@\n"; > + } > + #delete the snapshot > + eval { $class->free_image($storeid, $scfg, $snap_volname, 0); }; might return a code reference that needs to be executed.. > + if ($@) { > + die "error delete old snapshot volume $snap_volname: $@\n"; > + } > + } > } > > sub volume_has_feature { > my ($class, $scfg, $feature, $storeid, $volname, $snapname, $running) = > @_; > > my $features = { > - copy => { base => 1, current => 1}, > - rename => {current => 1}, > + copy => { > + base => { qcow2 => 1, raw => 1}, > + current => { qcow2 => 1, raw => 1}, > + snap => { qcow2 => 1 }, did you actually test this? AFAICT this would still fall back to internal qcow2 snapshots? > + }, > + 'rename' => { > + current => { qcow2 => 1, raw => 1}, how does this interact with snapshots? > + }, > + snapshot => { > + current => { qcow2 => 1 }, > + snap => { qcow2 => 1 }, > + }, > + template => { > + current => { qcow2 => 1, raw => 1}, see below.. > + }, > + clone => { > + base => { qcow2 => 1, raw => 1 }, how can we do linked clones of raw volumes? how can we do linked clones of qcow2 volumes if we don't allow creating base volumes? > + }, > }; > > - my ($vtype, $name, $vmid, $basename, $basevmid, $isBase) = > + > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > $class->parse_volname($volname); > > my $key = undef; > @@ -619,7 +803,7 @@ sub volume_has_feature { > }else{ > $key = $isBase ? 'base' : 'current'; > } > - return 1 if $features->{$feature}->{$key}; > + return 1 if defined($features->{$feature}->{$key}->{$format}); why the defined? > > return undef; > } > @@ -740,4 +924,12 @@ sub rename_volume { > return "${storeid}:${target_volname}"; > } > > +sub get_snap_volname { > + my ($class, $volname, $snapname) = @_; > + > + my ($vtype, $name, $vmid, $basename, $basevmid, $isBase, $format) = > $class->parse_volname($volname); > + $name = !$snapname || $snapname eq 'current' ? $volname : > "snap-$snapname-$name"; see above.. > + return $name; > +} > + > 1; > -- > 2.39.5 _______________________________________________ pve-devel mailing list pve-devel@lists.proxmox.com https://lists.proxmox.com/cgi-bin/mailman/listinfo/pve-devel