[pve-devel] [PATCH pve-manager 11/18] pvesr prepare-local-job: new helper

Mon May 29 08:07:46 CEST 2017

On Tue, May 23, 2017 at 09:08:50AM +0200, Dietmar Maurer wrote:
> Prepare for starting a replication job. This is called on the target
> node before replication starts. This call is for internal use, and
> return a JSON object on stdout. The method first test if VM <vmid>
> reside on the local node. If so, stop immediately. After that the
> method scans all volume IDs for snapshots, and removes all replications
> snapshots with timestamps different than <last_sync>. It also removes
> any unused volumes.
> 
> Returns a hash with boolean markers for all volumes with existing
> replication snapshots.
> 
> Signed-off-by: Dietmar Maurer <dietmar at proxmox.com>
> ---
>  PVE/CLI/pvesr.pm   | 98 +++++++++++++++++++++++++++++++++++++++++++++++++++++-
>  PVE/Replication.pm | 30 +++++++++++++++++
>  2 files changed, 127 insertions(+), 1 deletion(-)
> 
> diff --git a/PVE/CLI/pvesr.pm b/PVE/CLI/pvesr.pm
> index dee002ee..78d69747 100644
> --- a/PVE/CLI/pvesr.pm
> +++ b/PVE/CLI/pvesr.pm
> @@ -4,6 +4,7 @@ use strict;
>  use warnings;
>  use POSIX qw(strftime);
>  use Time::Local;
> +use Data::Dumper;

not used?

>  use JSON;
>  
>  use PVE::JSONSchema qw(get_standard_option);
> @@ -13,6 +14,7 @@ use PVE::Tools qw(extract_param);
>  use PVE::SafeSyslog;
>  use PVE::CLIHandler;
>  
> +use PVE::Cluster;
>  use PVE::Replication;
>  use PVE::API2::ReplicationConfig;
>  use PVE::API2::Replication;
> @@ -26,6 +28,98 @@ sub setup_environment {
>  }
>  
>  __PACKAGE__->register_method ({
> +    name => 'prepare_local_job',
> +    path => 'prepare_local_job',
> +    method => 'POST',
> +    description => "Prepare for starting a replication job. This is called on the target node before replication starts. This call is for internal use, and return a JSON object on stdout. The method first test if VM <vmid> reside on the local node. If so, stop immediately. After that the method scans all volume IDs for snapshots, and removes all replications snapshots with timestamps different than <last_sync>. It also removes any unused volumes. Returns a hash with boolean markers for all volumes with existing replication snapshots.",
> +    parameters => {
> +	additionalProperties => 0,
> +	properties => {
> +	    id => get_standard_option('pve-replication-id'),
> +	    vmid => get_standard_option('pve-vmid', { completion => \&PVE::Cluster::complete_vmid }),
> +	    'extra-args' => get_standard_option('extra-args', {
> +		description => "The list of volume IDs to consider." }),
> +	    last_sync => {
> +		description => "Time (UNIX epoch) of last successful sync. If not specified, all replication snapshots gets removed.",

s/gets/get/

> +		type => 'integer',
> +		minimum => 0,
> +		optional => 1,
> +	    },
> +	},
> +    },
> +    returns => { type => 'null' },
> +    code => sub {
> +	my ($param) = @_;
> +
> +	my $jobid = $param->{id};
> +	my $vmid = $param->{vmid};
> +	my $last_sync = $param->{last_sync} // 0;
> +
> +	my $local_node = PVE::INotify::nodename();
> +
> +	my $vms = PVE::Cluster::get_vmlist();
> +	die "guest '$vmid' is on local node\n"
> +	    if $vms->{ids}->{$vmid} && $vms->{ids}->{$vmid}->{node} eq $local_node;
> +
> +	my $storecfg = PVE::Storage::config();
> +
> +	my $dl = PVE::Storage::vdisk_list($storecfg, undef, $vmid);

I really really dislike this. AFAICT it is the only time we do a full
scan of all storages in the replication code path, instead of iterating
over the disk referenced in the guest config. this is a potentially very
expensive operation (e.g., on storages like Ceph or NFS), and should not
be done on every job run..

> +
> +	my $volids = [];
> +
> +	die "no volumes specified\n" if !scalar(@{$param->{'extra-args'}});
> +
> +	foreach my $volid (@{$param->{'extra-args'}}) {
> +
> +	    my ($storeid, $volname) = PVE::Storage::parse_volume_id($volid);
> +	    my $scfg = PVE::Storage::storage_check_enabled($storecfg, $storeid, $local_node);
> +	    die "storage '$storeid' is a shared storage\n" if $scfg->{shared};
> +
> +	    my ($vtype, undef, $ownervm) = PVE::Storage::parse_volname($storecfg, $volid);
> +	    die "volume '$volid' has wrong vtype ($vtype != 'images')\n"
> +		if $vtype ne 'images';
> +	    die "volume '$volid' has wrong owner\n"
> +		if !$ownervm || $vmid != $ownervm;
> +
> +	    my $found = 0;
> +	    foreach my $info (@{$dl->{$storeid}}) {
> +		if ($info->{volid} eq $volid) {
> +		    $found = 1;
> +		    last;
> +		}
> +	    }
> +
> +	    push @$volids, $volid if $found;
> +	}
> +
> +	$volids = [ sort @$volids ];
> +
> +	my $logfunc = sub {
> +	    my ($start_time, $msg) = @_;
> +	    print STDERR "$msg\n";
> +	};
> +
> +	# remove stale volumes
> +	foreach my $storeid (keys %$dl) {
> +	    my $scfg = PVE::Storage::storage_check_enabled($storecfg, $storeid, $local_node, 1);
> +	    next if !$scfg || $scfg->{shared};
> +	    foreach my $info (@{$dl->{$storeid}}) {
> +		my $volid = $info->{volid};
> +		next if grep { $_ eq $volid } @$volids;
> +		$logfunc->(undef, "$jobid: delete stale volume '$volid'");
> +		PVE::Storage::vdisk_free($storecfg, $volid);

and now we not only cleaned up stale volumes which were replicated but
are no longer there on the source, but also all other orphan disks of
that guest.. intentionally?

> +	    }
> +	}
> +
> +	my $last_snapshots = PVE::Replication::prepare(
> +	    $storecfg, $volids, $jobid, $last_sync, undef, $logfunc);
> +
> +	print to_json($last_snapshots) . "\n";
> +
> +	return undef;
> +    }});
> +
> +__PACKAGE__->register_method ({
>      name => 'run',
>      path => 'run',
>      method => 'POST',
> @@ -148,7 +242,7 @@ my $print_job_status = sub {
>  	    if ($next > $now) {
>  		$nextstr = strftime("%Y-%m-%d_%H:%M:%S", localtime($job->{next_sync}));
>  	    } else {
> -		$nextstr = 'now'
> +		$nextstr = 'now';

should be rebased into the proper commit

>  	    }
>  	}
>  
> @@ -174,6 +268,8 @@ our $cmddef = {
>      enable => [ __PACKAGE__, 'enable', ['id'], {}],
>      disable => [ __PACKAGE__, 'disable', ['id'], {}],
>  
> +    'prepare-local-job' => [ __PACKAGE__, 'prepare_local_job', ['id', 'vmid', 'extra-args'], {} ],
> +
>      run => [ __PACKAGE__ , 'run'],
>  };
>  
> diff --git a/PVE/Replication.pm b/PVE/Replication.pm
> index 7bfdeb7d..0a0ed436 100644
> --- a/PVE/Replication.pm
> +++ b/PVE/Replication.pm
> @@ -156,6 +156,36 @@ my $get_next_job = sub {
>      return $jobcfg;
>  };
>  
> +sub replication_snapshot_name {
> +    my ($jobid, $last_sync) = @_;
> +
> +    my $prefix = "replicate_${jobid}_";
> +    my $snapname = "$prefix${last_sync}_snap";

I'd prefer ${...}${....} for readability ;)
> +
> +    wantarray ? ($prefix, $snapname) : $snapname;
> +}
> +
> +sub prepare {
> +    my ($storecfg, $volids, $jobid, $last_sync, $start_time, $logfunc) = @_;
> +
> +    my ($prefix, $snapname) = replication_snapshot_name($jobid, $last_sync);
> +
> +    my $last_snapshots = {};
> +    foreach my $volid (@$volids) {
> +	my $list = PVE::Storage::volume_snapshot_list($storecfg, $volid, $prefix);
> +	my $found = 0;
> +	foreach my $snap (@$list) {
> +	    if ($snap eq $snapname) {
> +		$last_snapshots->{$volid} = 1;
> +	    } else {
> +		$logfunc->($start_time, "$jobid: delete stale snapshot '$snap' on $volid");
> +		PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap);
> +	    }
> +	}

this loop looks dangerous to me as well.. shouldn't we only delete
intermediate snapshots if we know there is a correct later one? what if
there is no snapshot "$snapname" (because we are in some kind of
partially failed but recoverable state)? instead of a simple "sync last
delta again (manually)" we are now in "full resync" territory..

my $snap;
foreach $snap (@$volids) {
  last if $snap eq $snapname;
}

if ($snap eq $snapname) {
  foreach $snap (@$volids) {
    if ($snap ne $snapname) {
      $logfunc->($start_time, "$jobid: delete stale snapshot '$snap' on $volid");
      PVE::Storage::volume_snapshot_delete($storecfg, $volid, $snap);
    }
  }
} else {
  # big fat warning
}

> +    }
> +
> +    return $last_snapshots;
> +}
>  
>  sub replicate {
>      my ($jobcfg, $start_time, $logfunc) = @_;
> -- 
> 2.11.0
> 
> _______________________________________________
> pve-devel mailing list
> pve-devel at pve.proxmox.com
> https://pve.proxmox.com/cgi-bin/mailman/listinfo/pve-devel