From: Alan J. Pippin <>
Date: Fri, 16 Jan 2009 06:57:18 +0000 (-0700)
Subject: Created the zfs-replicate-wrapper script that factors in duration to

Created the zfs-replicate-wrapper script that factors in duration to
stop replicating once duration exceeds a certain amount. Updated
zfs-log-parser to parse the stats from the replicate jobs properly.

diff --git a/zfs-log-parser b/zfs-log-parser
index 4ecca3c..94e4490 100755
--- a/zfs-log-parser
+++ b/zfs-log-parser
@@ -52,14 +52,14 @@ sub parse_replicate_logfile {
 	if(($in_replicate == 0) && ("$startdate" ne "") && ($line !~ /$startdate/)) { next; }
 	if($line =~ /(\S+)\s+(\S+)\s+(\d+)\s+(\d+):(\d+):(\d+)\s+(\S+)\s+(\S+)/) {
 	    $dayname=$1; $month=$2; $daynum=$3; $hour=$4; $minute=$5; $sec=$6; $year=$8;
-	    if(($in_replicate == 0) && ($line =~ /lock obtained/)) {
+	    if(($in_replicate == 0) && ($line =~ /replicate started/)) {
 		$in_replicate = 1;
 		$date="$dayname $month $daynum $hour:$minute:$sec $year";
 		$totals{$date}{data} = 0;
 		$totals{$date}{transfertime} = 0;
 		$totals{$date}{duration} = time_to_seconds($hour,$minute,$sec);
-	    elsif(($in_replicate == 1) && ($line=~ /lock released/)) {
+	    elsif(($in_replicate == 1) && ($line=~ /replicate complete/)) {
 		$in_replicate = 0;
 		$totals{$date}{duration} = time_to_seconds($hour,$minute,$sec) - $totals{$date}{duration};
diff --git a/zfs-replicate b/zfs-replicate
index dc6dab2..09cb3ba 100755
--- a/zfs-replicate
+++ b/zfs-replicate
@@ -10,7 +10,7 @@ remote_lockdir="/tmp/zfs-admin-lock"
 # Set the email address to send notification to
 # When this variable is set, local filesystems will be destroyed 
 # before receiving a full streams into them from the remote source.
@@ -19,6 +19,14 @@ destroy_local_filesystem_on_full_replicate=0
 # The ssh connection doesn't find zfs without this.
+# Setup our cleanup and exit trap
+cleanup() {
+  ssh $remote rm -rf "$remote_lockdir"
+  exit
+trap cleanup INT
+trap cleanup EXIT
 # Make sure we have valid arguments
 if [[ -z "$remote" ]] || [[ -z "$remote_fs" ]]; then
   echo "Usage: $0 <hostname> <zfs filesystem>"
@@ -78,10 +86,6 @@ while true; do
-# Declare a cleanup() method to remove the remote lockdir
-cleanup() { ssh $remote rm -rf "$remote_lockdir"; }
-trap cleanup EXIT
 # Setup our backup marker names
diff --git a/zfs-replicate-wrapper b/zfs-replicate-wrapper
new file mode 100755
index 0000000..d699c79
--- /dev/null
+++ b/zfs-replicate-wrapper
@@ -0,0 +1,110 @@
+# Author: Alan J. Pippin
+# Description: This script calls zfs-replicate for each filesystem needing
+#              to be backed up, or replicated, to another ZFS pool.
+# Setup some default values
+starttime=`date +%s`
+# Specify the list of filesystems to replicate
+# Specify the maximum run time in minutes that this script can run
+# This function checks to see if our runtime has exceeded our stoptime
+timeexceeded() { 
+  currenttime=`date +%s`  
+  elapsedtime=$(($currenttime - $starttime))
+  stoptime=$(($maxruntime*60))
+  if [[ $elapsedtime -gt $stoptime ]]; then
+    #echo "$elapsedtime > $stoptime"
+    return 1
+  fi
+  #echo "$elapsedtime < $stoptime"
+  return 0
+# This function cleanup and exit trap
+cleanup_and_exit() { 
+  #echo "cleanup and exit"
+  rm -rf "$lockdir"
+  exit 0
+trap cleanup_and_exit INT
+# This function executes the replicate command and checks the stoptime
+replicate() { 
+  $zfsreplicate $*  >> $logfile 2>&1
+  timeexceeded
+  if [ $? == 1 ]; then
+    cleanup_and_exit
+  fi
+# This function obtains the date a given snapshot was created in epoch seconds
+snapshot_age() {
+  snapshot=${local_pool}/${1}${previous_backup_marker}
+  $zfs list -t snapshot ${snapshot} > /dev/null 2>&1
+  if [ $? == 0 ]; then
+    $zfs get creation ${snapshot} > /dev/null 2>&1
+    if [ $? == 0 ]; then
+      snap_creation=`$zfs get creation ${snapshot} | grep $1 | awk '{ print $3" "$4" "$5" "$6" "$7 }'`
+      snap_age=`date -d "$snap_creation" +%s` 
+      echo "$snap_age"
+    else
+      echo "0"
+    fi
+  else
+    echo "0"
+  fi
+# Obtain the zpool guid for the local pool
+local_pool_guid=`zpool get guid $local_pool 2>&1 | grep $local_pool | awk '{ print $3 }'`
+zpool get guid $local_pool > /dev/null 2>&1
+if [ $? != 0 ]; then
+  echo >&2 "-E- Unable to extract the guid for the local pool: $local_pool"
+  exit 1
+# Setup our backup marker names
+# Auto snapshot every zfs filesystem on the system specified below
+echo "$date ZFS replicate started" >> $logfile
+# Sort the filesystems to replicate by the oldest backup first
+for filesystem in $filesystems_to_replicate; do
+  age=`snapshot_age $filesystem`
+  echo $filesystem $age >> $tmpfile
+sorted_filesystems=`cat $tmpfile | sort -n -k 2 | awk '{ print $1 }'`
+rm -f $tmpfile
+# Replicate the sorted filesystems
+for filesystem in $sorted_filesystems; do
+  echo "-> Replicating $remote:$filesystem to ${local_pool}/${filesystem}"
+  replicate $remote $filesystem
+# All done
+echo `date` ZFS replicate complete >> $logfile
+# Parse the log file and extract our backup stats
+$logfile_parser "$logfile" "$date" >> $logfile