From e2cc1e337cc5461d93a94931097ceb34e325c7ac Mon Sep 17 00:00:00 2001
From: Carl N Baldwin <cnb@plane.(none)>
Date: Wed, 19 Oct 2005 21:17:23 -0600
Subject: [PATCH] Regular commit

---
 filedata.cpp |  2 +-
 filedata.hpp | 28 +++++++++++++-----
 main.cc      | 84 +++++++++++++++++++++++++++++++++++-----------------
 3 files changed, 78 insertions(+), 36 deletions(-)

diff --git a/filedata.cpp b/filedata.cpp
index c66dadc..cd82b54 100644
--- a/filedata.cpp
+++ b/filedata.cpp
@@ -8,7 +8,7 @@ FileData::FileData( char               _type,
                     string             _permissions,
                     string             _user,
                     string             _group,
-                    unsigned long      _size,
+                    unsigned long long _size,
                     unsigned long long _modified_date,
                     string             _name,
                     unsigned long long _last_backup )
diff --git a/filedata.hpp b/filedata.hpp
index 8c2951b..3df81d9 100644
--- a/filedata.hpp
+++ b/filedata.hpp
@@ -3,6 +3,7 @@
 
 #include <string>
 #include <set>
+#include <vector>
 
 class FileData {
   public:
@@ -11,7 +12,7 @@ class FileData {
               std::string,
               std::string,
               std::string,
-              unsigned long,
+              unsigned long long,
               unsigned long long,
               std::string,
               unsigned long long = 0
@@ -21,7 +22,7 @@ class FileData {
     const std::string &getPermissions()    const { return permissions; }
     const std::string &getUserName()       const { return username; }
     const std::string &getGroupName()      const { return groupname; }
-    unsigned long      getFileSize()       const { return filesize; }
+    unsigned long long getFileSize()       const { return filesize; }
     unsigned long long getModifiedDate()   const { return modified_date; }
     const std::string &getFileName()       const { return filename; }
     unsigned long long getLastBackupDate() const { return last_backup_date; }
@@ -30,7 +31,7 @@ class FileData {
     void setPermissions(    const std::string &arg ) { permissions      = arg; }
     void setUserName(       const std::string &arg ) { username         = arg; }
     void setGroupName(      const std::string &arg ) { groupname        = arg; }
-    void setFileSize(       unsigned long      arg ) { filesize         = arg; }
+    void setFileSize(       unsigned long long arg ) { filesize         = arg; }
     void setModifiedDate(   unsigned long long arg ) { modified_date    = arg; }
     void setFileName(       const std::string &arg ) { filename         = arg; }
     void setLastBackupDate( unsigned long long arg ) { last_backup_date = arg; }
@@ -43,23 +44,34 @@ class FileData {
     std::string        permissions;
     std::string        username;
     std::string        groupname;
-    unsigned long      filesize;
+    unsigned long long filesize;
     unsigned long long modified_date;
     std::string        filename;
 
     unsigned long long last_backup_date;
 };
 
-class FileDataPtrCmp {
-  public:
+struct FileDataLastBackupCmp {
+  bool operator()( const FileData *a, const FileData *b ) {
+    return a->getLastBackupDate() < b->getLastBackupDate();
+  }
+};
+
+struct FileDataSizeCmp {
+  bool operator()( const FileData *a, const FileData *b ) {
+    return a->getFileSize() < b->getFileSize();
+  }
+};
 
+struct FileDataNameCmp {
   bool operator()( const FileData *a, const FileData *b ) {
     return cmp( a->getFileName(), b->getFileName() );
   }
   private:
-  std::less<std::string> cmp;
+    std::less<std::string> cmp;
 };
 
-typedef std::set<FileData*,FileDataPtrCmp> file_set;
+typedef std::set<FileData*,FileDataNameCmp> file_set;
+typedef std::vector<FileData*> file_vector;
 
 #endif
diff --git a/main.cc b/main.cc
index 407d572..1a1b9e7 100644
--- a/main.cc
+++ b/main.cc
@@ -1,6 +1,5 @@
 #include <iostream>
 #include <iterator>
-#include <vector>
 #include <algorithm>
 #include <cassert>
 
@@ -84,7 +83,7 @@ int main() {
   assert( SQLITE_OK == rc );
 
   // Now divide the two sets into three sets (new, deleted and updated )
-  FileDataPtrCmp cmp;
+  FileDataNameCmp cmp;
 
   file_set added;
   set_difference( current.begin(),   current.end(),
@@ -119,48 +118,79 @@ int main() {
   }
 
   // Now find the list of files to backup.
-  file_set backup_list;
+  file_set backup_set;
 
   // backup all new files
-  copy( added.begin(), added.end(), inserter( backup_list, backup_list.begin() ) );
+  copy( added.begin(), added.end(), inserter( backup_set, backup_set.begin() ) );
 
   // backup already backed-up files that have changed since the last backup date.
   for( file_set::iterator i = updated.begin(); i != updated.end(); ++i ) {
     if( (*i)->getLastBackupDate() < (*i)->getModifiedDate() ) {
-      backup_list.insert( *i );
+      backup_set.insert( *i );
     }
   }
 
-  // Now, sort the backup_list by filesize and build a list of up to SIZE
-
-  // Now, sort the non-backed-up list my last_backup_date and back-fill
+  // Now, sort the backup_set by filesize and build a list of up to SIZE
+  file_vector backups_bysize;
+  copy( backup_set.begin(), backup_set.end(), back_inserter( backups_bysize ) );
+  FileDataSizeCmp sizecmp;
+  sort( backups_bysize.begin(), backups_bysize.end(), sizecmp );
+
+  file_set final_set;
+  unsigned long long bytes_available = 4700000000ULL;  // 4.3 GBytes
+
+  unsigned long long block_size = 512ULL;
+
+  // Copy files over until full or out of files
+  file_vector::reverse_iterator i = backups_bysize.rbegin();
+  while( 0 != bytes_available && i != backups_bysize.rend() ) {
+    unsigned long long size = (*i)->getFileSize();
+    unsigned long long blocks = size & ( ~(block_size-1) );
+    if( blocks < size ) blocks += block_size;
+    if( blocks <= bytes_available ) {
+      bytes_available -= blocks;
+      final_set.insert( *i );
+    }
+    ++i;
+  }
 
-  // Remove deleted files from the database.
-  // TODO CNB You were working in here.  Actually, just delete all records in
-  // the database and re-populate with the current list.
-  const char *delete_sql = "delete from filedata where filename = :filename";
-  sqlite3_stmt *ppStmt;
+  // Now, sort the non-backed-up list by last_backup_date and back-fill
+  if( 0 != bytes_available ) {
+    file_vector leftovers;
+    set_difference( current.begin(),   current.end(),
+                    final_set.begin(), final_set.end(),
+                    back_inserter( leftovers ),
+                    cmp );
 
-  sqlite3_prepare( db, delete_sql, -1, &ppStmt, NULL );
-  assert( NULL != ppStmt );
+    FileDataLastBackupCmp lastbackupcmp;
+    sort( leftovers.begin(), leftovers.end(), lastbackupcmp );
 
-  for( file_set::iterator i = deleted.begin(); i != deleted.end(); ++i ) {
-    const string &name = (*i)->getFileName();
+    // Copy files over until full or out of files
+    file_vector::const_iterator j = leftovers.begin();
+    while( 0 != bytes_available && j != leftovers.end() ) {
+      unsigned long long size   = (*j)->getFileSize();
+      unsigned long long blocks = size & ( ~(block_size-1) );
 
-    rc = sqlite3_bind_text( ppStmt, 1, name.data(), name.size(), SQLITE_TRANSIENT );
-    assert( SQLITE_OK == rc );
+      if( blocks < size ) blocks += block_size;
 
-    rc = sqlite3_step( ppStmt );
-    assert( SQLITE_OK == rc );
+      if( blocks <= bytes_available ) {
+        bytes_available -= blocks;
+        final_set.insert( *j );
+      }
+      ++j;
+    }
   }
-  rc = sqlite3_finalize( ppStmt );
-  assert( SQLITE_OK == rc );
 
-  // Now, use the current set to update values in the database.  You should copy
-  // last_backup_date dates from the backed_up set first.  This will get all of
-  // the latest permissions but include the last_backup_date.
+  unsigned long long now = 20051019211200ULL;
+  for( file_set::iterator k = final_set.begin(); k != final_set.end(); ++k ) {
+    (*k)->setLastBackupDate( now );
+  }
 
-  // Now, update the last_backup_date for all of the files that are in the list
+  // Clean out the database
+  rc = sqlite3_exec( db, "delete from filedata;", NULL, NULL, &sqliteErrMsg );
+  assert( SQLITE_OK == rc );
+  rc = sqlite3_exec( db, "vacuum;", NULL, NULL, &sqliteErrMsg );
+  assert( SQLITE_OK == rc );
 
   // Clean-up
   for( file_set::iterator i = backed_up.begin(); i != backed_up.end(); ++i ) { delete *i; }
-- 
2.34.1