Mainly changes in style:

cyrusgeyer · cyrusgeyer · commit b355b386db72 · 2018-06-14T18:03:38.000+02:00
correcting typos, enforcing conventions.
diff --git a/DiffPrivate_FedLearning.py b/DiffPrivate_FedLearning.py
@@ -13,7 +13,7 @@ def run_differentially_private_federated_averaging(loss, train_op, eval_correct,
                                                    label_placeholder, privacy_agent=None, b=10, e=4,
                                                    record_privacy=True, m=0, sigma=0, eps=8, save_dir=None,
                                                    log_dir=None, max_comm_rounds=3000, gm=True,
-                                                   saver_func=create_save_dir):
+                                                   saver_func=create_save_dir, save_params=False):
 
     """
     This function will simulate a federated learning setting and enable differential privacy tracking. It will detect
@@ -65,6 +65,7 @@ def run_differentially_private_federated_averaging(loss, train_op, eval_correct,
     :param gm:                  Whether to use a Gaussian Mechanism or not.
     :param saver_func:          A function that specifies where and how to save progress: Note that the usual tensorflow
                                 tracking will not work
+    :param save_params:         save all weights_throughout training.
 
     :return:
 
@@ -277,4 +278,7 @@ def run_differentially_private_federated_averaging(loss, train_op, eval_correct,
         # PRINT the progress and stage of affairs.
         print(' - Epsilon-Delta Privacy:' + str([FLAGS.eps, delta]))
 
+        if save_params:
+            weights_accountant.save_params(save_dir)
+
     return [], [], []
diff --git a/Helper_Functions.py b/Helper_Functions.py
@@ -76,6 +76,11 @@ def __init__(self,sess,model,Sigma, real_round):
         self.num_weights = len(self.Weights)
         self.round = real_round
 
+    def save_params(self,save_dir):
+        filehandler = open(save_dir + '/Wweights_accountant_round_'+self.round + '.pkl', "wb")
+        pickle.dump(self, filehandler)
+        filehandler.close()
+
     def allocate(self, sess):
 
         self.Weights = [np.concatenate((self.Weights[i], np.expand_dims(sess.run(tf.trainable_variables()[i]), -1)), -1)
@@ -146,7 +151,6 @@ def Update_via_GaussianMechanism(self, sess, Acc, FLAGS, Computed_deltas):
                 delta = Computed_deltas[self.round]
         return New_model, delta
 
-
 def create_save_dir(FLAGS):
     '''
     :return: Returns a path that is used to store training progress; the path also identifies the chosen setup uniquely.
diff --git a/MNIST_reader.py b/MNIST_reader.py
@@ -19,6 +19,8 @@ def read(dataset = "training", path = "."):
     else:
         raise ValueError, "dataset must be 'testing' or 'training'"
 
+    print(fname_lbl)
+
     # Load everything in some numpy arrays
     with open(fname_lbl, 'rb') as flbl:
         magic, num = struct.unpack(">II", flbl.read(8))
@@ -36,10 +38,10 @@ def read(dataset = "training", path = "."):
     return img, lbl
 
 
-def get_data():
+def get_data(d):
     # load the data
-    x_train, y_train = read('training', os.getcwd() + '/MNIST_original')
-    x_test, y_test = read('testing', os.getcwd() + '/MNIST_original')
+    x_train, y_train = read('training', d + '/MNIST_original')
+    x_test, y_test = read('testing', d + '/MNIST_original')
 
     # create validation set
     x_vali = list(x_train[50000:].astype(float))
@@ -63,6 +65,6 @@ def get_data():
 
 class Data:
     def __init__(self, save_dir, n):
-        raw_directory = save_dir + '/DATA/'
-        self.client_set = pickle.load(open(raw_directory + 'clients/' + str(n) + '_clients.pkl', 'rb'))
-        self.sorted_x_train, self.sorted_y_train, self.x_vali, self.y_vali, self.x_test, self.y_test = get_data()
+        raw_directory = save_dir + '/DATA'
+        self.client_set = pickle.load(open(raw_directory + '/clients/' + str(n) + '_clients.pkl', 'rb'))
+        self.sorted_x_train, self.sorted_y_train, self.x_vali, self.y_vali, self.x_test, self.y_test = get_data(save_dir)
diff --git a/RUNME.sh b/RUNME.sh
@@ -0,0 +1,22 @@
+#!/bin/sh
+STRING="Downloading the MNIST-data set and creating clients"
+echo $STRING
+eval cd DiffPrivate_FedLearning
+eval mkdir MNIST_original
+eval cd MNIST_original 
+eval curl -O "http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz"
+eval curl -O "http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz"
+eval curl -O "http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz"
+eval curl -O "http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz"
+eval gunzip train-images-idx3-ubyte.gz
+eval gunzip train-labels-idx1-ubyte.gz
+eval gunzip t10k-images-idx3-ubyte.gz
+eval gunzip t10k-labels-idx1-ubyte.gz
+eval cd ..
+eval python Create_clients.py 
+STRING2="You can now run differentially private federated learning on the MNIST data set. Type python sample.py —-h for help"
+echo $STRING2
+STRING3="An example: …python sample.py —-N 100… would run differentially private federated learning on 100 clients for a privacy budget of (epsilon = 8, delta = 0.001)"
+echo $STRING3
+STINRG4="For more information on how to use the the functions please refer to their documentation"
+echo $STRING4
diff --git a/sample.py b/sample.py
@@ -3,71 +3,48 @@
 import os
 from DiffPrivate_FedLearning import run_differentially_private_federated_averaging
 from MNIST_reader import Data
+import argparse
+import sys
 
-# Specs for the model that we would like to train in differentially private federated fashion:
-hidden1 = 600
-hidden2 = 100
 
-# Specs for the differentially private federated fashion learning process.
-N = 100
-Batches = 10
-save_dir = os.getcwd()
+def sample(N, b,e,m, sigma, eps, save_dir, log_dir):
 
-# A data object that already satisfies client structure and has the following attributes:
-# DATA.data_set : A list of labeld training examples.
-# DATA.client_set : A
-DATA = Data(save_dir, N)
+    # Specs for the model that we would like to train in differentially private federated fashion:
+    hidden1 = 600
+    hidden2 = 100
 
-with tf.Graph().as_default():
+    # Specs for the differentially private federated fashion learning process.
 
-    # Building the model that we would like to train in differentially private federated fashion.
-    # We will need the tensorflow training operation for that model, its loss and an evaluation method:
+    # A data object that already satisfies client structure and has the following attributes:
+    # DATA.data_set : A list of labeld training examples.
+    # DATA.client_set : A
+    DATA = Data(save_dir, N)
 
-    train_op, eval_correct, loss, data_placeholder, labels_placeholder = mnist.mnist_fully_connected_model(Batches, hidden1, hidden2)
+    with tf.Graph().as_default():
 
-    Accuracy_accountant, Delta_accountant, model = \
-        run_differentially_private_federated_averaging(loss, train_op, eval_correct, DATA, data_placeholder, labels_placeholder)
-
-'''
-def main(_):
-    data = Data(FLAGS.save_dir, FLAGS.n)
-    train_op, eval_correct, loss = mnist_inference.mnist_fully_connected_model()
-    run_differentially_private_federated_averaging(loss, train_op, eval_correct, data)
+        # Building the model that we would like to train in differentially private federated fashion.
+        # We will need the tensorflow training operation for that model, its loss and an evaluation method:
 
+        train_op, eval_correct, loss, data_placeholder, labels_placeholder = mnist.mnist_fully_connected_model(b, hidden1, hidden2)
 
-class Flag:
-    def __init__(self, n, b, e, record_privacy, m, sigma, eps, save_dir, log_dir, max_comm_rounds, gm, PrivAgent):
-        if not save_dir:
-            save_dir = os.getcwd()
-        if not log_dir:
-            log_dir = os.path.join(os.getenv('TEST_TMPDIR', '/tmp'), 'tensorflow/mnist/logs/fully_connected_feed')
-        if tf.gfile.Exists(log_dir):
-            tf.gfile.DeleteRecursively(log_dir)
-        tf.gfile.MakeDirs(log_dir)
-        self.n = n
-        self.sigma = sigma
-        self.eps = eps
-        self.m = m
-        self.b = b
-        self.e = e
-        self.record_privacy = record_privacy
-        self.save_dir = save_dir
-        self.log_dir = log_dir
-        self.max_comm_rounds = max_comm_rounds
-        self.gm = gm
-        self.PrivAgentName = PrivAgent.Name
+        Accuracy_accountant, Delta_accountant, model = \
+            run_differentially_private_federated_averaging(loss, train_op, eval_correct, DATA, data_placeholder,
+                                                           labels_placeholder, b=b, e=e,m=m, sigma=sigma, eps=eps,
+                                                           save_dir=save_dir, log_dir=log_dir)
 
+def main(_):
+    sample(N=FLAGS.N, b=FLAGS.b, e=FLAGS.e,m=FLAGS.m, sigma=FLAGS.sigma, eps=FLAGS.eps, save_dir=None, log_dir=FLAGS.log_dir)
 
 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
     parser.add_argument(
-        '--PrivAgentName',
+        '--save_dir',
         type=str,
-        default='default_Priv_Agent',
-        help='Sets the name of the used Privacy agent'
+        default=os.getcwd(),
+        help='directory to store progress'
     )
     parser.add_argument(
-        '--n',
+        '--N',
         type=int,
         default=100,
         help='Total Number of clients participating'
@@ -102,12 +79,6 @@ def __init__(self, n, b, e, record_privacy, m, sigma, eps, save_dir, log_dir, ma
         default=4,
         help='Epochs per client'
     )
-    parser.add_argument(
-        '--record_privacy',
-        type=bool,
-        default=True,
-        help='Epochs per client'
-    )
     parser.add_argument(
         '--save_dir',
         type=str,
@@ -121,12 +92,6 @@ def __init__(self, n, b, e, record_privacy, m, sigma, eps, save_dir, log_dir, ma
                              'tensorflow/mnist/logs/fully_connected_feed'),
         help='Directory to put the log data.'
     )
-    parser.add_argument(
-        '--max_comm_rounds',
-        type=int,
-        default=3000,
-        help='Maximum number of communication rounds'
-    )
     FLAGS, unparsed = parser.parse_known_args()
     tf.app.run(main=main, argv=[sys.argv[0]] + unparsed)
-'''
+