From 70a65e43d6ff15fe55248d47382184507adb47dd Mon Sep 17 00:00:00 2001
From: DM <d.manousakas@gmail.com>
Date: Thu, 5 Nov 2020 12:54:45 +0200
Subject: [PATCH] rmv dp bpsvi

---
 bayesiancoresets/coreset/dpbpsvi.py | 87 -----------------------------
 1 file changed, 87 deletions(-)
 delete mode 100644 bayesiancoresets/coreset/dpbpsvi.py

diff --git a/bayesiancoresets/coreset/dpbpsvi.py b/bayesiancoresets/coreset/dpbpsvi.py
deleted file mode 100644
index e219a29..0000000
--- a/bayesiancoresets/coreset/dpbpsvi.py
+++ /dev/null
@@ -1,87 +0,0 @@
-import numpy as np
-from ..util.errors import NumericalPrecisionError
-from ..util.opt import partial_nn_opt
-from .coreset import Coreset
-from ..privacy import *
-np.set_printoptions(precision=6)
-
-def clip(x, c, axis=None):
-  return (x/(np.linalg.norm(x, axis=axis)+1e-15)*np.clip(np.linalg.norm(x, axis=axis), 0., c)).T
-
-class DiffPrivBatchPSVICoreset(Coreset):
-  def __init__(self, data, ll_projector, opt_itrs=500, n_subsample_opt=128, step_sched=lambda m: lambda i: 1./(1.+i), 
-               noise_multiplier=1.1, delta=None, init_sampler=None, gen_inits=None, l2normclip=100., down=1., **kw): 
-    self.data = data
-    self.ll_projector = ll_projector
-    self.opt_itrs = opt_itrs
-    self.n_subsample_opt = None if n_subsample_opt is None else min(data.shape[0], n_subsample_opt)
-    self.step_sched = step_sched
-    self.delta = 1./self.data.shape[0] if delta is None else delta
-    self.gradclip = l2normclip 
-    self.noise_mul = noise_multiplier
-    self.init_sampler = init_sampler
-    self.gen_inits = gen_inits
-    self.dp = (analysis.epsilon(self.data.shape[0], self.n_subsample_opt, self.noise_mul, self.opt_itrs, self.delta), self.delta)
-    print('dp guarantee : ', self.data.shape[0], self.n_subsample_opt, self.noise_mul, self.opt_itrs, self.dp)
-    self.down = down # multiply locations gradient with a constant to vary the lrs between weights and locations
-    super().__init__(**kw)
-
-  def get_privacy_params(self):
-    return self.dp
-
-  def _build(self, itrs, sz):
-    # privately initialize points
-    self._initialize(sz)
-    # run gradient optimization for opt_itrs steps
-    self._optimize()
-  
-  def _initialize(self, sz):
-    # implemented ONLY for Bayesian logistic regression 
-    # sample model parameters from pseudocoreset posterior (i.e. prior when pseudocoreset is empty)
-    self.wts = self.data.shape[0]/sz*np.ones(sz)
-    th0 = self.init_sampler(self.wts.shape[0], None, np.random.randint(self.data.shape[0], size=0)) # dummy init to empty set, which samples from the prior 
-    self.pts = self.gen_inits(self.wts.shape[0], th0)
-    self.idcs = -1*np.ones(sz)
-    return
-    
-  def _optimize(self):
-    sz = self.wts.shape[0]
-    N, d = self.data.shape[0], self.data.shape[1]
-    def grd(x): 
-      w = x[:sz]
-      p = x[sz:].reshape((sz, d))
-      vecs, sum_scaling, sub_idcs, corevecs, pgrads = self._get_projection(self.n_subsample_opt, w, p)
-      clip_value = np.median(np.linalg.norm(corevecs.T, axis=0))
-      clipped_vecs = clip(vecs.T, clip_value, axis=0)
-      gauss = clip_value*self.noise_mul*np.random.randn(clipped_vecs.shape[1])
-      priv_suffstats = clipped_vecs.sum(axis=0) + gauss
-      resid = sum_scaling*priv_suffstats - w.dot(corevecs)
-      wgrad = -corevecs.dot(resid) / corevecs.shape[1]
-      ugrad = -self.down*(w[:, np.newaxis, np.newaxis]*pgrads*resid[np.newaxis, :, np.newaxis]).sum(axis=1)/corevecs.shape[1]
-      grad = np.hstack((wgrad, ugrad.reshape(sz*d)))       
-      return grad
-    x0 = np.hstack((self.wts, self.pts.reshape(sz*d)))
-    xf = partial_nn_opt(x0, grd, np.arange(sz), self.opt_itrs, step_sched = self.step_sched(sz))
-    self.wts = xf[:sz]
-    self.pts = xf[sz:].reshape((sz, d))
-    return 
-    
-  def _get_projection(self, n_subsample, w, p):
-    #update the projector
-    self.ll_projector.update(w, p)
-
-    #construct a tangent space
-    if n_subsample is None:
-      sub_idcs = None
-      vecs = self.ll_projector.project(self.data)
-      sum_scaling = 1.
-    else:
-      sub_idcs = np.random.randint(self.data.shape[0], size=n_subsample)
-      vecs = self.ll_projector.project(self.data[sub_idcs])
-      sum_scaling = self.data.shape[0]/n_subsample
-
-    if p.size > 0:
-      corevecs, pgrads = self.ll_projector.project(p, grad=True)
-    else:
-      corevecs, pgrads = np.zeros((0, vecs.shape[1])), np.zeros((0, vecs.shape[1], p.shape[1]))
-    return vecs, sum_scaling, sub_idcs, corevecs, pgrads