HSJA_rb.py

#==================================================================================
# HopSkipJump 
#==================================================================================
import numpy as np
import torch

class HSJA(object):
    def __init__(self,model,constraint='l2',num_iterations=50,gamma=1.0,stepsize_search='geometric_progression',
        max_num_evals=1e4,init_num_evals=100, verbose=True,delta=2,len_T=2000):
        self.model = model
        self.constraint = constraint
        self.num_iterations = num_iterations
        self.gamma = gamma
        self.stepsize_search = stepsize_search
        self.max_num_evals = max_num_evals
        self.init_num_evals = init_num_evals
        self.verbose = verbose
        self.delta = delta
        self.len_T = len_T

    def hsja(self,input_xi,label_or_target,initial_xi,TARGETED,query_limit,auto_terminate=True):
        # Set parameters
        # original_label = np.argmax(self.model.predict_label(input_xi))
        d = int(np.prod(input_xi.shape))
        
        # =====================================================
        D = np.zeros(query_limit+1000)
        nq = 0
        DL = np.inf
        DR = 0
        accu_evals = 0
        # =====================================================

        # Set binary search threshold.
        if self.constraint == 'l2':
            theta = self.gamma / (np.sqrt(d) * d)
        else:
            theta = self.gamma / (d ** 2)

        
        # Initialize.
        perturbed = self.initialize(input_xi, label_or_target, initial_xi, TARGETED)
        

        # Project the initialization to the boundary.
        perturbed, dist_post_update = self.binary_search_batch(input_xi, perturbed, label_or_target, theta, TARGETED)
        dist = self.compute_distance(perturbed, input_xi)

        # =====================================================
        D[nq: self.model.num_queries]= dist
        nq = self.model.num_queries
        # =====================================================

        #for j in np.arange(self.num_iterations):
        j = 0
        terminate = False
        while not terminate:
            # Choose delta.
            if j==1:
                delta = 0.1 * (self.model.bounds[1] - self.model.bounds[0])
            else:
                if self.constraint == 'l2':
                    delta = np.sqrt(d) * theta * dist_post_update
                elif self.constraint == 'linf':
                    delta = d * theta * dist_post_update        


            # Choose number of evaluations.
            num_evals = int(self.init_num_evals * np.sqrt(j+1))
            num_evals = int(min([num_evals, self.max_num_evals]))

            # approximate gradient.
            gradf = self.approximate_gradient(perturbed, label_or_target, num_evals, 
                        delta, TARGETED)
            if self.constraint == 'linf':
                update = np.sign(gradf)
            else:
                update = gradf

            # search step size.
            if self.stepsize_search == 'geometric_progression':
                # find step size.
                epsilon = self.geometric_progression_for_stepsize(perturbed, label_or_target, 
                                update, dist, j+1, TARGETED)

                # Update the sample. 
                perturbed = self.clip_image(perturbed + epsilon * update, 
                                self.model.bounds[0], self.model.bounds[1])

                # Binary search to return to the boundary. 
                perturbed, dist_post_update = self.binary_search_batch(input_xi, 
                                perturbed[None], label_or_target, theta, TARGETED)

            elif params['stepsize_search'] == 'grid_search':
                # Grid search for stepsize.
                epsilons = np.logspace(-4, 0, num=20, endpoint = True) * dist
                epsilons_shape = [20] + len(input_xi.shape) * [1]
                perturbeds = perturbed + epsilons.reshape(epsilons_shape) * update
                perturbeds = self.clip_image(perturbeds, self.model.bounds[0], self.model.bounds[1])
                idx_perturbed = self.decision_function(perturbeds, label_or_target, TARGETED)

                if np.sum(idx_perturbed) > 0:
                    # Select the perturbation that yields the minimum distance # after binary search.
                    perturbed, dist_post_update = self.binary_search_batch(input_xi, 
                                        perturbeds[idx_perturbed], label_or_target, theta, TARGETED)

            # compute new distance.
            dist = self.compute_distance(perturbed, input_xi)
            #if self.verbose:
            #    print('iteration: {:d}, {:s} distance {:.4E}'.format(j+1, self.constraint, dist))

            #===============================================
            if j%10==0:
                print('iteration: {:d}, {:s} distance {:.4E} - nqry:{:d}'.format(j+1, self.constraint, dist, self.model.num_queries))            

            D[nq: self.model.num_queries]= dist
            
            nq = self.model.num_queries
            accu_evals += num_evals

            if auto_terminate:
                if accu_evals > self.len_T:
                    DR = dist
                    if ((DL-DR) < self.delta):
                        terminate = True
                        print('\nBreak due to slow convergence!\n')
                    DL = DR
                    accu_evals = 0
            else:
                if nq>query_limit:
                    terminate = True
                    print('\nBreak due to over query limit!\n')
            j += 1
            if (j>self.num_iterations):
                terminate = True
            #================================================

        return perturbed, nq, D[:nq]

    #=================================================================================================================================

    def decision_function(self, images, label, TARGETED):
            """
            Decision function output 1 on the desired side of the boundary,
            0 otherwise.
            """
            images = torch.from_numpy(images).float().cuda()
            la = self.model.predict_label(images,batch=True)
            #print(la,label)
            la = la.cpu().numpy()

            if TARGETED:
                return (la==label)
            else:
                return (la!=label)

    def decision_function_4_apprx(self,images, label, TARGETED):

        '''
        Decision function output 1 on the desired side of the boundary,
        0 otherwise.
        '''

        batch_size = len(images)
        la = np.zeros(batch_size,dtype = int)
        group = 128 # control memory consumption 
        i = 0
        while i<batch_size:
            imgs = torch.from_numpy(images[i:i+group]).float().cuda()
            la[i:i+group] = self.model.predict_label(imgs,batch=True).cpu().numpy()
            i += group
            if i+group> batch_size:
                group = batch_size - i

        if TARGETED:
            return (la==label)
        else:
            return (la!=label)

    def clip_image(self, image, clip_min, clip_max):
            # Clip an image, or an image batch, with upper and lower threshold.
            return np.minimum(np.maximum(clip_min, image), clip_max) 


    def compute_distance(self, x_ori, x_pert):
            # Compute the distance between two images.
            if self.constraint == 'l2':
                    return np.linalg.norm(x_ori - x_pert)
            elif self.constraint == 'linf':
                    return np.max(abs(x_ori - x_pert))


    def approximate_gradient(self, sample, label_or_target, num_evals, delta, TARGETED):

            # Generate random vectors.
            noise_shape = [num_evals] + list(sample.shape)
            if self.constraint == 'l2':
                    rv = np.random.randn(*noise_shape)
            elif self.constraint == 'linf':
                    rv = np.random.uniform(low = -1, high = 1, size = noise_shape)

            rv = rv / np.sqrt(np.sum(rv ** 2, axis = (1,2,3), keepdims = True))
            perturbed = sample + delta * rv
            perturbed = self.clip_image(perturbed, self.model.bounds[0], self.model.bounds[1])
            rv = (perturbed - sample) / delta

            # query the model.
            #decisions = self.decision_function(perturbed, label_or_target, TARGETED)
            decisions = self.decision_function_4_apprx(perturbed, label_or_target, TARGETED)
            decision_shape = [len(decisions)] + [1] * len(sample.shape)
            fval = 2 * decisions.astype(float).reshape(decision_shape) - 1.0

            # Baseline subtraction (when fval differs)
            if np.mean(fval) == 1.0: # label changes. 
                    gradf = np.mean(rv, axis = 0)
            elif np.mean(fval) == -1.0: # label not change.
                    gradf = - np.mean(rv, axis = 0)
            else:
                    fval -= np.mean(fval)
                    gradf = np.mean(fval * rv, axis = 0) 

            # Get the gradient direction.
            gradf = gradf / np.linalg.norm(gradf)

            return gradf


    def project(self, original_image, perturbed_images, alphas):
            alphas_shape = [1] * len(original_image.shape)
            alphas = alphas.reshape(alphas_shape)
            if self.constraint == 'l2':
                    #print(alphas.shape,original_image.shape, perturbed_images.shape)
                    return (1-alphas) * original_image + alphas * perturbed_images
            elif self.constraint == 'linf':
                    out_images = self.clip_image(
                            perturbed_images, 
                            original_image - alphas, 
                            original_image + alphas
                            )
                    return out_images


    def binary_search_batch(self, original_image, perturbed_images, label_or_target, theta, TARGETED):
            """ Binary search to approach the boundar. """

            # Compute distance between each of perturbed image and original image.
            dists_post_update = np.array([
                            self.compute_distance(
                                    original_image, 
                                    perturbed_image 
                            ) 
                            for perturbed_image in perturbed_images])
            #print(dists_post_update)
            # Choose upper thresholds in binary searchs based on constraint.
            if self.constraint == 'linf':
                    highs = dists_post_update
                    # Stopping criteria.
                    thresholds = np.minimum(dists_post_update * theta, theta)
            else:
                    highs = np.ones(len(perturbed_images))
                    thresholds = theta

            lows = np.zeros(len(perturbed_images))

            
            # Call recursive function. 
            while np.max((highs - lows) / thresholds) > 1:
                    # projection to mids.
                    mids = (highs + lows) / 2.0
                    mid_images = self.project(original_image, perturbed_images, mids)
           #         print(mid_images.shape)
                    # Update highs and lows based on model decisions.
                    decisions = self.decision_function(mid_images, label_or_target, TARGETED)
                    lows = np.where(decisions == 0, mids, lows)
                    highs = np.where(decisions == 1, mids, highs)

            out_images = self.project(original_image, perturbed_images, highs)

            # Compute distance of the output image to select the best choice. 
            # (only used when stepsize_search is grid_search.)
            dists = np.array([
                    self.compute_distance(
                            original_image, 
                            out_image 
                    ) 
                    for out_image in out_images])
            idx = np.argmin(dists)

            dist = dists_post_update[idx]
            out_image = out_images[idx]
            return out_image, dist


    def initialize(self, input_xi, label_or_target, initial_xi, TARGETED):
            """ 
            Efficient Implementation of BlendedUniformNoiseAttack in Foolbox.
            """
            success = 0
            num_evals = 0
            
            if initial_xi is None:
                    # Find a misclassified random noise.
                    while True:
                            random_noise = np.random.uniform(*self.model.bounds, size = input_xi.shape)
                            #print(random_noise[None].shape)
                            success = self.decision_function(random_noise, label_or_target, TARGETED)[0]
                            self.model.num_queries += 1
                            if success:
                                    break
                            assert num_evals < 1e4,"Initialization failed! "
                            "Use a misclassified image as `target_image`" 


                    # Binary search to minimize l2 distance to original image.
                    low = 0.0
                    high = 1.0
                    while high - low > 0.001:
                            mid = (high + low) / 2.0
                            blended = (1 - mid) * input_xi + mid * random_noise 
                            success = self.decision_function(blended, label_or_target, TARGETED)
                            if success:
                                    high = mid
                            else:
                                    low = mid

                    initialization = (1 - high) * input_xi + high * random_noise 

            else:
                    initialization = initial_xi

            return initialization


    def geometric_progression_for_stepsize(self, x, label_or_target, update, dist, j, TARGETED):
            """
            Geometric progression to search for stepsize.
            Keep decreasing stepsize by half until reaching 
            the desired side of the boundary,
            """
            epsilon = dist / np.sqrt(j) 

            def phi(epsilon):
                    new = x + epsilon * update
                    success = self.decision_function(new, label_or_target, TARGETED)
                    return success

            while not phi(epsilon):
                    epsilon /= 2.0

            return epsilon

    def __call__(self, input_xi, label_or_target, initial_xi=None, TARGETED=False):
        if initial_xi is not None:
            initial_xi = initial_xi.cpu().numpy()
        adv,nqry, Dt  = self.hsja(input_xi.cpu().numpy(), label_or_target, initial_xi, TARGETED)
        adv = torch.from_numpy(adv).float().cuda()
        return adv