xmutly
/

robustvlm-object-centric

Model card Files Files and versions

robustvlm-object-centric / autoattack /fab_tf.py

xmutly's picture

Upload 294 files

e1aaaac verified over 1 year ago

history blame contribute delete

2.6 kB

	# Copyright (c) 2019-present, Francesco Croce
	# All rights reserved.
	#
	# This source code is licensed under the license found in the
	# LICENSE file in the root directory of this source tree.
	#

	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function
	from __future__ import unicode_literals

	import torch
	from autoattack.fab_base import FABAttack


	class FABAttack_TF(FABAttack):
	"""
	Fast Adaptive Boundary Attack (Linf, L2, L1)
	https://arxiv.org/abs/1907.02044

	:param model: TF_model
	:param norm: Lp-norm to minimize ('Linf', 'L2', 'L1' supported)
	:param n_restarts: number of random restarts
	:param n_iter: number of iterations
	:param eps: epsilon for the random restarts
	:param alpha_max: alpha_max
	:param eta: overshooting
	:param beta: backward step
	"""

	def __init__(
	self,
	model,
	norm='Linf',
	n_restarts=1,
	n_iter=100,
	eps=None,
	alpha_max=0.1,
	eta=1.05,
	beta=0.9,
	loss_fn=None,
	verbose=False,
	seed=0,
	targeted=False,
	device=None,
	n_target_classes=9):
	""" FAB-attack implementation in TF2 """

	self.model = model
	super().__init__(norm,
	n_restarts,
	n_iter,
	eps,
	alpha_max,
	eta,
	beta,
	loss_fn,
	verbose,
	seed,
	targeted,
	device,
	n_target_classes)

	def _predict_fn(self, x):
	return self.model.predict(x)

	def _get_predicted_label(self, x):
	with torch.no_grad():
	outputs = self._predict_fn(x)
	_, y = torch.max(outputs, dim=1)
	return y

	def get_diff_logits_grads_batch(self, imgs, la):
	y2, g2 = self.model.grad_logits(imgs)
	df = y2 - y2[torch.arange(imgs.shape[0]), la].unsqueeze(1)
	dg = g2 - g2[torch.arange(imgs.shape[0]), la].unsqueeze(1)
	df[torch.arange(imgs.shape[0]), la] = 1e10

	return df, dg

	def get_diff_logits_grads_batch_targeted(self, imgs, la, la_target):
	df, dg = self.model.get_grad_diff_logits_target(imgs, la, la_target)
	df.unsqueeze_(1)
	dg.unsqueeze_(1)

	return df, dg