function expl = expl(Q,opts)
	% Compute the exploitability of a policy (value function)

	% VS = Q';
	% VS = softmax(VS, 1e-4);
	% M_br = VS^1e3 * M;
	% V = max(Q,[],2);
	% V_br = V;
	% for t = 1:10
	%     VS = repmat(V_br,1,A); % AxS
	%     VS(filter' ~= 1) = -Inf;
	%     V_br = r(1:S,1,M_br) + gamma * max(VS);
	%     V_br = V_br';
	% end
	% expl(k,e) = sum(square((V_br-V)));

	% Calculate the induced policy of u
	mu_u = ip(Q,opts);

	% Calculate the value function of u given the fixed population mu_u
	opts.type = 'evaluate';
	opts.policy = Q;
	V_u = br(mu_u,opts);

	% Calculate the optimal value function given the fixed population mu_u
	opts.type = 'optimize';
	V_br = br(mu_u,opts);

	% expl = squeeze(sum(abs(V_u - V_br),1));
	expl = squeeze(sum(mu_u .* (V_br - V_u),1));
end
