Add files via upload

XHWXD · Oct 31, 2017 · 1f4886d · 1f4886d
1 parent cf690f6
commit 1f4886d
Show file tree

Hide file tree

Showing 4 changed files with 118 additions and 0 deletions.
diff --git a/1.JPG b/1.JPG
diff --git a/2.JPG b/2.JPG
diff --git a/3.jpg b/3.jpg
diff --git a/vl_nnfocalloss.m b/vl_nnfocalloss.m
@@ -0,0 +1,118 @@
+function y = vl_nnfocalloss(x,c,dzdy)
+% focal_loss = -alpha * (1-p).*gamma * log(p)
+%
+% Based on VL_NNSOFTMAXLOSS. 
+%   **Deprecated: use `vl_nnloss` instead**
+%
+%   Y = VL_NNFOCALLOSS(X, C) applies the softmax operator followed by
+%   the focal loss the data X. X has dimension H x W x D x N,
+%   packing N arrays of W x H D-dimensional vectors.
+%
+%   C contains the class labels, which should be integers in the range
+%   1 to D. C can be an array with either N elements or with dimensions
+%   H x W x 1 x N dimensions. In the fist case, a given class label is
+%   applied at all spatial locations; in the second case, different
+%   class labels can be specified for different locations.
+%
+%   DZDX = VL_NNSOFTMAXLOSS(X, C, DZDY) computes the derivative of the
+%   block projected onto DZDY. DZDX and DZDY have the same dimensions
+%   as X and Y respectively.
+
+%
+% This file is part of the matconvnet and is made available under
+% the terms of the BSD license (see the COPYING file).
+
+% work around a bug in MATLAB, where native cast() would slow
+% progressively
+
+
+gamma = 2;
+alpha = 0.5;
+
+
+if isa(x, 'gpuArray')
+  switch classUnderlying(x) ;
+    case 'single', cast = @(z) single(z) ;
+    case 'double', cast = @(z) double(z) ;
+  end
+else
+  switch class(x)
+    case 'single', cast = @(z) single(z) ;
+    case 'double', cast = @(z) double(z) ;
+  end
+end
+
+%X = X + 1e-6 ;
+sz = [size(x,1) size(x,2) size(x,3) size(x,4)] ;
+
+if numel(c) == sz(4)
+  % one label per image
+  c = reshape(c, [1 1 1 sz(4)]) ;
+end
+if size(c,1) == 1 & size(c,2) == 1
+  c = repmat(c, [sz(1) sz(2)]) ;
+end
+
+% one label per spatial location
+sz_ = [size(c,1) size(c,2) size(c,3) size(c,4)] ;
+assert(isequal(sz_, [sz(1) sz(2) sz_(3) sz(4)])) ;
+assert(sz_(3)==1 | sz_(3)==2) ;
+
+% class c = 0 skips a spatial location
+mass = cast(c(:,:,1,:) > 0) ;
+if sz_(3) == 2
+  % the second channel of c (if present) is used as weights
+  mass = mass .* c(:,:,2,:) ;
+  c(:,:,2,:) = [] ;
+end
+
+% convert to indexes
+c = c - 1 ;
+c_ = 0:numel(c)-1 ;
+c_ = 1 + ...
+  mod(c_, sz(1)*sz(2)) + ...
+  (sz(1)*sz(2)) * max(c(:), 0)' + ...
+  (sz(1)*sz(2)*sz(3)) * floor(c_/(sz(1)*sz(2))) ;
+
+% compute softmaxloss
+xmax = max(x,[],3) ;
+ex = exp(bsxfun(@minus, x, xmax)) ;
+% the output of softmax function
+o = bsxfun(@rdivide, ex, sum(ex,3)) ;  
+
+
+%n = sz(1)*sz(2) ;
+if nargin <= 2
+%   % softmaxloss
+%   t = xmax + log(sum(ex,3)) - reshape(x(c_), [sz(1:2) 1 sz(4)]) ;
+%   y = sum(sum(sum(mass .* t,1),2),4) ;
+    % focal_loss = -alpha * (1-p).*gamma .* log(p), p=o(c_);
+    % p=exp(x_y)/sum(x_j) which means the probability that belongs to the true label;
+    t = alpha * reshape((1-o(c_)).^gamma, [sz(1:2) 1 sz(4)]) .* (log(sum(ex,3)) - reshape(x(c_), [sz(1:2) 1 sz(4)])) + xmax;
+    y = sum(sum(sum(mass .* t,1),2),4) ;
+else
+%   % softmaxloss
+%   y = bsxfun(@rdivide, ex, sum(ex,3)) ;
+%   y(c_) = y(c_) - 1; % for those = labels               
+%   y = bsxfun(@times, y, bsxfun(@times, mass, dzdy)) ;
+
+    % focal_loss 
+    % =label: grad1 = (1-p).*gamma .* (gamma * p .* log(p) + p - 1 )
+    % ~=label: grad2 = -(1-p).*(gamma-1) .* q .* (gamma * p .* log(p) + p - 1 ), for binary, q=1-p;
+    % q means that the probability that does not belong to the true label;
+    if isa(o,'gpuArray')
+        p = gpuArray.zeros(size(o),classUnderlying(o)) ;
+    else
+        p = zeros(size(o),'like',o) ;
+    end
+    p(c_) = alpha * (1 - o(c_)).^gamma .* ( gamma * o(c_) .* log(o(c_)+(1e-10)) + o(c_) - 1 );
+    q = o;
+    q(c_) = 0;
+    nClass = sz(1)*sz(2)*sz(3);
+    c_c = single(setdiff([1:nClass*numel(c)],c_));
+    p_tmp = repmat(o(c_),[nClass-1 1]);
+    q(c_c) = - alpha * (1 - p_tmp(:)') .^ (gamma-1) .* q(c_c) .* (gamma * p_tmp(:)' .* log(p_tmp(:)'+(1e-10)) + p_tmp(:)' - 1 );
+    y = p + q;
+    y = bsxfun(@times, y, bsxfun(@times, mass, dzdy)) ;
+end
+