Added workaround to overcome Octave's convn() bug.

albertoandreottiATgmail · albertoandreottiATgmail · commit 0e7bbaf76d94 · 2013-07-04T14:09:43.000-03:00
+ Added wrapper function 'custom_convn' to choose between three ways of
computing the convn(). The default behaviour is to use convn() and to
choose between 'valid' and 'same' according to the platform(Matlab or
Octave).
A third option is to use 'fft' which uses FFT based convolution.
Although this is very slow, the library can be compiled to support GPU.
Check the code for more info.
+ Added an utility function 'isOctave()' to tell which platform is being
used.
+ TODO: We should use custom_convn() everywhere, but this may slow
things down too much.
+ test_cnn_gradients_are_numerically_correct fails with convn(,,'same')
but works with convnfft.
diff --git a/CNN/cnnbp.m b/CNN/cnnbp.m
@@ -41,7 +41,7 @@
         if strcmp(net.layers{l}.type, 'c')
             for j = 1 : numel(net.layers{l}.a)
                 for i = 1 : numel(net.layers{l - 1}.a)
-                    net.layers{l}.dk{i}{j} = convn(flipall(net.layers{l - 1}.a{i}), net.layers{l}.d{j}, 'valid') / size(net.layers{l}.d{j}, 3);
+                    net.layers{l}.dk{i}{j} = custom_convn(flipall(net.layers{l - 1}.a{i}), net.layers{l}.d{j}, 'valid') / size(net.layers{l}.d{j}, 3);
                 end
                 net.layers{l}.db{j} = sum(net.layers{l}.d{j}(:)) / size(net.layers{l}.d{j}, 3);
             end
diff --git a/CNN/convnfft.m b/CNN/convnfft.m
@@ -0,0 +1,221 @@
+function A = convnfft(A, B, shape, dims, options)
+% CONVNFFT  FFT-BASED N-dimensional convolution.
+%   C = CONVNFFT(A, B) performs the N-dimensional convolution of
+%   matrices A and B. If nak = size(A,k) and nbk = size(B,k), then
+%   size(C,k) = max([nak+nbk-1,nak,nbk]);
+% 
+%   C = CONVNFFT(A, B, SHAPE) controls the size of the answer C:
+%       'full'   - (default) returns the full N-D convolution
+%       'same'   - returns the central part of the convolution that
+%                  is the same size as A.
+%       'valid'  - returns only the part of the result that can be
+%                  computed without assuming zero-padded arrays.
+%                  size(C,k) = max([nak-max(0,nbk-1)],0).
+%
+%   C = CONVNFFT(..., SHAPE, DIMS) with DIMS is vector of dimensions where
+%       the convolution will be carried out. By default DIMS is
+%       [1:max(ndims(A),ndims(B))] (all dimensions). A and B must have the
+%       same lengths on other dimensions.
+%   C = CONVNFFT(..., SHAPE, DIMS, GPU)
+%       GPU is boolean flag, see next
+%
+%   C = CONVNFFT(..., SHAPE, DIMS, OPTIONS)
+%
+%   OPTIONS is structure with following optional fields
+%       - 'GPU', boolean. If GPU is TRUE Jacket/GPU FFT engine will be used
+%       By default GPU is FALSE.
+%       - 'Power2Flag', boolean. If it is TRUE, use FFT with length rounded
+%       to the next power-two. It is faster but requires more memory.
+%       Default value is TRUE.
+%
+% Class support for inputs A,B:
+% float: double, single
+%
+% METHOD: CONVNFFT uses Fourier transform (FT) convolution theorem, i.e.
+%         FT of the convolution is equal to the product of the FTs of the
+%         input functions.
+%         In 1-D, the complexity is O((na+nb)*log(na+nb)), where na/nb are
+%         respectively the lengths of A and B.
+%
+% Usage recommendation:
+%         In 1D, this function is faster than CONV for nA, nB > 1000.
+%         In 2D, this function is faster than CONV2 for nA, nB > 20.
+%         In 3D, this function is faster than CONVN for nA, nB > 5.
+% 
+% See also conv, conv2, convn.
+% 
+%   Author: Bruno Luong <brunoluong@yahoo.com>
+%   History:
+%       Original: 21-Jun-2009
+%       23-Jun-2009: correct bug when ndims(A)<ndims(B)
+%       02-Sep-2009: GPU/JACKET option
+%       04-Sep-2009: options structure
+%       16-Sep-2009: inplace product
+
+if nargin<3 || isempty(shape)
+    shape = 'full';
+end
+
+if nargin<5 || isempty(options)
+    options = struct();
+elseif ~isstruct(options) % GPU options
+    options = struct('GPU', options);
+end
+
+nd = max(ndims(A),ndims(B));
+% work on all dimensions by default
+if nargin<4 || isempty(dims)
+    dims = 1:nd;
+end
+dims = reshape(dims, 1, []); % row (needed for for-loop index)
+
+% GPU enable flag
+GPU = getoption(options, 'GPU', false);
+% Check if Jacket is installed
+GPU = GPU && ~isempty(which('ginfo'));
+
+% IFUN function will be used later to truncate the result
+% M and N are respectively the length of A and B in some dimension
+switch lower(shape)
+    case 'full',
+        ifun = @(m,n) 1:m+n-1;
+    case 'same',
+        ifun = @(m,n) ceil((n-1)/2)+(1:m);
+    case 'valid',
+        ifun = @(m,n) n:m;
+    otherwise
+        error('convnfft: unknown shape %s', shape);
+end
+
+classA = class(A);
+classB = class(B);
+ABreal = isreal(A) && isreal(B);
+
+% Special case, empty convolution, try to follow MATLAB CONVN convention
+if any(size(A)==0) || any(size(B)==0)
+    szA = zeros(1,nd); szA(1:ndims(A))=size(A);
+    szB = zeros(1,nd); szB(1:ndims(B))=size(B);
+    % Matlab wants these:
+    szA = max(szA,1); szB = max(szB,1);
+    szC = szA;
+    for dim=dims
+        szC(dim) = length(ifun(szA(dim),szB(dim)));
+    end
+    A = zeros(szC,classA); % empty -> return zeros
+    return
+end
+
+power2flag = getoption(options, 'Power2Flag', true);
+if power2flag
+    % faster FFT if the dimension is power of 2
+    lfftfun = @(l) 2^nextpow2(l);
+else
+    % slower, but smaller temporary arrays
+    lfftfun = @(l) l;
+end
+
+if GPU % GPU/Jacket FFT
+    if strcmp(classA,'single')
+        A = gsingle(A);
+    else
+        A = gdouble(A);
+    end
+    if strcmp(classB,'single')
+        B = gsingle(B);
+    else
+        B = gdouble(B);
+    end
+    % Do the FFT
+    subs(1:ndims(A)) = {':'};
+    for dim=dims
+        m = size(A,dim);
+        n = size(B,dim);
+        % compute the FFT length
+        l = lfftfun(m+n-1);
+        % We need to swap dimensions because GPU FFT works along the
+        % first dimension
+        if dim~=1 % do the work when only required
+            swap = 1:nd;
+            swap([1 dim]) = swap([dim 1]);
+            A = permute(A, swap);
+            B = permute(B, swap);
+        end
+        A = fft(A,l);
+        B = fft(B,l);
+        subs{dim} = ifun(m,n);
+    end
+else % Matlab FFT
+    % Do the FFT
+    subs(1:ndims(A)) = {':'};
+    for dim=dims
+        m = size(A,dim);
+        n = size(B,dim);
+        % compute the FFT length
+        l = lfftfun(m+n-1);
+        A = fft(A,l,dim);
+        B = fft(B,l,dim);
+        subs{dim} = ifun(m,n);
+    end
+end
+ 
+if GPU
+    A = A.*B;
+    clear B
+else
+    % inplace product to save 1/3 of the memory
+	% Modified by Alberto Andreotti(albertoandreotti@gmail.com)
+    %inplaceprod(A,B);
+	A(:) = A(:).*B(:);
+end
+
+% Back to the non-Fourier space
+if GPU % GPU/Jacket FFT
+    for dim=dims(end:-1:1) % reverse loop
+        A = ifft(A,[]);
+        % Swap back the dimensions
+        if dim~=1 % do the work when only required
+            swap = 1:nd;
+            swap([1 dim]) = swap([dim 1]);
+            A = permute(A, swap);
+        end        
+    end   
+else % Matlab IFFT  
+    for dim=dims
+        A = ifft(A,[],dim);
+    end
+end
+
+% Truncate the results
+if ABreal
+    % Make sure the result is real
+    A = real(A(subs{:}));
+else
+    A = A(subs{:});
+end
+
+% GPU/Jacket
+if GPU
+    % Cast the type back
+    if strcmp(class(A),'gsingle')
+        A = single(A);
+    else
+        A = double(A);
+    end
+end
+
+end % convnfft
+
+
+%% Get defaut option
+function value = getoption(options, name, defaultvalue)
+% function value = getoption(options, name, defaultvalue)
+    value = defaultvalue;
+    fields = fieldnames(options);
+    found = strcmpi(name,fields);
+    if any(found)
+        i = find(found,1,'first');
+        if ~isempty(options.(fields{i}))
+            value = options.(fields{i});
+        end
+    end
+end
diff --git a/CNN/custom_convn.m b/CNN/custom_convn.m
@@ -0,0 +1,29 @@
+% This function is used to choose between different implementations of the convn function
+% according to the platform.
+% This is mainly useful for overcoming an Octave's bug in convn(), https://savannah.gnu.org/bugs/?39314
+% parameters: x is the chunk of the image/samples, k is the kernel.
+
+function result = custom_convn(x, k, convmode) 
+    
+    %FFT works with batchsize>50, but still really slow, about 10000 seconds. It should produce an error near 0.18.
+	%this convnfft is taken from http://www.mathworks.com/matlabcentral/fileexchange/24504-fft-based-convolution.
+    if exist('convmode') && strcmp(convmode, 'fft')
+       result = convnfft(x,k, 'valid');
+       return
+	end
+	
+	%the 'valid' version of convolution has problems in Octave, use 'same' instead.
+	if isOctave()
+	   %Alternative to convnftt, use for small batch size ~ 5, will give 2676.56 seconds, otherwise it will explode(too long running time).
+       start = size(x,1) - size(k,1);
+       fin = 2*start;
+       %note: if x and k have not the same size in the third dimension, middle could be a range.
+       middle = floor(size(x,3)/2) + 1;
+       result = convn (x, k, "same")(start:fin, start:fin, middle);
+	else
+	   %we're running matlab
+	   result = convn(x, k, 'valid');
+	end
+
+end
+
diff --git a/util/isOctave.m b/util/isOctave.m
@@ -0,0 +1,4 @@
+%detects if we're running Octave
+function result = isOctave()
+    result = exist('OCTAVE_VERSION') ~= 0;
+end