alanlukezic
diff --git a/‎compile.m
+51 b/‎compile.m
+51
diff --git a/‎create_csr_tracker.m
+257 b/‎create_csr_tracker.m
+257
diff --git a/‎csr_wrapper.m
+54 b/‎csr_wrapper.m
+54
@@ -0,0 +1,51 @@
+% compile hog and segmetation mex files
+% before compiling set the following variables to the correct paths:
+% opencv_include and opencv_libpath
+
+current_folder = pwd;
+mkdir('mex');
+
+cd(['mex_src' filesep 'hog']);
+mex gradientMex.cpp
+movefile('*.mex*', [current_folder filesep 'mex'])
+cd(current_folder);
+
+if ispc     % Windows machine
+    % set opencv include path
+    opencv_include = 'E:\development\opencv-2.4.12\opencv\build\include\';
+    % set opencv lib path
+    opencv_libpath = 'E:\development\opencv-2.4.12\opencv\build\x64\vc11\lib\';
+
+    files = dir([opencv_libpath '*opencv*.lib']);
+    lib = [];
+    for i = 1:length(files),
+        lib = [lib ' -l' files(i).name(1:end-4)];
+    end
+
+    cd(['mex_src' filesep 'segmentation']);
+    eval(['mex mex_extractforeground.cpp src\segment.cpp -Isrc\ -I' opencv_include ' -L' opencv_libpath ' ' lib]);
+    eval(['mex mex_extractbackground.cpp src\segment.cpp -Isrc\ -I' opencv_include ' -L' opencv_libpath ' ' lib]);
+    eval(['mex mex_segment.cpp src\segment.cpp -Isrc\ -I' opencv_include ' -L' opencv_libpath ' ' lib]);
+    movefile('*.mex*', [current_folder filesep 'mex'])
+    cd(current_folder);
+
+elseif isunix   % Unix machine
+    % set opencv include path
+    opencv_include = '/usr/local/include/';
+    % set opencv lib path
+    opencv_libpath = '/usr/lib/x86_64-linux-gnu/';
+
+    lib = [];
+    files = dir([opencv_libpath '*opencv*.so']);
+    for i = 1:length(files)
+        lib = [lib ' -l' files(i).name(4:end-3)];
+    end
+
+    cd(['mex_src' filesep 'segmentation']);
+    eval(['mex mex_extractforeground.cpp src/segment.cpp -Isrc/ -I' opencv_include ' -L' opencv_libpath ' ' lib]);
+    eval(['mex mex_extractbackground.cpp src/segment.cpp -Isrc/ -I' opencv_include ' -L' opencv_libpath ' ' lib]);
+    eval(['mex mex_segment.cpp src/segment.cpp -Isrc/ -I' opencv_include ' -L' opencv_libpath ' ' lib]);
+    movefile('*.mex*', [current_folder filesep 'mex'])
+    cd(current_folder);
+
+end
@@ -0,0 +1,257 @@
+function tracker = create_csr_tracker(img, init_bbox, init_params)
+
+    if nargin < 3
+        init_params = read_default_csr_parameters();
+    end
+
+    % transform polygon to axis-aligned bbox
+    if numel(init_bbox) > 4,
+        bb8 = round(init_bbox(:));
+        x1 = round(min(bb8(1:2:end)));
+        x2 = round(max(bb8(1:2:end)));
+        y1 = round(min(bb8(2:2:end)));
+        y2 = round(max(bb8(2:2:end)));
+        bb = round([x1, y1, x2 - x1, y2 - y1]);
+        
+        init_mask = poly2mask(bb8(1:2:end)-bb(1), bb8(2:2:end)-bb(2), bb(4), bb(3));
+    else
+        bb = round(init_bbox);
+        init_mask = ones(bb(4), bb(3));
+    end
+
+
+    % filter parameters
+    padding = init_params.padding;  % padding
+    learning_rate = init_params.learning_rate;  % learning rate for updating filter
+    feature_type = init_params.feature_type;
+
+    % load and store pre-computed lookup table for colornames
+    w2c = [];
+    if sum(strcmp(feature_type, 'cn'))
+        w2c = load('w2crs.mat');
+        w2c = w2c.w2crs;
+    end
+
+    % segmentation parameters
+    hist_lr = init_params.hist_lr;
+    nbins = init_params.nbins;  % N bins for segmentation
+    seg_colorspace = init_params.seg_colorspace;     % 'rgb' or 'hsv'
+    use_segmentation = init_params.use_segmentation;  % false to disable use of segmentation
+    mask_diletation_type =  init_params.mask_diletation_type;  % for function strel (square, disk, ...)
+    mask_diletation_sz = init_params.mask_diletation_sz;
+
+    % check if grayscale image (only 1 channel) or
+    % check if grayscale image (3 the same channels)
+    img0 = bsxfun(@minus, double(img), mean(img,3));
+    if size(img,3) < 3 || sum(abs(img0(:))) < 10
+        use_segmentation = false;
+        % also do not use colornames
+        [isused_cn, cn_idx] = ismember('cn', feature_type);
+        if isused_cn
+            feature_type(cn_idx) = [];
+        end
+    end
+
+    % features parameters
+    cell_size = 1.0;
+    if sum(strcmp(feature_type, 'hog'))
+        cell_size = min(4, max(1, ceil((bb(3)*bb(4))/400)));
+    end
+
+    % size parameters
+    % reference target size: [width, height]
+    base_target_sz = [bb(3), bb(4)];
+    % reference template size: [w, h], does not change during tracking
+    template_size = floor(base_target_sz + padding*sqrt(prod(base_target_sz)));
+    template_size = mean(template_size);
+    template_size = [template_size, template_size];
+
+    % rescale template after extracting to have fixed area
+    rescale_ratio = sqrt((200^2) / (template_size(1) * template_size(2)));
+    if rescale_ratio > 1  % if already smaller - do not rescale
+        rescale_ratio = 1;
+    end
+
+    rescale_template_size = floor(rescale_ratio * template_size);
+
+    % position of the target center
+    c = bb([1,2]) + base_target_sz/2;
+
+    % create gaussian shaped labels
+    sigma = init_params.y_sigma;
+    Y = fft2(gaussian_shaped_labels(1,sigma, floor(rescale_template_size([2,1]) / cell_size)));
+
+    %store pre-computed cosine window
+    cos_win = hann(size(Y,1)) * hann(size(Y,2))';
+
+    % scale adaptation parameters (from DSST)
+    currentScaleFactor = init_params.currentScaleFactor;
+    n_scales = init_params.n_scales;
+    scale_model_factor = init_params.scale_model_factor;
+    scale_sigma_factor = init_params.scale_sigma_factor;
+    scale_step = init_params.scale_step;
+    scale_model_max_area = init_params.scale_model_max_area;
+    scale_sigma = sqrt(n_scales) * scale_sigma_factor;
+    scale_lr = init_params.scale_lr;     % learning rate parameter
+
+    %label function for the scales
+    ss = (1:n_scales) - ceil(n_scales/2);
+    ys = exp(-0.5 * (ss.^2) / scale_sigma^2);
+    ysf = single(fft(ys));
+
+    if mod(n_scales,2) == 0
+        scale_window = single(hann(n_scales+1));
+        scale_window = scale_window(2:end);
+    else
+        scale_window = single(hann(n_scales));
+    end
+
+    ss = 1:n_scales;
+    scaleFactors = scale_step.^(ceil(n_scales/2) - ss);
+
+    template_size_ = template_size;
+    if scale_model_factor^2 * prod(template_size_) > scale_model_max_area
+        scale_model_factor = sqrt(scale_model_max_area/prod(template_size_));
+    end
+
+    scale_model_sz = floor(template_size_ * scale_model_factor);
+    scaleSizeFactors = scaleFactors;
+    min_scale_factor = scale_step ^ ceil(log(max(5 ./ template_size_)) / log(scale_step));
+    max_scale_factor = scale_step ^ floor(log(min([size(img,1) size(img,2)] ./ base_target_sz)) / log(scale_step));
+
+    % create dummy mask (approximation for segmentation)
+    % size of the object in feature space
+    obj_size = floor(rescale_ratio * (base_target_sz/cell_size));
+    x0 = floor((size(Y,2)-obj_size(1))/2);
+    y0 = floor((size(Y,1)-obj_size(2))/2);
+    x1 = x0 + obj_size(1);
+    y1 = y0 + obj_size(2);
+    target_dummy_mask = zeros(size(Y));
+    target_dummy_mask(y0:y1, x0:x1) = 1;
+    target_dummy_mask = single(target_dummy_mask);
+
+    target_dummy_area = sum(target_dummy_mask(:));
+    
+    if use_segmentation
+        % convert image in desired colorspace
+        if strcmp(seg_colorspace, 'rgb')
+            seg_img = img;
+        elseif strcmp(seg_colorspace, 'hsv')
+            seg_img = rgb2hsv(img);
+            seg_img = seg_img * 255;
+        else
+            error('Unknown colorspace parameter');
+        end
+
+        % object rectangle region (to zero-based coordinates)
+        obj_reg = [bb(1), bb(2), bb(1)+bb(3), bb(2)+bb(4)] - [1 1 1 1];
+
+        % extract histograms
+        hist_fg = mex_extractforeground(seg_img, obj_reg, nbins);
+        hist_bg = mex_extractbackground(seg_img, obj_reg, nbins);
+
+        % extract masked patch: mask out parts outside image
+        [seg_patch, valid_pixels_mask] = get_patch(seg_img, c, currentScaleFactor, template_size);
+
+        % segmentation
+        [fg_p, bg_p] = get_location_prior([1 1 size(seg_patch, 2) size(seg_patch, 1)], base_target_sz, [size(seg_patch,2), size(seg_patch, 1)]);
+        [~, fg, ~] = mex_segment(seg_patch, hist_fg, hist_bg, nbins, fg_p, bg_p);
+
+        % cut out regions outside from image
+        mask = single(fg).*single(valid_pixels_mask);
+        mask = binarize_softmask(mask);
+
+        % use mask from init pose
+        init_mask_padded = zeros(size(mask));
+        pm_x0 = floor(size(init_mask_padded,2) / 2 - size(init_mask,2) / 2);
+        pm_y0 = floor(size(init_mask_padded,1) / 2 - size(init_mask,1) / 2);
+        init_mask_padded(pm_y0:pm_y0+size(init_mask,1)-1, pm_x0:pm_x0+size(init_mask,2)-1) = init_mask;
+        mask = mask.*single(init_mask_padded);
+
+        % resize to filter size
+        mask = imresize(mask, size(Y), 'nearest');
+
+        % check if mask is too small (probably segmentation is not ok then)
+        if mask_normal(mask, target_dummy_area)
+            if mask_diletation_sz > 0
+                D = strel(mask_diletation_type, mask_diletation_sz);
+                mask = imdilate(mask, D);
+            end
+        else
+            mask = target_dummy_mask;
+        end
+
+    else
+        mask = target_dummy_mask;
+    end
+
+    % extract features
+    f = get_csr_features(img, c, currentScaleFactor, template_size, ...
+                rescale_template_size, cos_win, feature_type, w2c, cell_size);
+
+    % create filter - using segmentation mask
+    H = create_csr_filter(f, Y, single(mask));
+
+    % calculate per-channel feature weights
+    response = real(ifft2(fft2(f).*conj(H)));
+    chann_w = max(reshape(response, [size(response,1)*size(response,2), size(response,3)]), [], 1);
+    % normalize: sum = 1
+    chann_w = chann_w / sum(chann_w);
+
+    % make a scale search model aswell
+    xs = get_scale_subwindow(img, c([2,1]), base_target_sz([2,1]), ...
+        currentScaleFactor * scaleSizeFactors, scale_window, scale_model_sz([2,1]), []);
+    % fft over the scale dim
+    xsf = fft(xs,[],2);
+    new_sf_num = bsxfun(@times, ysf, conj(xsf));
+    new_sf_den = sum(xsf .* conj(xsf), 1);
+
+    % store all important const's and variables to the tracker structure
+    tracker.feature_type = feature_type;
+    tracker.padding = padding;
+    tracker.learning_rate = learning_rate;  % filter learning rate
+    tracker.cell_size = cell_size;
+    tracker.H = H;
+    tracker.weight_lr = init_params.channels_weight_lr;
+    tracker.use_channel_weights = init_params.use_channel_weights;
+    tracker.chann_w = chann_w;
+    tracker.Y = Y;
+    tracker.mask_diletation_type = mask_diletation_type;
+    tracker.mask_diletation_sz = mask_diletation_sz;
+    tracker.target_dummy_mask = target_dummy_mask;
+    tracker.target_dummy_area = target_dummy_area;
+    tracker.use_segmentation = use_segmentation;
+    tracker.bb = bb;
+    tracker.cos_win = cos_win;
+    tracker.w2c = w2c;
+    tracker.template_size = template_size;
+    tracker.obj_size = obj_size;
+    tracker.c = c;
+    tracker.nbins = nbins;
+    tracker.currentScaleFactor = currentScaleFactor;
+    tracker.rescale_template_size = rescale_template_size;
+    tracker.rescale_ratio = rescale_ratio;
+    if use_segmentation
+        tracker.hist_fg = hist_fg;
+        tracker.hist_bg = hist_bg;
+        tracker.hist_lr = hist_lr;
+        tracker.seg_colorspace = seg_colorspace;
+    end
+    tracker.ysf = ysf;
+    tracker.sf_num = new_sf_num;
+    tracker.sf_den = new_sf_den;
+    tracker.scale_lr = scale_lr;
+    tracker.base_target_sz = base_target_sz;
+    tracker.scaleSizeFactors = scaleSizeFactors;
+    tracker.scale_window = scale_window;
+    tracker.scale_model_sz = scale_model_sz;
+    tracker.scaleFactors = scaleFactors;
+    tracker.min_scale_factor = min_scale_factor;
+    tracker.max_scale_factor = max_scale_factor;
+    tracker.mask = mask;
+    
+    tracker.H_prev = H;
+    
+    tracker.img_prev = img;
+
+end  % endfunction
@@ -0,0 +1,54 @@
+function csr_wrapper(varargin)
+    % csr_wrapper Wrapper function for VOT-like interface
+    %
+    % This function is a wrapper for the CSR-DCF tracker using the VOT interface for input/output
+    % data loading (i.e. images, initial region) and storing (i.e. output.txt or trax output)
+    %
+    % Input:
+    % - varargin[OutputDir] (string): path to dir where some output images/data should be stored
+
+    cleanup = onCleanup(@() exit() ); % Always call exit command at the end to terminate Matlab!
+    RandStream.setGlobalStream(RandStream('mt19937ar', 'Seed', sum(clock))); % Set random seed to a different value every time as required by the VOT rules.
+    
+    [handle, image_path, region] = vot('polygon'); % Obtain communication object
+    image = imread(image_path); % Read first image from file
+
+    % matlab indexing: starts with (1,1); gt starts with (0,0)
+    if numel(region) > 4
+        % all x,y points shifted by 1
+        region = region + 1;
+    else
+        % shift x,y by 1
+        region(1:2) = region(1:2) + 1;
+    end
+
+    tracker = create_csr_tracker(image, region);
+    
+    while true
+
+        [handle, image_path] = handle.frame(handle); % Get the next frame
+
+        if isempty(image_path) % Are we done?
+            break;
+        end;
+
+        image = imread(image_path);
+
+        [tracker, region] = track_csr_tracker(tracker, image);
+
+        % matlab indexing: starts with (1,1); gt starts with (0,0)
+        if numel(region) > 4
+            % all x,y points shifted by 1
+            region = region - 1;
+        else
+            % shift x,y by 1
+            region(1:2) = region(1:2) - 1;
+        end
+ 
+        handle = handle.report(handle, double(region)); % Report position for the given frame
+
+    end;
+
+    handle.quit(handle); % Output the results and clear the resources
+
+end  % endfunction