stereo/Features.cpp

#include "Features.h"
#include "Stereography.h"
#define _USE_MATH_DEFINES
#include <math.h>
#include <errno.h>
#include <iostream>
#include <string>
#include <sstream>
#include <algorithm>

using namespace cv;
using namespace std;


/*
	Create a Gaussian kernel within the given matrix

	TODO: use Eigen
*/
void CreateGaussianKernel(Mat& img, float sigma)
{
	for (int y = 0; y < img.rows; ++y)
	{
		for (int x = 0; x < img.cols; ++x)
		{
			float x_u = x - img.cols / 2.f;
			float y_u = y - img.rows / 2.f;
			float g = (1.f / (2.f * sigma * sigma * (float)M_PI)) * exp(-1*(x_u*x_u + y_u*y_u)/(2*sigma*sigma));
			img.at<float>(x, y) = g;
		}
	}

	//cout << "gaussian kernel: " << endl << img << endl;
}


/*
	Cluster features.

	Given a vector of features, perform non-maximal suppression over a given
	window size to compact clusters into single features.
	For each feature, within a window around it, if it is the strongest feature then
	remove all others; otherwise move on, it will be removed as part of the other feature's window

	TODO: This can be made WAY more efficient with a kd-tree
	since this is the most time consuming part of the feature extraction
*/
vector<Feature> ClusterFeatures(vector<Feature>& features, const int windowSize)
{ 
	vector<Feature> temp;
	for (unsigned int n = 0; n < features.size(); ++n)
	{
		auto& f = features[n];
		bool thisFeatureIsTheMaximum = true;
		for (int i = 0; i < features.size(); ++i)
		{
			if (i == n)
				continue;

			auto& f2 = features[i];
			int xmargin = (int)abs(f.p.x - f2.p.x);
			int ymargin = (int)abs(f.p.y - f2.p.y);
			if (xmargin <= windowSize && ymargin <= windowSize)
			{
				if (f.score < f2.score)
				{
					thisFeatureIsTheMaximum = false;
					break;
				}
			}
		}

		if (thisFeatureIsTheMaximum)
		{
			temp.push_back(f);
		}
	}

	return temp;
}

/*
	Harris corners

	Given an image, search over all pixels' structure tensors. We do this with a sliding window
	approach at a certin scale and window size, and repeat over multiple scales (maybe)
	If the Harris equation of the eigenvalues of the structure tensor, trace minus determinant, 
	is above a certain value, then this is a feature. Save. 

	We can technically leverage the scoring function I have below, by setting up certain vaues of
	pixels as features, but I prefer to just implement this function.

	I'm going to use a sliding window of size 5 and shift by two pixels every time.
	This doesn't save much time but hey
*/
// Support functions

// Actual function
vector<Feature> FindHarrisCorners(const Mat& input, int nmsWindowSize)
{
	vector<Feature> features;
	Mat img = input.clone();

	// Get features over a scale pyramid
	// each level of the pyramid, we halve the size of the image
	// This is done 4 times
	for (int s = 1; s < SCALE_PYRAMID_LEVELS; ++s)
	{
		// Halve the image size
		Mat dst;
		resize(img, dst, Size(), 0.5, 0.5, CV_INTER_LINEAR);
		img = dst;

		// Now get features
		// Compute image gradient
		Mat sobel;
		GaussianBlur(img, sobel, Size(HARRIS_WINDOW, HARRIS_WINDOW), 1, 1, BORDER_DEFAULT);
		Mat grad_x, grad_y;
		int scale = 1;
		int delta = 0;
		int ddepth = CV_8U;
		Sobel(sobel, grad_x, ddepth, 1, 0, HARRIS_WINDOW, scale, delta, BORDER_DEFAULT);
		Sobel(sobel, grad_y, ddepth, 0, 1, HARRIS_WINDOW, scale, delta, BORDER_DEFAULT);
		// We have our x and y gradients
		// Now with our window size, go over the image

		// Get gaussian kernel for weighting the gradients within the window
		Mat gaussKernel = Mat(HARRIS_WINDOW, HARRIS_WINDOW, CV_32F, 1);
		CreateGaussianKernel(gaussKernel, 1);

		int width = img.cols;
		int height = img.rows;
		std::vector<Feature> goodFeatures;
		float avgEigen = 0.f;

		// Loop over all pixels in the image, and check for Harris corners
		// Except this is hideously expensive, so I'm going to skip every second pixel
		for (int y = HARRIS_WINDOW / 2 + 1; y < img.rows - HARRIS_WINDOW / 2; y += 2)
		{
			for (int x = HARRIS_WINDOW / 2 + 1; x < img.cols - HARRIS_WINDOW / 2; x += 2)
			{
				int winSize = HARRIS_WINDOW / 2;
				Mat M = Mat::zeros(2, 2, CV_32F);
				// Go through the window around the point
				// Accumulate M weighted by the kernel
				// This is the gradient at the point that we will use. 
				// We use an accumulated gradient rather than a pointwise gradient since we are 
				// approximating the gradient of a "smooth" function that we only know at certain points.
				for (int n = -(HARRIS_WINDOW / 2); n <= HARRIS_WINDOW / 2; ++n)
				{
					for (int m = -(HARRIS_WINDOW / 2); m <= (HARRIS_WINDOW / 2); ++m)
					{
						int i = n + y;
						int j = m + x;
						float w = gaussKernel.at<float>(n + (HARRIS_WINDOW / 2), m + (HARRIS_WINDOW / 2));
						M.at<float>(0, 0) += w * (float)(grad_x.at<uchar>(i, j) * grad_x.at<uchar>(i, j));
						M.at<float>(0, 1) += w * (float)(grad_x.at<uchar>(i, j) * grad_y.at<uchar>(i, j));
						M.at<float>(1, 0) += w * (float)(grad_x.at<uchar>(i, j) * grad_y.at<uchar>(i, j));
						M.at<float>(1, 1) += w * (float)(grad_y.at<uchar>(i, j) * grad_y.at<uchar>(i, j));
					}
				}

				// Compute the harris score
				// This is R = det(M) - k * (trace(M))^2
				float detM = M.at<float>(0, 0) * M.at<float>(1, 1) - M.at<float>(0, 1) * M.at<float>(1, 0);
				float traceM = M.at<float>(0, 0) + M.at<float>(1, 1);
				float score = detM - HARRIS_CONSTANT * traceM * traceM;

				// Only keep point that have a score above our threshold
				if (score > HARRIS_THRESH)
				{
					Feature f;
					f.p.x = (float)x*pow(2, s);
					f.p.y = (float)y*pow(2, s);
					f.score = score;
					f.scale = s;
					//f.saddle = detM < 0; // if  < 0, one eigenvalue is positive, the other negative
					features.push_back(f);
				}
			}
		}

		//Mat img_i = imread(img.filename, IMREAD_GRAYSCALE);
		//Mat disp = img.clone();
		//for (auto& f : features)
		//{
		//	circle(disp, f.p, 3, (255, 255, 0), -1);
		//}

		// Display
		//imshow("Image - best features", disp);
		//waitKey(0);
	}

	// We apply non-maximal suppression over a greater window area
	//int nmsWindow = 20;
	vector<Feature> temp;
	for (unsigned int n = 0; n < features.size(); ++n)
	{
		auto& f = features[n];
		bool thisFeatureIsTheMaximum = true;
		for (int i = 0; i < features.size(); ++i)
		{
			if (i == n)
				continue;

			auto& f2 = features[i];
			int xmargin = (int)abs(f.p.x - f2.p.x);
			int ymargin = (int)abs(f.p.y - f2.p.y);
			if (xmargin <= nmsWindowSize && ymargin <= nmsWindowSize)
			{
				if (f.score < f2.score)
				{
					thisFeatureIsTheMaximum = false;
					break;
				}
			}
		}

		if (thisFeatureIsTheMaximum)
		{
			temp.push_back(f);
		}
	}

	return temp;
}

/*
	DoH Features

	Given an image, return a vector of all the Determinant of Hessian features in the image. 
	These are directly scored by the determinant. 
	This is computed over a scale space - each scale up, we 'downsample' by Gaussian blur. 
	We compute the Hessian matrix over each window, and get the determinant. If the determinant times
	the fourth power of the scale (1, 2, 3, etc) is above a threshold, then this is a feature. 

	Note that descriptors are computed NOT in the scale space
*/
bool FindDoHFeatures(Mat input, Mat mask, vector<Feature>& features)
{
	// First, confirm that the mask is the same size as the image
	if (mask.cols != input.cols || mask.rows != input.rows)
		return false;

	// Get gaussian kernel for weighting the gradients within the window
	Mat gaussKernel = Mat(DOH_WINDOW, DOH_WINDOW, CV_32F, 1);
	CreateGaussianKernel(gaussKernel, 1);

	// We run this over an image that uses normalised pixels - that is, values between 0 and 1, representing 0-255
	Mat img = Mat(input.rows, input.cols, CV_32F, 1);
	Mat showImg = img.clone();
	for (int y = 0; y < img.rows; ++y)
	{
		for (int x = 0; x < img.cols; ++x)
		{
			if (mask.at<uchar>(y,x) < 127)
			{
				showImg.at<float>(y, x) = 0;
			}
			else
			{
				showImg.at<float>(y, x) = (float)input.at<uchar>(y, x) / 255.f;
			}
			img.at<float>(y, x) = (float)input.at<uchar>(y, x) / 255.f;
		}
	}
	

	// Iterate over scale space
	float maxFeatureScore = 0;
	float avgFeatureScore = 0;
	for (int k = 1; k < SCALE_SPACE_ITERATIONS; ++k)
	{
		// blur the image
		GaussianBlur(img, img, Size(DOH_WINDOW, DOH_WINDOW), 1, 1, BORDER_DEFAULT);

		// Only take even iterations
		if (k % 2 == 0)
		{
			continue;
		}

		// Compute image gradient
		Mat sobel = img.clone();
		Mat grad_x, grad_y;
		int scale = 1;
		int delta = 0;
		int ddepth = CV_32F;
		Sobel(sobel, grad_x, ddepth, 1, 0, DOH_WINDOW, scale, delta, BORDER_DEFAULT);
		Sobel(sobel, grad_y, ddepth, 0, 1, DOH_WINDOW, scale, delta, BORDER_DEFAULT);
		// We have our x and y gradients
		// Now with our window size, go over the image

		int width = img.cols;
		int height = img.rows;
		float avgEigen = 0.f;

		// Loop over all pixels in the image, and check for Harris corners
		// Except this is hideously expensive, so I'm going to skip every second pixel
		for (int y = DOH_WINDOW / 2 + 1; y < img.rows - DOH_WINDOW / 2; y += 2)
		{
			for (int x = DOH_WINDOW / 2 + 1; x < img.cols - DOH_WINDOW / 2; x += 2)
			{
				// If out of masked region, ignore
				if (mask.at<uchar>(y, x) < 127)
				{
					continue;
				}

				int winSize = DOH_WINDOW / 2;
				Mat H = Mat::zeros(2, 2, CV_32F);
				// Go through the window around the point
				// Accumulate M weighted by the kernel
				// This is the gradient at the point that we will use. 
				// We use an accumulated gradient rather than a pointwise gradient since we are 
				// approximating the gradient of a "smooth" function that we only know at certain points.
				for (int n = -(DOH_WINDOW / 2); n <= DOH_WINDOW / 2; ++n)
				{
					for (int m = -(DOH_WINDOW / 2); m <= (DOH_WINDOW / 2); ++m)
					{
						int i = n + y;
						int j = m + x;
						float w = gaussKernel.at<float>(n + (DOH_WINDOW / 2), m + (DOH_WINDOW / 2));
						H.at<float>(0, 0) += w * (grad_x.at<float>(i, j) * grad_x.at<float>(i, j));
						H.at<float>(0, 1) += w * (grad_x.at<float>(i, j) * grad_y.at<float>(i, j));
						H.at<float>(1, 0) += w * (grad_x.at<float>(i, j) * grad_y.at<float>(i, j));
						H.at<float>(1, 1) += w * (grad_y.at<float>(i, j) * grad_y.at<float>(i, j));
					}
				}

				// Scale Hessian to use normalised gradient values

				// Compute the DoH score
				// This is just the determinant of the hessian, times the scale factor to the fourth power
				float detM = H.at<float>(0, 0) * H.at<float>(1, 1) - H.at<float>(0, 1) * H.at<float>(1, 0);
				//float traceM = H.at<float>(0, 0) + H.at<float>(1, 1);
				float score = detM;// *k* k;// *k* k;

				//std::cout << "score: " << score << std::endl;

				// Only keep point that have a score above our threshold
				if (score > DOH_THRESHOLD)
				{
					Feature f;
					f.scale = k;
					f.p.x = (float)x;
					f.p.y = (float)y;
					f.score = score;
					features.push_back(f);

					avgFeatureScore += score;
					if (score > maxFeatureScore)
					{
						maxFeatureScore = score;
					}
				}
			}
		}
	}

	avgFeatureScore /= features.size();
	cout << "Average score = " << avgFeatureScore << " from " << features.size() << " features"  << endl;

	/*namedWindow("Image first", WINDOW_AUTOSIZE);
	for (auto& f : features)
	{
		circle(showImg, f.p, 2, (255, 255, 0), -1);
	}
	imshow("Image first", showImg);
	waitKey(0);*/

	
	auto temp = ClusterFeatures(features, 20);
	features.clear();
	features.insert(features.end(), temp.begin(), temp.end());
	

	return true;
}

/*
	FAST features

	Given an image, return a vector of all FAST features in the image.
	In 16 defined points surrounding a pixel, visualised below, we aim to
	find a sequence of N=12 or more long where the points are all above or all below
	the centre point value plus or minus a given threshold.
	Assumed: img is grayscale
		  16  1  2
	   15     +    3
	14        +      4
	13  +  +  p  + + 5
	12        +      6
	   11     +    7
		  10  9  8

   The threshold I use is defined in Features.h and can be tuned. 
   The helper functions implement an optimisation to reject bad points faster, 
   and another function to black box the search for a sequential 12 or more. 
*/
// Support function prototypes
bool ThreeOfFourValuesBrighterOrDarker(int i1, int i5, int i9, int i13, int pb, int p_b);
bool CheckForSequential12(std::vector<int> points, int p_b, int pb);
// Actual fast features function
bool FindFASTFeatures(Mat img, vector<Feature>& features)
{
	int width = img.cols;
	int height = img.rows;
	// Loop over each point in the image, except for a strip of width 3 around the edge. THis is so we
	// avoid dealing with the cases where the pixels 3 away from the point of consideration don't exist.
	// There are enough features in teh main body of the image that removing any in the 3 pixels of edge does nothing.
	for (int h = FAST_SPACING; h < height - FAST_SPACING; ++h)
	{
		for (int w = FAST_SPACING; w < width - FAST_SPACING; ++w)
		{
			// Get the upper and lower thresholds we'll use.
			// Everything in the sequence must be above pb - the pixel value plus the threshold,
			// or below p_b - the pixel value minus the threshold
			int p = img.at<uchar>(h, w);
			int pb = p + FAST_THRESHOLD;
			int p_b = p - FAST_THRESHOLD;

			// For a speed-up, check 1, 9, then 5, 13
			// Any three of 1,5,9,13 can be all brighter or darker. If not,
			// then this is not a corner. 
			// This just quickly skips many points and is not strictly necessary
			int i1 = img.at<uchar>(h - FAST_SPACING, w);
			int i5 = img.at<uchar>(h, w + FAST_SPACING);
			int i9 = img.at<uchar>(h + FAST_SPACING, w);
			int i13 = img.at<uchar>(h, w - FAST_SPACING);
			if (!ThreeOfFourValuesBrighterOrDarker(i1, i5, i9, i13, pb, p_b))
			{
				continue;
			}
			else {
				// Now check the rest
				// need 12 or more sequential values above or below
				// First, get all the values
				int i2 = img.at<uchar>(h - FAST_SPACING, w + 1);
				int i3 = img.at<uchar>(h - 2, w + 2);
				int i4 = img.at<uchar>(h - 1, w + FAST_SPACING);
				int i6 = img.at<uchar>(h + 1, w + FAST_SPACING);
				int i7 = img.at<uchar>(h + 2, w + 2);
				int i8 = img.at<uchar>(h + FAST_SPACING, w - 1);
				int i10 = img.at<uchar>(h + FAST_SPACING, w + 1);
				int i11 = img.at<uchar>(h + 2, w - 2);
				int i12 = img.at<uchar>(h + 1, w - FAST_SPACING);
				int i14 = img.at<uchar>(h - 1, w - FAST_SPACING);
				int i15 = img.at<uchar>(h - 2, w - 2);
				int i16 = img.at<uchar>(h - FAST_SPACING, w - 1);
				std::vector<int> points{ i1, i2, i3, i4, i5, i6, i7, i8, i9, i10, i11, i12, i13, i14, i15, i16 };

				// Pass values into evaluation function
				if (!CheckForSequential12(points, p_b, pb))
				{
					continue;
				}

				// It worked! We have a feature. Record this point in our vector
				Feature feature;
				feature.p.x = (float)w;
				feature.p.y = (float)h;
				features.push_back(feature);
			}
		}
	}

	return true;
}

/*
If three of the four i values are all brighter than pb or darker than p_b, return true.
Else, return false
*/
bool ThreeOfFourValuesBrighterOrDarker(int i1, int i5, int i9, int i13, int pb, int p_b)
{
	// Fast fail
	// If both i1 and i9 lie within [p_b, pb] then we do not have a corner
	if ((p_b < i1 && i1 < pb) && (p_b < i9 && i9 < pb))
	{
		return false;
	}
	else if ((p_b < i5 && i5 < pb) && (p_b < i13 && i13 < pb))
	{
		return false;
	}
	else
	{
		int above_pb = 0;
		int below_p_b = 0;

		above_pb += i1 > pb ? 1 : 0;
		above_pb += i5 > pb ? 1 : 0;
		above_pb += i9 > pb ? 1 : 0;
		above_pb += i13 > pb ? 1 : 0;

		if (above_pb >= 3)
		{
			return true;
		}
		else {
			below_p_b += i1 < p_b ? 1 : 0;
			below_p_b += i5 < p_b ? 1 : 0;
			below_p_b += i9 < p_b ? 1 : 0;
			below_p_b += i13 < p_b ? 1 : 0;

			if (below_p_b >= 3)
			{
				return true;
			}
		}
	}

	return false;
}

// Helper functions for FAST features
bool greaterthan(int i, int pb, int p_b)
{
	return i > pb;
}

bool lessthan(int i, int pb, int p_b)
{
	return i < p_b;
}

/*
If there is a sequence of i values that are all above pb or below p_b, return true.
Else, return false.
*/
bool CheckForSequential12(std::vector<int> points, int p_b, int pb)
{
	// Do we try to do this intelligently or just brute force? 
	// For each in the list
	// if it's above or below
	// Search front and back until we find a break
	// count the sequence length
	assert(pb > p_b);

	// Yes, there are smarter ways to do this. No, I don't care right now.
	int p = (pb + p_b) / 2;

	bool(*comp)(int, int, int);
	for (int i = 0; i < (int)points.size(); ++i)
	{
		if (points[i] > pb)
		{
			comp = &greaterthan;
		}
		else if (points[i] < p_b)
		{
			comp = &lessthan;
		}
		else {
			continue;
		}

		// Now loop over the rest of the sequence, forward and backward,
		// until both sides return false
		// Forward loop
		int fLen = 0;
		int fJ = 0;
		for (fJ = i + 1; fJ != i; ++fJ)
		{
			// quit when we get back to i
			if (fJ == 16)
				fJ = 0;
			if (fJ == i)
				break;
			if (comp(points[fJ], pb, p_b))
				fLen++;
			else
				break;
		}
		fJ--;
		int bLen = 0;
		int bJ = 0;
		for (int bJ = i - 1; bJ != i && bJ != fJ; --bJ)
		{
			// quit when we get back to i
			if (bJ == -1)
				bJ = 15;
			if (bJ == i || bJ == fJ)
				break;
			if (comp(points[bJ], pb, p_b))
				bLen++;
			else
				break;
		}
		int seqLen = fLen + bLen + 1;
		assert(seqLen <= 16);
		if (seqLen >= 12)
		{
			return true;
		}
	}

	return false;
}

// Unit Tests for the above
void TestSequential12(void)
{
	// Create some data for sequential 12 and confirm that it actually does what it should
	int pb = 1;
	int p_b = 0;
	std::vector<int> p1{ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
	// this one should pass
	assert(!CheckForSequential12(p1, p_b, pb));

	p_b = 1;
	pb = 3;
	vector<int> p2{ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
	// this should pass
	assert(CheckForSequential12(p2, p_b, pb));

	p_b = 30;
	pb = 90;
	// pass, meaning there is a 12 or more
	vector<int> p3{ 0, 91, 0, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91, 0 };
	assert(CheckForSequential12(p3, p_b, pb));
	// fail
	vector<int> p4{ 0, 91, 0, 0, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91, 0 };
	assert(!CheckForSequential12(p4, p_b, pb));
	// pass
	vector<int> p5{ 91, 91, 0, 91, 0, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91, 91 };
	assert(CheckForSequential12(p5, p_b, pb));
	// fail
	vector<int> p6{ 0, 61, 0, 0, 61, 61, 61, 61, 61, 61, 61, 61, 61, 61, 61, 0 };
	assert(!CheckForSequential12(p6, p_b, pb));
	// pass
	vector<int> p7{ 0, 0, 0, 91, 0, 91, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 };
	assert(CheckForSequential12(p7, p_b, pb));
	// fail
	vector<int> p8{ 0, 91, 0, 0, 0, 0, 0, 0, 0, 0, 0, 91, 91, 91, 91, 0 };
	assert(!CheckForSequential12(p8, p_b, pb));

}

/*
	Feature Scoring
	
	We loop over the list of features supplied and construct a value for each
	based on the Shi-Tomasi score.
	Any features below the cut-off are removed.
	The Shi Tomasi score is explained here: https://aishack.in/tutorials/harris-corner-detector/

	Then we do a second pass, and if there are tight groups of features,
	we cull everything but the one with the highest score in the group.
	This is the Non-Maximal Suppression.

	The Shi-Tomasi score uses the minimum eigenvalue of the matrix
	I_x^2     I_x I_y
	I_x I_y     I_x ^2
	where I_x is the derivative in X of the image i at x,y.
	We compute the derivate from a window of size ST_WINDOW either side of the point,
	and use a Gaussian kernel to weight all the values' contributions to the derivative. 

	Parameters:
	- There is a cutoff value for the Shi-Tomasi corner detector
	- Window size for deformation matrix
*/
// Support function
bool FeatureCompare(Feature a, Feature b)
{
	return a.score > b.score;
}
// Actual function
std::vector<Feature> ScoreAndClusterFeatures(
	const Mat& img,
	vector<Feature>& features,
	float scoreThreshold,
	float distanceForWithinCluster)
{
	// let's cheat and use opencv to compute the sobel derivative, window size 3,
	// over the whole image
	// lol this doesn't actually save us much time but whatevs, I know how to implement this. 
	// here's an explanation if you don't know the theory - https://en.wikipedia.org/wiki/Sobel_operator
	// Basically this gets the gradients at all points over the image, which we use for the derivative of the "image function"
	Mat sobel;
	GaussianBlur(img, sobel, Size(ST_WINDOW, ST_WINDOW), 1, 1, BORDER_DEFAULT);
	Mat grad_x, grad_y;
	int scale = 1;
	int delta = 0;
	int ddepth = CV_8U;
	Sobel(sobel, grad_x, ddepth, 1, 0, ST_WINDOW, scale, delta, BORDER_DEFAULT);
	Sobel(sobel, grad_y, ddepth, 0, 1, ST_WINDOW, scale, delta, BORDER_DEFAULT);
	// We have our x and y gradients
	// Now with our window size, go over the image

	// Get gaussian kernel for weighting the gradients within the window
	Mat gaussKernel = Mat(ST_WINDOW, ST_WINDOW, CV_32F, 1);
	CreateGaussianKernel(gaussKernel, 1);

	int width = img.cols;
	int height = img.rows;
	int numFeatures = (int)features.size();
	std::vector<Feature> goodFeatures;
	float avgEigen = 0.f;
	// Loop over all features in the given list to score them
	for (int i = 0; i < numFeatures; ++i)
	{
		auto& f = features[i];
		int winSize = ST_WINDOW / 2;
		Mat M = Mat::zeros(2, 2, CV_32F);
		// Go through the window around the feature
		// Accumulate M weighted by the kernel
		// This is the gradient at the feature point that we will use. 
		// We use an accumulated gradient rather than a pointwise gradient since we are 
		// approximating the gradient of a "smooth" function that we only know at certain points.
		for (int n = -(ST_WINDOW / 2); n <= ST_WINDOW / 2; ++n)
		{
			for (int m = -(ST_WINDOW / 2); m <= (ST_WINDOW / 2); ++m)
			{
				int i = n + (int)f.p.y;
				int j = m + (int)f.p.x;
				float w = gaussKernel.at<float>(n + (ST_WINDOW / 2), m + (ST_WINDOW / 2));
				M.at<float>(0, 0) += w * (float)(grad_x.at<uchar>(i, j) * grad_x.at<uchar>(i, j));
				M.at<float>(0, 1) += w * (float)(grad_x.at<uchar>(i, j) * grad_y.at<uchar>(i, j));
				M.at<float>(1, 0) += w * (float)(grad_x.at<uchar>(i, j) * grad_y.at<uchar>(i, j));
				M.at<float>(1, 1) += w * (float)(grad_y.at<uchar>(i, j) * grad_y.at<uchar>(i, j));
			}
		}

		// Compute the eigenvalues of M
		// so the equation is
		// (I_x squared - E)(I_y squared - E) - I_xy squared, solve for two solutions of e
		// See the ai shack link above for the equation written nicely
		float a = 1.f; // yeah, unnecessary, just for show
		float b = -1 * (M.at<float>(0, 0) + M.at<float>(1, 1));
		float c = M.at<float>(0, 0)*M.at<float>(1, 1) - M.at<float>(1, 0)*M.at<float>(0, 1);
		float eigen1 = (-b + sqrt(b*b - 4 * a*c)) / 2 * a;
		float eigen2 = (-b - sqrt(b*b - 4 * a*c)) / 2 * a;

		float minEigenvalue = min(eigen1, eigen2);
		f.score = minEigenvalue;
		avgEigen += f.score;
		// Only keep features that have a score above our threshold
		if (f.score > scoreThreshold)
		{
			goodFeatures.push_back(f);
		}
	}

	// Perform non-maximal suppression over a window around each feature
	// We'll choose 5x5 around each feature, which is 
	// if there is a feature of lower score in the 5x5, remove it
	vector<Feature> temp;
	for (unsigned int n = 0; n < goodFeatures.size(); ++n)
	{
		auto& f = goodFeatures[n];
		bool thisFeatureIsTheMaximum = true;
		for (int i = 0; i < goodFeatures.size(); ++i)
		{
			if (i == n)
				continue;

			auto& f2 = goodFeatures[i];
			int xmargin = (int)abs(f.p.x - f2.p.x);
			int ymargin = (int)abs(f.p.y - f2.p.y);
			if (xmargin <= distanceForWithinCluster && ymargin <= distanceForWithinCluster)
			{
				if (f.score < f2.score)
				{
					thisFeatureIsTheMaximum = false;
					break;
				}
			}
		}

		if (thisFeatureIsTheMaximum)
		{
			temp.push_back(f);
		}
	}

	goodFeatures = temp;

	// Sort features
	sort(goodFeatures.begin(), goodFeatures.end(), FeatureCompare);

	return goodFeatures;
}

/*
	Feature Description
	Create SIFT descriptors for each feature given.
	https://aishack.in/tutorials/sift-scale-invariant-feature-transform-features/

	First, we use the SIFT method of computing the orientation of each feature point. 
	Every subsequent orientation, like the gradients below, is taken relative to this
	to ensure invariance to feature rotation.

	In a 16x16 window around the feature, we create 16 4x4 windows.
	In each window, we create an 8 bin histogram for gradient orientation, weighting
	each bin entry with the magnitude of the added vector. These entries are also weighted
	by a gaussian function based on distance from the centre. 
	Then these are all put into the one big 128-long vector.
	The vector is normalised, capped at 0.2 for illuminance checking, then normalised again
	(https://en.wikipedia.org/wiki/Scale-invariant_feature_transform#Keypoint_descriptor)
*/
// Support functions
template <typename T>
float L2_norm(vector<T> v)
{
	T norm = (T)0;
	for (unsigned int i = 0; i < v.size(); ++i)
	{
		norm += v[i] * v[i];
	}
	return sqrt(norm);
}
template <typename T>
void NormaliseVector(std::vector<T>& v)
{
	float s = L2_norm(v);
	for (unsigned int i = 0; i < v.size(); ++i)
	{
		v[i] /= s;
	}
}
void ComputeFeatureOrientation(Feature& feature, Mat xgrad, Mat ygrad);
// Actual function
bool CreateSIFTDescriptors(cv::Mat img, std::vector<Feature>& features, std::vector<FeatureDescriptor>& descriptors)
{
	// Smooth the image with a Gaussian first and get gradients
	Mat smoothed;
	GaussianBlur(img, smoothed, Size(ST_WINDOW, ST_WINDOW), 1, 1, BORDER_DEFAULT);
	Mat grad_x, grad_y;
	int scale = 1;
	int delta = 0;
	int ddepth = CV_8U;
	Sobel(smoothed, grad_x, ddepth, 1, 0, ST_WINDOW, scale, delta, BORDER_DEFAULT);
	Sobel(smoothed, grad_y, ddepth, 0, 1, ST_WINDOW, scale, delta, BORDER_DEFAULT);

	// Construct a Gaussian kernel for weighting descriptor entries
	Mat gaussKernel = Mat(DESC_SUB_WINDOW, DESC_SUB_WINDOW, CV_32F, 1);
	CreateGaussianKernel(gaussKernel, 1);

	// For each feature
	for (unsigned int i = 0; i < features.size(); ++i)
	{
		auto& f = features[i];

		// Get feature orientation
		ComputeFeatureOrientation(f, grad_x, grad_y);

		// Over a 16x16 window, iterate over 4x4 blocks
		// For each block, compute the histogram
		// Weight the histogram
		// Add these to the vector
		int vecEntryIndex = 0;
		// I'm supposed to interpolate here and use sub-pixel values cos otherwise the feature
		// point isn't aligned with the centre.
		// Instead of interpolating, we're just going to create the window with
		// the feature at 8,8. It'll work as an approximation
		for (int j = 0; j < DESC_WINDOW; j += DESC_SUB_WINDOW)
		{
			for (int k = 0; k < DESC_WINDOW; k += DESC_SUB_WINDOW)
			{
				float hist[DESC_BINS] = {0.0f};
				// For each 4x4 block
				for (int n = j; n < j+DESC_SUB_WINDOW; ++n)
				{
					for (int m = k; m < k + DESC_SUB_WINDOW; ++m)
					{
						int imgX = (int)f.p.x - (DESC_WINDOW / 2) + m;
						int imgY = (int)f.p.y - (DESC_WINDOW / 2) + n;

						// Ensure that window stays within bounds of image. xgrad and ygrad have the same size
						if (imgY < 0 || imgY >= grad_x.rows)
							continue;
						if (imgX < 0 || imgX >= grad_x.cols)
							continue;

						// Get angle and magnitude of gradient at this point, and add
						// into the histogram at the right bin
						float gX = (float)grad_x.at<uchar>(imgY, imgX);
						float gY = (float)grad_y.at<uchar>(imgY, imgX);
						float mag = sqrt(gX*gX + gY * gY);
						float angle = 0.f;
						if (gX != 0)
							angle = RAD2DEG(atan(gY / gX));
						else
							angle = 90;
						// Make angle relative to feature angle
						angle -= f.angle;
						if (angle > 360)
							angle = (int)angle % 360;
						if (angle < 0)
							angle = 0;
						hist[(int)angle / DESC_BIN_SIZE] += mag * gaussKernel.at<float>(j/DESC_SUB_WINDOW,k/DESC_SUB_WINDOW);
					}
				}

				// add this histogram to the feature vector
				for (int index = 0; index < DESC_BINS; ++index)
				{
					f.desc.vec[vecEntryIndex] = hist[index];
					vecEntryIndex++;
				}
			}
		}

		// Once the vector is created, we normalise it
		vector<float> descVec(std::begin(f.desc.vec), std::end(f.desc.vec));
		NormaliseVector(descVec);

		// Confirm that the descriptor size is 128
		if (descVec.size() != DESC_LENGTH)
		{
			std::cout << "Error: feature vector length = " << descVec.size() << std::endl;
			continue;
		}

		// Cap every entry to 0.2 max, to remove illumination dependence
		for (unsigned int j = 0; j < descVec.size(); ++j)
		{
			if (descVec[j] > ILLUMINANCE_BOUND)
			{
				descVec[j] = ILLUMINANCE_BOUND;
			}
		}

		// Renormalise
		NormaliseVector(descVec);

		// Put back in the array
		std::copy(descVec.begin(), descVec.end(), f.desc.vec);
		descriptors.push_back(f.desc);
	}

	return true;
}

/*
Compute feature orientation.
This is a window around the feature of size dependent on the feature scale (to come later).
For now, we'll say a 9x9 window.
There are 36 bins in the angle histogram, entries weighted by magnitude and by gaussian.
*/
void ComputeFeatureOrientation(Feature& feature, Mat xgrad, Mat ygrad)
{
	// get Gaussian weighting function. Use a sigma 1.5 times the scale
	// For now, sigma is just 1.5
	Mat gaussKernel = Mat(ANGLE_WINDOW, ANGLE_WINDOW, CV_32F, 1);
	CreateGaussianKernel(gaussKernel, 1);

	// Create histogram
	float hist[ORIENTATION_HIST_BINS] = { 0.0f };

	for (int n = -(ANGLE_WINDOW / 2); n <= ANGLE_WINDOW / 2; ++n)
	{
		for (int m = -(ANGLE_WINDOW / 2); m <= (ANGLE_WINDOW / 2); ++m)
		{
			// Compute magnitude and angle and add to histogram
			int i = n + (int)feature.p.y;
			int j = m + (int)feature.p.x;
			
			// Ensure that window stays within bounds of image. xgrad and ygrad have the same size
			if (i < 0 || i >= xgrad.rows)
				continue;
			if (j < 0 || j >= xgrad.cols)
				continue;

			// Get the angle and the magnitude of the gradient at this point, and
			// add it into the histogram at the right bin
			float gX = (float)xgrad.at<uchar>(i,j);
			float gY = (float)ygrad.at<uchar>(i,j);
			float mag = sqrt(gX*gX + gY* gY);
			float angle = 0.f;
			if (gX != 0)
				angle = RAD2DEG(atan(gY / gX));
			else
				angle = 90;
			hist[(int)(angle / 10)] += mag * gaussKernel.at<float>(n+(ANGLE_WINDOW/2), m+(ANGLE_WINDOW/2));
		}
	}

	// Find the dominant bin in the histogram
	// Set the angle of the feature to this bin range in radians
	float dominantAngle = 0;
	for (int i = 0; i < ORIENTATION_HIST_BINS; ++i)
	{
		if (hist[i] > dominantAngle)
		{
			// Cap the angle to be between -180 and 180
			dominantAngle = hist[i];
			feature.angle = DEG2RAD(i*10.f);
		}
	}
}

/*
	Match features
	We only call two features a match if they are sufficiently close
	and they pass the Lowe ratio test - the next closest feature's distance to the closest
	distance is above a certain ratio.

	The structure of the pair is that the first in the pair is from list1, and the
	second from list2
*/
// Support functions
float DistanceBetweenDescriptors(FeatureDescriptor a, FeatureDescriptor b)
{
	float dist = 0;
	vector<float> aVec(std::begin(a.vec), std::end(a.vec));
	vector<float> bVec(std::begin(b.vec), std::end(b.vec));
	assert(aVec.size() == bVec.size());
	for (unsigned int i = 0; i < aVec.size(); ++i)
	{
		aVec[i] -= bVec[i];
	}
	return L2_norm(aVec);
}
// Actual function
std::vector<std::pair<Feature, Feature> > MatchDescriptors(
	std::vector<Feature> list1,
	std::vector<Feature> list2,
	float distLimitBetweenMatches)
{
	std::vector<std::pair<Feature, Feature> > matches;

	// Loop through list 1 and compare each to list 2
	for (unsigned int i = 0; i < list1.size(); ++i)
	{
		auto& f = list1[i];

		// Find the closest two matches to this feature's descriptor in list2
		int closest = -1;
		int secondClosest = -1;
		float minDist = -1;
		for (unsigned int j = 0; j < list2.size(); ++j)
		{
			auto& compareFeature = list2[j];
			float dist = DistanceBetweenDescriptors(f.desc, compareFeature.desc);

			if (minDist == -1 || dist < minDist)
			{
				secondClosest = closest;
				closest = j;
				minDist = dist;
			}
		}

		if (closest == -1 || secondClosest == -1 || closest == secondClosest)
		{
			// Something went badly
			std::cout << "Error: failed to match feature " << i << std::endl;
			continue;
		}

		// To match, scores must also be sufficiently similar
		if (abs(f.score - list2[closest].score) > distLimitBetweenMatches)
		{
			continue;
		}

		// Lowe ratio test
		float distClosest = minDist;
		float distSecondClosest = DistanceBetweenDescriptors(f.desc, list2[secondClosest].desc);
		float ratio = distClosest / distSecondClosest;
		// Ratio should be 0.8 or less
		if (ratio < NN_RATIO)
		{
			// Create matches with (right, left) structure
			f.distFromBestMatch = minDist;
			list2[closest].distFromBestMatch = minDist;
			std::pair<Feature, Feature> match;
			match = std::make_pair(f, list2[closest]);
			matches.push_back(match);
		}
	}

	return matches;
}

/*
	Given a series of image file names, create image descriptors for each file
*/
// Helper - given an image file name, create an image descriptor for that file
void CreateDescriptorForImage(
	const std::string& filename,
	const std::string& folder,
	ImageDescriptor& imgDesc,
	const Eigen::MatrixXf& calibMatrix,
	const Mat& mask)
{
	string imagePath = folder + "\\" + filename;
	Mat img = imread(imagePath, IMREAD_GRAYSCALE);

	// Scale the image to be square along the smaller axis
	// ONLY IF we have no calibration matrices
	//if (calibrationMatrices.empty())
	//{
	//	int size = min(img.cols, img.rows);
	//	resize(img, img, Size(size, size), 0, 0, CV_INTER_LINEAR);
	//}

	// Find DOH features
	vector<Feature> features;
	if (!FindDoHFeatures(img, mask, features))
	{
#ifdef DEBUG_FEATURES
		cout << "Failed to find DoH features in image " << filename << endl;
#endif

		return;
	}
#ifdef DEBUG_FEATURES
	std::cout << features.size() << " features found in image " << filename << std::endl;
#endif

#ifdef DEBUG
	Mat img_i = imread(imagePath, IMREAD_GRAYSCALE);
	for (auto& f : features)
	{
		circle(img_i, f.p, 3, (255, 255, 0), -1);
	}

	// Display
	imshow("Image - best features", img_i);
	waitKey(0);
#endif

	// Create descriptors for each feature in the image
	std::vector<FeatureDescriptor> descriptors;
	if (!CreateSIFTDescriptors(img, features, descriptors))
	{
#ifdef DEBUG_FEATURES
		cout << "Failed to create feature descriptors for image " << filename << endl;
#endif

		return;
	}

#ifdef DEBUG_FEATURES
	cout << "Image descriptor created for image " << filename << endl;
#endif

	imgDesc.filename = filename;
	imgDesc.features = features;
	// Need to decompose K into K and E = [R|t]. 
	// This E is different to the E later on, which is between two cameras, not per-camera
	DecomposeProjectiveMatrixIntoKAndE(calibMatrix, imgDesc.K, imgDesc.E);
}
// Actual function
void GetImageDescriptorsForFile(
	const std::vector<std::string>& filenames,
	const std::string& folder,
	std::vector<ImageDescriptor>& images,
	const std::vector<Eigen::MatrixXf>& calibrationMatrices,
	const Mat& mask)
{
#pragma omp parallel
	{
#pragma omp for 
		for (int idx = 0; idx < filenames.size(); idx++)
		{
			ImageDescriptor i;
			CreateDescriptorForImage(filenames[idx], folder, i, calibrationMatrices[idx], mask);
#pragma omp critical
			images.push_back(i);
		}
	}
}
// Similar function but single threaded
void GetImageDescriptorsForImages(
	_Inout_ std::vector<ImageDescriptor>& images)
{
	for (auto& image : images)
	{
		Mat img = imread(image.filename, IMREAD_GRAYSCALE);

		vector<Feature> features;
		FindFASTFeatures(img, features);
		if (features.empty())
		{
			cout << "No features were found in " << image.filename << endl;
		}
		features = ScoreAndClusterFeatures(img, features, ST_THRESH, NMS_WINDOW);

		cout << "Found " << features.size() << " features in " << image.filename << endl;

#ifdef DEBUG_FEATURES
		Mat img_i = imread(image.filename, IMREAD_GRAYSCALE);
		for (auto& f : features)
		{
			circle(img_i, f.p, 3, (255, 255, 0), -1);
		}

		// Display
		imshow("Image - best features", img_i);
		waitKey(0);
#endif

		// Create descriptors with scale information for better matching

		// Create descriptors for each feature in the image
		std::vector<FeatureDescriptor> descriptors;
		if (!CreateSIFTDescriptors(img, features, descriptors))
		{
			cout << "Failed to create feature descriptors for image " << image.filename << endl;
			continue;
		}

		image.width = img.cols;
		image.height = img.rows;
		image.features = features;
	}
}

/*
	Given a list of image descriptors, serialise these to a .dat file
*/
bool SaveImageDescriptorsToFile(const std::string& filename, vector<ImageDescriptor>& images)
{
	ofstream descFile;
	descFile.open(filename);
	if (descFile.is_open())
	{
		for (auto& i : images)
		{
			descFile << i;
		}
		descFile.close();
	}
	else
	{
		return false;
	}

	return true;
}

/*
	Given a file of image descriptors, deserialise into a vector of descriptors
*/
bool ReadDescriptorsFromFile(const std::string& filename, vector<ImageDescriptor>& images)
{
	ifstream descFile;
	descFile.open(filename);
	if (descFile.is_open())
	{
		while (!descFile.eof())
		{
			ImageDescriptor i;
			descFile >> i;
			/*if (descFile.fail())
			{
				size_t errmsglen = 94;
				char* errmsg = (char*)malloc(sizeof(char)* errmsglen);
				strerror_s(errmsg, errmsglen, errno);
				errmsg[93] = '\0';
				std::cerr << "Error: " << errmsg << endl;
				descFile.close();
				return false;
			}*/
			if (i.features.size() < 1)
			{
				continue;
			}
			images.push_back(i);
		}
		descFile.close();
	}
	else
	{
		return false;
	}

	return true;
}