Rhoana · tkucukdeniz · Jan 30, 2014
diff --git a/ClassifyMembranes/predict_gpu_randomforest_2class.py b/ClassifyMembranes/predict_gpu_randomforest_2class.py
@@ -0,0 +1,194 @@
+############################################################
+# GPU Implementation of Random Forest Classifier - Training
+# v0.1
+# Seymour Knowles-Barley
+############################################################
+# Based on c code from:
+# http://code.google.com/p/randomforest-matlab/
+# License: GPLv2
+############################################################
+
+import numpy as np
+import os
+import sys
+import h5py
+import glob
+import mahotas
+
+import pycuda.autoinit
+import pycuda.driver as cu
+import pycuda.compiler as nvcc
+import pycuda.gpuarray as gpuarray
+
+gpu_randomforest_predict_source = """
+#define NODE_TERMINAL -1
+#define NODE_TOSPLIT  -2
+#define NODE_INTERIOR -3
+
+__global__ void predictKernel(const float *x, int n, int mdim, const int *treemap,
+		      const int *nodestatus, const float *xbestsplit,
+		      const int *bestvar, const int *nodeclass,
+		      int nclass,
+			  int ntree, int *countts, int maxTreeSize)
+		      //int *jts,
+			  //int *nodex,
+{
+	int idx = threadIdx.x + blockDim.x * (blockIdx.x + gridDim.x * blockIdx.y);
+
+	//Make sure we don't overrun
+	if (idx < n) {
+		int m, k, treei, treeOffset1, treeOffset2;
+
+		//Repeat for each tree - this way only one thread writes to any point in the vote output array
+
+		for (treei = 0; treei < ntree; ++treei) {
+		//for (treei = 0; treei < ntree; ++treei) {
+			treeOffset1 = treei*maxTreeSize;
+			treeOffset2 = treei*2*maxTreeSize;
+			k = 0;
+
+			while (nodestatus[treeOffset1 + k] != NODE_TERMINAL) {
+				m = bestvar[treeOffset1 + k] - 1;
+				//Split by a numerical predictor
+				k = (x[idx + n * m] <= xbestsplit[treeOffset1 + k]) ?
+					treemap[treeOffset2 + k * 2] - 1 : treemap[treeOffset2 + 1 + k * 2] - 1;
+			}
+			//We found the terminal node: assign class label
+			//jts[chunki + treei] = nodeclass[treeOffset + k];
+			//nodex[chunki + treei] = k + 1;
+			countts[idx * nclass + nodeclass[treeOffset1 + k] - 1] += 1;
+		}
+	}
+
+}
+"""
+
+# forest_file = 'D:\\dev\\datasets\\LGN1\\autoSeg\\IlasticExportViews\\joshm\\rhoana_forest_2class.h5'
+# input_image_folder = 'D:\\dev\\datasets\\LGN1\\autoSeg\\IlasticExportViews\\joshm\\classifyds2\\'
+# input_image_suffix = '.tif'
+# input_features_suffix = '_rhoana_features.h5'
+# output_folder = 'D:\\dev\\datasets\\LGN1\\autoSeg\\IlasticExportViews\\joshm\\classifyds2\\output\\'
+
+# forest_file = 'D:\\dev\\Rhoana\\classifierTraining\\autoencoder_test\\autoencoder_forest_2class.h5'
+# input_image_folder = 'D:\\dev\\Rhoana\\classifierTraining\\autoencoder_test\\'
+# input_image_suffix = '.tif'
+# input_features_suffix = '_autoencoder_features.h5'
+# output_folder = 'D:\\dev\\Rhoana\\classifierTraining\\autoencoder_test\\autoencoder_output\\'
+
+# forest_file = 'D:\\dev\\Rhoana\\classifierTraining\\autoencoder_test\\autoencoder_nosig_forest_2class.h5'
+# input_image_folder = 'D:\\dev\\Rhoana\\classifierTraining\\autoencoder_test\\'
+# input_image_suffix = '.tif'
+# input_features_suffix = '_autoencoder_nosig_features.h5'
+# output_folder = 'D:\\dev\\Rhoana\\classifierTraining\\autoencoder_test\\autoencoder_nosig_output\\'
+
+forest_file = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\training2_auto1\\auto1_forest_3class.hdf5'
+input_image_folder = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\original'
+input_image_suffix = '.tif'
+input_features_suffix = '_autoencoder_features.h5'
+output_folder = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\training2_auto1\\output\\'
+
+
+# Load the forest settings
+
+model = h5py.File(forest_file, 'r')
+
+
+# Prep the gpu function
+gpu_predict = nvcc.SourceModule(gpu_randomforest_predict_source).get_function('predictKernel')
+
+d_treemap = gpuarray.to_gpu(model['/forest/treemap'][...])
+d_nodestatus = gpuarray.to_gpu(model['/forest/nodestatus'][...])
+d_xbestsplit = gpuarray.to_gpu(model['/forest/xbestsplit'][...])
+d_bestvar = gpuarray.to_gpu(model['/forest/bestvar'][...])
+d_nodeclass = gpuarray.to_gpu(model['/forest/nodeclass'][...])
+
+nrnodes = model['/forest/nrnodes'][...];
+ntree = model['/forest/ntree'][...];
+nclass = model['/forest/nclass'][...];
+
+
+files = sorted( glob.glob( input_image_folder + '\\*' + input_image_suffix ) )
+
+print 'Found {0} images to classify.'.format(len(files))
+
+for file in files:
+	features_file = file.replace(input_image_suffix, input_features_suffix)
+
+	# Load the features
+	f = h5py.File(features_file, 'r')
+
+	nfeatures = len(f.keys())
+	image_shape = f[f.keys()[0]].shape
+	fshape = (nfeatures, image_shape[0] * image_shape[1])
+	features = np.zeros(fshape, dtype=np.float32)
+
+	for i,k in enumerate(f.keys()):
+		features[i,:] = f[k][...].ravel()
+
+
+	# Predict
+
+	out_votes = np.zeros((image_shape[0], image_shape[1], nclass), dtype=np.int32)
+	d_votes = gpuarray.to_gpu(out_votes)
+
+	d_features = gpuarray.to_gpu(features)
+
+	block = (64, 1, 1)
+	grid = (1024, int(fshape[1] / block[0] / 1024 + 1))
+
+	gpu_predict(d_features, np.int32(fshape[1]), np.int32(fshape[0]),
+		d_treemap, d_nodestatus, d_xbestsplit, d_bestvar, d_nodeclass,
+		np.int32(nclass), np.int32(ntree), d_votes, np.int32(nrnodes),
+		grid=grid, block=block)
+
+
+	# Save / display results
+
+	votes = d_votes.get()
+
+	del d_votes
+	del d_features
+
+	prob_image = np.float32(votes) / ntree
+
+	output_image_basename = file.replace(input_image_folder, output_folder)
+
+	for classi in range(nclass):
+		output_image_file = output_image_basename.replace(input_image_suffix, '_class{0}.png'.format(classi + 1))
+		mahotas.imsave(output_image_file, np.uint8(prob_image[:,:,classi] * 255))
+
+	if (nclass == 2):
+		color_image = np.zeros((prob_image.shape[0], prob_image.shape[1], 3), dtype=np.float32)
+		color_image[:,:,0] = prob_image[:,:,0]
+		color_image[:,:,1] = prob_image[:,:,1]
+		color_image[:,:,2] = prob_image[:,:,0]
+
+	output_image_file = output_image_basename.replace(input_image_suffix, '_allclass.png')
+	mahotas.imsave(output_image_file, np.uint8(color_image * 255))
+
+	win_0 = prob_image[:,:,0] > prob_image[:,:,1]
+	win_1 = np.logical_not(win_0)
+
+	win_image = color_image
+	win_image[:,:,0] = win_0 * 255
+	win_image[:,:,1] = win_1 * 255
+	win_image[:,:,2] = win_0 * 255
+
+	output_image_file = output_image_basename.replace(input_image_suffix, '_winclass.png')
+	mahotas.imsave(output_image_file, np.uint8(win_image))
+
+	output_path = output_image_basename.replace(input_image_suffix, '_probabilities.hdf5');
+	temp_path = output_path + '_tmp'
+	out_hdf5 = h5py.File(temp_path, 'w')
+	# copy the probabilities for future use
+	probs_out = out_hdf5.create_dataset('probabilities',
+	                                    data = prob_image,
+	                                    chunks = (64,64,1),
+	                                    compression = 'gzip')
+	out_hdf5.close()
+
+	if os.path.exists(output_path):
+	    os.unlink(output_path)
+	os.rename(temp_path, output_path)
+
+	print '{0} done.'.format(file)
diff --git a/ClassifyMembranes/predict_gpu_randomforest_3class.py b/ClassifyMembranes/predict_gpu_randomforest_3class.py
@@ -0,0 +1,176 @@
+############################################################
+# GPU Implementation of Random Forest Classifier - Training
+# v0.1
+# Seymour Knowles-Barley
+############################################################
+# Based on c code from:
+# http://code.google.com/p/randomforest-matlab/
+# License: GPLv2
+############################################################
+
+import numpy as np
+import os
+import sys
+import h5py
+import glob
+import mahotas
+
+import pycuda.autoinit
+import pycuda.driver as cu
+import pycuda.compiler as nvcc
+import pycuda.gpuarray as gpuarray
+
+gpu_randomforest_predict_source = """
+#define NODE_TERMINAL -1
+#define NODE_TOSPLIT  -2
+#define NODE_INTERIOR -3
+
+__global__ void predictKernel(const float *x, int n, int mdim, const int *treemap,
+		      const int *nodestatus, const float *xbestsplit,
+		      const int *bestvar, const int *nodeclass,
+		      int nclass,
+			  int ntree, int *countts, int maxTreeSize)
+		      //int *jts,
+			  //int *nodex,
+{
+	int idx = threadIdx.x + blockDim.x * (blockIdx.x + gridDim.x * blockIdx.y);
+
+	//Make sure we don't overrun
+	if (idx < n) {
+		int m, k, treei, treeOffset1, treeOffset2;
+
+		//Repeat for each tree - this way only one thread writes to any point in the vote output array
+
+		for (treei = 0; treei < ntree; ++treei) {
+		//for (treei = 0; treei < ntree; ++treei) {
+			treeOffset1 = treei*maxTreeSize;
+			treeOffset2 = treei*2*maxTreeSize;
+			k = 0;
+
+			while (nodestatus[treeOffset1 + k] != NODE_TERMINAL) {
+				m = bestvar[treeOffset1 + k] - 1;
+				//Split by a numerical predictor
+				k = (x[idx + n * m] <= xbestsplit[treeOffset1 + k]) ?
+					treemap[treeOffset2 + k * 2] - 1 : treemap[treeOffset2 + 1 + k * 2] - 1;
+			}
+			//We found the terminal node: assign class label
+			//jts[chunki + treei] = nodeclass[treeOffset + k];
+			//nodex[chunki + treei] = k + 1;
+			countts[idx * nclass + nodeclass[treeOffset1 + k] - 1] += 1;
+		}
+	}
+
+}
+"""
+
+# forest_file = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\training2\\rhoana_forest_3class.hdf5'
+# input_image_folder = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\all'
+# input_image_suffix = '_labeled.png'
+# input_features_suffix = '.hdf5'
+# output_folder = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\output2\\'
+
+forest_file = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\training2_auto1\\auto1_forest_3class.hdf5'
+input_image_folder = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\original'
+input_image_suffix = '.tif'
+input_features_suffix = '_autoencoder_features.h5'
+output_folder = 'D:\\dev\\Rhoana\\classifierTraining\\Miketraining\\training2_auto1\\output\\'
+
+# Load the forest settings
+
+model = h5py.File(forest_file, 'r')
+
+
+# Prep the gpu function
+gpu_predict = nvcc.SourceModule(gpu_randomforest_predict_source).get_function('predictKernel')
+
+d_treemap = gpuarray.to_gpu(model['/forest/treemap'][...])
+d_nodestatus = gpuarray.to_gpu(model['/forest/nodestatus'][...])
+d_xbestsplit = gpuarray.to_gpu(model['/forest/xbestsplit'][...])
+d_bestvar = gpuarray.to_gpu(model['/forest/bestvar'][...])
+d_nodeclass = gpuarray.to_gpu(model['/forest/nodeclass'][...])
+
+nrnodes = model['/forest/nrnodes'][...];
+ntree = model['/forest/ntree'][...];
+nclass = model['/forest/nclass'][...];
+
+
+files = sorted( glob.glob( input_image_folder + '\\*' + input_image_suffix ) )
+
+print 'Found {0} images to classify.'.format(len(files))
+
+for file in files:
+	features_file = file.replace(input_image_suffix, input_features_suffix)
+
+	# Load the features
+	f = h5py.File(features_file, 'r')
+
+	nfeatures = len(f.keys())
+	image_shape = f[f.keys()[0]].shape
+	fshape = (nfeatures, image_shape[0] * image_shape[1])
+	features = np.zeros(fshape, dtype=np.float32)
+
+	for i,k in enumerate(f.keys()):
+		features[i,:] = f[k][...].ravel()
+
+
+	# Predict
+
+	out_votes = np.zeros((image_shape[0], image_shape[1], nclass), dtype=np.int32)
+	d_votes = gpuarray.to_gpu(out_votes)
+
+	d_features = gpuarray.to_gpu(features)
+
+	block = (64, 1, 1)
+	grid = (1024, int(fshape[1] / block[0] / 1024 + 1))
+
+	gpu_predict(d_features, np.int32(fshape[1]), np.int32(fshape[0]),
+		d_treemap, d_nodestatus, d_xbestsplit, d_bestvar, d_nodeclass,
+		np.int32(nclass), np.int32(ntree), d_votes, np.int32(nrnodes),
+		grid=grid, block=block)
+
+
+	# Save / display results
+
+	votes = d_votes.get()
+
+	del d_votes
+	del d_features
+
+	prob_image = np.float32(votes) / ntree
+
+	output_image_basename = file.replace(input_image_folder, output_folder)
+
+	# for classi in range(nclass):
+	# 	output_image_file = output_image_basename.replace(input_image_suffix, '_class{0}.png'.format(classi + 1))
+	# 	mahotas.imsave(output_image_file, np.uint8(prob_image[:,:,classi] * 255))
+
+	output_image_file = output_image_basename.replace(input_image_suffix, '_allclass.png')
+	mahotas.imsave(output_image_file, np.uint8(prob_image * 255))
+
+	win_0 = np.logical_and(prob_image[:,:,0] > prob_image[:,:,1], prob_image[:,:,0] > prob_image[:,:,2])
+	win_2 = np.logical_and(prob_image[:,:,2] > prob_image[:,:,0], prob_image[:,:,2] > prob_image[:,:,1])
+	win_1 = np.logical_not(np.logical_or(win_0, win_2))
+
+	win_image = prob_image
+	win_image[:,:,0] = win_0 * 255
+	win_image[:,:,1] = win_1 * 255
+	win_image[:,:,2] = win_2 * 255
+
+	output_image_file = output_image_basename.replace(input_image_suffix, '_winclass.png')
+	mahotas.imsave(output_image_file, np.uint8(win_image))
+
+	output_path = output_image_basename.replace(input_image_suffix, '_probabilities.hdf5');
+	temp_path = output_path + '_tmp'
+	out_hdf5 = h5py.File(temp_path, 'w')
+	# copy the probabilities for future use
+	probs_out = out_hdf5.create_dataset('probabilities',
+	                                    data = prob_image,
+	                                    chunks = (64,64,1),
+	                                    compression = 'gzip')
+	out_hdf5.close()
+
+	if os.path.exists(output_path):
+	    os.unlink(output_path)
+	os.rename(temp_path, output_path)
+
+	print '{0} done.'.format(file)