add feature extraction

9 years ago · 391596a1b2
parent 9fdc78a302
commit 391596a1b2
10 changed files with 564 additions and 149 deletions
--- a/modules/cnn_3dobj/README.md
+++ b/modules/cnn_3dobj/README.md
@ -12,8 +12,10 @@ $ mkdir build
 $ cd build
 $ cmake ..
 $ make
-$ ./sphereview_test -radius=250 -ite_depth=1 -plymodel=../ape.ply -imagedir=../data/images_ape/
+$ ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ape.ply -imagedir=../data/images_ape/ -labeldir=../data/label_ape.txt -num_class=4 -label_class=0
 $ ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ant.ply -imagedir=../data/images_ant/ -labeldir=../data/label_ant.txt -num_class=4 -label_class=1
 $ ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/cow.ply -imagedir=../data/images_cow/ -labeldir=../data/label_cow.txt -num_class=4 -label_class=2
 $ ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/plane.ply -imagedir=../data/images_plane/ -labeldir=../data/label_plane.txt -num_class=4 -label_class=3
 ==============================================
 demo :$ ./sphereview_test -radius=250 -ite_depth=1 -plymodel=../ape.ply -imagedir=../data/images_ape/
 Then press 'q' to run the demo for images generation when you see the gray background and a coordinate.
 ==============================================
--- a/modules/cnn_3dobj/include/opencv2/cnn_3dobj.hpp
+++ b/modules/cnn_3dobj/include/opencv2/cnn_3dobj.hpp
@ -49,10 +49,12 @@ the use of this software, even if advised of the possibility of such damage.
 #include <opencv2/calib3d.hpp>
 #include <opencv2/viz/vizcore.hpp>
 #include <opencv2/highgui.hpp>
 #include <string>
 #include <fstream>
 #include <vector>
 #include <stdio.h>
 #include <iostream>
-
+using std::string;
 /** @defgroup cnn_3dobj CNN based on Caffe aimming at 3D object recognition and pose estimation
 */
 namespace cv
@ -92,6 +94,23 @@ class CV_EXPORTS_W IcoSphere
 		/** @brief Generating new view points from all triangles.
 		*/
 		CV_WRAP void subdivide(float v1[], float v2[], float v3[], int depth);
 		/** @brief Make all view points having the some distance from the focal point used by the camera view.
 		*/
 		CV_WRAP static uint32_t swap_endian(uint32_t val);
 		/** @brief Suit the position of bytes in 4 byte data structure for particular system.
 		*/
 		CV_WRAP cv::Point3d getCenter(cv::Mat cloud);
 		/** @brief Get the center of points on surface in .ply model.
 		*/
 		CV_WRAP float getRadius(cv::Mat cloud, cv::Point3d center);
 		/** @brief Get the proper camera radius from the view point to the center of model.
 		*/
 		CV_WRAP static void createHeader(int num_item, int rows, int cols, const char* headerPath);
 		/** @brief Create header in binary files collecting the image data and label.
 		*/
 		CV_WRAP static void writeBinaryfile(string filenameImg, const char* binaryPath, const char* headerPath, int num_item, int label_class);
 		/** @brief Write binary files used for training in other open source project.
 		*/
 };
 //! @}
--- a/modules/cnn_3dobj/samples/build/binary_label_test
+++ b/modules/cnn_3dobj/samples/build/binary_label_test
--- a/modules/cnn_3dobj/samples/build/binary_label_train
+++ b/modules/cnn_3dobj/samples/build/binary_label_train
--- a/modules/cnn_3dobj/samples/build/train_linemod_triplet.sh
+++ b/modules/cnn_3dobj/samples/build/train_linemod_triplet.sh
@ -8,18 +8,15 @@ cd build
 cmake -DCMAKE_INSTALL_PREFIX=/usr/local ..
 make -j4
 make test
-make install
+sudo make install
 cd ..
 cmake ..
 make -j4
-./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ape.ply -imagedir=../data/images_ape/ -labeldir=../data/label_ape.txt -num_class=2 -label_class=0
+./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ape.ply -imagedir=../data/images_ape/ -labeldir=../data/label_ape.txt -num_class=4 -label_class=0
-./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ant.ply -imagedir=../data/images_ant/ -labeldir=../data/label_ant.txt -num_class=2 -label_class=1
+./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ant.ply -imagedir=../data/images_ant/ -labeldir=../data/label_ant.txt -num_class=4 -label_class=1
-./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/apple.ply -imagedir=../data/images_apple/ -labeldir=../data/label_apple.txt -num_class=2 -label_class=2
+./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/cow.ply -imagedir=../data/images_cow/ -labeldir=../data/label_cow.txt -num_class=4 -label_class=2
-./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/lamp.ply -imagedir=../data/images_lamp/ -labeldir=../data/label_lamp.txt -num_class=2 -label_class=3
+./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/plane.ply -imagedir=../data/images_plane/ -labeldir=../data/label_plane.txt -num_class=4 -label_class=3
 ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/cow.ply -imagedir=../data/images_cow/ -labeldir=../data/label_cow.txt -num_class=2 -label_class=4
 ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/plane.ply -imagedir=../data/images_plane/ -labeldir=../data/label_plane.txt -num_class=2 -label_class=5
 ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/porsche.ply -imagedir=../data/images_porsche/ -labeldir=../data/label_porsche.txt -num_class=2 -label_class=6
 echo "Creating leveldb..."
--- a/modules/cnn_3dobj/samples/feature_extraction.cpp
+++ b/modules/cnn_3dobj/samples/feature_extraction.cpp
@ -0,0 +1,202 @@
 #include <stdio.h>  // for snprintf
 #include <string>
 #include <vector>
 #include "boost/algorithm/string.hpp"
 #include "google/protobuf/text_format.h"
 #define CPU_ONLY
 #include "caffe/blob.hpp"
 #include "caffe/common.hpp"
 #include "caffe/net.hpp"
 #include "caffe/proto/caffe.pb.h"
 #include "caffe/util/db.hpp"
 #include "caffe/util/io.hpp"
 #include "caffe/vision_layers.hpp"
 using caffe::Blob;
 using caffe::Caffe;
 using caffe::Datum;
 using caffe::Net;
 using boost::shared_ptr;
 using std::string;
 namespace db = caffe::db;
 template<typename Dtype>
 int feature_extraction_pipeline(int argc, char** argv);
 int main(int argc, char** argv) {
  return feature_extraction_pipeline<float>(argc, argv);
 //  return feature_extraction_pipeline<double>(argc, argv);
 }
 template<typename Dtype>
 int feature_extraction_pipeline(int argc, char** argv) {
  ::google::InitGoogleLogging(argv[0]);
  const int num_required_args = 7;
  /*if (argc < num_required_args) {
    LOG(ERROR)<<
    "This program takes in a trained network and an input data layer, and then"
    " extract features of the input data produced by the net.\n"
    "Usage: extract_features  pretrained_net_param"
    "  feature_extraction_proto_file  extract_feature_blob_name1[,name2,...]"
    "  save_feature_dataset_name1[,name2,...]  num_mini_batches  db_type"
    "  [CPU/GPU] [DEVICE_ID=0]\n"
    "Note: you can extract multiple features in one pass by specifying"
    " multiple feature blob names and dataset names seperated by ','."
    " The names cannot contain white space characters and the number of blobs"
    " and datasets must be equal.";
    return 1;
  }*/
  int arg_pos = num_required_args;
  arg_pos = num_required_args;
  //if (argc > arg_pos && strcmp(argv[arg_pos], "GPU") == 0) {
  if (argc > arg_pos && strcmp("CPU", "GPU") == 0) {
    LOG(ERROR)<< "Using GPU";
    int device_id = 0;
    if (argc > arg_pos + 1) {
      device_id = atoi(argv[arg_pos + 1]);
      CHECK_GE(device_id, 0);
    }
    LOG(ERROR) << "Using Device_id=" << device_id;
    Caffe::SetDevice(device_id);
    Caffe::set_mode(Caffe::GPU);
  } else {
    LOG(ERROR) << "Using CPU";
    Caffe::set_mode(Caffe::CPU);
  }
  arg_pos = 0;  // the name of the executable
  //std::string pretrained_binary_proto(argv[++arg_pos]);
  std::string pretrained_binary_proto("/home/wangyida/Desktop/caffe/examples/triplet/3d_triplet_iter_200.caffemodel");
  // Expected prototxt contains at least one data layer such as
  //  the layer data_layer_name and one feature blob such as the
  //  fc7 top blob to extract features.
  /*
   layers {
     name: "data_layer_name"
     type: DATA
     data_param {
       source: "/path/to/your/images/to/extract/feature/images_leveldb"
       mean_file: "/path/to/your/image_mean.binaryproto"
       batch_size: 128
       crop_size: 227
       mirror: false
     }
     top: "data_blob_name"
     top: "label_blob_name"
   }
   layers {
     name: "drop7"
     type: DROPOUT
     dropout_param {
       dropout_ratio: 0.5
     }
     bottom: "fc7"
     top: "fc7"
   }
   */
  //std::string feature_extraction_proto(argv[++arg_pos]);
  std::string feature_extraction_proto("/home/wangyida/Desktop/caffe/examples/triplet/3d_triplet.prototxt");
  boost::shared_ptr<Net<Dtype> > feature_extraction_net(
      new Net<Dtype>(feature_extraction_proto, caffe::TEST));
  feature_extraction_net->CopyTrainedLayersFrom(pretrained_binary_proto);
  //std::string extract_feature_blob_names(argv[++arg_pos]);
  std::string extract_feature_blob_names("feat");
  std::vector<std::string> blob_names;
  boost::split(blob_names, extract_feature_blob_names, boost::is_any_of(","));
  //std::string save_feature_dataset_names(argv[++arg_pos]);
  std::string save_feature_dataset_names("/home/wangyida/Desktop/caffe/examples/triplet/feature_extracted");
  std::vector<std::string> dataset_names;
  boost::split(dataset_names, save_feature_dataset_names,
               boost::is_any_of(","));
  CHECK_EQ(blob_names.size(), dataset_names.size()) <<
      " the number of blob names and dataset names must be equal";
  size_t num_features = blob_names.size();
  for (size_t i = 0; i < num_features; i++) {
    CHECK(feature_extraction_net->has_blob(blob_names[i]))
        << "Unknown feature blob name " << blob_names[i]
        << " in the network " << feature_extraction_proto;
  }
  //int num_mini_batches = atoi(argv[++arg_pos]);
  int num_mini_batches = atoi("6");
  /*std::vector<shared_ptr<db::DB> > feature_dbs;
  std::vector<shared_ptr<db::Transaction> > txns;
  const char* db_type = argv[++arg_pos];
  for (size_t i = 0; i < num_features; ++i) {
    LOG(INFO)<< "Opening dataset " << dataset_names[i];
    shared_ptr<db::DB> db(db::GetDB(db_type));
    db->Open(dataset_names.at(i), db::NEW);
    feature_dbs.push_back(db);
    shared_ptr<db::Transaction> txn(db->NewTransaction());
    txns.push_back(txn);
  }*/
  std::vector<FILE*> files;
  for (size_t i = 0; i < num_features; ++i)
  {
 	  LOG(INFO) << "Opening file " << dataset_names[i];
 	  FILE * temp = NULL;
 	  temp = fopen(dataset_names[i].c_str(), "wb");
 	  files.push_back(temp);
  }
  LOG(ERROR)<< "Extacting Features";
  //bool header_flag = true;
  Datum datum;
  //const int kMaxKeyStrLength = 100;
  //char key_str[kMaxKeyStrLength];
  std::vector<Blob<float>*> input_vec;
  std::vector<int> image_indices(num_features, 0);
  for (int batch_index = 0; batch_index < num_mini_batches; ++batch_index) {
    feature_extraction_net->Forward(input_vec);
    for (int i = 0; i < num_features; ++i) {
 		const boost::shared_ptr<Blob<Dtype> > feature_blob = feature_extraction_net
          ->blob_by_name(blob_names[i]);
      int batch_size = feature_blob->num();
      int dim_features = feature_blob->count() / batch_size;
 	  if (batch_index == 0)
 	  {
 		  int fea_num = batch_size*num_mini_batches;
 		  fwrite(&dim_features, sizeof(int), 1, files[i]);
 		  fwrite(&fea_num, sizeof(int), 1, files[i]);
 		  //bool header_flag = false;
 	  }
      const Dtype* feature_blob_data;
      for (int n = 0; n < batch_size; ++n) {
        feature_blob_data = feature_blob->cpu_data() +
            feature_blob->offset(n);
 		fwrite(feature_blob_data, sizeof(Dtype), dim_features, files[i]);
        ++image_indices[i];
        if (image_indices[i] % 1000 == 0) {
          LOG(ERROR)<< "Extracted features of " << image_indices[i] <<
              " query images for feature blob " << blob_names[i];
        }
      }  // for (int n = 0; n < batch_size; ++n)
    }  // for (int i = 0; i < num_features; ++i)
  }  // for (int batch_index = 0; batch_index < num_mini_batches; ++batch_index)
  // write the last batch
  for (int i = 0; i < num_features; ++i) {
   /* if (image_indices[i] % 1000 != 0) {
      txns.at(i)->Commit();
    }
    LOG(ERROR)<< "Extracted features of " << image_indices[i] <<
        " query images for feature blob " << blob_names[i];
    feature_dbs.at(i)->Close();*/
 	  fclose(files[i]);
  }
  LOG(ERROR)<< "Successfully extracted the features!";
  return 0;
 }
--- a/modules/cnn_3dobj/samples/image2db.cpp
+++ b/modules/cnn_3dobj/samples/image2db.cpp
@ -0,0 +1,191 @@
 #include <google/protobuf/text_format.h>
 #include <glog/logging.h>
 #include <leveldb/db.h>
 #include <stdint.h>
 #include <fstream>  // NOLINT(readability/streams)
 #include <string>
 #include <set>
 #include <stdio.h>
 #include <string.h>
 #include <stdlib.h>
 #include <dirent.h>
 #include <sys/stat.h>
 #include <unistd.h>
 #include <sys/types.h>
 #include "caffe/proto/caffe.pb.h"
 #include <opencv2/highgui/highgui.hpp>
 #include <opencv2/highgui/highgui_c.h>
 #include <opencv2/imgproc/imgproc.hpp>
 using std::string;
 using namespace std;
 set<string> all_class_name;
 map<string,int> class2id;
 void list_dir(const char *path,vector<string>& files,bool r = false)
 {
  DIR *pDir;
  struct dirent *ent;
  char childpath[512];
  pDir = opendir(path);
  memset(childpath, 0, sizeof(childpath));
  while ((ent = readdir(pDir)) != NULL)
  {
    if (ent->d_type & DT_DIR)
    {
      if (strcmp(ent->d_name, ".") == 0 || strcmp(ent->d_name, "..") == 0)
      {
        continue;
      }
      if(r)
      {
        sprintf(childpath, "%s/%s", path, ent->d_name);
        list_dir(childpath,files);
      }
    }
    else
    {
      files.push_back(ent->d_name);
    }
  }
  sort(files.begin(),files.end());
 }
 string get_classname(string path)
 {
  int index = path.find_last_of('_');
  return path.substr(0, index);
 }
 int get_labelid(string fileName)
 {
  string class_name_tmp = get_classname(fileName);
  all_class_name.insert(class_name_tmp);
  map<string,int>::iterator name_iter_tmp = class2id.find(class_name_tmp);
  if (name_iter_tmp == class2id.end())
  {
    int id = class2id.size();
    class2id.insert(name_iter_tmp, std::make_pair(class_name_tmp, id));
    return id;
  }
  else
  {
    return name_iter_tmp->second;
  }
 }
 void loadimg(string path,char* buffer)
 {
  cv::Mat img = cv::imread(path, CV_LOAD_IMAGE_COLOR);
  string val;
  int rows = img.rows;
  int cols = img.cols;
  int pos=0;
  for (int c = 0; c < 3; c++)
  {
    for (int row = 0; row < rows; row++)
    {
      for (int col = 0; col < cols; col++)
      {
        buffer[pos++]=img.at<cv::Vec3b>(row,col)[c];
      }
    }
  }
 }
 void convert(string imgdir,string outputdb,string attachdir,int channel,int width,int height)
 {
  leveldb::DB* db;
  leveldb::Options options;
  options.create_if_missing = true;
  options.error_if_exists = true;
  caffe::Datum datum;
  datum.set_channels(channel);
  datum.set_height(height);
  datum.set_width(width);
  int image_size = channel*width*height;
  char buffer[image_size];
  string value;
  CHECK(leveldb::DB::Open(options, outputdb, &db).ok());
  vector<string> filenames;
  list_dir(imgdir.c_str(),filenames);
  string img_log = attachdir+"image_filename";
  ofstream writefile(img_log.c_str());
  for(int i=0;i<filenames.size();i++)
  {
    string path= imgdir;
    path.append(filenames[i]);
    loadimg(path,buffer);
    int labelid = get_labelid(filenames[i]);
    datum.set_label(labelid);
    datum.set_data(buffer,image_size);
    datum.SerializeToString(&value);
    snprintf(buffer, image_size, "%05d", i);
    printf("\nclassid:%d classname:%s abspath:%s",labelid,get_classname(filenames[i]).c_str(),path.c_str());
    db->Put(leveldb::WriteOptions(),string(buffer),value);
    //printf("%d %s\n",i,fileNames[i].c_str());
    assert(writefile.is_open());
    writefile<<i<<" "<<filenames[i]<<"\n";
  }
  delete db;
  writefile.close();
  img_log = attachdir+"image_classname";
  writefile.open(img_log.c_str());
  set<string>::iterator iter = all_class_name.begin();
  while(iter != all_class_name.end())
  {
    assert(writefile.is_open());
    writefile<<(*iter)<<"\n";
    //printf("%s\n",(*iter).c_str());
    iter++;
  }
  writefile.close();
 }
 int main(int argc, char** argv)
 {
  if (argc < 6)
  {
      LOG(ERROR) << "convert_imagedata src_dir dst_dir attach_dir channel width height";
      return 0;
  }
 //./convert_imagedata.bin  /home/linger/imdata/collarTest/ /home/linger/linger/testfile/dbtest/  /home/linger/linger/testfile/test_attachment/ 3 250 250
  //   ./convert_imagedata.bin /home/linger/imdata/collar_train/ /home/linger/linger/testfile/crop_train_db/ /home/linger/linger/testfile/crop_train_attachment/ 3 50 50
  google::InitGoogleLogging(argv[0]);
  string src_dir = argv[1];
  string src_dst = argv[2];
  string attach_dir = argv[3];
  int channel = atoi(argv[4]);
  int width = atoi(argv[5]);
  int height = atoi(argv[6]);
  //for test
  /*
  src_dir = "/home/linger/imdata/collarTest/";
  src_dst = "/home/linger/linger/testfile/dbtest/";
  attach_dir = "/home/linger/linger/testfile/";
  channel = 3;
  width = 250;
  height = 250;
   */
  convert(src_dir,src_dst,attach_dir,channel,width,height);
 }
--- a/modules/cnn_3dobj/samples/sphereview_3dobj_demo.cpp
+++ b/modules/cnn_3dobj/samples/sphereview_3dobj_demo.cpp
@ -35,135 +35,12 @@
 #include <opencv2/cnn_3dobj.hpp>
 #include <opencv2/viz/vizcore.hpp>
 #include <iostream>
 #include <string>
 #include <stdio.h>
 #include <stdlib.h>
 #include <math.h>
 using namespace cv;
 using namespace std;
 using namespace cv::cnn_3dobj;
 uint32_t swap_endian(uint32_t val) {
    val = ((val << 8) & 0xFF00FF00) | ((val >> 8) & 0xFF00FF);
    return (val << 16) | (val >> 16);
 }
 Point3d getCenter(cv::Mat cloud)
 {
 	Point3f* data = cloud.ptr<cv::Point3f>();
 	Point3d dataout;
 	for(int i = 0; i < cloud.cols; ++i)
 	    {
 	        dataout.x += data[i].x;
 	        dataout.y += data[i].y;
 	        dataout.z += data[i].z;
 	    }
 	dataout.x = dataout.x/cloud.cols;
 	dataout.y = dataout.y/cloud.cols;
 	dataout.z = dataout.z/cloud.cols;
 	return dataout;
 };
 float getRadius(cv::Mat cloud, Point3d center)
 {
 	float radius = 0;
 	Point3f* data = cloud.ptr<cv::Point3f>();
 	Point3d datatemp;
 	for(int i = 0; i < cloud.cols; ++i)
 	    {
 	        datatemp.x = data[i].x - (float)center.x;
 	        datatemp.y = data[i].y - (float)center.y;
 	        datatemp.z = data[i].z - (float)center.z;
 		float Radius = sqrt(pow(datatemp.x,2)+pow(datatemp.y,2)+pow(datatemp.z,2));
 		if(Radius > radius)
 		{
 			radius = Radius;
 		}
 	    }
 	radius = radius*3;
 	return radius;
 };
 void createHeader(int num_item, int rows, int cols, const char* headerPath)
 {
 	char* a0 = new char;
 	strcpy(a0, headerPath);
 	char a1[] = "image";
 	char a2[] = "label";
 	char* headerPathimg = new char;
 	strcpy(headerPathimg, a0);
 	strcat(headerPathimg, a1);
 	char* headerPathlab = new char;
 	strcpy(headerPathlab, a0);
 	strcat(headerPathlab, a2);
 	std::ofstream headerImg(headerPathimg, ios::out|ios::binary);
 	std::ofstream headerLabel(headerPathlab, ios::out|ios::binary);
 	int headerimg[4] = {2051,num_item,rows,cols};
 	for (int i=0; i<4; i++)
 		headerimg[i] = swap_endian(headerimg[i]);
 	int headerlabel[2] = {2049,num_item};
 	for (int i=0; i<2; i++)
 		headerlabel[i] = swap_endian(headerlabel[i]);
 	headerImg.write(reinterpret_cast<const char*>(headerimg), sizeof(int)*4);
 	headerImg.close();
 	headerLabel.write(reinterpret_cast<const char*>(headerlabel), sizeof(int)*2);
 	headerLabel.close();
 };
 void writeBinaryfile(string filename, const char* binaryPath, const char* headerPath, int num_item, int label_class)
 {
 	int isrgb = 0;
 	cv::Mat ImgforBin = cv::imread(filename, isrgb);
 	char* A0 = new char;
 	strcpy(A0, binaryPath);
 	char A1[] = "image";
 	char A2[] = "label";
 	char* binPathimg = new char;
 	strcpy(binPathimg, A0);
 	strcat(binPathimg, A1);
 	char* binPathlab = new char;
 	strcpy(binPathlab, A0);
 	strcat(binPathlab, A2);
 	fstream img_file, lab_file;
 	img_file.open(binPathimg,ios::in);
 	lab_file.open(binPathlab,ios::in);
 	if(!img_file)
 	{
 		cout << "Creating the training data at: " << binaryPath << ". " << endl;
 		char* a0 = new char;
 		strcpy(a0, headerPath);
 		char a1[] = "image";
 		char a2[] = "label";
 		char* headerPathimg = new char;
 		strcpy(headerPathimg, a0);
 		strcat(headerPathimg,a1);
 		char* headerPathlab = new char;
 		strcpy(headerPathlab, a0);
 		strcat(headerPathlab,a2);
 		createHeader(num_item, 250, 250, binaryPath);
 		ofstream img_file(binPathimg,ios::out|ios::binary|ios::app);
 		ofstream lab_file(binPathlab,ios::out|ios::binary|ios::app);
 		for (int r = 0; r < ImgforBin.rows; r++)
 		  {
 			img_file.write(reinterpret_cast<const char*>(ImgforBin.ptr(r)), ImgforBin.cols*ImgforBin.elemSize());
 		  }
 		unsigned char templab = (unsigned char)label_class;
 		lab_file << templab;
 	}
 	else
 	{
 		img_file.close();
 		lab_file.close();
 		img_file.open(binPathimg,ios::out|ios::binary|ios::app);
 		lab_file.open(binPathlab,ios::out|ios::binary|ios::app);
 		cout <<"Concatenating the training data at: " << binaryPath << ". " << endl;
 		for (int r = 0; r < ImgforBin.rows; r++)
 		  {
 			img_file.write(reinterpret_cast<const char*>(ImgforBin.ptr(r)), ImgforBin.cols*ImgforBin.elemSize());
 		  }
 		unsigned char templab = (unsigned char)label_class;
 		lab_file << templab;
 	}
 	img_file.close();
 	lab_file.close();
 };
 int main(int argc, char *argv[]){
-	const String keys = "{help | | demo :$ ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ape.ply -imagedir=../data/images_ape/ -labeldir=../data/label_ape.txt -num_class=2 -label_class=0, then press 'q' to run the demo for images generation when you see the gray background and a coordinate.}"
+	const String keys = "{help | | demo :$ ./sphereview_test -ite_depth=2 -plymodel=../3Dmodel/ape.ply -imagedir=../data/images_ape/ -labeldir=../data/label_ape.txt -num_class=4 -label_class=0, then press 'q' to run the demo for images generation when you see the gray background and a coordinate.}"
 			     "{ite_depth | 1 | Iteration of sphere generation.}"
 			     "{plymodel | ../ape.ply | path of the '.ply' file for image rendering. }"
 			     "{imagedir | ../data/images_ape/ | path of the generated images for one particular .ply model. }"
@ -191,7 +68,7 @@ int main(int argc, char *argv[]){
 	bool camera_pov = (true);
 	/// Create a window
 	viz::Viz3d myWindow("Coordinate Frame");
-	myWindow.setWindowSize(Size(250,250));
+	myWindow.setWindowSize(Size(64,64));
 	/// Add coordinate axes
 	myWindow.showWidget("Coordinate Widget", viz::WCoordinateSystem());
 	myWindow.setBackgroundColor(viz::Color::gray());
@ -200,12 +77,12 @@ int main(int argc, char *argv[]){
 	/// Let's assume camera has the following properties
 	/// Create a cloud widget.
 	viz::Mesh objmesh = viz::Mesh::load(plymodel);
-	Point3d cam_focal_point = getCenter(objmesh.cloud);
+	Point3d cam_focal_point = ViewSphere.getCenter(objmesh.cloud);
-	float radius = getRadius(objmesh.cloud, cam_focal_point);
+	float radius = ViewSphere.getRadius(objmesh.cloud, cam_focal_point);
 	Point3d cam_y_dir(0.0f,0.0f,1.0f);
 	const char* headerPath = "./header_for_";
 	const char* binaryPath = "./binary_";
-	createHeader((int)campos.size(), 250, 250, headerPath);
+	ViewSphere.createHeader((int)campos.size(), 64, 64, headerPath);
 	for(int pose = 0; pose < (int)campos.size(); pose++){
 		imglabel << campos.at(pose).x << ' ' << campos.at(pose).y << ' ' << campos.at(pose).z << endl;
 		/// We can get the pose of the cam using makeCameraPoses
@ -240,7 +117,7 @@ int main(int argc, char *argv[]){
 		filename = imagedir + filename;
 		filename += ".png";
 		myWindow.saveScreenshot(filename);
-		writeBinaryfile(filename, binaryPath, headerPath,(int)campos.size()*num_class, label_class);
+		ViewSphere.writeBinaryfile(filename, binaryPath, headerPath,(int)campos.size()*num_class, label_class);
 	}
 	return 1;
 };
--- a/modules/cnn_3dobj/src/cnn_3dobj.cpp
+++ b/modules/cnn_3dobj/src/cnn_3dobj.cpp
@ -2,17 +2,18 @@
 using namespace cv;
 using namespace std;
-namespace cv{ namespace cnn_3dobj{
+namespace cv
 {
 namespace cnn_3dobj
 {
 	IcoSphere::IcoSphere(float radius_in, int depth_in)
 	{
 		X = 0.5f;
 		Z = 0.5f;
-		int radius = radius_in;
+		X *= (int)radius_in;
-		int depth = depth_in;
+		Z *= (int)radius_in;
 		X *= radius;
 		Z *= radius;
 		diff = 0.00000005964;
 		float vdata[12][3] = { { -X, 0.0f, Z }, { X, 0.0f, Z },
 				{ -X, 0.0f, -Z }, { X, 0.0f, -Z }, { 0.0f, Z, X }, { 0.0f, Z, -X },
@ -26,14 +27,11 @@ namespace cv{ namespace cnn_3dobj{
 				{ 11, 0, 6 }, { 0, 1, 6 }, { 6, 1, 10 }, { 9, 0, 11 },
 				{ 9, 11, 2 }, { 9, 2, 5 }, { 7, 2, 11 } };
 		std::vector<float>* texCoordsList = new std::vector<float>;
 		std::vector<int>* indicesList = new std::vector<int>;
 		// Iterate over points
 		for (int i = 0; i < 20; ++i) {
 			subdivide(vdata[tindices[i][0]], vdata[tindices[i][1]],
-					vdata[tindices[i][2]], depth);
+					vdata[tindices[i][2]], depth_in);
 		}
 		CameraPos_temp.push_back(CameraPos[0]);
 		for (int j = 1; j<int(CameraPos.size()); j++)
@ -114,4 +112,130 @@ namespace cv{ namespace cnn_3dobj{
 		subdivide(v3, v31, v23, depth - 1);
 		subdivide(v12, v23, v31, depth - 1);
 	}
 	uint32_t IcoSphere::swap_endian(uint32_t val)
 	{
    		val = ((val << 8) & 0xFF00FF00) | ((val >> 8) & 0xFF00FF);
    		return (val << 16) | (val >> 16);
 	}
 	cv::Point3d IcoSphere::getCenter(cv::Mat cloud)
 	{
 		Point3f* data = cloud.ptr<cv::Point3f>();
 		Point3d dataout;
 		for(int i = 0; i < cloud.cols; ++i)
 		    {
 			dataout.x += data[i].x;
 			dataout.y += data[i].y;
 			dataout.z += data[i].z;
 		    }
 		dataout.x = dataout.x/cloud.cols;
 		dataout.y = dataout.y/cloud.cols;
 		dataout.z = dataout.z/cloud.cols;
 		return dataout;
 	}
 	float IcoSphere::getRadius(cv::Mat cloud, cv::Point3d center)
 	{
 		float radiusCam = 0;
 		Point3f* data = cloud.ptr<cv::Point3f>();
 		Point3d datatemp;
 		for(int i = 0; i < cloud.cols; ++i)
 		    {
 			datatemp.x = data[i].x - (float)center.x;
 			datatemp.y = data[i].y - (float)center.y;
 			datatemp.z = data[i].z - (float)center.z;
 			float Radius = sqrt(pow(datatemp.x,2)+pow(datatemp.y,2)+pow(datatemp.z,2));
 			if(Radius > radiusCam)
 			{
 				radiusCam = Radius;
 			}
 		    }
 		radiusCam *= 4;
 		return radiusCam;
 	};
 	void IcoSphere::createHeader(int num_item, int rows, int cols, const char* headerPath)
 	{
 		char* a0 = (char*)malloc(1024);
 		strcpy(a0, headerPath);
 		char a1[] = "image";
 		char a2[] = "label";
 		char* headerPathimg = (char*)malloc(1024);
 		strcpy(headerPathimg, a0);
 		strcat(headerPathimg, a1);
 		char* headerPathlab = (char*)malloc(1024);
 		strcpy(headerPathlab, a0);
 		strcat(headerPathlab, a2);
 		std::ofstream headerImg(headerPathimg, ios::out|ios::binary);
 		std::ofstream headerLabel(headerPathlab, ios::out|ios::binary);
 		int headerimg[4] = {2051,num_item,rows,cols};
 		for (int i=0; i<4; i++)
 			headerimg[i] = swap_endian(headerimg[i]);
 		int headerlabel[2] = {2049,num_item};
 		for (int i=0; i<2; i++)
 			headerlabel[i] = swap_endian(headerlabel[i]);
 		headerImg.write(reinterpret_cast<const char*>(headerimg), sizeof(int)*4);
 		headerImg.close();
 		headerLabel.write(reinterpret_cast<const char*>(headerlabel), sizeof(int)*2);
 		headerLabel.close();
 	};
 	void IcoSphere::writeBinaryfile(string filenameImg, const char* binaryPath, const char* headerPath, int num_item, int label_class)
 	{
 		int isrgb = 0;
 		cv::Mat ImgforBin = cv::imread(filenameImg, isrgb);
 		char* A0 = (char*)malloc(1024);
 		strcpy(A0, binaryPath);
 		char A1[] = "image";
 		char A2[] = "label";
 		char* binPathimg = (char*)malloc(1024);
 		strcpy(binPathimg, A0);
 		strcat(binPathimg, A1);
 		char* binPathlab = (char*)malloc(1024);
 		strcpy(binPathlab, A0);
 		strcat(binPathlab, A2);
 		fstream img_file, lab_file;
 		img_file.open(binPathimg,ios::in);
 		lab_file.open(binPathlab,ios::in);
 		if(!img_file)
 		{
 			cout << "Creating the training data at: " << binaryPath << ". " << endl;
 			char* a0 = (char*)malloc(1024);
 			strcpy(a0, headerPath);
 			char a1[] = "image";
 			char a2[] = "label";
 			char* headerPathimg = (char*)malloc(1024);
 			strcpy(headerPathimg, a0);
 			strcat(headerPathimg,a1);
 			char* headerPathlab = (char*)malloc(1024);
 			strcpy(headerPathlab, a0);
 			strcat(headerPathlab,a2);
 			createHeader(num_item, 64, 64, binaryPath);
 			img_file.open(binPathimg,ios::out|ios::binary|ios::app);
 			lab_file.open(binPathlab,ios::out|ios::binary|ios::app);
 			for (int r = 0; r < ImgforBin.rows; r++)
 			  {
 				img_file.write(reinterpret_cast<const char*>(ImgforBin.ptr(r)), ImgforBin.cols*ImgforBin.elemSize());
 			  }
 			unsigned char templab = (unsigned char)label_class;
 			lab_file << templab;
 		}
 		else
 		{
 			img_file.close();
 			lab_file.close();
 			img_file.open(binPathimg,ios::out|ios::binary|ios::app);
 			lab_file.open(binPathlab,ios::out|ios::binary|ios::app);
 			cout <<"Concatenating the training data at: " << binaryPath << ". " << endl;
 			for (int r = 0; r < ImgforBin.rows; r++)
 			  {
 				img_file.write(reinterpret_cast<const char*>(ImgforBin.ptr(r)), ImgforBin.cols*ImgforBin.elemSize());
 			  }
 			unsigned char templab = (unsigned char)label_class;
 			lab_file << templab;
 		}
 		img_file.close();
 		lab_file.close();
 	};
 }}
--- a/modules/cnn_3dobj/src/precomp.hpp
+++ b/modules/cnn_3dobj/src/precomp.hpp
@ -48,6 +48,9 @@ the use of this software, even if advised of the possibility of such damage.
 #include <opencv2/highgui.hpp>
 #include <iostream>
 #include <vector>
 #include <string>
 #include <stdio.h>
 #include <iostream>
 #include <math.h>
 #endif