update181229

ChenYingpeng · ChenYingpeng · commit 9ed917190f6c · 2018-12-29T11:09:53.000+08:00
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -10,8 +10,9 @@ set(
 	CUDA_NVCC_FLAGS
 	${CUDA_NVCC_FLAGS}; 
     -O3 
-	-gencode arch=compute_53,code=sm_53
-	-gencode arch=compute_62,code=sm_62
+	-gencode arch=compute_53,code=sm_53  #tegra tx1 
+        -gencode arch=compute_61,code=sm_61  #gtx 1060
+	-gencode arch=compute_62,code=sm_62  #tegra tx2
 )
 
 # setup project output paths
@@ -32,8 +33,8 @@ set(CMAKE_ARCHIVE_OUTPUT_DIRECTORY ${PROJECT_OUTPUT_DIR}/lib)
 # build C/C++ interface
 include_directories(${PROJECT_INCLUDE_DIR} ${GIE_PATH}/include)
 include_directories(${PROJECT_INCLUDE_DIR} 
-	/home/nvidia/caffe/include 
-	/home/nvidia/caffe/build/include 
+	/home/chen/caffe/include 
+	/home/chen/caffe/build/include 
 )
 
 
@@ -42,11 +43,11 @@ file(GLOB inferenceIncludes *.h )
 
 cuda_add_library(sysDetectSpeed SHARED ${inferenceSources})
 target_link_libraries(sysDetectSpeed 
-	/home/nvidia/caffe/build/lib/libcaffe.so  
-	/usr/lib/aarch64-linux-gnu/libglog.so  
-	/usr/lib/aarch64-linux-gnu/libgflags.so.2
-    	/usr/lib/aarch64-linux-gnu/libboost_system.so  
-	/usr/lib/aarch64-linux-gnu/libGLEW.so.1.13  
+	/home/chen/caffe/build/lib/libcaffe.so  
+	/usr/lib/x86_64-linux-gnu/libglog.so  
+	/usr/lib/x86_64-linux-gnu/libgflags.so.2
+    	/usr/lib/x86_64-linux-gnu/libboost_system.so  
+	/usr/lib/x86_64-linux-gnu/libGLEW.so.1.13  
 )
 
 
diff --git a/activation_kernels.cu b/activation_kernels.cu
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/activations.h b/activations.h
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/blas.h b/blas.h
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/blas_kernels.cu b/blas_kernels.cu
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/box.h b/box.h
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/cuda.cpp b/cuda.cpp
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/cuda.h b/cuda.h
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
diff --git a/detectnet/detectnet.cpp b/detectnet/detectnet.cpp
@@ -1,6 +1,6 @@
 
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04	
  */
@@ -22,11 +22,12 @@
 using namespace caffe;
 using namespace cv;
 
-//YOLOV3
-const string& model_file = "/home/nvidia/projects/caffe-yolov3/data/networks/yolov3/yolov3.prototxt";
-const string& weights_file = "/home/nvidia/projects/caffe-yolov3/data/networks/yolov3/yolov3.caffemodel";
+const int timeIters = 10;
 
-const char* imgFilename = "/home/nvidia/projects/caffe-yolov3/data/images/dog.jpg";
+//YOLOV3
+const string& model_file = "/home/chen/projects/caffe-yolov3/data/yolov3/yolov3.prototxt";//modify your model file path
+const string& weights_file = "/home/chen/projects/caffe-yolov3/data/yolov3/yolov3.caffemodel";//modify your weights file path
+const char* imgFilename = "/home/chen/projects/caffe-yolov3/data/images/dog.jpg"; //modify your images file path
 
 uint64_t current_timestamp() {
     struct timeval te; 
@@ -47,7 +48,7 @@ void sig_handler(int signo)
 
 int main( int argc, char** argv )
 {
-    printf("detectnet-camera\n  args (%i):  ", argc);
+    printf("detectnet\n  args (%i):  ", argc);
 
     for( int i=0; i < argc; i++ )
 	printf("%i [%s]  ", i, argv[i]);
@@ -77,39 +78,48 @@ int main( int argc, char** argv )
 
     int size = input_data_blobs->channels()*input_data_blobs->width()*input_data_blobs->height();
 
-    uint64_t beginDataTime =  current_timestamp();
-    //load image
-    image im = load_image_color((char*)imgFilename,0,0);
-    image sized = letterbox_image(im,input_data_blobs->width(),input_data_blobs->height());
-    cuda_push_array(input_data_blobs->mutable_gpu_data(),sized.data,size);
-
-    uint64_t endDataTime =  current_timestamp();
-
-    //YOLOV3 objection detection implementation with Caffe
-    uint64_t beginDetectTime =  current_timestamp();
-
-    net->Forward();
-
-    vector<Blob<float>*> blobs;
-    blobs.clear();
-    Blob<float>* out_blob1 = net->output_blobs()[1];
-    blobs.push_back(out_blob1);
-    Blob<float>* out_blob2 = net->output_blobs()[2];
-    blobs.push_back(out_blob2);
-    Blob<float>* out_blob3 = net->output_blobs()[0];
-    blobs.push_back(out_blob3);
-
-    printf("output blob1 shape c= %d, h = %d, w = %d\n",out_blob1->channels(),out_blob1->height(),out_blob1->width());
-    printf("output blob2 shape c= %d, h = %d, w = %d\n",out_blob2->channels(),out_blob2->height(),out_blob2->width());
-    printf("output blob3 shape c= %d, h = %d, w = %d\n",out_blob3->channels(),out_blob3->height(),out_blob3->width());
-
+    uint64_t dataTime = 0;
+    uint64_t networkTime = 0;
+    image im,sized;
     int nboxes = 0;
-    detection *dets = get_detections(blobs,im.w,im.h,&nboxes);
-
-    uint64_t endDetectTime = current_timestamp();
-    printf("object-detection:  finished processing data operation  (%zu)ms\n", endDataTime - beginDataTime);
-    printf("object-detection:  finished processing yolov3 network  (%zu)ms\n", endDetectTime - beginDetectTime);
-
+    detection *dets = NULL;
+    for(int i=0;i<timeIters;++i){
+    	uint64_t beginDataTime =  current_timestamp();
+    	//load image
+    	im = load_image_color((char*)imgFilename,0,0);
+    	sized = letterbox_image(im,input_data_blobs->width(),input_data_blobs->height());
+    	cuda_push_array(input_data_blobs->mutable_gpu_data(),sized.data,size);
+
+    	uint64_t endDataTime =  current_timestamp();
+        dataTime += (endDataTime - beginDataTime);
+
+    	//YOLOV3 objection detection implementation with Caffe
+
+    	net->Forward();
+
+    	vector<Blob<float>*> blobs;
+    	blobs.clear();
+    	Blob<float>* out_blob1 = net->output_blobs()[1];
+    	blobs.push_back(out_blob1);
+    	Blob<float>* out_blob2 = net->output_blobs()[2];
+    	blobs.push_back(out_blob2);
+    	Blob<float>* out_blob3 = net->output_blobs()[0];
+    	blobs.push_back(out_blob3);
+
+    	//printf("output blob1 shape c= %d, h = %d, w = %d\n",out_blob1->channels(),out_blob1->height(),out_blob1->width());
+    	//printf("output blob2 shape c= %d, h = %d, w = %d\n",out_blob2->channels(),out_blob2->height(),out_blob2->width());
+    	//printf("output blob3 shape c= %d, h = %d, w = %d\n",out_blob3->channels(),out_blob3->height(),out_blob3->width());
+
+    	//int nboxes = 0;
+    	//printf("img width =%d, height = %d\n",im.w,im.h);
+    	dets = get_detections(blobs,im.w,im.h,&nboxes);
+
+    	uint64_t endDetectTime = current_timestamp();
+        networkTime += (endDetectTime - endDataTime);
+    }
+    
+    printf("object-detection: total iters = %d done, processing data operation avergae time is  (%zu)ms\n", timeIters,dataTime/timeIters);
+    printf("object-detection: total iters = %d done, processing network yolov3 avergae time is (%zu)ms\n", timeIters,networkTime/timeIters);
 
     //show detection results
     Mat img = imread(imgFilename);
diff --git a/image.h b/image.h
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/07
  */
diff --git a/yolo_layer.cpp b/yolo_layer.cpp
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04
  */
@@ -35,17 +35,17 @@ layer make_yolo_layer(int batch,int w,int h,int n,int total,int classes)
         l.biases[i] = biases[i];
     }
     l.mask = (int*)calloc(n,sizeof(int));
-    if(l.w == 13){
+    if(l.w == netW / 32){
         int j = 6;
         for(int i =0;i<l.n;++i)
             l.mask[i] = j++;
     }
-    if(l.w == 26){
+    if(l.w == netW / 16){
         int j = 3;
         for(int i =0;i<l.n;++i)
             l.mask[i] = j++;
     }
-    if(l.w == 52){
+    if(l.w == netW / 8){
         int j = 0;
         for(int i =0;i<l.n;++i)
             l.mask[i] = j++;
@@ -111,8 +111,10 @@ int yolo_num_detections(layer l,float thresh)
             if(l.output[obj_index] > thresh)
                 ++count;
         }
+	
     }
   }
+  //printf("count = %d\n",count);
     return count;
 }
 
diff --git a/yolo_layer.h b/yolo_layer.h
@@ -1,5 +1,5 @@
 /*
- * Company:	Systhesis
+ * Company:	Synthesis
  * Author: 	Chen
  * Date:	2018/06/04	
  */

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,5 @@`
`1`	`1`	`/*`
`2`		`- * Company: Systhesis`
	`2`	`+ * Company: Synthesis`
`3`	`3`	`* Author: Chen`
`4`	`4`	`* Date: 2018/06/04`
`5`	`5`	`*/`
`@@ -35,17 +35,17 @@ layer make_yolo_layer(int batch,int w,int h,int n,int total,int classes)`
`35`	`35`	`l.biases[i] = biases[i];`
`36`	`36`	`}`
`37`	`37`	`l.mask = (int*)calloc(n,sizeof(int));`
`38`		`- if(l.w == 13){`
	`38`	`+ if(l.w == netW / 32){`
`39`	`39`	`int j = 6;`
`40`	`40`	`for(int i =0;i<l.n;++i)`
`41`	`41`	`l.mask[i] = j++;`
`42`	`42`	`}`
`43`		`- if(l.w == 26){`
	`43`	`+ if(l.w == netW / 16){`
`44`	`44`	`int j = 3;`
`45`	`45`	`for(int i =0;i<l.n;++i)`
`46`	`46`	`l.mask[i] = j++;`
`47`	`47`	`}`
`48`		`- if(l.w == 52){`
	`48`	`+ if(l.w == netW / 8){`
`49`	`49`	`int j = 0;`
`50`	`50`	`for(int i =0;i<l.n;++i)`
`51`	`51`	`l.mask[i] = j++;`
`@@ -111,8 +111,10 @@ int yolo_num_detections(layer l,float thresh)`
`111`	`111`	`if(l.output[obj_index] > thresh)`
`112`	`112`	`++count;`
`113`	`113`	`}`
	`114`	`+`
`114`	`115`	`}`
`115`	`116`	`}`
	`117`	`+ //printf("count = %d\n",count);`
`116`	`118`	`return count;`
`117`	`119`	`}`
`118`	`120`