perseusdg
diff --git a/‎README.md
Lines changed: 6 additions & 1 deletion b/‎README.md
Lines changed: 6 additions & 1 deletion
diff --git a/‎demo/demo/demo.cpp
Lines changed: 46 additions & 21 deletions b/‎demo/demo/demo.cpp
Lines changed: 46 additions & 21 deletions
diff --git a/‎demo/demo/map.cpp
Lines changed: 47 additions & 25 deletions b/‎demo/demo/map.cpp
Lines changed: 47 additions & 25 deletions
diff --git a/‎include/tkDNN/CenternetDetection.h
Lines changed: 3 additions & 3 deletions b/‎include/tkDNN/CenternetDetection.h
Lines changed: 3 additions & 3 deletions
@@ -123,13 +123,16 @@ rm yolo3_fp32.rt        # be sure to delete(or move) old tensorRT files
 ```
 In general the demo program takes 4 parameters:
 ```
-./demo <network-rt-file> <path-to-video> <kind-of-network> <number-of-classes>
+./demo <network-rt-file> <path-to-video> <kind-of-network> <number-of-classes> <n-batches> <show-flag>
 ```
 where
 *  ```<network-rt-file>``` is the rt file generated by a test
 *  ```<<path-to-video>``` is the path to a video file or a camera input  
 *  ```<kind-of-network>``` is the type of network. Thee types are currently supported: ```y``` (YOLO family), ```c``` (CenterNet family) and ```m``` (MobileNet-SSD family)
 *  ```<number-of-classes>```is the number of classes the network is trained on
+*  ```<n-batches>``` number of batches to use in inference (N.B. you should first export TKDNN_BATCHSIZE to the required n_batches and create again the rt file for the network).
+*  ```<show-flag>``` if set to 0 the demo will not show the visualization but save the video into result.mp4 (if n-batches ==1)
+
 N.b. By default it is used FP32 inference
 
 ![demo](https://user-images.githubusercontent.com/11562617/72547657-540e7800-388d-11ea-83c6-49dfea2a0607.gif)
@@ -218,6 +221,8 @@ cd build
 ./map_demo dla34_cnet_FP32.rt c ../demo/COCO_val2017/all_labels.txt ../demo/config.yaml
 ```
 
+This demo also creates a json file named ```net_name_COCO_res.json``` containing all the detections computed. The detections are in COCO format, the correct format to subit the results to [CodaLab COCO detection challenge](https://competitions.codalab.org/competitions/20794#participate).
+
 ## Existing tests and supported networks
 
 | Test Name         | Network                                       | Dataset                                                       | N Classes | Input size    | Weights                                                                   |
 
@@ -34,6 +34,18 @@ int main(int argc, char *argv[]) {
     int n_classes = 80;
     if(argc > 4)
         n_classes = atoi(argv[4]); 
+    int n_batch = 1;
+    if(argc > 5)
+        n_batch = atoi(argv[5]); 
+    bool show = true;
+    if(argc > 6)
+        show = atoi(argv[6]); 
+
+    if(n_batch < 1 || n_batch > 64)
+        FatalError("Batch dim not supported");
+
+    if(!show)
+        SAVE_RESULT = true;
 
     tk::dnn::Yolo3Detection yolo;
     tk::dnn::CenternetDetection cnet;
@@ -57,7 +69,7 @@ int main(int argc, char *argv[]) {
         FatalError("Network type not allowed (3rd parameter)\n");
     }
 
-    detNN->init(net, n_classes);
+    detNN->init(net, n_classes, n_batch);
 
     gRun = true;
 
@@ -75,38 +87,51 @@ int main(int argc, char *argv[]) {
     }
 
     cv::Mat frame;
-    cv::Mat dnn_input;
-    cv::namedWindow("detection", cv::WINDOW_NORMAL);
-    
-    std::vector<tk::dnn::box> detected_bbox;
+    if(show)
+        cv::namedWindow("detection", cv::WINDOW_NORMAL);
+
+    std::vector<cv::Mat> batch_frame;
+    std::vector<cv::Mat> batch_dnn_input;
 
     while(gRun) {
-        cap >> frame; 
-        if(!frame.data) {
-            break;
-        }  
- 
-        // this will be resized to the net format
-        dnn_input = frame.clone();
+        batch_dnn_input.clear();
+        batch_frame.clear();
 
+        for(int bi=0; bi< n_batch; ++bi){
+            cap >> frame; 
+            if(!frame.data) 
+                break;
+            
+            batch_frame.push_back(frame);
+
+            // this will be resized to the net format
+            batch_dnn_input.push_back(frame.clone());
+        } 
+        if(!frame.data) 
+            break;
+    
         //inference
-        detNN->update(dnn_input);
-        frame = detNN->draw(frame);
-
-        cv::imshow("detection", frame);
-        cv::waitKey(1);
-        if(SAVE_RESULT)
+        detNN->update(batch_dnn_input, n_batch);
+        detNN->draw(batch_frame);
+
+        if(show){
+            for(int bi=0; bi< n_batch; ++bi){
+                cv::imshow("detection", batch_frame[bi]);
+                cv::waitKey(1);
+            }
+        }
+        if(n_batch == 1 && SAVE_RESULT)
             resultVideo << frame;
     }
 
     std::cout<<"detection end\n";   
     double mean = 0; 
 
     std::cout<<COL_GREENB<<"\n\nTime stats:\n";
-    std::cout<<"Min: "<<*std::min_element(detNN->stats.begin(), detNN->stats.end())<<" ms\n";    
-    std::cout<<"Max: "<<*std::max_element(detNN->stats.begin(), detNN->stats.end())<<" ms\n";    
+    std::cout<<"Min: "<<*std::min_element(detNN->stats.begin(), detNN->stats.end())/n_batch<<" ms\n";    
+    std::cout<<"Max: "<<*std::max_element(detNN->stats.begin(), detNN->stats.end())/n_batch<<" ms\n";    
     for(int i=0; i<detNN->stats.size(); i++) mean += detNN->stats[i]; mean /= detNN->stats.size();
-    std::cout<<"Avg: "<<mean<<" ms\n"<<COL_END;   
+    std::cout<<"Avg: "<<mean/n_batch<<" ms\t"<<1000/(mean/n_batch)<<" FPS\n"<<COL_END;   
 
 
     return 0;
 
@@ -34,6 +34,7 @@ int main(int argc, char *argv[])
     bool show = false;
     bool write_dets = false;
     bool write_res_on_file = true;
+    bool write_coco_json = true;
     int n_images = 5000;
 
     bool verbose;
@@ -43,6 +44,7 @@ int main(int argc, char *argv[])
     double vm_total = 0, rss_total = 0;
     double vm, rss;
 
+    //read args
     if(argc > 1)
         net = argv[1]; 
     if(argc > 2)
@@ -52,6 +54,7 @@ int main(int argc, char *argv[])
     if(argc > 4)
         config_filename = argv[4]; 
 
+    //check if files needed exist
     if(!fileExist(config_filename))
         FatalError("Wrong config file path.");
     if(!fileExist(net))
@@ -63,26 +66,31 @@ int main(int argc, char *argv[])
     tk::dnn::readmAPParams( config_filename, classes,  map_points, map_levels, map_step,
                 IoU_thresh, conf_thresh, verbose);
 
-    std::ofstream times, memory;
+    //extract network name from rt path
     std::string net_name;
     removePathAndExtension(net, net_name);
     std::cout<<"Network: "<<net_name<<std::endl;
 
+    //open files (if needed)
+    std::ofstream times, memory, coco_json;
+
+    if(write_coco_json){
+        coco_json.open(net_name+"_COCO_res.json");
+        coco_json << "[\n";
+    }
+
     if(write_res_on_file){
         times.open("times_"+net_name+".csv");
         memory.open("memory.csv", std::ios_base::app);
         memory<<net<<";";
     }
 
+    // instantiate detector
     tk::dnn::Yolo3Detection yolo;
     tk::dnn::CenternetDetection cnet;
     tk::dnn::MobilenetDetection mbnet;
-
     tk::dnn::DetectionNN *detNN;  
-
     int n_classes = classes;   
-    
-    
     switch(ntype){
         case 'y':
             detNN = &yolo;
@@ -97,9 +105,9 @@ int main(int argc, char *argv[])
         default:
             FatalError("Network type not allowed (3rd parameter)\n");
     }
-
     detNN->init(net, n_classes);
 
+    //read images 
     std::ifstream all_labels(labels_path);
     std::string l_filename;
     std::vector<tk::dnn::Frame> images;
@@ -124,21 +132,25 @@ int main(int argc, char *argv[])
             FatalError("Wrong image file path.");
 
         cv::Mat frame = cv::imread(f.iFilename.c_str(), cv::IMREAD_COLOR);
+        std::vector<cv::Mat> batch_frames;
+        batch_frames.push_back(frame);
         int height = frame.rows;
         int width = frame.cols;
 
-        cv::Mat dnn_input;
         if(!frame.data) 
             break;
-        dnn_input = frame.clone();
+        std::vector<cv::Mat> batch_dnn_input;
+        batch_dnn_input.push_back(frame.clone());
 
         //inference 
-        
         detected_bbox.clear();
-        detNN->update(dnn_input, write_res_on_file, &times);
-        frame = detNN->draw(frame);
+        detNN->update(batch_dnn_input,1,write_res_on_file, &times, write_coco_json);
+        detNN->draw(batch_frames);
         detected_bbox = detNN->detected;
-        
+
+        if(write_coco_json)
+            printJsonCOCOFormat(&coco_json, f.iFilename.c_str(), detected_bbox, classes,  width, height);        
+
         std::ofstream myfile;
         if(write_dets)
             myfile.open ("det/"+f.lFilename.substr(f.lFilename.find("000")));
@@ -160,30 +172,33 @@ int main(int argc, char *argv[])
                 myfile << d.cl << " "<< d.prob << " "<< d.x << " "<< d.y << " "<< d.w << " "<< d.h <<"\n";
 
 			if(show)// draw rectangle for detection
-                cv::rectangle(frame, cv::Point(d.x, d.y), cv::Point(d.x + d.w, d.y + d.h), cv::Scalar(0, 0, 255), 2);             
+                cv::rectangle(batch_frames[0], cv::Point(d.x, d.y), cv::Point(d.x + d.w, d.y + d.h), cv::Scalar(0, 0, 255), 2);             
         }
 
         if(write_dets)
             myfile.close();
 
         // read and save groundtruth labels
-        std::ifstream labels(l_filename);
-        for(std::string line; std::getline(labels, line); ){
-            std::istringstream in(line); 
-            tk::dnn::BoundingBox b;
-            in >> b.cl >> b.x >> b.y >> b.w >> b.h;  
-            b.prob = 1;
-            b.truthFlag = 1;
-            f.gt.push_back(b);
-
-            if(show)// draw rectangle for groundtruth
-                cv::rectangle(frame, cv::Point((b.x-b.w/2)*width, (b.y-b.h/2)*height), cv::Point((b.x+b.w/2)*width,(b.y+b.h/2)*height), cv::Scalar(0, 255, 0), 2);             
+        if(fileExist(f.lFilename.c_str()))
+        {
+            std::ifstream labels(l_filename);
+            for(std::string line; std::getline(labels, line); ){
+                std::istringstream in(line); 
+                tk::dnn::BoundingBox b;
+                in >> b.cl >> b.x >> b.y >> b.w >> b.h;  
+                b.prob = 1;
+                b.truthFlag = 1;
+                f.gt.push_back(b);
+
+                if(show)// draw rectangle for groundtruth
+                    cv::rectangle(batch_frames[0], cv::Point((b.x-b.w/2)*width, (b.y-b.h/2)*height), cv::Point((b.x+b.w/2)*width,(b.y+b.h/2)*height), cv::Scalar(0, 255, 0), 2);             
+            }
         }    
 
         images.push_back(f);
 
         if(show){
-            cv::imshow("detection", frame);
+            cv::imshow("detection", batch_frames[0]);
             cv::waitKey(0);
         }
 
@@ -193,6 +208,13 @@ int main(int argc, char *argv[])
 
 
     }
+
+    if(write_coco_json){
+        coco_json.seekp (coco_json.tellp() - std::streampos(2));
+        coco_json << "\n]\n";
+        coco_json.close();
+    }
+
     std::cout << "Avg VM[MB]: " << vm_total/images_done/1024.0 << ";Avg RSS[MB]: " << rss_total/images_done/1024.0 << std::endl;
 
     //compute mAP
 
@@ -73,9 +73,9 @@ class CenternetDetection : public DetectionNN
     CenternetDetection() {};
     ~CenternetDetection() {}; 
 
-    bool init(const std::string& tensor_path, const int n_classes=80);
-    void preprocess(cv::Mat &frame);
-    void postprocess();
+    bool init(const std::string& tensor_path, const int n_classes=80, const int n_batches=1);
+    void preprocess(cv::Mat &frame, const int bi=0);
+    void postprocess(const int bi=0,const bool mAP=false);
 };