开发者论坛

全部回复

LV.2 #4 lanhao回复
#3zwb回复
您好，请问为什么会出现同一张图检测框结果不一样的情况呢，是因为outputdata的值的问题吗
1、生成离线模型，batch size是固定的，比如生成batch size=1的离线模型，那么在推理时只能每次推理一张图;生成batch size = 4的离线模型，那么在推理时必须输入四张图片 2、根据您的代码，推理完成后进行后处理的部分，只是在处理batch size=1的推理结果，并不是batch size=4的推理结果
2022-01-18 10:41:22 1| 回复

LV.2 #3 zwb回复

#1lanhao回复

batch size=1没有问题说明离线模型生成方式以及前后处理的方法是没有问题的。首先需要检查batch size=4时的cambricon_twins文件里，batchsize的大小。其次检查融合模式batchsize=4时的推理结果对不对。最后如果融合模式batch size=4的推理结果是正确的，检查融合模式的前后处理与离线模型的前后处理的区别，目前看起来可能是模型推理完进行的batch size=4的后处理有问题。

展开

您好，请问为什么会出现同一张图检测框结果不一样的情况呢，是因为outputdata的值的问题吗

2022-01-17 16:52:10 1| 回复

LV.2 #2 zwb回复

因为只有mlu220边缘设备，所以无法看到融合模式结果，只能生成离线模型，对于同一张图在batchsize=4的情况下，输出的boxnumber分别为56，27，0，0，为什么会出现检测框数目不一样的情况呢，后处理部分代码如下

void writeVisualizeBBox(
    const vector<cv::Mat>& images,
    const vector<vector<vector<float>>> detections,
    const vector<string>& labelToDisplayName, 
    const vector<string>& imageNames,
    int input_dim) {
  // Retrieve detections.
  for (int i = 0; i < images.size(); ++i) {
    if (imageNames[i] == "null") continue;
    cv::Mat image;
    image = images[i];
    vector<vector<float>> result = detections[i];
    std::string name = imageNames[i];
    int positionMap = imageNames[i].rfind("/");
    if (positionMap > 0 && positionMap < imageNames[i].size()) {
      name = name.substr(positionMap + 1);
    }
    positionMap = name.find(".");
    if (positionMap > 0 && positionMap < name.size()) {
      name = name.substr(0, positionMap);
    }
    string filename = "result/"+name + ".txt";
    std::ofstream fileMap(filename);
    float scaling_factors = std::min(
        static_cast<float>(input_dim) / static_cast<float>(images[i].cols),
        static_cast<float>(input_dim) / static_cast<float>(images[i].rows));
    for (int j = 0; j < result.size(); j++) {
      result[j][0] =
          result[j][0]  -
          static_cast<float>(input_dim - scaling_factors * image.cols) / 2.0;
      result[j][2] =
          result[j][2]  -
          static_cast<float>(input_dim - scaling_factors * image.cols) / 2.0;
      result[j][1] =
          result[j][1]  -
          static_cast<float>(input_dim - scaling_factors * image.rows) / 2.0;
      result[j][3] =
          result[j][3]  -
          static_cast<float>(input_dim - scaling_factors * image.rows) / 2.0;

      for (int k = 0; k < 4; k++) {
        result[j][k] = result[j][k] / scaling_factors;
       // cout << result[j][k] << " ";
      }
     // cout << endl;
    }

    for (int j = 0; j < result.size(); j++) {
      result[j][0] = result[j][0] < 0 ? 0 : result[j][0];
      result[j][2] = result[j][2] < 0 ? 0 : result[j][2];
      result[j][1] = result[j][1] < 0 ? 0 : result[j][1];
      result[j][3] = result[j][3] < 0 ? 0 : result[j][3];
      result[j][0] = result[j][0] > image.cols ? image.cols : result[j][0];
      result[j][2] = result[j][2] > image.cols ? image.cols : result[j][2];
      result[j][1] = result[j][1] > image.rows ? image.rows : result[j][1];
      result[j][3] = result[j][3] > image.rows ? image.rows : result[j][3];
    }
    for (int j = 0; j < result.size(); j++) {
      int x0 = static_cast<int>(result[j][0]);
      int y0 = static_cast<int>(result[j][1]);
      int x1 = static_cast<int>(result[j][2]);
      int y1 = static_cast<int>(result[j][3]);
      //cout << "(" <<x0 << "," << y0 << ")" << "(" << y0 << "," << y1 << ")" << endl;
      cv::Point p1(x0, y0);
      cv::Point p2(x1, y1);
      cv::rectangle(image, p1, p2, cv::Scalar(0, 0, 255), 2);
      stringstream ss;
      ss << round(result[j][4] * 1000) / 1000.0;
      std::string str = labelToDisplayName[static_cast<int>(result[j][5])] + ":" + ss.str();
      //std::string str = ss.str();
      cv::Point p5(x0, y0 - 2);
     // cv::rectanle(image, p1, p2, )
      cv::putText(image, str, p5, cv::FONT_HERSHEY_SIMPLEX, 0.6,
                  cv::Scalar(255, 0, 0), 2);
      //std::cout << "it is "  << result[j][5] << ":" << result[j][4] << std::endl;
      fileMap << labelToDisplayName[static_cast<int>(result[j][5])] << " "
              << ss.str() << " "
              << static_cast<float>(result[j][0])  << " "
              << static_cast<float>(result[j][1])  << " "
              << static_cast<float>(result[j][2])  << " "
              << static_cast<float>(result[j][3])  << " "
              << image.cols << " " << image.rows << std::endl;
    }
    fileMap.close();
    stringstream ss;
    string outFile;
    ss <<  "result/yolov5_" << name << ".jpg";
    ss >> outFile;
    cv::imwrite(outFile.c_str(), image);
  }
}

void readLabels(string filename, vector<string>& labels) {
  std::ifstream file(filename);
  if (file.fail())
    std::cerr << "failed to open labels file!";

  std::string line;
  while (getline(file, line)) {
    labels.push_back(line);
  }
  file.close();
}

using std::vector;
using std::string;
/*vector<vector<vector<float>>> getResults(float* outputData,
                                         int dimNumm,
                                         int *dimValues) {
  vector<vector<vector<float>>> detections;

  // BangOp implementation
  float max_limit = 1;
  float min_limit = 0;
  float input_size = 640;
  int batchSize = dimValues[0];
  int count = dimValues[3];
  for (int i = 0; i < batchSize; i++) {
    int num_boxes = static_cast<int>(outputData[i * count]);
    vector<vector<float>> batch_box;
    for (int k = 0; k < num_boxes; k++) {
      int index = i * count + 64 + k * 7;
      vector<float> single_box;
      float bl = std::max(
          min_limit, std::min(max_limit, outputData[index + 3]/input_size));  // x1
      float br = std::max(
          min_limit, std::min(max_limit, outputData[index + 5]/input_size));  // x2
      float bt = std::max(
          min_limit, std::min(max_limit, outputData[index + 4]/input_size));  // y1
      float bb = std::max(
          min_limit, std::min(max_limit, outputData[index + 6]/input_size));  // y2
      single_box.push_back(bl);
      single_box.push_back(bt);
      single_box.push_back(br);
      single_box.push_back(bb);
      single_box.push_back(outputData[index + 2]);
      single_box.push_back(outputData[index + 1]);
      for(auto s:single_box)
        cout << s << " ";
      cout << endl;
      if ((br - bl) > 0 && (bb - bt) > 0) {
        batch_box.push_back(single_box);
      }
    }
    detections.push_back(batch_box);
  }
  return detections;
}*/

vector<vector<vector<float>>> getResults(float* outputData,
                                         int dimNumm,
                                         int *dimValues) {
  vector<vector<vector<float>>> detections;

  int batchSize = dimValues[0];
  int count = dimValues[3];
  for (int i = 0; i < batchSize; i++) {
    int num_boxes = static_cast<int>(outputData[i * count]);
    vector<vector<float>> batch_box;
    for (int k = 0; k < num_boxes; k++) {
      int index = i * count + 64 + k * 7;
      vector<float> single_box;
      float bl = outputData[index + 3];
      float br = outputData[index + 5];
      float bt = outputData[index + 4];
      float bb = outputData[index + 6];
      single_box.push_back(bl);
      single_box.push_back(bt);
      single_box.push_back(br);
      single_box.push_back(bb);
      single_box.push_back(outputData[index + 2]);
      single_box.push_back(outputData[index + 1]);
    //  for(auto s:single_box)
    //    cout << s << " ";
    //  cout << endl;
      if ((br - bl) > 0 && (bb - bt) > 0) {
        batch_box.push_back(single_box);
      }
    }
    detections.push_back(batch_box);
  }
  return detections;
}

2022-01-17 16:50:43 1| 回复

LV.2 #1 lanhao回复

batch size=1没有问题说明离线模型生成方式以及前后处理的方法是没有问题的。首先需要检查batch size=4时的cambricon_twins文件里，batchsize的大小。其次检查融合模式batchsize=4时的推理结果对不对。最后如果融合模式batch size=4的推理结果是正确的，检查融合模式的前后处理与离线模型的前后处理的区别，目前看起来可能是模型推理完进行的batch size=4的后处理有问题。

2022-01-17 15:48:00 1| 回复

请登录后评论