test_int8_layers.cpp 57 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442
  1. // This file is part of OpenCV project.
  2. // It is subject to the license terms in the LICENSE file found in the top-level directory
  3. // of this distribution and at http://opencv.org/license.html.
  4. #include "test_precomp.hpp"
  5. #include "npy_blob.hpp"
  6. #include <opencv2/dnn/shape_utils.hpp>
  7. #include <opencv2/dnn/all_layers.hpp>
  8. namespace opencv_test { namespace {
  9. testing::internal::ParamGenerator< tuple<Backend, Target> > dnnBackendsAndTargetsInt8()
  10. {
  11. std::vector< tuple<Backend, Target> > targets;
  12. targets.push_back(make_tuple(DNN_BACKEND_OPENCV, DNN_TARGET_CPU));
  13. #ifdef HAVE_TIMVX
  14. targets.push_back(make_tuple(DNN_BACKEND_TIMVX, DNN_TARGET_NPU));
  15. #endif
  16. #ifdef HAVE_INF_ENGINE
  17. targets.push_back(make_tuple(DNN_BACKEND_INFERENCE_ENGINE_NGRAPH, DNN_TARGET_CPU));
  18. #endif
  19. return testing::ValuesIn(targets);
  20. }
  21. template<typename TString>
  22. static std::string _tf(TString filename)
  23. {
  24. return (getOpenCVExtraDir() + "dnn/") + filename;
  25. }
  26. class Test_Int8_layers : public DNNTestLayer
  27. {
  28. public:
  29. void testLayer(const String& basename, const String& importer, double l1, double lInf,
  30. int numInps = 1, int numOuts = 1, bool useCaffeModel = false,
  31. bool useCommonInputBlob = true, bool hasText = false, bool perChannel = true)
  32. {
  33. CV_Assert_N(numInps >= 1, numInps <= 10, numOuts >= 1, numOuts <= 10);
  34. std::vector<Mat> inps(numInps), inps_int8(numInps);
  35. std::vector<Mat> refs(numOuts), outs_int8(numOuts), outs_dequantized(numOuts);
  36. std::vector<float> inputScale, outputScale;
  37. std::vector<int> inputZp, outputZp;
  38. String inpPath, outPath;
  39. Net net, qnet;
  40. if (importer == "Caffe")
  41. {
  42. String prototxt = _tf("layers/" + basename + ".prototxt");
  43. String caffemodel = _tf("layers/" + basename + ".caffemodel");
  44. net = readNetFromCaffe(prototxt, useCaffeModel ? caffemodel : String());
  45. inpPath = _tf("layers/" + (useCommonInputBlob ? "blob" : basename + ".input"));
  46. outPath = _tf("layers/" + basename);
  47. }
  48. else if (importer == "TensorFlow")
  49. {
  50. String netPath = _tf("tensorflow/" + basename + "_net.pb");
  51. String netConfig = hasText ? _tf("tensorflow/" + basename + "_net.pbtxt") : "";
  52. net = readNetFromTensorflow(netPath, netConfig);
  53. inpPath = _tf("tensorflow/" + basename + "_in");
  54. outPath = _tf("tensorflow/" + basename + "_out");
  55. }
  56. else if (importer == "ONNX")
  57. {
  58. String onnxmodel = _tf("onnx/models/" + basename + ".onnx");
  59. net = readNetFromONNX(onnxmodel);
  60. inpPath = _tf("onnx/data/input_" + basename);
  61. outPath = _tf("onnx/data/output_" + basename);
  62. }
  63. ASSERT_FALSE(net.empty());
  64. for (int i = 0; i < numInps; i++)
  65. inps[i] = blobFromNPY(inpPath + ((numInps > 1) ? cv::format("_%d.npy", i) : ".npy"));
  66. for (int i = 0; i < numOuts; i++)
  67. refs[i] = blobFromNPY(outPath + ((numOuts > 1) ? cv::format("_%d.npy", i) : ".npy"));
  68. qnet = net.quantize(inps, CV_8S, CV_8S, perChannel);
  69. qnet.getInputDetails(inputScale, inputZp);
  70. qnet.getOutputDetails(outputScale, outputZp);
  71. qnet.setPreferableBackend(backend);
  72. qnet.setPreferableTarget(target);
  73. // Quantize inputs to int8
  74. // int8_value = float_value/scale + zero-point
  75. for (int i = 0; i < numInps; i++)
  76. {
  77. inps[i].convertTo(inps_int8[i], CV_8S, 1.f/inputScale[i], inputZp[i]);
  78. String inp_name = numInps > 1 ? (importer == "Caffe" ? cv::format("input_%d", i) : cv::format("%d", i)) : "";
  79. qnet.setInput(inps_int8[i], inp_name);
  80. }
  81. qnet.forward(outs_int8);
  82. // Dequantize outputs and compare with reference outputs
  83. // float_value = scale*(int8_value - zero-point)
  84. for (int i = 0; i < numOuts; i++)
  85. {
  86. outs_int8[i].convertTo(outs_dequantized[i], CV_32F, outputScale[i], -(outputScale[i] * outputZp[i]));
  87. normAssert(refs[i], outs_dequantized[i], basename.c_str(), l1, lInf);
  88. }
  89. }
  90. };
  91. TEST_P(Test_Int8_layers, Convolution1D)
  92. {
  93. testLayer("conv1d", "ONNX", 0.00302, 0.00909);
  94. testLayer("conv1d_bias", "ONNX", 0.00306, 0.00948);
  95. {
  96. SCOPED_TRACE("Per-tensor quantize");
  97. testLayer("conv1d", "ONNX", 0.00302, 0.00909, 1, 1, false, true, false, false);
  98. testLayer("conv1d_bias", "ONNX", 0.00319, 0.00948, 1, 1, false, true, false, false);
  99. }
  100. }
  101. TEST_P(Test_Int8_layers, Convolution2D)
  102. {
  103. if(backend == DNN_BACKEND_TIMVX)
  104. testLayer("single_conv", "TensorFlow", 0.00424, 0.02201);
  105. else
  106. testLayer("single_conv", "TensorFlow", 0.00413, 0.02201);
  107. testLayer("atrous_conv2d_valid", "TensorFlow", 0.0193, 0.0633);
  108. testLayer("atrous_conv2d_same", "TensorFlow", 0.0185, 0.1322);
  109. testLayer("keras_atrous_conv2d_same", "TensorFlow", 0.0056, 0.0244);
  110. if(backend == DNN_BACKEND_TIMVX)
  111. testLayer("convolution", "ONNX", 0.00534, 0.01516);
  112. else
  113. testLayer("convolution", "ONNX", 0.0052, 0.01516);
  114. if(backend == DNN_BACKEND_TIMVX)
  115. testLayer("two_convolution", "ONNX", 0.0033, 0.01);
  116. else
  117. testLayer("two_convolution", "ONNX", 0.00295, 0.00840);
  118. if(backend == DNN_BACKEND_TIMVX)
  119. applyTestTag(CV_TEST_TAG_DNN_SKIP_TIMVX);
  120. testLayer("layer_convolution", "Caffe", 0.0174, 0.0758, 1, 1, true);
  121. testLayer("depthwise_conv2d", "TensorFlow", 0.0388, 0.169);
  122. {
  123. SCOPED_TRACE("Per-tensor quantize");
  124. testLayer("single_conv", "TensorFlow", 0.00413, 0.02301, 1, 1, false, true, false, false);
  125. testLayer("atrous_conv2d_valid", "TensorFlow", 0.027967, 0.07808, 1, 1, false, true, false, false);
  126. testLayer("atrous_conv2d_same", "TensorFlow", 0.01945, 0.1322, 1, 1, false, true, false, false);
  127. testLayer("keras_atrous_conv2d_same", "TensorFlow", 0.005677, 0.03327, 1, 1, false, true, false, false);
  128. testLayer("convolution", "ONNX", 0.00538, 0.01517, 1, 1, false, true, false, false);
  129. testLayer("two_convolution", "ONNX", 0.00295, 0.00926, 1, 1, false, true, false, false);
  130. testLayer("layer_convolution", "Caffe", 0.0175, 0.0759, 1, 1, true, true, false, false);
  131. testLayer("depthwise_conv2d", "TensorFlow", 0.041847, 0.18744, 1, 1, false, true, false, false);
  132. }
  133. }
  134. TEST_P(Test_Int8_layers, Convolution3D)
  135. {
  136. testLayer("conv3d", "TensorFlow", 0.00734, 0.02434);
  137. testLayer("conv3d", "ONNX", 0.00353, 0.00941);
  138. testLayer("conv3d_bias", "ONNX", 0.00129, 0.00249);
  139. }
  140. TEST_P(Test_Int8_layers, Flatten)
  141. {
  142. testLayer("flatten", "TensorFlow", 0.0036, 0.0069, 1, 1, false, true, true);
  143. testLayer("unfused_flatten", "TensorFlow", 0.0014, 0.0028);
  144. testLayer("unfused_flatten_unknown_batch", "TensorFlow", 0.0043, 0.0051);
  145. {
  146. SCOPED_TRACE("Per-tensor quantize");
  147. testLayer("conv3d", "TensorFlow", 0.00734, 0.02434, 1, 1, false, true, false, false);
  148. testLayer("conv3d", "ONNX", 0.00377, 0.01362, 1, 1, false, true, false, false);
  149. testLayer("conv3d_bias", "ONNX", 0.00201, 0.0039, 1, 1, false, true, false, false);
  150. }
  151. }
  152. TEST_P(Test_Int8_layers, Padding)
  153. {
  154. if (backend == DNN_BACKEND_TIMVX)
  155. testLayer("padding_valid", "TensorFlow", 0.0292, 0.0105);
  156. else
  157. testLayer("padding_valid", "TensorFlow", 0.0026, 0.0064);
  158. if (backend == DNN_BACKEND_TIMVX)
  159. testLayer("padding_same", "TensorFlow", 0.0085, 0.032);
  160. else
  161. testLayer("padding_same", "TensorFlow", 0.0081, 0.032);
  162. if (backend == DNN_BACKEND_TIMVX)
  163. testLayer("spatial_padding", "TensorFlow", 0.0079, 0.028);
  164. else
  165. testLayer("spatial_padding", "TensorFlow", 0.0078, 0.028);
  166. testLayer("mirror_pad", "TensorFlow", 0.0064, 0.013);
  167. testLayer("pad_and_concat", "TensorFlow", 0.0021, 0.0098);
  168. testLayer("padding", "ONNX", 0.0005, 0.0069);
  169. testLayer("ReflectionPad2d", "ONNX", 0.00062, 0.0018);
  170. testLayer("ZeroPad2d", "ONNX", 0.00037, 0.0018);
  171. }
  172. TEST_P(Test_Int8_layers, AvePooling)
  173. {
  174. // Some tests failed with OpenVINO due to wrong padded area calculation
  175. if (backend != DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  176. testLayer("layer_pooling_ave", "Caffe", 0.0021, 0.0075);
  177. testLayer("ave_pool_same", "TensorFlow", 0.00153, 0.0041);
  178. testLayer("average_pooling_1d", "ONNX", 0.002, 0.0048);
  179. if (backend != DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  180. testLayer("average_pooling", "ONNX", 0.0014, 0.0032);
  181. testLayer("average_pooling_dynamic_axes", "ONNX", 0.0014, 0.006);
  182. if (target != DNN_TARGET_CPU)
  183. throw SkipTestException("Only CPU is supported");
  184. testLayer("ave_pool3d", "TensorFlow", 0.00175, 0.0047);
  185. testLayer("ave_pool3d", "ONNX", 0.00063, 0.0016);
  186. }
  187. TEST_P(Test_Int8_layers, MaxPooling)
  188. {
  189. testLayer("pool_conv_1d", "ONNX", 0.0006, 0.0015);
  190. if (target != DNN_TARGET_CPU)
  191. throw SkipTestException("Only CPU is supported");
  192. testLayer("pool_conv_3d", "ONNX", 0.0033, 0.0124);
  193. testLayer("layer_pooling_max", "Caffe", 0.0021, 0.004);
  194. testLayer("max_pool_even", "TensorFlow", 0.0048, 0.0139);
  195. testLayer("max_pool_odd_valid", "TensorFlow", 0.0043, 0.012);
  196. testLayer("conv_pool_nchw", "TensorFlow", 0.007, 0.025);
  197. testLayer("max_pool3d", "TensorFlow", 0.0025, 0.0058);
  198. testLayer("maxpooling_1d", "ONNX", 0.0018, 0.0037);
  199. testLayer("two_maxpooling_1d", "ONNX", 0.0037, 0.0052);
  200. testLayer("maxpooling", "ONNX", 0.0034, 0.0065);
  201. testLayer("two_maxpooling", "ONNX", 0.0025, 0.0052);
  202. testLayer("max_pool3d", "ONNX", 0.0028, 0.0069);
  203. }
  204. TEST_P(Test_Int8_layers, Reduce)
  205. {
  206. testLayer("reduce_mean", "TensorFlow", 0.0005, 0.0014);
  207. testLayer("reduce_mean", "ONNX", 0.00062, 0.0014);
  208. testLayer("reduce_mean_axis1", "ONNX", 0.00032, 0.0007);
  209. testLayer("reduce_mean_axis2", "ONNX", 0.00033, 0.001);
  210. testLayer("reduce_sum", "TensorFlow", 0.015, 0.031);
  211. testLayer("reduce_sum_channel", "TensorFlow", 0.008, 0.019);
  212. testLayer("sum_pool_by_axis", "TensorFlow", 0.012, 0.032);
  213. testLayer("reduce_sum", "ONNX", 0.0025, 0.0048);
  214. testLayer("reduce_max", "ONNX", 0, 0);
  215. testLayer("reduce_max_axis_0", "ONNX", 0.0042, 0.007);
  216. testLayer("reduce_max_axis_1", "ONNX", 0.0018, 0.0036);
  217. if (target != DNN_TARGET_CPU)
  218. throw SkipTestException("Only CPU is supported");
  219. testLayer("reduce_mean3d", "ONNX", 0.00048, 0.0016);
  220. }
  221. TEST_P(Test_Int8_layers, ReLU)
  222. {
  223. testLayer("layer_relu", "Caffe", 0.0005, 0.002);
  224. testLayer("ReLU", "ONNX", 0.0012, 0.0047);
  225. }
  226. TEST_P(Test_Int8_layers, LeakyReLU)
  227. {
  228. testLayer("leaky_relu", "TensorFlow", 0.0002, 0.0004);
  229. }
  230. TEST_P(Test_Int8_layers, ReLU6)
  231. {
  232. testLayer("keras_relu6", "TensorFlow", 0.0018, 0.0062);
  233. testLayer("keras_relu6", "TensorFlow", 0.0018, 0.0062, 1, 1, false, true, true);
  234. testLayer("clip_by_value", "TensorFlow", 0.0009, 0.002);
  235. testLayer("clip", "ONNX", 0.00006, 0.00037);
  236. }
  237. TEST_P(Test_Int8_layers, Sigmoid)
  238. {
  239. testLayer("maxpooling_sigmoid", "ONNX", 0.0011, 0.0032);
  240. }
  241. TEST_P(Test_Int8_layers, Sigmoid_dynamic_axes)
  242. {
  243. testLayer("maxpooling_sigmoid_dynamic_axes", "ONNX", 0.002, 0.0032);
  244. }
  245. TEST_P(Test_Int8_layers, Sigmoid_1d)
  246. {
  247. testLayer("maxpooling_sigmoid_1d", "ONNX", 0.002, 0.0037);
  248. }
  249. TEST_P(Test_Int8_layers, Mish)
  250. {
  251. testLayer("mish", "ONNX", 0.0015, 0.0025);
  252. }
  253. TEST_P(Test_Int8_layers, Softmax_Caffe)
  254. {
  255. testLayer("layer_softmax", "Caffe", 0.0011, 0.0036);
  256. }
  257. TEST_P(Test_Int8_layers, Softmax_keras_TF)
  258. {
  259. testLayer("keras_softmax", "TensorFlow", 0.00093, 0.0027);
  260. }
  261. TEST_P(Test_Int8_layers, Softmax_slim_TF)
  262. {
  263. testLayer("slim_softmax", "TensorFlow", 0.0016, 0.0034);
  264. }
  265. TEST_P(Test_Int8_layers, Softmax_slim_v2_TF)
  266. {
  267. testLayer("slim_softmax_v2", "TensorFlow", 0.0029, 0.017);
  268. }
  269. TEST_P(Test_Int8_layers, Softmax_ONNX)
  270. {
  271. testLayer("softmax", "ONNX", 0.0016, 0.0028);
  272. }
  273. TEST_P(Test_Int8_layers, Softmax_log_ONNX)
  274. {
  275. testLayer("log_softmax", "ONNX", 0.014, 0.025);
  276. }
  277. TEST_P(Test_Int8_layers, DISABLED_Softmax_unfused_ONNX) // FIXIT Support 'Identity' layer for outputs (#22022)
  278. {
  279. testLayer("softmax_unfused", "ONNX", 0.0009, 0.0021);
  280. }
  281. TEST_P(Test_Int8_layers, Concat)
  282. {
  283. testLayer("layer_concat_shared_input", "Caffe", 0.0076, 0.029, 1, 1, true, false);
  284. if (backend != DNN_BACKEND_INFERENCE_ENGINE_NGRAPH) {
  285. // Crashes with segfault
  286. testLayer("concat_axis_1", "TensorFlow", 0.0056, 0.017);
  287. }
  288. testLayer("keras_pad_concat", "TensorFlow", 0.0032, 0.0089);
  289. testLayer("concat_3d", "TensorFlow", 0.005, 0.014);
  290. testLayer("concatenation", "ONNX", 0.0032, 0.009);
  291. }
  292. TEST_P(Test_Int8_layers, BatchNorm)
  293. {
  294. testLayer("layer_batch_norm", "Caffe", 0.0061, 0.019, 1, 1, true);
  295. testLayer("fused_batch_norm", "TensorFlow", 0.0063, 0.02);
  296. testLayer("batch_norm_text", "TensorFlow", 0.0048, 0.013, 1, 1, false, true, true);
  297. testLayer("unfused_batch_norm", "TensorFlow", 0.0076, 0.019);
  298. testLayer("fused_batch_norm_no_gamma", "TensorFlow", 0.0067, 0.015);
  299. testLayer("unfused_batch_norm_no_gamma", "TensorFlow", 0.0123, 0.044);
  300. testLayer("switch_identity", "TensorFlow", 0.0035, 0.011);
  301. testLayer("batch_norm3d", "TensorFlow", 0.0077, 0.02);
  302. testLayer("batch_norm", "ONNX", 0.0012, 0.0049);
  303. testLayer("batch_norm_3d", "ONNX", 0.0039, 0.012);
  304. testLayer("frozenBatchNorm2d", "ONNX", 0.001, 0.0018);
  305. testLayer("batch_norm_subgraph", "ONNX", 0.0049, 0.0098);
  306. }
  307. TEST_P(Test_Int8_layers, Scale)
  308. {
  309. testLayer("batch_norm", "TensorFlow", 0.0028, 0.0098);
  310. testLayer("scale", "ONNX", 0.0025, 0.0071);
  311. testLayer("expand_hw", "ONNX", 0.0012, 0.0012);
  312. testLayer("flatten_const", "ONNX", 0.0024, 0.0048);
  313. }
  314. TEST_P(Test_Int8_layers, InnerProduct)
  315. {
  316. testLayer("layer_inner_product", "Caffe", 0.005, 0.02, 1, 1, true);
  317. testLayer("matmul", "TensorFlow", 0.0061, 0.019);
  318. if (backend == DNN_BACKEND_TIMVX)
  319. testLayer("nhwc_transpose_reshape_matmul", "TensorFlow", 0.0018, 0.0175);
  320. else
  321. testLayer("nhwc_transpose_reshape_matmul", "TensorFlow", 0.0009, 0.0091);
  322. testLayer("nhwc_reshape_matmul", "TensorFlow", 0.03, 0.071);
  323. testLayer("matmul_layout", "TensorFlow", 0.035, 0.06);
  324. testLayer("tf2_dense", "TensorFlow", 0, 0);
  325. testLayer("matmul_add", "ONNX", 0.041, 0.082);
  326. testLayer("linear", "ONNX", 0.0027, 0.0046);
  327. if (backend == DNN_BACKEND_TIMVX)
  328. testLayer("constant", "ONNX", 0.00048, 0.0013);
  329. else
  330. testLayer("constant", "ONNX", 0.00021, 0.0006);
  331. testLayer("lin_with_constant", "ONNX", 0.0011, 0.0016);
  332. {
  333. SCOPED_TRACE("Per-tensor quantize");
  334. testLayer("layer_inner_product", "Caffe", 0.0055, 0.02, 1, 1, true, true, false, false);
  335. testLayer("matmul", "TensorFlow", 0.0075, 0.019, 1, 1, false, true, false, false);
  336. testLayer("nhwc_transpose_reshape_matmul", "TensorFlow", 0.0009, 0.0091, 1, 1, false, true, false, false);
  337. testLayer("nhwc_reshape_matmul", "TensorFlow", 0.037, 0.071, 1, 1, false, true, false, false);
  338. testLayer("matmul_layout", "TensorFlow", 0.035, 0.095, 1, 1, false, true, false, false);
  339. testLayer("tf2_dense", "TensorFlow", 0, 0, 1, 1, false, true, false, false);
  340. testLayer("matmul_add", "ONNX", 0.041, 0.082, 1, 1, false, true, false, false);
  341. testLayer("linear", "ONNX", 0.0027, 0.005, 1, 1, false, true, false, false);
  342. testLayer("constant", "ONNX", 0.00038, 0.0012, 1, 1, false, true, false, false);
  343. testLayer("lin_with_constant", "ONNX", 0.0011, 0.0016, 1, 1, false, true, false, false);
  344. }
  345. }
  346. TEST_P(Test_Int8_layers, Reshape)
  347. {
  348. testLayer("reshape_layer", "TensorFlow", 0.0032, 0.0082);
  349. if (backend == DNN_BACKEND_TIMVX)
  350. testLayer("reshape_nchw", "TensorFlow", 0.0092, 0.0495);
  351. else
  352. testLayer("reshape_nchw", "TensorFlow", 0.0089, 0.029);
  353. testLayer("reshape_conv", "TensorFlow", 0.035, 0.054);
  354. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  355. testLayer("reshape_reduce", "TensorFlow", 0.0053, 0.011);
  356. else
  357. testLayer("reshape_reduce", "TensorFlow", 0.0042, 0.0078);
  358. testLayer("reshape_as_shape", "TensorFlow", 0.0014, 0.0028);
  359. testLayer("reshape_no_reorder", "TensorFlow", 0.0014, 0.0028);
  360. testLayer("shift_reshape_no_reorder", "TensorFlow", 0.0063, backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH ? 0.016 : 0.014);
  361. testLayer("dynamic_reshape", "ONNX", 0.0047, 0.0079);
  362. testLayer("dynamic_reshape_opset_11", "ONNX", 0.0048, 0.0081);
  363. testLayer("flatten_by_prod", "ONNX", 0.0048, 0.0081);
  364. testLayer("squeeze", "ONNX", 0.0048, 0.0081);
  365. testLayer("unsqueeze", "ONNX", 0.0033, 0.0053);
  366. if (backend == DNN_BACKEND_TIMVX)
  367. testLayer("squeeze_and_conv_dynamic_axes", "ONNX", 0.006, 0.0212);
  368. else
  369. testLayer("squeeze_and_conv_dynamic_axes", "ONNX", 0.0054, 0.0154);
  370. testLayer("unsqueeze_and_conv_dynamic_axes", "ONNX", 0.0037, 0.0151);
  371. }
  372. TEST_P(Test_Int8_layers, Permute)
  373. {
  374. testLayer("tf2_permute_nhwc_ncwh", "TensorFlow", 0.0028, 0.006);
  375. testLayer("transpose", "ONNX", 0.0015, 0.0046);
  376. }
  377. TEST_P(Test_Int8_layers, Identity)
  378. {
  379. testLayer("expand_batch", "ONNX", 0.0027, 0.0036);
  380. testLayer("expand_channels", "ONNX", 0.0013, 0.0019);
  381. testLayer("expand_neg_batch", "ONNX", 0.00071, 0.0019);
  382. }
  383. TEST_P(Test_Int8_layers, Slice_split_tf)
  384. {
  385. testLayer("split", "TensorFlow", 0.0033, 0.0056);
  386. }
  387. TEST_P(Test_Int8_layers, Slice_4d_tf)
  388. {
  389. testLayer("slice_4d", "TensorFlow", 0.003, 0.0073);
  390. }
  391. TEST_P(Test_Int8_layers, Slice_strided_tf)
  392. {
  393. testLayer("strided_slice", "TensorFlow", 0.008, 0.0142);
  394. }
  395. TEST_P(Test_Int8_layers, DISABLED_Slice_onnx) // FIXIT Support 'Identity' layer for outputs (#22022)
  396. {
  397. testLayer("slice", "ONNX", 0.0046, 0.0077);
  398. }
  399. TEST_P(Test_Int8_layers, Slice_dynamic_axes_onnx)
  400. {
  401. testLayer("slice_dynamic_axes", "ONNX", 0.0039, 0.02);
  402. }
  403. TEST_P(Test_Int8_layers, Slice_steps_2d_onnx11)
  404. {
  405. testLayer("slice_opset_11_steps_2d", "ONNX", 0.01, 0.0124);
  406. }
  407. TEST_P(Test_Int8_layers, Slice_steps_3d_onnx11)
  408. {
  409. testLayer("slice_opset_11_steps_3d", "ONNX", 0.0068, 0.014);
  410. }
  411. TEST_P(Test_Int8_layers, Slice_steps_4d_onnx11)
  412. {
  413. testLayer("slice_opset_11_steps_4d", "ONNX", 0.0041, 0.008);
  414. }
  415. TEST_P(Test_Int8_layers, Slice_steps_5d_onnx11)
  416. {
  417. testLayer("slice_opset_11_steps_5d", "ONNX", 0.0085, 0.021);
  418. }
  419. TEST_P(Test_Int8_layers, Dropout)
  420. {
  421. testLayer("layer_dropout", "Caffe", 0.0021, 0.004);
  422. testLayer("dropout", "ONNX", 0.0029, 0.004);
  423. }
  424. TEST_P(Test_Int8_layers, Eltwise)
  425. {
  426. testLayer("layer_eltwise", "Caffe", 0.062, 0.15);
  427. if (backend == DNN_BACKEND_TIMVX)
  428. applyTestTag(CV_TEST_TAG_DNN_SKIP_TIMVX);
  429. testLayer("conv_2_inps", "Caffe", 0.0086, 0.0232, 2, 1, true, false);
  430. testLayer("eltwise_sub", "TensorFlow", 0.015, 0.047);
  431. testLayer("eltwise_add_vec", "TensorFlow", 0.037, backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH ? 0.24 : 0.21); // tflite 0.0095, 0.0365
  432. testLayer("eltwise_mul_vec", "TensorFlow", 0.173, 1.14); // tflite 0.0028, 0.017
  433. testLayer("channel_broadcast", "TensorFlow", 0.0025, 0.0063);
  434. testLayer("split_equals", "TensorFlow", backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH ? 0.021 : 0.02, 0.065);
  435. testLayer("mul", "ONNX", 0.0039, 0.014);
  436. testLayer("split_max", "ONNX", 0.004, 0.012);
  437. }
  438. TEST_P(Test_Int8_layers, DepthSpaceOps) {
  439. auto test_layer_with_onnx_conformance_models = [&](const std::string &model_name, double l1, double lInf) {
  440. std::string model_path = _tf("onnx/conformance/node/test_" + model_name + "/model.onnx");
  441. auto net = readNet(model_path);
  442. // load reference inputs and outputs
  443. std::string data_base_path = _tf("onnx/conformance/node/test_" + model_name + "/test_data_set_0");
  444. Mat input = readTensorFromONNX(data_base_path + "/input_0.pb");
  445. Mat ref_output = readTensorFromONNX(data_base_path + "/output_0.pb");
  446. std::vector<float> input_scales, output_scales;
  447. std::vector<int> input_zeropoints, output_zeropoints;
  448. auto qnet = net.quantize(std::vector<Mat>{input}, CV_8S, CV_8S, false);
  449. qnet.getInputDetails(input_scales, input_zeropoints);
  450. qnet.getOutputDetails(output_scales, output_zeropoints);
  451. qnet.setPreferableBackend(backend);
  452. qnet.setPreferableTarget(target);
  453. Mat quantized_input, quantized_output;
  454. input.convertTo(quantized_input, CV_8S, 1.f / input_scales.front(), input_zeropoints.front());
  455. qnet.setInput(quantized_input);
  456. quantized_output = qnet.forward();
  457. Mat output;
  458. quantized_output.convertTo(output, CV_32F, output_scales.front(), -(output_scales.front() * output_zeropoints.front()));
  459. normAssert(ref_output, output, model_name.c_str(), l1, lInf);
  460. };
  461. double l1 = default_l1, lInf = default_lInf;
  462. {
  463. l1 = 0.001; lInf = 0.002;
  464. if (backend == DNN_BACKEND_TIMVX) { l1 = 0.001; lInf = 0.002; }
  465. test_layer_with_onnx_conformance_models("spacetodepth", l1, lInf);
  466. }
  467. {
  468. l1 = 0.022; lInf = 0.044;
  469. if (backend == DNN_BACKEND_TIMVX) { l1 = 0.022; lInf = 0.044; }
  470. test_layer_with_onnx_conformance_models("spacetodepth_example", l1, lInf);
  471. }
  472. {
  473. l1 = 0.001; lInf = 0.002;
  474. if (backend == DNN_BACKEND_TIMVX) { l1 = 0.24; lInf = 0.99; }
  475. test_layer_with_onnx_conformance_models("depthtospace_crd_mode", l1, lInf);
  476. }
  477. test_layer_with_onnx_conformance_models("depthtospace_dcr_mode", 0.001, 0.002);
  478. test_layer_with_onnx_conformance_models("depthtospace_example", 0.07, 0.14);
  479. {
  480. l1 = 0.07; lInf = 0.14;
  481. if (backend == DNN_BACKEND_TIMVX) // diff too huge, l1 = 13.6; lInf = 27.2
  482. applyTestTag(CV_TEST_TAG_DNN_SKIP_TIMVX);
  483. test_layer_with_onnx_conformance_models("depthtospace_crd_mode_example", l1, lInf);
  484. }
  485. }
  486. INSTANTIATE_TEST_CASE_P(/**/, Test_Int8_layers, dnnBackendsAndTargetsInt8());
  487. class Test_Int8_nets : public DNNTestLayer
  488. {
  489. public:
  490. void testClassificationNet(Net baseNet, const Mat& blob, const Mat& ref, double l1, double lInf, bool perChannel = true)
  491. {
  492. Net qnet = baseNet.quantize(blob, CV_32F, CV_32F, perChannel);
  493. qnet.setPreferableBackend(backend);
  494. qnet.setPreferableTarget(target);
  495. qnet.setInput(blob);
  496. Mat out = qnet.forward();
  497. normAssert(ref, out, "", l1, lInf);
  498. }
  499. void testDetectionNet(Net baseNet, const Mat& blob, const Mat& ref,
  500. double confThreshold, double scoreDiff, double iouDiff, bool perChannel = true)
  501. {
  502. Net qnet = baseNet.quantize(blob, CV_32F, CV_32F, perChannel);
  503. qnet.setPreferableBackend(backend);
  504. qnet.setPreferableTarget(target);
  505. qnet.setInput(blob);
  506. Mat out = qnet.forward();
  507. normAssertDetections(ref, out, "", confThreshold, scoreDiff, iouDiff);
  508. }
  509. void testFaster(Net baseNet, const Mat& ref, double confThreshold, double scoreDiff, double iouDiff, bool perChannel = true)
  510. {
  511. Mat inp = imread(_tf("dog416.png"));
  512. resize(inp, inp, Size(800, 600));
  513. Mat blob = blobFromImage(inp, 1.0, Size(), Scalar(102.9801, 115.9465, 122.7717), false, false);
  514. Mat imInfo = (Mat_<float>(1, 3) << inp.rows, inp.cols, 1.6f);
  515. Net qnet = baseNet.quantize(std::vector<Mat>{blob, imInfo}, CV_32F, CV_32F, perChannel);
  516. qnet.setPreferableBackend(backend);
  517. qnet.setPreferableTarget(target);
  518. qnet.setInput(blob, "data");
  519. qnet.setInput(imInfo, "im_info");
  520. Mat out = qnet.forward();
  521. normAssertDetections(ref, out, "", confThreshold, scoreDiff, iouDiff);
  522. }
  523. void testONNXNet(const String& basename, double l1, double lInf, bool useSoftmax = false, bool perChannel = true)
  524. {
  525. String onnxmodel = findDataFile("dnn/onnx/models/" + basename + ".onnx", false);
  526. Mat blob = readTensorFromONNX(findDataFile("dnn/onnx/data/input_" + basename + ".pb"));
  527. Mat ref = readTensorFromONNX(findDataFile("dnn/onnx/data/output_" + basename + ".pb"));
  528. Net baseNet = readNetFromONNX(onnxmodel);
  529. Net qnet = baseNet.quantize(blob, CV_32F, CV_32F, perChannel);
  530. qnet.setPreferableBackend(backend);
  531. qnet.setPreferableTarget(target);
  532. qnet.setInput(blob);
  533. Mat out = qnet.forward();
  534. if (useSoftmax)
  535. {
  536. LayerParams lp;
  537. Net netSoftmax;
  538. netSoftmax.addLayerToPrev("softmaxLayer", "Softmax", lp);
  539. netSoftmax.setPreferableBackend(DNN_BACKEND_OPENCV);
  540. netSoftmax.setInput(out);
  541. out = netSoftmax.forward();
  542. netSoftmax.setInput(ref);
  543. ref = netSoftmax.forward();
  544. }
  545. normAssert(ref, out, "", l1, lInf);
  546. }
  547. void testDarknetModel(const std::string& cfg, const std::string& weights,
  548. const cv::Mat& ref, double scoreDiff, double iouDiff,
  549. float confThreshold = 0.24, float nmsThreshold = 0.4, bool perChannel = true)
  550. {
  551. CV_Assert(ref.cols == 7);
  552. std::vector<std::vector<int> > refClassIds;
  553. std::vector<std::vector<float> > refScores;
  554. std::vector<std::vector<Rect2d> > refBoxes;
  555. for (int i = 0; i < ref.rows; ++i)
  556. {
  557. int batchId = static_cast<int>(ref.at<float>(i, 0));
  558. int classId = static_cast<int>(ref.at<float>(i, 1));
  559. float score = ref.at<float>(i, 2);
  560. float left = ref.at<float>(i, 3);
  561. float top = ref.at<float>(i, 4);
  562. float right = ref.at<float>(i, 5);
  563. float bottom = ref.at<float>(i, 6);
  564. Rect2d box(left, top, right - left, bottom - top);
  565. if (batchId >= refClassIds.size())
  566. {
  567. refClassIds.resize(batchId + 1);
  568. refScores.resize(batchId + 1);
  569. refBoxes.resize(batchId + 1);
  570. }
  571. refClassIds[batchId].push_back(classId);
  572. refScores[batchId].push_back(score);
  573. refBoxes[batchId].push_back(box);
  574. }
  575. Mat img1 = imread(_tf("dog416.png"));
  576. Mat img2 = imread(_tf("street.png"));
  577. std::vector<Mat> samples(2);
  578. samples[0] = img1; samples[1] = img2;
  579. // determine test type, whether batch or single img
  580. int batch_size = refClassIds.size();
  581. CV_Assert(batch_size == 1 || batch_size == 2);
  582. samples.resize(batch_size);
  583. Mat inp = blobFromImages(samples, 1.0/255, Size(416, 416), Scalar(), true, false);
  584. Net baseNet = readNetFromDarknet(findDataFile("dnn/" + cfg), findDataFile("dnn/" + weights, false));
  585. Net qnet = baseNet.quantize(inp, CV_32F, CV_32F, perChannel);
  586. qnet.setPreferableBackend(backend);
  587. qnet.setPreferableTarget(target);
  588. qnet.setInput(inp);
  589. std::vector<Mat> outs;
  590. qnet.forward(outs, qnet.getUnconnectedOutLayersNames());
  591. for (int b = 0; b < batch_size; ++b)
  592. {
  593. std::vector<int> classIds;
  594. std::vector<float> confidences;
  595. std::vector<Rect2d> boxes;
  596. for (int i = 0; i < outs.size(); ++i)
  597. {
  598. Mat out;
  599. if (batch_size > 1){
  600. // get the sample slice from 3D matrix (batch, box, classes+5)
  601. Range ranges[3] = {Range(b, b+1), Range::all(), Range::all()};
  602. out = outs[i](ranges).reshape(1, outs[i].size[1]);
  603. }else{
  604. out = outs[i];
  605. }
  606. for (int j = 0; j < out.rows; ++j)
  607. {
  608. Mat scores = out.row(j).colRange(5, out.cols);
  609. double confidence;
  610. Point maxLoc;
  611. minMaxLoc(scores, 0, &confidence, 0, &maxLoc);
  612. if (confidence > confThreshold) {
  613. float* detection = out.ptr<float>(j);
  614. double centerX = detection[0];
  615. double centerY = detection[1];
  616. double width = detection[2];
  617. double height = detection[3];
  618. boxes.push_back(Rect2d(centerX - 0.5 * width, centerY - 0.5 * height,
  619. width, height));
  620. confidences.push_back(confidence);
  621. classIds.push_back(maxLoc.x);
  622. }
  623. }
  624. }
  625. // here we need NMS of boxes
  626. std::vector<int> indices;
  627. NMSBoxes(boxes, confidences, confThreshold, nmsThreshold, indices);
  628. std::vector<int> nms_classIds;
  629. std::vector<float> nms_confidences;
  630. std::vector<Rect2d> nms_boxes;
  631. for (size_t i = 0; i < indices.size(); ++i)
  632. {
  633. int idx = indices[i];
  634. Rect2d box = boxes[idx];
  635. float conf = confidences[idx];
  636. int class_id = classIds[idx];
  637. nms_boxes.push_back(box);
  638. nms_confidences.push_back(conf);
  639. nms_classIds.push_back(class_id);
  640. }
  641. if (cvIsNaN(iouDiff))
  642. {
  643. if (b == 0)
  644. std::cout << "Skip accuracy checks" << std::endl;
  645. continue;
  646. }
  647. normAssertDetections(refClassIds[b], refScores[b], refBoxes[b], nms_classIds, nms_confidences, nms_boxes,
  648. format("batch size %d, sample %d\n", batch_size, b).c_str(), confThreshold, scoreDiff, iouDiff);
  649. }
  650. }
  651. };
  652. TEST_P(Test_Int8_nets, AlexNet)
  653. {
  654. #if defined(OPENCV_32BIT_CONFIGURATION) && defined(HAVE_OPENCL)
  655. applyTestTag(CV_TEST_TAG_MEMORY_2GB);
  656. #else
  657. applyTestTag(target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB);
  658. #endif
  659. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  660. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  661. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  662. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  663. Net net = readNetFromCaffe(findDataFile("dnn/bvlc_alexnet.prototxt"),
  664. findDataFile("dnn/bvlc_alexnet.caffemodel", false));
  665. Mat inp = imread(_tf("grace_hopper_227.png"));
  666. Mat blob = blobFromImage(inp, 1.0, Size(227, 227), Scalar(), false);
  667. Mat ref = blobFromNPY(_tf("caffe_alexnet_prob.npy"));
  668. float l1 = 1e-4, lInf = 0.003;
  669. testClassificationNet(net, blob, ref, l1, lInf);
  670. }
  671. TEST_P(Test_Int8_nets, GoogLeNet)
  672. {
  673. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  674. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  675. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  676. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  677. Net net = readNetFromCaffe(findDataFile("dnn/bvlc_googlenet.prototxt"),
  678. findDataFile("dnn/bvlc_googlenet.caffemodel", false));
  679. std::vector<Mat> inpMats;
  680. inpMats.push_back( imread(_tf("googlenet_0.png")) );
  681. inpMats.push_back( imread(_tf("googlenet_1.png")) );
  682. Mat blob = blobFromImages(inpMats, 1.0, Size(224, 224), Scalar(), false);
  683. Mat ref = blobFromNPY(_tf("googlenet_prob.npy"));
  684. float l1 = 2e-4, lInf = 0.07;
  685. testClassificationNet(net, blob, ref, l1, lInf);
  686. }
  687. TEST_P(Test_Int8_nets, ResNet50)
  688. {
  689. applyTestTag(
  690. target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB,
  691. CV_TEST_TAG_DEBUG_VERYLONG
  692. );
  693. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  694. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  695. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  696. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  697. Net net = readNetFromCaffe(findDataFile("dnn/ResNet-50-deploy.prototxt"),
  698. findDataFile("dnn/ResNet-50-model.caffemodel", false));
  699. Mat inp = imread(_tf("googlenet_0.png"));
  700. Mat blob = blobFromImage(inp, 1.0, Size(224, 224), Scalar(), false);
  701. Mat ref = blobFromNPY(_tf("resnet50_prob.npy"));
  702. float l1 = 3e-4, lInf = 0.05;
  703. testClassificationNet(net, blob, ref, l1, lInf);
  704. {
  705. SCOPED_TRACE("Per-tensor quantize");
  706. testClassificationNet(net, blob, ref, l1, lInf, false);
  707. }
  708. }
  709. TEST_P(Test_Int8_nets, DenseNet121)
  710. {
  711. applyTestTag(CV_TEST_TAG_MEMORY_512MB);
  712. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  713. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  714. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  715. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  716. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  717. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  718. Net net = readNetFromCaffe(findDataFile("dnn/DenseNet_121.prototxt", false),
  719. findDataFile("dnn/DenseNet_121.caffemodel", false));
  720. Mat inp = imread(_tf("dog416.png"));
  721. Mat blob = blobFromImage(inp, 1.0 / 255.0, Size(224, 224), Scalar(), true, true);
  722. Mat ref = blobFromNPY(_tf("densenet_121_output.npy"));
  723. float l1 = 0.76, lInf = 3.31; // seems wrong
  724. testClassificationNet(net, blob, ref, l1, lInf);
  725. }
  726. TEST_P(Test_Int8_nets, SqueezeNet_v1_1)
  727. {
  728. if(target == DNN_TARGET_OPENCL_FP16)
  729. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  730. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  731. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  732. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  733. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  734. Net net = readNetFromCaffe(findDataFile("dnn/squeezenet_v1.1.prototxt"),
  735. findDataFile("dnn/squeezenet_v1.1.caffemodel", false));
  736. Mat inp = imread(_tf("googlenet_0.png"));
  737. Mat blob = blobFromImage(inp, 1.0, Size(227, 227), Scalar(), false, true);
  738. Mat ref = blobFromNPY(_tf("squeezenet_v1.1_prob.npy"));
  739. float l1 = 3e-4, lInf = 0.056;
  740. testClassificationNet(net, blob, ref, l1, lInf);
  741. }
  742. TEST_P(Test_Int8_nets, CaffeNet)
  743. {
  744. #if defined(OPENCV_32BIT_CONFIGURATION) && (defined(HAVE_OPENCL) || defined(_WIN32))
  745. applyTestTag(CV_TEST_TAG_MEMORY_2GB);
  746. #else
  747. applyTestTag(target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB);
  748. #endif
  749. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  750. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  751. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  752. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  753. float l1 = 4e-5, lInf = 0.0025;
  754. testONNXNet("caffenet", l1, lInf);
  755. }
  756. TEST_P(Test_Int8_nets, RCNN_ILSVRC13)
  757. {
  758. #if defined(OPENCV_32BIT_CONFIGURATION) && (defined(HAVE_OPENCL) || defined(_WIN32))
  759. applyTestTag(CV_TEST_TAG_MEMORY_2GB);
  760. #else
  761. applyTestTag(target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB);
  762. #endif
  763. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  764. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  765. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  766. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  767. float l1 = 0.02, lInf = 0.047;
  768. testONNXNet("rcnn_ilsvrc13", l1, lInf);
  769. }
  770. TEST_P(Test_Int8_nets, Inception_v2)
  771. {
  772. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  773. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  774. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  775. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  776. testONNXNet("inception_v2", default_l1, default_lInf, true);
  777. }
  778. TEST_P(Test_Int8_nets, MobileNet_v2)
  779. {
  780. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  781. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  782. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  783. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  784. testONNXNet("mobilenetv2", default_l1, default_lInf, true);
  785. }
  786. TEST_P(Test_Int8_nets, Shufflenet)
  787. {
  788. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  789. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  790. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  791. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  792. testONNXNet("shufflenet", default_l1, default_lInf);
  793. }
  794. TEST_P(Test_Int8_nets, MobileNet_SSD)
  795. {
  796. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  797. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  798. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  799. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  800. Net net = readNetFromCaffe(findDataFile("dnn/MobileNetSSD_deploy_19e3ec3.prototxt", false),
  801. findDataFile("dnn/MobileNetSSD_deploy_19e3ec3.caffemodel", false));
  802. Mat inp = imread(_tf("street.png"));
  803. Mat blob = blobFromImage(inp, 1.0 / 127.5, Size(300, 300), Scalar(127.5, 127.5, 127.5), false);
  804. Mat ref = blobFromNPY(_tf("mobilenet_ssd_caffe_out.npy"));
  805. float confThreshold = FLT_MIN, scoreDiff = 0.084, iouDiff = 0.43;
  806. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  807. }
  808. TEST_P(Test_Int8_nets, MobileNet_v1_SSD)
  809. {
  810. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  811. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  812. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  813. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  814. Net net = readNetFromTensorflow(findDataFile("dnn/ssd_mobilenet_v1_coco_2017_11_17.pb", false),
  815. findDataFile("dnn/ssd_mobilenet_v1_coco_2017_11_17.pbtxt"));
  816. Mat inp = imread(_tf("dog416.png"));
  817. Mat blob = blobFromImage(inp, 1.0, Size(300, 300), Scalar(), true, false);
  818. Mat ref = blobFromNPY(_tf("tensorflow/ssd_mobilenet_v1_coco_2017_11_17.detection_out.npy"));
  819. float confThreshold = 0.5, scoreDiff = 0.034, iouDiff = 0.13;
  820. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  821. }
  822. TEST_P(Test_Int8_nets, MobileNet_v1_SSD_PPN)
  823. {
  824. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  825. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  826. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  827. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  828. Net net = readNetFromTensorflow(findDataFile("dnn/ssd_mobilenet_v1_ppn_coco.pb", false),
  829. findDataFile("dnn/ssd_mobilenet_v1_ppn_coco.pbtxt"));
  830. Mat inp = imread(_tf("dog416.png"));
  831. Mat blob = blobFromImage(inp, 1.0, Size(300, 300), Scalar(), true, false);
  832. Mat ref = blobFromNPY(_tf("tensorflow/ssd_mobilenet_v1_ppn_coco.detection_out.npy"));
  833. float confThreshold = 0.51, scoreDiff = 0.05, iouDiff = 0.06;
  834. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  835. }
  836. TEST_P(Test_Int8_nets, Inception_v2_SSD)
  837. {
  838. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  839. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  840. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  841. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  842. applyTestTag(target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB);
  843. Net net = readNetFromTensorflow(findDataFile("dnn/ssd_inception_v2_coco_2017_11_17.pb", false),
  844. findDataFile("dnn/ssd_inception_v2_coco_2017_11_17.pbtxt"));
  845. Mat inp = imread(_tf("street.png"));
  846. Mat blob = blobFromImage(inp, 1.0, Size(300, 300), Scalar(), true, false);
  847. Mat ref = (Mat_<float>(5, 7) << 0, 1, 0.90176028, 0.19872092, 0.36311883, 0.26461923, 0.63498729,
  848. 0, 3, 0.93569964, 0.64865261, 0.45906419, 0.80675775, 0.65708131,
  849. 0, 3, 0.75838411, 0.44668293, 0.45907149, 0.49459291, 0.52197015,
  850. 0, 10, 0.95932811, 0.38349164, 0.32528657, 0.40387636, 0.39165527,
  851. 0, 10, 0.93973452, 0.66561931, 0.37841269, 0.68074018, 0.42907384);
  852. float confThreshold = 0.5, scoreDiff = 0.0114, iouDiff = 0.22;
  853. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  854. }
  855. TEST_P(Test_Int8_nets, opencv_face_detector)
  856. {
  857. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  858. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  859. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  860. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  861. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  862. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  863. Net net = readNetFromCaffe(findDataFile("dnn/opencv_face_detector.prototxt"),
  864. findDataFile("dnn/opencv_face_detector.caffemodel", false));
  865. Mat inp = imread(findDataFile("gpu/lbpcascade/er.png"));
  866. Mat blob = blobFromImage(inp, 1.0, Size(), Scalar(104.0, 177.0, 123.0), false, false);
  867. Mat ref = (Mat_<float>(6, 7) << 0, 1, 0.99520785, 0.80997437, 0.16379407, 0.87996572, 0.26685631,
  868. 0, 1, 0.9934696, 0.2831718, 0.50738752, 0.345781, 0.5985168,
  869. 0, 1, 0.99096733, 0.13629119, 0.24892329, 0.19756334, 0.3310290,
  870. 0, 1, 0.98977017, 0.23901358, 0.09084064, 0.29902688, 0.1769477,
  871. 0, 1, 0.97203469, 0.67965847, 0.06876482, 0.73999709, 0.1513494,
  872. 0, 1, 0.95097077, 0.51901293, 0.45863652, 0.5777427, 0.5347801);
  873. float confThreshold = 0.5, scoreDiff = 0.002, iouDiff = 0.4;
  874. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  875. }
  876. TEST_P(Test_Int8_nets, EfficientDet)
  877. {
  878. if (cvtest::skipUnstableTests)
  879. throw SkipTestException("Skip unstable test"); // detail: https://github.com/opencv/opencv/pull/23167
  880. applyTestTag(CV_TEST_TAG_DEBUG_VERYLONG);
  881. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  882. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  883. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  884. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  885. if (backend == DNN_BACKEND_TIMVX)
  886. applyTestTag(CV_TEST_TAG_DNN_SKIP_TIMVX);
  887. if (target != DNN_TARGET_CPU)
  888. {
  889. if (target == DNN_TARGET_OPENCL_FP16) applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  890. if (target == DNN_TARGET_OPENCL) applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  891. if (target == DNN_TARGET_MYRIAD) applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_MYRIAD);
  892. }
  893. Net net = readNetFromTensorflow(findDataFile("dnn/efficientdet-d0.pb", false),
  894. findDataFile("dnn/efficientdet-d0.pbtxt"));
  895. Mat inp = imread(_tf("dog416.png"));
  896. Mat blob = blobFromImage(inp, 1.0/255, Size(512, 512), Scalar(123.675, 116.28, 103.53));
  897. Mat ref = (Mat_<float>(3, 7) << 0, 1, 0.8437444, 0.153996080160141, 0.20534580945968628, 0.7463544607162476, 0.7414066195487976,
  898. 0, 17, 0.8245924, 0.16657517850399017, 0.3996818959712982, 0.4111558794975281, 0.9306337833404541,
  899. 0, 7, 0.8039304, 0.6118435263633728, 0.13175517320632935, 0.9065558314323425, 0.2943994700908661);
  900. float confThreshold = 0.65, scoreDiff = 0.3, iouDiff = 0.18;
  901. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  902. {
  903. SCOPED_TRACE("Per-tensor quantize");
  904. testDetectionNet(net, blob, ref, 0.85, scoreDiff, iouDiff, false);
  905. }
  906. }
  907. TEST_P(Test_Int8_nets, FasterRCNN_resnet50)
  908. {
  909. applyTestTag(
  910. (target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_1GB : CV_TEST_TAG_MEMORY_2GB),
  911. CV_TEST_TAG_LONG,
  912. CV_TEST_TAG_DEBUG_VERYLONG
  913. );
  914. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  915. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  916. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  917. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  918. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  919. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  920. if (backend == DNN_BACKEND_OPENCV && target == DNN_TARGET_OPENCL_FP16)
  921. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  922. Net net = readNetFromTensorflow(findDataFile("dnn/faster_rcnn_resnet50_coco_2018_01_28.pb", false),
  923. findDataFile("dnn/faster_rcnn_resnet50_coco_2018_01_28.pbtxt"));
  924. Mat inp = imread(_tf("dog416.png"));
  925. Mat blob = blobFromImage(inp, 1.0, Size(800, 600), Scalar(), true, false);
  926. Mat ref = blobFromNPY(_tf("tensorflow/faster_rcnn_resnet50_coco_2018_01_28.detection_out.npy"));
  927. float confThreshold = 0.8, scoreDiff = 0.05, iouDiff = 0.15;
  928. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  929. }
  930. TEST_P(Test_Int8_nets, FasterRCNN_inceptionv2)
  931. {
  932. applyTestTag(
  933. (target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_1GB : CV_TEST_TAG_MEMORY_2GB),
  934. CV_TEST_TAG_LONG,
  935. CV_TEST_TAG_DEBUG_VERYLONG
  936. );
  937. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  938. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  939. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  940. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  941. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  942. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  943. if (backend == DNN_BACKEND_OPENCV && target == DNN_TARGET_OPENCL_FP16)
  944. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  945. Net net = readNetFromTensorflow(findDataFile("dnn/faster_rcnn_inception_v2_coco_2018_01_28.pb", false),
  946. findDataFile("dnn/faster_rcnn_inception_v2_coco_2018_01_28.pbtxt"));
  947. Mat inp = imread(_tf("dog416.png"));
  948. Mat blob = blobFromImage(inp, 1.0, Size(800, 600), Scalar(), true, false);
  949. Mat ref = blobFromNPY(_tf("tensorflow/faster_rcnn_inception_v2_coco_2018_01_28.detection_out.npy"));
  950. float confThreshold = 0.5, scoreDiff = 0.21, iouDiff = 0.1;
  951. testDetectionNet(net, blob, ref, confThreshold, scoreDiff, iouDiff);
  952. }
  953. TEST_P(Test_Int8_nets, FasterRCNN_vgg16)
  954. {
  955. applyTestTag(
  956. #if defined(OPENCV_32BIT_CONFIGURATION) && defined(HAVE_OPENCL)
  957. CV_TEST_TAG_MEMORY_2GB,
  958. #else
  959. CV_TEST_TAG_MEMORY_2GB,
  960. #endif
  961. CV_TEST_TAG_LONG,
  962. CV_TEST_TAG_DEBUG_VERYLONG
  963. );
  964. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  965. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  966. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  967. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  968. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  969. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  970. Net net = readNetFromCaffe(findDataFile("dnn/faster_rcnn_vgg16.prototxt"),
  971. findDataFile("dnn/VGG16_faster_rcnn_final.caffemodel", false));
  972. Mat ref = (Mat_<float>(3, 7) << 0, 2, 0.949398, 99.2454, 210.141, 601.205, 462.849,
  973. 0, 7, 0.997022, 481.841, 92.3218, 722.685, 175.953,
  974. 0, 12, 0.993028, 133.221, 189.377, 350.994, 563.166);
  975. float confThreshold = 0.8, scoreDiff = 0.048, iouDiff = 0.35;
  976. testFaster(net, ref, confThreshold, scoreDiff, iouDiff);
  977. }
  978. TEST_P(Test_Int8_nets, FasterRCNN_zf)
  979. {
  980. applyTestTag(
  981. #if defined(OPENCV_32BIT_CONFIGURATION) && defined(HAVE_OPENCL)
  982. CV_TEST_TAG_MEMORY_2GB,
  983. #else
  984. (target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB),
  985. #endif
  986. CV_TEST_TAG_DEBUG_VERYLONG
  987. );
  988. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  989. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  990. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  991. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  992. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  993. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  994. Net net = readNetFromCaffe(findDataFile("dnn/faster_rcnn_zf.prototxt"),
  995. findDataFile("dnn/ZF_faster_rcnn_final.caffemodel", false));
  996. Mat ref = (Mat_<float>(3, 7) << 0, 2, 0.90121, 120.407, 115.83, 570.586, 528.395,
  997. 0, 7, 0.988779, 469.849, 75.1756, 718.64, 186.762,
  998. 0, 12, 0.967198, 138.588, 206.843, 329.766, 553.176);
  999. float confThreshold = 0.8, scoreDiff = 0.021, iouDiff = 0.1;
  1000. testFaster(net, ref, confThreshold, scoreDiff, iouDiff);
  1001. }
  1002. TEST_P(Test_Int8_nets, RFCN)
  1003. {
  1004. applyTestTag(
  1005. (target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_2GB),
  1006. CV_TEST_TAG_LONG,
  1007. CV_TEST_TAG_DEBUG_VERYLONG
  1008. );
  1009. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  1010. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  1011. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  1012. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  1013. Net net = readNetFromCaffe(findDataFile("dnn/rfcn_pascal_voc_resnet50.prototxt"),
  1014. findDataFile("dnn/resnet50_rfcn_final.caffemodel", false));
  1015. Mat ref = (Mat_<float>(2, 7) << 0, 7, 0.991359, 491.822, 81.1668, 702.573, 178.234,
  1016. 0, 12, 0.94786, 132.093, 223.903, 338.077, 566.16);
  1017. float confThreshold = 0.8, scoreDiff = 0.15, iouDiff = 0.11;
  1018. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH) {
  1019. iouDiff = 0.12;
  1020. }
  1021. testFaster(net, ref, confThreshold, scoreDiff, iouDiff);
  1022. }
  1023. TEST_P(Test_Int8_nets, YoloVoc)
  1024. {
  1025. applyTestTag(
  1026. #if defined(OPENCV_32BIT_CONFIGURATION) && defined(HAVE_OPENCL)
  1027. CV_TEST_TAG_MEMORY_2GB,
  1028. #else
  1029. CV_TEST_TAG_MEMORY_1GB,
  1030. #endif
  1031. CV_TEST_TAG_LONG,
  1032. CV_TEST_TAG_DEBUG_VERYLONG
  1033. );
  1034. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  1035. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  1036. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  1037. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  1038. Mat ref = (Mat_<float>(6, 7) << 0, 6, 0.750469f, 0.577374f, 0.127391f, 0.902949f, 0.300809f,
  1039. 0, 1, 0.780879f, 0.270762f, 0.264102f, 0.732475f, 0.745412f,
  1040. 0, 11, 0.901615f, 0.1386f, 0.338509f, 0.421337f, 0.938789f,
  1041. 1, 14, 0.623813f, 0.183179f, 0.381921f, 0.247726f, 0.625847f,
  1042. 1, 6, 0.667770f, 0.446555f, 0.453578f, 0.499986f, 0.519167f,
  1043. 1, 6, 0.844947f, 0.637058f, 0.460398f, 0.828508f, 0.66427f);
  1044. std::string config_file = "yolo-voc.cfg";
  1045. std::string weights_file = "yolo-voc.weights";
  1046. double scoreDiff = 0.12, iouDiff = 0.3;
  1047. {
  1048. SCOPED_TRACE("batch size 1");
  1049. testDarknetModel(config_file, weights_file, ref.rowRange(0, 3), scoreDiff, iouDiff);
  1050. }
  1051. {
  1052. SCOPED_TRACE("batch size 2");
  1053. testDarknetModel(config_file, weights_file, ref, scoreDiff, iouDiff);
  1054. }
  1055. }
  1056. TEST_P(Test_Int8_nets, TinyYoloVoc)
  1057. {
  1058. applyTestTag(
  1059. CV_TEST_TAG_MEMORY_512MB,
  1060. CV_TEST_TAG_DEBUG_VERYLONG
  1061. );
  1062. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  1063. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  1064. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  1065. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  1066. Mat ref = (Mat_<float>(4, 7) << 0, 6, 0.761967f, 0.579042f, 0.159161f, 0.894482f, 0.31994f,
  1067. 0, 11, 0.780595f, 0.129696f, 0.386467f, 0.445275f, 0.920994f,
  1068. 1, 6, 0.651450f, 0.460526f, 0.458019f, 0.522527f, 0.5341f,
  1069. 1, 6, 0.928758f, 0.651024f, 0.463539f, 0.823784f, 0.654998f);
  1070. std::string config_file = "tiny-yolo-voc.cfg";
  1071. std::string weights_file = "tiny-yolo-voc.weights";
  1072. double scoreDiff = 0.043, iouDiff = 0.12;
  1073. {
  1074. SCOPED_TRACE("batch size 1");
  1075. testDarknetModel(config_file, weights_file, ref.rowRange(0, 2), scoreDiff, iouDiff);
  1076. {
  1077. SCOPED_TRACE("Per-tensor quantize");
  1078. testDarknetModel(config_file, weights_file, ref.rowRange(0, 2), 0.1, 0.2, 0.24, 0.6, false);
  1079. }
  1080. }
  1081. {
  1082. SCOPED_TRACE("batch size 2");
  1083. testDarknetModel(config_file, weights_file, ref, scoreDiff, iouDiff);
  1084. {
  1085. SCOPED_TRACE("Per-tensor quantize");
  1086. testDarknetModel(config_file, weights_file, ref, 0.1, 0.2, 0.24, 0.6, false);
  1087. }
  1088. }
  1089. }
  1090. TEST_P(Test_Int8_nets, YOLOv3)
  1091. {
  1092. applyTestTag(
  1093. CV_TEST_TAG_LONG,
  1094. (target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_1GB : CV_TEST_TAG_MEMORY_2GB),
  1095. CV_TEST_TAG_DEBUG_VERYLONG
  1096. );
  1097. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  1098. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  1099. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  1100. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  1101. const int N0 = 3;
  1102. const int N1 = 6;
  1103. static const float ref_[/* (N0 + N1) * 7 */] = {
  1104. 0, 16, 0.998836f, 0.160024f, 0.389964f, 0.417885f, 0.943716f,
  1105. 0, 1, 0.987908f, 0.150913f, 0.221933f, 0.742255f, 0.746261f,
  1106. 0, 7, 0.952983f, 0.614621f, 0.150257f, 0.901368f, 0.289251f,
  1107. 1, 2, 0.997412f, 0.647584f, 0.459939f, 0.821037f, 0.663947f,
  1108. 1, 2, 0.989633f, 0.450719f, 0.463353f, 0.496306f, 0.522258f,
  1109. 1, 0, 0.980053f, 0.195856f, 0.378454f, 0.258626f, 0.629257f,
  1110. 1, 9, 0.785341f, 0.665503f, 0.373543f, 0.688893f, 0.439244f,
  1111. 1, 9, 0.733275f, 0.376029f, 0.315694f, 0.401776f, 0.395165f,
  1112. 1, 9, 0.384815f, 0.659824f, 0.372389f, 0.673927f, 0.429412f,
  1113. };
  1114. Mat ref(N0 + N1, 7, CV_32FC1, (void*)ref_);
  1115. std::string config_file = "yolov3.cfg";
  1116. std::string weights_file = "yolov3.weights";
  1117. double scoreDiff = 0.08, iouDiff = 0.21, confThreshold = 0.25;
  1118. {
  1119. SCOPED_TRACE("batch size 1");
  1120. testDarknetModel(config_file, weights_file, ref.rowRange(0, N0), scoreDiff, iouDiff, confThreshold);
  1121. }
  1122. {
  1123. SCOPED_TRACE("batch size 2");
  1124. testDarknetModel(config_file, weights_file, ref, scoreDiff, iouDiff, confThreshold);
  1125. }
  1126. }
  1127. TEST_P(Test_Int8_nets, YOLOv4)
  1128. {
  1129. applyTestTag(
  1130. CV_TEST_TAG_LONG,
  1131. (target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_1GB : CV_TEST_TAG_MEMORY_2GB),
  1132. CV_TEST_TAG_DEBUG_VERYLONG
  1133. );
  1134. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  1135. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  1136. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  1137. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  1138. const int N0 = 3;
  1139. const int N1 = 7;
  1140. static const float ref_[/* (N0 + N1) * 7 */] = {
  1141. 0, 16, 0.992194f, 0.172375f, 0.402458f, 0.403918f, 0.932801f,
  1142. 0, 1, 0.988326f, 0.166708f, 0.228236f, 0.737208f, 0.735803f,
  1143. 0, 7, 0.94639f, 0.602523f, 0.130399f, 0.901623f, 0.298452f,
  1144. 1, 2, 0.99761f, 0.646556f, 0.45985f, 0.816041f, 0.659067f,
  1145. 1, 0, 0.988913f, 0.201726f, 0.360282f, 0.266181f, 0.631728f,
  1146. 1, 2, 0.98233f, 0.452007f, 0.462217f, 0.495612f, 0.521687f,
  1147. 1, 9, 0.919195f, 0.374642f, 0.316524f, 0.398126f, 0.393714f,
  1148. 1, 9, 0.856303f, 0.666842f, 0.372215f, 0.685539f, 0.44141f,
  1149. 1, 9, 0.313516f, 0.656791f, 0.374734f, 0.671959f, 0.438371f,
  1150. 1, 9, 0.256625f, 0.940232f, 0.326931f, 0.967586f, 0.374002f,
  1151. };
  1152. Mat ref(N0 + N1, 7, CV_32FC1, (void*)ref_);
  1153. std::string config_file = "yolov4.cfg";
  1154. std::string weights_file = "yolov4.weights";
  1155. double scoreDiff = 0.15, iouDiff = 0.2;
  1156. {
  1157. SCOPED_TRACE("batch size 1");
  1158. testDarknetModel(config_file, weights_file, ref.rowRange(0, N0), scoreDiff, iouDiff);
  1159. }
  1160. {
  1161. SCOPED_TRACE("batch size 2");
  1162. testDarknetModel(config_file, weights_file, ref, scoreDiff, iouDiff);
  1163. }
  1164. }
  1165. TEST_P(Test_Int8_nets, YOLOv4_tiny)
  1166. {
  1167. applyTestTag(
  1168. target == DNN_TARGET_CPU ? CV_TEST_TAG_MEMORY_512MB : CV_TEST_TAG_MEMORY_1GB
  1169. );
  1170. if (target == DNN_TARGET_OPENCL_FP16 && !ocl::Device::getDefault().isIntel())
  1171. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL_FP16);
  1172. if (target == DNN_TARGET_OPENCL && !ocl::Device::getDefault().isIntel())
  1173. applyTestTag(CV_TEST_TAG_DNN_SKIP_OPENCL);
  1174. if (backend == DNN_BACKEND_INFERENCE_ENGINE_NGRAPH)
  1175. applyTestTag(CV_TEST_TAG_DNN_SKIP_IE_NGRAPH);
  1176. const float confThreshold = 0.6;
  1177. const int N0 = 2;
  1178. const int N1 = 3;
  1179. static const float ref_[/* (N0 + N1) * 7 */] = {
  1180. 0, 16, 0.912199f, 0.169926f, 0.350896f, 0.422704f, 0.941837f,
  1181. 0, 7, 0.845388f, 0.617568f, 0.13961f, 0.9008f, 0.29315f,
  1182. 1, 2, 0.997789f, 0.657455f, 0.459714f, 0.809122f, 0.656829f,
  1183. 1, 2, 0.924423f, 0.442872f, 0.470127f, 0.49816f, 0.516516f,
  1184. 1, 0, 0.728307f, 0.202607f, 0.369828f, 0.259445f, 0.613846f,
  1185. };
  1186. Mat ref(N0 + N1, 7, CV_32FC1, (void*)ref_);
  1187. std::string config_file = "yolov4-tiny-2020-12.cfg";
  1188. std::string weights_file = "yolov4-tiny-2020-12.weights";
  1189. double scoreDiff = 0.12;
  1190. double iouDiff = target == DNN_TARGET_OPENCL_FP16 ? 0.2 : 0.118;
  1191. {
  1192. SCOPED_TRACE("batch size 1");
  1193. testDarknetModel(config_file, weights_file, ref.rowRange(0, N0), scoreDiff, iouDiff, confThreshold);
  1194. {
  1195. SCOPED_TRACE("Per-tensor quantize");
  1196. testDarknetModel(config_file, weights_file, ref.rowRange(0, N0), scoreDiff, 0.224, 0.7, 0.4, false);
  1197. }
  1198. }
  1199. throw SkipTestException("batch2: bad accuracy on second image");
  1200. /* bad accuracy on second image
  1201. {
  1202. SCOPED_TRACE("batch size 2");
  1203. testDarknetModel(config_file, weights_file, ref, scoreDiff, iouDiff, confThreshold);
  1204. }
  1205. */
  1206. }
  1207. INSTANTIATE_TEST_CASE_P(/**/, Test_Int8_nets, dnnBackendsAndTargetsInt8());
  1208. }} // namespace