fp16 ocl support for more layers

Signed-off-by: Li Peng <peng.li@intel.com>
2018-04-26 19:36:19 +08:00
parent 3dd916882a
commit ba5e8befa9
14 changed files with 121 additions and 50 deletions
@@ -96,9 +96,10 @@ public:
        std::vector<UMat> inputs;
        std::vector<UMat> outputs;

+        bool use_half = (inps.depth() == CV_16S);
        inps.getUMatVector(inputs);
        outs.getUMatVector(outputs);
-        String buildopt = String("-DDtype=") + ocl::typeToStr(inputs[0].type()) + String(" ");
+        String buildopt= format("-DDtype=%s ", use_half ? "half" : "float");

        for (size_t i = 0; i < inputs.size(); i++)
        {
@@ -134,7 +135,7 @@ public:
        CV_TRACE_FUNCTION();
        CV_TRACE_ARG_VALUE(name, "name", name.c_str());

-        CV_OCL_RUN((preferableTarget == DNN_TARGET_OPENCL) &&
+        CV_OCL_RUN(IS_DNN_OPENCL_TARGET(preferableTarget) &&
                   OCL_PERFORMANCE_CHECK(ocl::Device::getDefault().isIntel()),
                   forward_ocl(inputs_arr, outputs_arr, internals_arr))