[GPU] Remove property

vladimir-paramuzov · Sep 19, 2024 · 89ff672 · 89ff672
1 parent dd4d729
commit 89ff672
Show file tree

Hide file tree

Showing 8 changed files with 5 additions and 39 deletions.
diff --git a/src/inference/include/openvino/runtime/intel_gpu/properties.hpp b/src/inference/include/openvino/runtime/intel_gpu/properties.hpp
@@ -132,15 +132,6 @@ static constexpr Property<bool> enable_sdpa_optimization{"GPU_ENABLE_SDPA_OPTIMI
  * @ingroup ov_runtime_ocl_gpu_prop_cpp_api
  */
 static constexpr Property<bool> enable_kernels_reuse{"GPU_ENABLE_KERNELS_REUSE"};
-
-/**
- * @brief Turning on this key switches addressing mode to allow allocations larger than 4GB
- * as described here
- * https://github.com/intel/compute-runtime/blob/master/programmers-guide/ALLOCATIONS_GREATER_THAN_4GB.md#creating-allocations-greater-than-4GB
- * Note: On some platform performance of primitives with i64 data type may be lower with this option enabled.
- * @ingroup ov_runtime_ocl_gpu_prop_cpp_api
- */
-static constexpr Property<bool> enable_large_allocations{"GPU_ENABLE_LARGE_ALLOCATIONS"};
 }  // namespace hint
 
 /**

diff --git a/src/plugins/intel_gpu/src/graph/impls/ocl/kernel_selector_helper.cpp b/src/plugins/intel_gpu/src/graph/impls/ocl/kernel_selector_helper.cpp
@@ -1132,7 +1132,6 @@ void set_params(const kernel_impl_params& param_info, kernel_selector::params& p
     params.engineInfo.supports_imad = device_info.supports_imad;
     params.engineInfo.supports_immad = device_info.supports_immad;
     params.engineInfo.enable_sub_groups_emulation = true;
-    params.engineInfo.enable_large_allocations = config.get_property(ov::intel_gpu::hint::enable_large_allocations);
     params.engineInfo.bOptHintsSupport = false;
 
     params.engineInfo.bLocalBlockIOSupport = query_local_block_io_supported(engine, config);

diff --git a/src/plugins/intel_gpu/src/kernel_selector/kernel_base_opencl.cpp b/src/plugins/intel_gpu/src/kernel_selector/kernel_base_opencl.cpp
@@ -173,8 +173,7 @@ std::shared_ptr<KernelString> KernelBaseOpenCL::GetKernelString(const std::strin
         kernel_string->undefs = jit.second;
         if (engine_info.vendor_id == cldnn::INTEL_VENDOR_ID) {
             kernel_string->options = exe_mode + " -cl-mad-enable";
-            if (engine_info.enable_large_allocations)
-                kernel_string->options += " -cl-intel-greater-than-4GB-buffer-required";
+            kernel_string->options += " -cl-intel-greater-than-4GB-buffer-required";
             if (engine_info.bOptHintsSupport)
                 kernel_string->options += " -DOPT_HINTS_SUPPORTED=1";
             if (engine_info.bLocalBlockIOSupport)

diff --git a/src/plugins/intel_gpu/src/kernel_selector/kernel_selector_params.h b/src/plugins/intel_gpu/src/kernel_selector/kernel_selector_params.h
@@ -390,7 +390,6 @@ struct EngineInfo {
     bool supports_imad = false;
     bool supports_immad = false;
     bool enable_sub_groups_emulation = false;
-    bool enable_large_allocations = false;
     bool bOptHintsSupport = false;
     bool bLocalBlockIOSupport = false;
     bool supports_microkernels = false;

diff --git a/src/plugins/intel_gpu/src/plugin/program_builder.cpp b/src/plugins/intel_gpu/src/plugin/program_builder.cpp
@@ -2,7 +2,6 @@
 // SPDX-License-Identifier: Apache-2.0
 //
 
-#include "openvino/core/shape.hpp"
 #include "openvino/op/constant.hpp"
 #include "openvino/op/split.hpp"
 #include "openvino/op/variadic_split.hpp"
@@ -17,7 +16,6 @@
 #include "intel_gpu/primitives/data.hpp"
 #include "intel_gpu/op/fully_connected_compressed.hpp"
 #include "intel_gpu/op/placeholder.hpp"
-#include "openvino/runtime/intel_gpu/properties.hpp"
 #include "openvino/util/pp.hpp"
 
 #ifdef __linux__
@@ -28,18 +26,6 @@
 #include <malloc.h>
 #endif
 
-namespace {
-bool requires_large_allocations(const std::shared_ptr<ov::Node>& op, size_t max_alloc_size) {
-    for (size_t i = 0; i < op->get_output_size(); i++) {
-        const auto& out_pshape = op->get_output_partial_shape(i);
-        if (out_pshape.is_static() && ov::shape_size(out_pshape.to_shape()) * op->get_output_element_type(i).size() >= max_alloc_size) {
-            return true;
-        }
-    }
-
-    return false;
-}
-}  // namespace
 
 namespace ov {
 namespace intel_gpu {
@@ -168,22 +154,13 @@ std::shared_ptr<cldnn::program> ProgramBuilder::build(const std::vector<std::sha
         }
     }
 
-    bool enable_large_allocations = false;
-    for (const auto& op : ops) {
-        if (requires_large_allocations(op, m_engine.get_device_info().max_alloc_mem_size)) {
-            enable_large_allocations = true;
-            break;
-        }
-    }
-
     if (is_inner_program) {
         allow_new_shape_infer = (m_config.get_property(ov::intel_gpu::allow_new_shape_infer) || allow_new_shape_infer);
     }
 
     m_config.set_property(ov::intel_gpu::partial_build_program(partial_build));
     m_config.set_property(ov::intel_gpu::optimize_data(true));
     m_config.set_property(ov::intel_gpu::allow_new_shape_infer(allow_new_shape_infer));
-    m_config.set_property(ov::intel_gpu::hint::enable_large_allocations(enable_large_allocations));
 
     prepare_build();
     {

diff --git a/src/plugins/intel_gpu/src/runtime/execution_config.cpp b/src/plugins/intel_gpu/src/runtime/execution_config.cpp
@@ -4,7 +4,6 @@
 
 #include "intel_gpu/runtime/execution_config.hpp"
 #include "intel_gpu/runtime/debug_configuration.hpp"
-#include "openvino/runtime/intel_gpu/properties.hpp"
 #include "openvino/runtime/internal_properties.hpp"
 
 #include <thread>
@@ -53,7 +52,6 @@ void ExecutionConfig::set_default() {
         std::make_tuple(ov::intel_gpu::hint::queue_throttle, ov::intel_gpu::hint::ThrottleLevel::MEDIUM),
         std::make_tuple(ov::intel_gpu::hint::queue_priority, ov::hint::Priority::MEDIUM),
         std::make_tuple(ov::intel_gpu::hint::enable_sdpa_optimization, true),
-        std::make_tuple(ov::intel_gpu::hint::enable_large_allocations, false),
         std::make_tuple(ov::intel_gpu::enable_loop_unrolling, true),
         std::make_tuple(ov::intel_gpu::disable_winograd_convolution, false),
         std::make_tuple(ov::internal::exclusive_async_requests, false),

diff --git a/src/plugins/intel_gpu/src/runtime/ocl/ocl_memory.cpp b/src/plugins/intel_gpu/src/runtime/ocl/ocl_memory.cpp
@@ -461,6 +461,8 @@ gpu_usm::gpu_usm(ocl_engine* engine, const layout& layout, allocation_type type)
     std::vector<cl_mem_properties_intel> properties;
     if (engine->get_device_info().vendor_id == INTEL_VENDOR_ID) {
         properties = {CL_MEM_FLAGS, CL_MEM_ALLOW_UNRESTRICTED_SIZE_INTEL, 0};
+    } else {
+        properties = {0};
     }
 
     switch (get_allocation_type()) {

diff --git a/src/plugins/intel_gpu/tests/unit/test_cases/reduce_gpu_test.cpp b/src/plugins/intel_gpu/tests/unit/test_cases/reduce_gpu_test.cpp
@@ -2229,9 +2229,10 @@ TEST(reduce_f32_fw_gpu, large_buffer) {
 
     layout in_l = { sz_8gb, data_types::f32, format::bfyx };
 
+    auto config = get_test_default_config(*engine);
     topology topology(input_layout("input", in_l),
                       reduce("reduce", input_info("input"), reduce_mode::mean, {2}, true));
-    network network(*engine, topology, get_test_default_config(*engine));
+    network network(*engine, topology, config);
     auto input = network.get_output_memory("input");
     {
         mem_lock<float, mem_lock_type::write> l(input, get_test_stream());