[NPU] Use the friendly name of the tensor instead of the legacy name of it (openvinotoolkit#23945)

pereanub · web-flow · commit 7d56aeb91fc2 · 2024-04-18T14:26:16.000Z
### Details:
 - *Use friendly name of the tensor instead of legacy name of it*
 - *...*

### Tickets:
 - *ticket-id*
diff --git a/src/plugins/intel_npu/src/al/include/sync_infer_request.hpp b/src/plugins/intel_npu/src/al/include/sync_infer_request.hpp
@@ -201,6 +201,7 @@ class SyncInferRequest : public ov::IInferRequest {
     std::vector<std::string> _outputAndStateOutputNames;
 
     std::unordered_map<std::string, std::string> _nodeNameToLegacyName;
+    std::unordered_map<std::string, std::string> _legacyNameToNodeName;
 };
 
 }  // namespace intel_npu
diff --git a/src/plugins/intel_npu/src/al/src/sync_infer_request.cpp b/src/plugins/intel_npu/src/al/src/sync_infer_request.cpp
@@ -24,11 +24,9 @@ SyncInferRequest::SyncInferRequest(const std::shared_ptr<const ICompiledModel>&
 
     // Map the node names to the legacy ones used by the I/O tensors in order to allow an easier access to the tensors'
     // contents
-    for (const auto& [legacyName, parameterDescriptor] : _metadata.parameters) {
-        _nodeNameToLegacyName[parameterDescriptor.currentNodeName] = legacyName;
-    }
-    for (const auto& [legacyName, resultDescriptor] : _metadata.results) {
-        _nodeNameToLegacyName[resultDescriptor.currentNodeName] = legacyName;
+    for (const auto& [name, resultDescriptor] : _metadata.results) {
+        _nodeNameToLegacyName[name] = resultDescriptor.legacyName;
+        _legacyNameToNodeName[resultDescriptor.legacyName] = name;
     }
 
     _inputAndStateInputNames = _metadata.inputNames;
@@ -48,8 +46,12 @@ SyncInferRequest::SyncInferRequest(const std::shared_ptr<const ICompiledModel>&
         if (contains(_inputAndStateInputNames, shapeName)) {
             _inputAndStateInputNames.push_back(SHAPE_TENSOR_PREFIX + shapeName);
         }
-        if (contains(_outputAndStateOutputNames, shapeName)) {
-            _outputAndStateOutputNames.push_back(SHAPE_TENSOR_PREFIX + shapeName);
+
+        const auto& shapeNameMatch = _legacyNameToNodeName.find(shapeName);
+        if (shapeNameMatch != _legacyNameToNodeName.end()) {
+            if (contains(_outputAndStateOutputNames, shapeNameMatch->second)) {
+                _outputAndStateOutputNames.push_back(SHAPE_TENSOR_PREFIX + shapeName);
+            }
         }
     }
 }
@@ -83,10 +85,7 @@ std::vector<ov::SoPtr<ov::IVariableState>> SyncInferRequest::query_state() const
 }
 
 ov::SoPtr<ov::ITensor> SyncInferRequest::get_tensor(const ov::Output<const ov::Node>& port) const {
-    const auto& nodeNameMatch = _nodeNameToLegacyName.find(port.get_node()->get_friendly_name());
-    OPENVINO_ASSERT(nodeNameMatch != _nodeNameToLegacyName.end(), "Cannot find tensor for port ", port);
-
-    return _allTensors.at(nodeNameMatch->second);
+    return _allTensors.at(port.get_node()->get_friendly_name());
 }
 
 void SyncInferRequest::set_tensor(const ov::Output<const ov::Node>& port, const ov::SoPtr<ov::ITensor>& tensor) {
@@ -97,8 +96,7 @@ void SyncInferRequest::set_tensor(const ov::Output<const ov::Node>& port, const
         OPENVINO_THROW("Failed to set tensor. ", ex.what());
     }
 
-    const std::string& legacyName = _nodeNameToLegacyName.at(port.get_node()->get_friendly_name());
-    _allTensors[legacyName] = tensor._ptr;
+    _allTensors[port.get_node()->get_friendly_name()] = tensor._ptr;
 }
 
 std::vector<ov::SoPtr<ov::ITensor>> SyncInferRequest::get_tensors(const ov::Output<const ov::Node>& /*port*/) const {
@@ -151,14 +149,12 @@ void SyncInferRequest::check_tensor(const ov::Output<const ov::Node>& port,
 void SyncInferRequest::check_tensors() const {
     const auto& inputs = _compiledModel->inputs();
     for (size_t i = 0; i < inputs.size(); i++) {
-        const std::string& legacyName = _nodeNameToLegacyName.at(inputs[i].get_node()->get_friendly_name());
-        check_tensor(inputs[i], _allTensors.at(legacyName));
+        check_tensor(inputs[i], _allTensors.at(inputs[i].get_node()->get_friendly_name()));
     }
 
     const auto& outputs = _compiledModel->outputs();
     for (size_t i = 0; i < outputs.size(); i++) {
-        const std::string& legacyName = _nodeNameToLegacyName.at(outputs[i].get_node()->get_friendly_name());
-        check_tensor(outputs[i], _allTensors.at(legacyName));
+        check_tensor(outputs[i], _allTensors.at(outputs[i].get_node()->get_friendly_name()));
     }
 }
 
@@ -180,6 +176,7 @@ void SyncInferRequest::allocate_tensor(std::string tensorName,
         _shapesTensors[tensorName] = tensor;
         tensorName = SHAPE_TENSOR_PREFIX + tensorName;
     }
+
     if (tensorType == TensorType::State) {
         _variableStates[tensorName] = std::make_shared<VariableState>(tensorName, tensor);
 
diff --git a/src/plugins/intel_npu/src/backend/include/zero_executor.hpp b/src/plugins/intel_npu/src/backend/include/zero_executor.hpp
@@ -27,7 +27,7 @@ class ZeroExecutor final : public IExecutor {
     ~ZeroExecutor() override;
 
     struct ArgumentDescriptor {
-        ze_graph_argument_properties_t info;
+        ze_graph_argument_properties_3_t info;
         uint32_t idx;
     };
 
@@ -67,6 +67,7 @@ class ZeroExecutor final : public IExecutor {
 
     ze_graph_handle_t _graph = nullptr;
     ze_graph_properties_t _props{};
+
     std::unordered_map<std::string, ArgumentDescriptor> _inputs_desc_map;
     std::unordered_map<std::string, ArgumentDescriptor> _outputs_desc_map;
 
diff --git a/src/plugins/intel_npu/src/backend/include/zero_memory.hpp b/src/plugins/intel_npu/src/backend/include/zero_memory.hpp
@@ -96,7 +96,7 @@ class HostMemAllocator final {
 struct MemoryManagementUnit {
     MemoryManagementUnit() = default;
 
-    void appendArgument(const std::string& name, const ze_graph_argument_properties_t& argument);
+    void appendArgument(const std::string& name, const std::size_t argSize);
     /* Allocate Device memories */
     void allocate(const ze_device_handle_t device_handle, const ze_context_handle_t context);
 
diff --git a/src/plugins/intel_npu/src/backend/include/zero_utils.hpp b/src/plugins/intel_npu/src/backend/include/zero_utils.hpp
@@ -164,7 +164,7 @@ static inline std::size_t layoutCount(const ze_graph_argument_layout_t val) {
     }
 }
 
-static inline std::size_t getSizeIOBytes(const ze_graph_argument_properties_t& argument) {
+static inline std::size_t getSizeIOBytes(const ze_graph_argument_properties_3_t& argument) {
     std::size_t num_elements = 1;
     for (std::size_t i = 0; i < layoutCount(argument.deviceLayout); ++i) {
         num_elements *= argument.dims[i];
diff --git a/src/plugins/intel_npu/src/backend/src/zero_executor.cpp b/src/plugins/intel_npu/src/backend/src/zero_executor.cpp
@@ -13,6 +13,7 @@
 
 #include "intel_npu/al/config/common.hpp"
 #include "intel_npu/al/itt.hpp"
+#include "intel_npu/al/prefix.hpp"
 #include "zero_device.hpp"
 #include "zero_utils.hpp"
 
@@ -55,11 +56,9 @@ ZeroExecutor::ZeroExecutor(const std::shared_ptr<const ZeroInitStructsHolder>& i
                                      _config,
                                      _group_ordinal);
     Fence fence(graph_command_queue, _config);
-    ze_device_properties_t properties = {};
-    properties.stype = ZE_STRUCTURE_TYPE_DEVICE_PROPERTIES;
-    zeroUtils::throwOnFail("zeDeviceGetProperties", zeDeviceGetProperties(_initStructs->getDevice(), &properties));
 
     OV_ITT_TASK_CHAIN(ZERO_EXECUTOR_GRAPH, itt::domains::LevelZeroBackend, "Executor::ZeroExecutor", "graphCreate");
+
     ze_graph_desc_t desc{ZE_STRUCTURE_TYPE_GRAPH_DESC_PROPERTIES,
                          nullptr,
                          ZE_GRAPH_FORMAT_NATIVE,
@@ -73,17 +72,37 @@ ZeroExecutor::ZeroExecutor(const std::shared_ptr<const ZeroInitStructsHolder>& i
     OV_ITT_TASK_NEXT(ZERO_EXECUTOR_GRAPH, "pfnGetProperties");
     zeroUtils::throwOnFail("pfnGetProperties", _graph_ddi_table_ext->pfnGetProperties(_graph, &_props));
 
-    OV_ITT_TASK_NEXT(ZERO_EXECUTOR_GRAPH, "pfnGetArgumentProperties");
+    auto targetDriverExtVersion = _initStructs->getDriverExtVersion();
+    if (targetDriverExtVersion <= ZE_GRAPH_EXT_VERSION_1_1) {
+        OPENVINO_THROW("Incompatibility between the NPU plugin and driver! The driver version is too old, please "
+                       "update the driver version");
+    }
+
+    OV_ITT_TASK_NEXT(ZERO_EXECUTOR_GRAPH, "pfnGetArgumentProperties3");
     for (uint32_t index = 0; index < _props.numGraphArgs; ++index) {
-        ze_graph_argument_properties_t arg;
-        zeroUtils::throwOnFail("pfnGetArgumentProperties",
-                               _graph_ddi_table_ext->pfnGetArgumentProperties(_graph, index, &arg));
-        if (ZE_GRAPH_ARGUMENT_TYPE_INPUT == arg.type) {
-            _inputs_desc_map.emplace(std::make_pair(std::string(arg.name), ArgumentDescriptor{arg, index}));
+        ze_graph_argument_properties_3_t arg3;
+        zeroUtils::throwOnFail("pfnGetArgumentProperties3",
+                               _graph_ddi_table_ext->pfnGetArgumentProperties3(_graph, index, &arg3));
+
+        if (ZE_GRAPH_ARGUMENT_TYPE_INPUT == arg3.type) {
+            if (isStateInputName(arg3.name) || isShapeTensorName(arg3.name)) {
+                _inputs_desc_map.emplace(std::make_pair(std::string(arg3.name), ArgumentDescriptor{arg3, index}));
+
+            } else {
+                _inputs_desc_map.emplace(
+                    std::make_pair(std::string(arg3.debug_friendly_name), ArgumentDescriptor{arg3, index}));
+            }
         } else {
-            _outputs_desc_map.emplace(std::make_pair(std::string(arg.name), ArgumentDescriptor{arg, index}));
+            if (isStateOutputName(arg3.name) || isShapeTensorName(arg3.name)) {
+                _outputs_desc_map.emplace(std::make_pair(std::string(arg3.name), ArgumentDescriptor{arg3, index}));
+
+            } else {
+                _outputs_desc_map.emplace(
+                    std::make_pair(std::string(arg3.debug_friendly_name), ArgumentDescriptor{arg3, index}));
+            }
         }
     }
+
     OV_ITT_TASK_NEXT(ZERO_EXECUTOR_GRAPH, "appendGraphInitialize");
     graph_command_list.appendGraphInitialize(_graph);
     graph_command_list.close();
diff --git a/src/plugins/intel_npu/src/backend/src/zero_infer_request.cpp b/src/plugins/intel_npu/src/backend/src/zero_infer_request.cpp
@@ -91,6 +91,8 @@ ZeroInferRequest::ZeroInferRequest(const std::shared_ptr<ZeroInitStructsHolder>&
         return std::find(container.begin(), container.end(), value) != container.end();
     };
 
+    auto allocator = zeroMemory::HostMemAllocator(backendPtr);
+
     for (const std::string& inputName : _metadata.inputNames) {
         if (!executorInputDescriptors.count(inputName)) {
             OPENVINO_THROW("Invalid graph input descriptor key: " + inputName);
@@ -99,15 +101,15 @@ ZeroInferRequest::ZeroInferRequest(const std::shared_ptr<ZeroInitStructsHolder>&
         const IONodeDescriptor& parameterDescriptor = _metadata.parameters.at(inputName);
         check_level_zero_attributes_match(parameterDescriptor, executorInputDescriptors.at(inputName), inputName);
 
-        ov::Allocator allocator;
+        ov::Allocator inputAllocator;
         if (properties.flags & ZE_DEVICE_PROPERTY_FLAG_INTEGRATED) {
-            allocator = zeroMemory::HostMemAllocator(backendPtr, ZE_HOST_MEM_ALLOC_FLAG_BIAS_WRITE_COMBINED);
+            inputAllocator = zeroMemory::HostMemAllocator(backendPtr, ZE_HOST_MEM_ALLOC_FLAG_BIAS_WRITE_COMBINED);
         } else {
-            allocator = zeroMemory::HostMemAllocator(backendPtr);
-        }
+            inputAllocator = zeroMemory::HostMemAllocator(backendPtr);
+        };
 
         // The I/O buffers already allocated using the Level Zero API are being reused here
-        allocate_tensor(inputName, parameterDescriptor, TensorType::InputOrOutput, allocator);
+        allocate_tensor(inputName, parameterDescriptor, TensorType::InputOrOutput, inputAllocator);
 
         if (contains(_metadata.shapeNames, inputName)) {
             const std::string shapeBufferName = SHAPE_TENSOR_PREFIX + inputName;
@@ -117,8 +119,7 @@ ZeroInferRequest::ZeroInferRequest(const std::shared_ptr<ZeroInitStructsHolder>&
                                               executorInputDescriptors.at(shapeBufferName),
                                               shapeBufferName);
 
-            auto allocator = zeroMemory::HostMemAllocator(backendPtr);
-            allocate_tensor(inputName, shapeDescriptor, TensorType::Shape, allocator);
+            allocate_tensor(inputName, shapeDescriptor, TensorType::Shape, inputAllocator);
         }
     }
 
@@ -130,20 +131,20 @@ ZeroInferRequest::ZeroInferRequest(const std::shared_ptr<ZeroInitStructsHolder>&
         const IONodeDescriptor& resultDescriptor = _metadata.results.at(outputName);
         check_level_zero_attributes_match(resultDescriptor, executorOutputDescriptors.at(outputName), outputName);
 
-        auto allocator = zeroMemory::HostMemAllocator(backendPtr);
-
         allocate_tensor(outputName, resultDescriptor, TensorType::InputOrOutput, allocator);
 
-        if (contains(_metadata.shapeNames, outputName)) {
-            const std::string shapeBufferName = SHAPE_TENSOR_PREFIX + outputName;
-            const IONodeDescriptor& shapeDescriptor = _metadata.shapes.at(outputName);
+        const auto& shapeNameMatch = _nodeNameToLegacyName.find(outputName);
+        if (shapeNameMatch != _nodeNameToLegacyName.end()) {
+            if (contains(_metadata.shapeNames, shapeNameMatch->second)) {
+                const std::string shapeBufferName = SHAPE_TENSOR_PREFIX + shapeNameMatch->second;
+                const IONodeDescriptor& shapeDescriptor = _metadata.shapes.at(shapeNameMatch->second);
 
-            check_level_zero_attributes_match(shapeDescriptor,
-                                              executorOutputDescriptors.at(shapeBufferName),
-                                              shapeBufferName);
+                check_level_zero_attributes_match(shapeDescriptor,
+                                                  executorOutputDescriptors.at(shapeBufferName),
+                                                  shapeBufferName);
 
-            auto allocator = zeroMemory::HostMemAllocator(backendPtr);
-            allocate_tensor(outputName, shapeDescriptor, TensorType::Shape, allocator);
+                allocate_tensor(shapeNameMatch->second, shapeDescriptor, TensorType::Shape, allocator);
+            }
         }
     }
 
@@ -166,8 +167,6 @@ ZeroInferRequest::ZeroInferRequest(const std::shared_ptr<ZeroInitStructsHolder>&
                                           executorOutputDescriptors.at(stateOutputBufferName),
                                           stateOutputBufferName);
 
-        auto allocator = zeroMemory::HostMemAllocator(backendPtr);
-
         // Only one buffer per state variable is required, we'll use the "output" one since this one captures the latest
         // tensor value
         allocate_tensor(stateName, stateDescriptor, TensorType::State, allocator);
@@ -226,15 +225,18 @@ void ZeroInferRequest::get_result() {
 
         if (isShapeTensorName(name)) {
             const auto actualTensorName = name.substr(SHAPE_TENSOR_PREFIX.size());
-            ov::Shape actualDims;
-            actualDims.reserve(outputTensor->get_size());
-
-            for (size_t i = 0; i < outputTensor->get_size(); ++i) {
-                const auto reverseIdx = outputTensor->get_size() - 1 - i;
-                actualDims.push_back(outputTensor->data<uint32_t>()[reverseIdx]);
+            const auto& shapeNameMatch = _legacyNameToNodeName.find(actualTensorName);
+            if (shapeNameMatch != _legacyNameToNodeName.end()) {
+                ov::Shape actualDims;
+                actualDims.reserve(outputTensor->get_size());
+
+                for (size_t i = 0; i < outputTensor->get_size(); ++i) {
+                    const auto reverseIdx = outputTensor->get_size() - 1 - i;
+                    actualDims.push_back(outputTensor->data<uint32_t>()[reverseIdx]);
+                }
+                auto& tensorToBeReshaped = _allTensors.at(shapeNameMatch->second);
+                tensorToBeReshaped->set_shape(actualDims);
             }
-            auto& tensorToBeReshaped = _allTensors.at(actualTensorName);
-            tensorToBeReshaped->set_shape(actualDims);
         }
 
         uint8_t* tensorBuffer = reinterpret_cast<uint8_t*>(outputTensor->data());
diff --git a/src/plugins/intel_npu/src/backend/src/zero_memory.cpp b/src/plugins/intel_npu/src/backend/src/zero_memory.cpp
@@ -69,10 +69,9 @@ bool HostMemAllocator::is_equal(const HostMemAllocator& other) const {
     return other._data != nullptr && _data != nullptr && other._data == _data;
 }
 
-void MemoryManagementUnit::appendArgument(const std::string& name, const ze_graph_argument_properties_t& argument) {
+void MemoryManagementUnit::appendArgument(const std::string& name, const std::size_t argSize) {
     _offsets.emplace(std::make_pair(name, _size));
 
-    const std::size_t argSize = zeroUtils::getSizeIOBytes(argument);
     _size += argSize + alignment -
              (argSize % alignment);  // is this really necessary? if 0==argSize%alignment -> add 1 * alignment
 }
diff --git a/src/plugins/intel_npu/src/backend/src/zero_pipeline.cpp b/src/plugins/intel_npu/src/backend/src/zero_pipeline.cpp
@@ -41,7 +41,7 @@ struct DiscretePipeline final : public Pipeline {
 
         OV_ITT_SCOPED_TASK(itt::domains::LevelZeroBackend, "Zero_infer_request::DiscretePipeline::DiscretePipeline");
         for (const auto& desc : executor->inputs_desc_map()) {
-            _deviceInputs.appendArgument(desc.first, desc.second.info);
+            _deviceInputs.appendArgument(desc.first, zeroUtils::getSizeIOBytes(desc.second.info));
         }
         _deviceInputs.allocate(device_handle, context);
 
@@ -61,7 +61,7 @@ struct DiscretePipeline final : public Pipeline {
         _event[stage::UPLOAD].AppendSignalEvent(_command_list[stage::UPLOAD]);
 
         for (const auto& desc : executor->outputs_desc_map()) {
-            _deviceOutputs.appendArgument(desc.first, desc.second.info);
+            _deviceOutputs.appendArgument(desc.first, zeroUtils::getSizeIOBytes(desc.second.info));
         }
         _deviceOutputs.allocate(device_handle, context);
 
diff --git a/src/plugins/intel_npu/src/compiler/src/zero_compiler_in_driver.cpp b/src/plugins/intel_npu/src/compiler/src/zero_compiler_in_driver.cpp
@@ -996,8 +996,8 @@ static void getNodeDescriptor(IONodeDescriptorMap& nodeDescriptors,
     }
     const std::string& legacyName = arg.name;
 
-    names.push_back(legacyName);
-    nodeDescriptors[legacyName] =
+    names.push_back(arg.debug_friendly_name);
+    nodeDescriptors[arg.debug_friendly_name] =
         {legacyName, arg.debug_friendly_name, std::move(outputTensorNames), precision, shape, shape};
 }
 

Original file line number	Diff line number	Diff line change
`@@ -24,11 +24,9 @@ SyncInferRequest::SyncInferRequest(const std::shared_ptr<const ICompiledModel>&`
`24`	`24`
`25`	`25`	`// Map the node names to the legacy ones used by the I/O tensors in order to allow an easier access to the tensors'`
`26`	`26`	`// contents`
`27`		`- for (const auto& [legacyName, parameterDescriptor] : _metadata.parameters) {`
`28`		`- _nodeNameToLegacyName[parameterDescriptor.currentNodeName] = legacyName;`
`29`		`- }`
`30`		`- for (const auto& [legacyName, resultDescriptor] : _metadata.results) {`
`31`		`- _nodeNameToLegacyName[resultDescriptor.currentNodeName] = legacyName;`
	`27`	`+ for (const auto& [name, resultDescriptor] : _metadata.results) {`
	`28`	`+ _nodeNameToLegacyName[name] = resultDescriptor.legacyName;`
	`29`	`+ _legacyNameToNodeName[resultDescriptor.legacyName] = name;`
`32`	`30`	`}`
`33`	`31`
`34`	`32`	`_inputAndStateInputNames = _metadata.inputNames;`
`@@ -48,8 +46,12 @@ SyncInferRequest::SyncInferRequest(const std::shared_ptr<const ICompiledModel>&`
`48`	`46`	`if (contains(_inputAndStateInputNames, shapeName)) {`
`49`	`47`	`_inputAndStateInputNames.push_back(SHAPE_TENSOR_PREFIX + shapeName);`
`50`	`48`	`}`
`51`		`- if (contains(_outputAndStateOutputNames, shapeName)) {`
`52`		`- _outputAndStateOutputNames.push_back(SHAPE_TENSOR_PREFIX + shapeName);`
	`49`	`+`
	`50`	`+ const auto& shapeNameMatch = _legacyNameToNodeName.find(shapeName);`
	`51`	`+ if (shapeNameMatch != _legacyNameToNodeName.end()) {`
	`52`	`+ if (contains(_outputAndStateOutputNames, shapeNameMatch->second)) {`
	`53`	`+ _outputAndStateOutputNames.push_back(SHAPE_TENSOR_PREFIX + shapeName);`
	`54`	`+ }`
`53`	`55`	`}`
`54`	`56`	`}`
`55`	`57`	`}`
`@@ -83,10 +85,7 @@ std::vector<ov::SoPtr<ov::IVariableState>> SyncInferRequest::query_state() const`
`83`	`85`	`}`
`84`	`86`
`85`	`87`	`ov::SoPtr<ov::ITensor> SyncInferRequest::get_tensor(const ov::Output<const ov::Node>& port) const {`
`86`		`- const auto& nodeNameMatch = _nodeNameToLegacyName.find(port.get_node()->get_friendly_name());`
`87`		`- OPENVINO_ASSERT(nodeNameMatch != _nodeNameToLegacyName.end(), "Cannot find tensor for port ", port);`
`88`		`-`
`89`		`- return _allTensors.at(nodeNameMatch->second);`
	`88`	`+ return _allTensors.at(port.get_node()->get_friendly_name());`
`90`	`89`	`}`
`91`	`90`
`92`	`91`	`void SyncInferRequest::set_tensor(const ov::Output<const ov::Node>& port, const ov::SoPtr<ov::ITensor>& tensor) {`
`@@ -97,8 +96,7 @@ void SyncInferRequest::set_tensor(const ov::Output<const ov::Node>& port, const`
`97`	`96`	`OPENVINO_THROW("Failed to set tensor. ", ex.what());`
`98`	`97`	`}`
`99`	`98`
`100`		`- const std::string& legacyName = _nodeNameToLegacyName.at(port.get_node()->get_friendly_name());`
`101`		`- _allTensors[legacyName] = tensor._ptr;`
	`99`	`+ _allTensors[port.get_node()->get_friendly_name()] = tensor._ptr;`
`102`	`100`	`}`
`103`	`101`
`104`	`102`	`std::vector<ov::SoPtr<ov::ITensor>> SyncInferRequest::get_tensors(const ov::Output<const ov::Node>& /port/) const {`
`@@ -151,14 +149,12 @@ void SyncInferRequest::check_tensor(const ov::Output<const ov::Node>& port,`
`151`	`149`	`void SyncInferRequest::check_tensors() const {`
`152`	`150`	`const auto& inputs = _compiledModel->inputs();`
`153`	`151`	`for (size_t i = 0; i < inputs.size(); i++) {`
`154`		`- const std::string& legacyName = _nodeNameToLegacyName.at(inputs[i].get_node()->get_friendly_name());`
`155`		`- check_tensor(inputs[i], _allTensors.at(legacyName));`
	`152`	`+ check_tensor(inputs[i], _allTensors.at(inputs[i].get_node()->get_friendly_name()));`
`156`	`153`	`}`
`157`	`154`
`158`	`155`	`const auto& outputs = _compiledModel->outputs();`
`159`	`156`	`for (size_t i = 0; i < outputs.size(); i++) {`
`160`		`- const std::string& legacyName = _nodeNameToLegacyName.at(outputs[i].get_node()->get_friendly_name());`
`161`		`- check_tensor(outputs[i], _allTensors.at(legacyName));`
	`157`	`+ check_tensor(outputs[i], _allTensors.at(outputs[i].get_node()->get_friendly_name()));`
`162`	`158`	`}`
`163`	`159`	`}`
`164`	`160`
`@@ -180,6 +176,7 @@ void SyncInferRequest::allocate_tensor(std::string tensorName,`
`180`	`176`	`_shapesTensors[tensorName] = tensor;`
`181`	`177`	`tensorName = SHAPE_TENSOR_PREFIX + tensorName;`
`182`	`178`	`}`
	`179`	`+`
`183`	`180`	`if (tensorType == TensorType::State) {`
`184`	`181`	`_variableStates[tensorName] = std::make_shared<VariableState>(tensorName, tensor);`
`185`	`182`
Original file line number	Diff line number	Diff line change
`@@ -164,7 +164,7 @@ static inline std::size_t layoutCount(const ze_graph_argument_layout_t val) {`
`164`	`164`	`}`
`165`	`165`	`}`
`166`	`166`
`167`		`-static inline std::size_t getSizeIOBytes(const ze_graph_argument_properties_t& argument) {`
	`167`	`+static inline std::size_t getSizeIOBytes(const ze_graph_argument_properties_3_t& argument) {`
`168`	`168`	`std::size_t num_elements = 1;`
`169`	`169`	`for (std::size_t i = 0; i < layoutCount(argument.deviceLayout); ++i) {`
`170`	`170`	`num_elements *= argument.dims[i];`
Original file line number	Diff line number	Diff line change
`@@ -69,10 +69,9 @@ bool HostMemAllocator::is_equal(const HostMemAllocator& other) const {`
`69`	`69`	`return other._data != nullptr && _data != nullptr && other._data == _data;`
`70`	`70`	`}`
`71`	`71`
`72`		`-void MemoryManagementUnit::appendArgument(const std::string& name, const ze_graph_argument_properties_t& argument) {`
	`72`	`+void MemoryManagementUnit::appendArgument(const std::string& name, const std::size_t argSize) {`
`73`	`73`	`_offsets.emplace(std::make_pair(name, _size));`
`74`	`74`
`75`		`- const std::size_t argSize = zeroUtils::getSizeIOBytes(argument);`
`76`	`75`	`_size += argSize + alignment -`
`77`	`76`	`(argSize % alignment); // is this really necessary? if 0==argSize%alignment -> add 1 * alignment`
`78`	`77`	`}`
Original file line number	Diff line number	Diff line change
`@@ -41,7 +41,7 @@ struct DiscretePipeline final : public Pipeline {`
`41`	`41`
`42`	`42`	`OV_ITT_SCOPED_TASK(itt::domains::LevelZeroBackend, "Zero_infer_request::DiscretePipeline::DiscretePipeline");`
`43`	`43`	`for (const auto& desc : executor->inputs_desc_map()) {`
`44`		`- _deviceInputs.appendArgument(desc.first, desc.second.info);`
	`44`	`+ _deviceInputs.appendArgument(desc.first, zeroUtils::getSizeIOBytes(desc.second.info));`
`45`	`45`	`}`
`46`	`46`	`_deviceInputs.allocate(device_handle, context);`
`47`	`47`
`@@ -61,7 +61,7 @@ struct DiscretePipeline final : public Pipeline {`
`61`	`61`	`_event[stage::UPLOAD].AppendSignalEvent(_command_list[stage::UPLOAD]);`
`62`	`62`
`63`	`63`	`for (const auto& desc : executor->outputs_desc_map()) {`
`64`		`- _deviceOutputs.appendArgument(desc.first, desc.second.info);`
	`64`	`+ _deviceOutputs.appendArgument(desc.first, zeroUtils::getSizeIOBytes(desc.second.info));`
`65`	`65`	`}`
`66`	`66`	`_deviceOutputs.allocate(device_handle, context);`
`67`	`67`
Original file line number	Diff line number	Diff line change
`@@ -996,8 +996,8 @@ static void getNodeDescriptor(IONodeDescriptorMap& nodeDescriptors,`
`996`	`996`	`}`
`997`	`997`	`const std::string& legacyName = arg.name;`
`998`	`998`
`999`		`- names.push_back(legacyName);`
`1000`		`- nodeDescriptors[legacyName] =`
	`999`	`+ names.push_back(arg.debug_friendly_name);`
	`1000`	`+ nodeDescriptors[arg.debug_friendly_name] =`
`1001`	`1001`	`{legacyName, arg.debug_friendly_name, std::move(outputTensorNames), precision, shape, shape};`
`1002`	`1002`	`}`
`1003`	`1003`