Skip to content

Commit

Permalink
NPUW memory and L0 pipeline hotfixes
Browse files Browse the repository at this point in the history
  • Loading branch information
smirnov-alexey committed Nov 29, 2024
1 parent 76cca6c commit cbb3760
Show file tree
Hide file tree
Showing 2 changed files with 7 additions and 8 deletions.
5 changes: 3 additions & 2 deletions src/plugins/intel_npu/src/plugin/npuw/compiled_model.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -705,8 +705,9 @@ std::shared_ptr<ov::ISyncInferRequest> ov::npuw::CompiledModel::create_sync_infe
const auto num_submodels = m_compiled_submodels.size();
for (std::size_t idx = 0u; idx < num_submodels; idx++) {
const auto& comp_model_desc = m_compiled_submodels[idx];
if (!comp_model_desc.replaced_by.has_value()) {
// not a funcall, do nothing
if (!comp_model_desc.replaced_by.has_value() || comp_model_desc.forced_to_fcall) {
// not a funcall, do nothing, or a subgraph that was forced to funcall
// (a 1-call function) - skip
continue;
}
const auto real_idx = comp_model_desc.replaced_by.value();
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -96,12 +96,10 @@ ClosureRemap build_remap(const Function& fbody, const DCOFFParams& params_to) {
LOG_DEBUG("This is an OK parameter, will be kept");
m.closure_remap.push_back(i - fbody._param_offset);

// Check if unpack is indeed required
const auto& type = param->get_element_type();
if (type == ov::element::i4 || type == ov::element::u4 || type == ov::element::i8 ||
type == ov::element::u8) {
m.weights_to_unpack.insert(i - fbody._param_offset);
}
// FIXME: type should be queried from a lazy tensor
// and compared against param->get_element_type()
// to decide 100%
m.weights_to_unpack.insert(i - fbody._param_offset);
}

// Process zero points for parameters
Expand Down

0 comments on commit cbb3760

Please sign in to comment.