Skip to content

Commit b806f94

Browse files
2024UD24 RC2 Content (#110)
1 parent d5d219e commit b806f94

File tree

5 files changed

+14
-13
lines changed

5 files changed

+14
-13
lines changed

src/vpux_compiler/include/vpux/compiler/NPU37XX/dialect/IE/transforms/passes.hpp

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -94,9 +94,6 @@ struct DefaultHWOptions : public IE::DefaultHWOptionsDialectBase, virtual vpux::
9494
BoolOption mergeUnrolledMatmul{*this, "merge-unrolled-matmul", llvm::cl::desc("Enable merging urolled Matmul ops"),
9595
llvm::cl::init(false)};
9696

97-
BoolOption enableRuntimeDequant{*this, "enable-runtime-dequant",
98-
llvm::cl::desc("Enable runtime dequantization of asymmetricly quantized weight"),
99-
llvm::cl::init(false)};
10097
Int64Option runtimeDequantizationLimit{
10198
*this, "runtime-dequantization-limit",
10299
llvm::cl::desc("Lower limit on weight size for runtime dequantization"

src/vpux_compiler/include/vpux/compiler/NPU40XX/dialect/IE/transforms/passes.hpp

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -43,9 +43,6 @@ struct DefaultHWOptions : public IE::DefaultHWOptionsDialectBase, virtual vpux::
4343
BoolOption mergeUnrolledMatmul{*this, "merge-unrolled-matmul", llvm::cl::desc("Enable merging urolled Matmul ops"),
4444
llvm::cl::init(true)};
4545

46-
BoolOption enableRuntimeDequant{*this, "enable-runtime-dequant",
47-
llvm::cl::desc("Enable runtime dequantization of asymmetricly quantized weight"),
48-
llvm::cl::init(true)};
4946
BoolOption enableApplyDynamicBoundaryCorrection{*this, "enable-apply-dynamic-boundary-correction",
5047
llvm::cl::desc("Enable apply-dynamic-boundary-correction pass"),
5148
llvm::cl::init(false)};

src/vpux_compiler/include/vpux/compiler/compilation_options.hpp

Lines changed: 1 addition & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -13,11 +13,8 @@
1313
namespace vpux {
1414

1515
constexpr bool arePrivateOptionsEnabled() {
16-
#ifdef PRIVATE_COMPILER_OPTIONS_ENABLED
16+
// Note: private options have been intentionally made public for the time being
1717
return true;
18-
#else
19-
return false;
20-
#endif
2118
}
2219

2320
template <typename T>

src/vpux_compiler/include/vpux/compiler/core/pipelines_options.hpp

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -149,9 +149,6 @@ struct ReferenceSWOptions : mlir::PassPipelineOptions<T> {
149149
llvm::cl::desc("Enable weights dequantization for weights as input"),
150150
llvm::cl::init(false)};
151151

152-
BoolOption enableRuntimeDequant{*this, "enable-runtime-dequant",
153-
llvm::cl::desc("Enable runtime dequantization of asymmetricly quantized weight"),
154-
llvm::cl::init(false)};
155152
Int64Option runtimeDequantizationLimit{
156153
*this, "runtime-dequantization-limit",
157154
llvm::cl::desc("Lower limit on weight size for runtime dequantization"

src/vpux_compiler/include/vpux/compiler/core/public_options.hpp

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -141,6 +141,18 @@ struct PublicOptions : mlir::PassPipelineOptions<PublicOptions> {
141141
BoolOption shaveDryRun{*this, "shave-dry-run", llvm::cl::desc("Enable shave dry run stripping"),
142142
llvm::cl::init(false)};
143143

144+
BoolOption enableRuntimeDequant{*this, "enable-runtime-dequant",
145+
llvm::cl::desc("Enable runtime dequantization of asymmetricly quantized weight"),
146+
llvm::cl::init(false)};
147+
static bool getDefaultEnableRuntimeDequant(VPU::ArchKind arch) {
148+
switch (arch) {
149+
case VPU::ArchKind::NPU40XX:
150+
return true;
151+
default:
152+
return false;
153+
}
154+
}
155+
144156
//
145157
// Constructors
146158
//
@@ -152,6 +164,7 @@ struct PublicOptions : mlir::PassPipelineOptions<PublicOptions> {
152164
workloadManagementMode = getDefaultWorkloadManagementMode(arch);
153165
}
154166
enableDMAProfiling = getDefaultEnableDMAProfiling(arch);
167+
enableRuntimeDequant = getDefaultEnableRuntimeDequant(arch);
155168
}
156169

157170
static std::unique_ptr<PublicOptions> createFromString(StringRef options, VPU::ArchKind arch) {

0 commit comments

Comments
 (0)