bobbyliujb
diff --git a/‎.clang-tidy‎
Lines changed: 1 addition & 0 deletions b/‎.clang-tidy‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎CMakeLists.txt‎
Lines changed: 3 additions & 0 deletions b/‎CMakeLists.txt‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎bench/AlignedVec.h‎
Lines changed: 1 addition & 2 deletions b/‎bench/AlignedVec.h‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎bench/BenchUtils.cc‎
Lines changed: 1 addition & 2 deletions b/‎bench/BenchUtils.cc‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎bench/BenchUtils.h‎
Lines changed: 5 additions & 5 deletions b/‎bench/BenchUtils.h‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎bench/EmbeddingIndexRemappingBenchmark.cc‎
Lines changed: 3 additions & 3 deletions b/‎bench/EmbeddingIndexRemappingBenchmark.cc‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎bench/EmbeddingSpMDMBenchmark.cc‎
Lines changed: 0 additions & 1 deletion b/‎bench/EmbeddingSpMDMBenchmark.cc‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎bench/EmbeddingSpMDMNBit2Benchmark.cc‎
Lines changed: 0 additions & 1 deletion b/‎bench/EmbeddingSpMDMNBit2Benchmark.cc‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎bench/EmbeddingSpMDMNBitBenchmark.cc‎
Lines changed: 4 additions & 4 deletions b/‎bench/EmbeddingSpMDMNBitBenchmark.cc‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎bench/EmbeddingSpMDMNBitRowWiseSparseBenchmark.cc‎
Lines changed: 4 additions & 4 deletions b/‎bench/EmbeddingSpMDMNBitRowWiseSparseBenchmark.cc‎
Lines changed: 4 additions & 4 deletions
@@ -7,6 +7,7 @@ InheritParentConfig: true
 # @nolint
 Checks: '
 -*,
+cppcoreguidelines-init-variables,
 bugprone-argument-comment,
 misc-use-internal-linkage,
 modernize*,
 
@@ -208,8 +208,11 @@ else(MSVC)
   string(APPEND CMAKE_CXX_FLAGS " -Wunknown-pragmas")
   string(APPEND CMAKE_CXX_FLAGS " -Wimplicit-fallthrough")
   string(APPEND CMAKE_CXX_FLAGS " -Wno-strict-aliasing")
+  string(APPEND CMAKE_CXX_FLAGS " -Wunused-variable")
   if("${CMAKE_CXX_COMPILER_ID}" MATCHES "Clang" AND CMAKE_CXX_COMPILER_VERSION VERSION_GREATER 17.0.0)
     string(APPEND CMAKE_CXX_FLAGS " -Wno-vla-cxx-extension")
+  elseif(CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
+    string(APPEND CMAKE_CXX_FLAGS " -Wmaybe-uninitialized")
   endif()
   target_compile_options(fbgemm_avx2 PRIVATE
     "-m64" "-mavx2" "-mf16c" "-mfma")
 
@@ -107,10 +107,9 @@ class aligned_allocator {
 
     // Mallocator wraps malloc().
     void* pv = nullptr;
-    int ret;
+    int ret = 0;
 #ifdef _MSC_VER
     pv = _aligned_malloc(n * sizeof(T), Alignment);
-    ret = 0;
 #else
     ret = posix_memalign(&pv, Alignment, n * sizeof(T));
 #endif
 
@@ -150,9 +150,8 @@ aligned_vector<float> getRandomSparseVector(
   std::sort(sorted_res.begin(), sorted_res.end());
   int32_t numZeros =
       size - static_cast<int32_t>(std::round(size * fractionNonZeros));
-  float thr;
   if (numZeros) {
-    thr = sorted_res[numZeros - 1];
+    float thr = sorted_res[numZeros - 1];
 
     for (auto& f : res) {
       if (f <= thr) {
 
@@ -28,6 +28,7 @@
 
 #ifdef _OPENMP
 #include <omp.h>
+#include <cmath>
 #endif
 
 #ifdef USE_MKL
@@ -136,8 +137,6 @@ double measureWithWarmup(
   {
 #endif
     for (int i = 0; i < measuredIterations; ++i) {
-      std::chrono::time_point<std::chrono::high_resolution_clock> start, end;
-
       const auto thread_id = useOpenMP ? fbgemm_get_thread_num() : 0;
 
       if (thread_id == 0) {
@@ -149,7 +148,7 @@ double measureWithWarmup(
 #pragma omp barrier
       }
 #endif
-      start = std::chrono::high_resolution_clock::now();
+      auto start = std::chrono::high_resolution_clock::now();
 
       fn();
 
@@ -159,7 +158,7 @@ double measureWithWarmup(
       }
 #endif
 
-      end = std::chrono::high_resolution_clock::now();
+      auto end = std::chrono::high_resolution_clock::now();
       auto dur =
           std::chrono::duration_cast<std::chrono::nanoseconds>(end - start);
 
@@ -256,7 +255,6 @@ void performance_test(
 #endif
 
   std::string type;
-  double gflops, gbs, ttot;
   for (auto s : shapes) {
     int m = s[0];
     int n = s[1];
@@ -266,6 +264,7 @@ void performance_test(
     aligned_vector<int> Aint(m * k);
     randFill(Aint, 0, 4);
     std::vector<aligned_vector<float>> A;
+    A.reserve(num_instances);
     for (int i = 0; i < num_instances; ++i) {
       A.emplace_back(Aint.begin(), Aint.end());
     }
@@ -321,6 +320,7 @@ void performance_test(
 
     double nflops = 2.0 * m * n * k;
     double nbytes = 4.0 * m * k + sizeof(btype) * 1.0 * k * n + 4.0 * m * n;
+    double gflops = 0, gbs = 0, ttot = 0.0;
 
     // warm up MKL and fbgemm
     // check correctness at the same time
 
@@ -135,9 +135,9 @@ static int run_benchmark(
 }
 
 int main() {
-  int batch_size;
-  int num_rows;
-  int average_len;
+  int batch_size = 0;
+  int num_rows = 0;
+  int average_len = 0;
 
   vector<vector<int>> inputs(GetInputs_());
 
 
@@ -12,7 +12,6 @@
 #endif
 #include <algorithm>
 #include <cassert>
-#include <chrono>
 #include <cmath>
 #include <cstdint>
 #include <iomanip>
 
@@ -12,7 +12,6 @@
 #endif
 #include <algorithm>
 #include <cassert>
-#include <chrono>
 #include <cmath>
 #include <cstdint>
 #include <iomanip>
 
@@ -492,10 +492,10 @@ static int run_benchmark(
 }
 
 int main() {
-  int batch_size;
-  int num_rows;
-  int embedding_dim;
-  int average_len;
+  int batch_size = 0;
+  int num_rows = 0;
+  int embedding_dim = 0;
+  int average_len = 0;
 
   vector<vector<int>> inputs(GetInputs_());
 
 
@@ -325,10 +325,10 @@ static int run_benchmark(
 }
 
 int main() {
-  int batch_size;
-  int num_rows;
-  int embedding_dim;
-  int average_len;
+  int batch_size = 0;
+  int num_rows = 0;
+  int embedding_dim = 0;
+  int average_len = 0;
 
   vector<vector<int>> inputs(GetInputs_());