nipung90
diff --git a/‎.clang-tidy
Lines changed: 2 additions & 0 deletions b/‎.clang-tidy
Lines changed: 2 additions & 0 deletions
diff --git a/‎bench/BenchUtils.cc
Lines changed: 1 addition & 1 deletion b/‎bench/BenchUtils.cc
Lines changed: 1 addition & 1 deletion
diff --git a/‎bench/ConvUnifiedBenchmark.cc
Lines changed: 5 additions & 5 deletions b/‎bench/ConvUnifiedBenchmark.cc
Lines changed: 5 additions & 5 deletions
diff --git a/‎bench/ConvertBenchmark.cc
Lines changed: 1 addition & 1 deletion b/‎bench/ConvertBenchmark.cc
Lines changed: 1 addition & 1 deletion
diff --git a/‎bench/EmbeddingIndexRemappingBenchmark.cc
Lines changed: 1 addition & 1 deletion b/‎bench/EmbeddingIndexRemappingBenchmark.cc
Lines changed: 1 addition & 1 deletion
diff --git a/‎bench/EmbeddingQuantizeBenchmark.cc
Lines changed: 1 addition & 1 deletion b/‎bench/EmbeddingQuantizeBenchmark.cc
Lines changed: 1 addition & 1 deletion
diff --git a/‎bench/EmbeddingQuantizeFloatToFloatOrHalfBenchmark.cc
Lines changed: 1 addition & 1 deletion b/‎bench/EmbeddingQuantizeFloatToFloatOrHalfBenchmark.cc
Lines changed: 1 addition & 1 deletion
diff --git a/‎bench/EmbeddingSpMDM8BitBenchmark.cc
Lines changed: 8 additions & 7 deletions b/‎bench/EmbeddingSpMDM8BitBenchmark.cc
Lines changed: 8 additions & 7 deletions
diff --git a/‎bench/EmbeddingSpMDMBenchmark.cc
Lines changed: 1 addition & 1 deletion b/‎bench/EmbeddingSpMDMBenchmark.cc
Lines changed: 1 addition & 1 deletion
diff --git a/‎bench/EmbeddingSpMDMNBit2Benchmark.cc
Lines changed: 2 additions & 13 deletions b/‎bench/EmbeddingSpMDMNBit2Benchmark.cc
Lines changed: 2 additions & 13 deletions
@@ -4,8 +4,10 @@
 # Get options for config files in parent directories,
 # but override them if there's a conflict.
 InheritParentConfig: true
+# @nolint
 Checks: '
 bugprone-argument-comment,
+misc-use-internal-linkage,
 '
 CheckOptions:
  - key: facebook-cuda-safe-api-call-check.HandlerName
 
@@ -19,7 +19,7 @@
 
 namespace fbgemm {
 
-std::default_random_engine eng;
+static std::default_random_engine eng;
 
 template <typename T>
 void randFill(aligned_vector<T>& vec, T low, T high, std::true_type) {
 
@@ -28,7 +28,7 @@ using namespace fbgemm;
 
 // clang-format off
 // 1D conv shapes
-vector<conv_param_t<1>> shapes_1d = {
+static vector<conv_param_t<1>> shapes_1d = {
   // MB, IC, OC, IW, G, KW, stride_w, pad_w_left, pad_w_right,
   // (dilation, output_padding_w, tranpose)
   // regular
@@ -46,7 +46,7 @@ vector<conv_param_t<1>> shapes_1d = {
 };
 
 // 2D conv shapes
-vector<conv_param_t<2>> shapes_2d = {
+static vector<conv_param_t<2>> shapes_2d = {
   // MB, IC, OC, IH, IW, G, KH, KW, stride_h, stride_w,
   // pad_h_top, pad_w_left, pad_h_bottom, pad_w_right,
   // (dilation_h, dilation_w, output_padding_h, output_padding_w, tranpose)
@@ -84,7 +84,7 @@ vector<conv_param_t<2>> shapes_2d = {
       {1, 1}, {0, 0, 0, 0})
 };
 
-vector<conv_param_t<2>> shapes_2d_resnext_101 = {
+static vector<conv_param_t<2>> shapes_2d_resnext_101 = {
   // ResNext-101 (unique shapes only)
   // conv_param_t<>(N, C, M, H, W, groups, /* kern */ {KH, KW}, /* stride */
   //   {stride_h, stride_w}, /* padding pad_l = pad_h */ {pad_l, pad_l, pad_l, pad_l}, /* dialation */
@@ -143,7 +143,7 @@ vector<conv_param_t<2>> shapes_2d_resnext_101 = {
 };
 
 // 3D conv shapes
-vector<conv_param_t<3>> shapes_3d = {
+static vector<conv_param_t<3>> shapes_3d = {
   // MB, IC, OC, {IT, IH, IW}, G, {KT, KH, KW}, {stride_t, stride_h,
   // stride_w},
   // {pad_prev, pad_h_top, pad_w_left, pad_next, pad_h_bottom, pad_w_right},
@@ -216,7 +216,7 @@ vector<conv_param_t<3>> shapes_3d = {
 // clang-format on
 
 template <int SPATIAL_DIM, typename Acc_t>
-void performance_test(
+static void performance_test(
     const vector<conv_param_t<SPATIAL_DIM>>& shapes,
     bool flush,
     int repetitions) {
 
@@ -21,7 +21,7 @@
 using namespace std;
 using namespace fbgemm;
 
-void performance_test() {
+static void performance_test() {
   constexpr int NWARMUP = 4;
   constexpr int NITER = 256;
 
 
@@ -37,7 +37,7 @@ static vector<vector<int>> GetInputs_() {
   return input_dims;
 }
 
-int run_benchmark(
+static int run_benchmark(
     int batch_size,
     int num_rows,
     int average_len,
 
@@ -25,7 +25,7 @@ using namespace fbgemm;
 
 // T is the type of scale and bias
 template <typename T>
-void performance_test() {
+static void performance_test() {
   constexpr int NWARMUP = 4;
   constexpr int NITER = 256;
 
 
@@ -25,7 +25,7 @@ using namespace fbgemm;
 
 // T is the type of scale and bias
 template <typename T>
-void performance_test() {
+static void performance_test() {
   constexpr int NWARMUP = 4;
   constexpr int NITER = 256;
 
 
@@ -30,15 +30,16 @@
 using namespace std;
 using namespace fbgemm;
 
-void print_fused_table(int rows, int embedding_dim, const uint8_t* table) {
-  for (int i = 0; i < rows; i++) {
-    cout << "row: " << i << " : " << endl;
-    for (int ii = 0; ii < embedding_dim; ii++) {
-      cout << (int)table[i * (embedding_dim + 2 * sizeof(float)) + ii] << ",";
+/*
+static void print_fused_table(int rows, int embedding_dim, const uint8_t* table)
+{ for (int i = 0; i < rows; i++) { cout << "row: " << i << " : " << endl; for
+(int ii = 0; ii < embedding_dim; ii++) { cout << (int)table[i * (embedding_dim +
+2 * sizeof(float)) + ii] << ",";
     }
     cout << endl;
   }
 }
+*/
 
 static vector<vector<int>> GetInputs_() {
   vector<vector<int>> input_dims = {
@@ -58,10 +59,10 @@ static vector<vector<int>> GetInputs_() {
   return input_dims;
 }
 
-vector<double> benchmarkTimes;
+static vector<double> benchmarkTimes;
 
 template <typename OutType>
-int run_benchmark(
+static int run_benchmark(
     int batch_size,
     int num_rows,
     int embedding_dim,
 
@@ -49,7 +49,7 @@ static vector<vector<int>> GetInputs_() {
   return input_dims;
 }
 
-void run_benchmark(
+static void run_benchmark(
     int batch_size,
     int num_rows,
     int embedding_dim,
 
@@ -171,17 +171,6 @@ static void print_benchmark_results() {
   }
 }
 
-void print_fused_table(int rows, int embedding_dim, const uint8_t* table) {
-  for (int i = 0; i < rows; i++) {
-    std::cout << "row: " << i << " : " << std::endl;
-    for (int ii = 0; ii < embedding_dim; ii++) {
-      std::cout << (int)table[i * (embedding_dim + 2 * sizeof(float)) + ii]
-                << ",";
-    }
-    std::cout << std::endl;
-  }
-}
-
 static vector<vector<int>> GetInputs_() {
   vector<vector<int>> input_dims = {
       // batch size, number of rows of table, emb dim , avg lengthl
@@ -200,7 +189,7 @@ static vector<vector<int>> GetInputs_() {
   return input_dims;
 }
 
-int run_benchmark(
+static int run_benchmark(
     int bit_rate,
     int batch_size,
     int num_rows,
@@ -488,7 +477,7 @@ int run_benchmark(
   return 0;
 }
 
-void sweep_benchmark(KernelType kern_type) {
+static void sweep_benchmark(KernelType kern_type) {
   int batch_size;
   int num_rows;
   int embedding_dim;
Original file line number	Diff line number	Diff line change
`@@ -37,7 +37,7 @@ static vector<vector<int>> GetInputs_() {`
`37`	`37`	`return input_dims;`
`38`	`38`	`}`
`39`	`39`
`40`		`-int run_benchmark(`
	`40`	`+static int run_benchmark(`
`41`	`41`	`int batch_size,`
`42`	`42`	`int num_rows,`
`43`	`43`	`int average_len,`
Original file line number	Diff line number	Diff line change
`@@ -49,7 +49,7 @@ static vector<vector<int>> GetInputs_() {`
`49`	`49`	`return input_dims;`
`50`	`50`	`}`
`51`	`51`
`52`		`-void run_benchmark(`
	`52`	`+static void run_benchmark(`
`53`	`53`	`int batch_size,`
`54`	`54`	`int num_rows,`
`55`	`55`	`int embedding_dim,`