sevagh
diff --git a/‎.gitmodules
Lines changed: 3 additions & 0 deletions b/‎.gitmodules
Lines changed: 3 additions & 0 deletions
diff --git a/‎CMakeLists.txt
Lines changed: 14 additions & 9 deletions b/‎CMakeLists.txt
Lines changed: 14 additions & 9 deletions
diff --git a/‎cli-apps/demucs.cpp
Lines changed: 12 additions & 4 deletions b/‎cli-apps/demucs.cpp
Lines changed: 12 additions & 4 deletions
diff --git a/‎cli-apps/demucs_ft.cpp
Lines changed: 67 additions & 28 deletions b/‎cli-apps/demucs_ft.cpp
Lines changed: 67 additions & 28 deletions
diff --git a/‎src/conv.hpp
Lines changed: 12 additions & 12 deletions b/‎src/conv.hpp
Lines changed: 12 additions & 12 deletions
@@ -8,3 +8,6 @@
 [submodule "vendor/libnyquist"]
 	path = vendor/libnyquist
 	url = https://github.com/ddiakopoulos/libnyquist
+[submodule "vendor/googletest"]
+	path = vendor/googletest
+	url = https://github.com/google/googletest
@@ -28,13 +28,8 @@ enable_testing()
 set(CMAKE_CXX_STANDARD 17)
 set(CMAKE_POSITION_INDEPENDENT_CODE ON)
 
-# compile vendored submodule libnyquist
-set(LIBNYQUIST_BUILD_EXAMPLE OFF CACHE BOOL "Disable libnyquist example")
-add_subdirectory(vendor/libnyquist)
-
 # add library Eigen3
 include_directories(vendor/eigen)
-include_directories(vendor/libnyquist/include)
 include_directories(src)
 
 if (USE_AMD_AOCL)
@@ -80,17 +75,23 @@ file(GLOB SOURCES "src/*.cpp")
 
 add_library(demucs.cpp.lib ${SOURCES})
 
-target_link_libraries(demucs.cpp.lib libnyquist ${LIBRARIES_TO_LINK})
+target_link_libraries(demucs.cpp.lib ${LIBRARIES_TO_LINK})
+
+# compile vendored submodule libnyquist for driver programs
+set(LIBNYQUIST_BUILD_EXAMPLE OFF CACHE BOOL "Disable libnyquist example" FORCE)
+add_subdirectory(vendor/libnyquist)
 
 # Add target to compile demucs.cpp.main, the main driver program for demucs.cpp
 add_executable(demucs.cpp.main "cli-apps/demucs.cpp")
-target_link_libraries(demucs.cpp.main demucs.cpp.lib)
+target_include_directories(demucs.cpp.main PRIVATE vendor/libnyquist/include)
+target_link_libraries(demucs.cpp.main demucs.cpp.lib libnyquist)
 
 # Add target to compile demucs_ft.cpp.main, the fine-tuned driver program for demucs.cpp
 add_executable(demucs_ft.cpp.main "cli-apps/demucs_ft.cpp")
-target_link_libraries(demucs_ft.cpp.main demucs.cpp.lib)
+target_include_directories(demucs_ft.cpp.main PRIVATE vendor/libnyquist/include)
+target_link_libraries(demucs_ft.cpp.main demucs.cpp.lib libnyquist)
 
-file(GLOB SOURCES_TO_LINT "src/*.cpp" "src/*.hpp" "demucs.cpp" "test/*.cpp")
+file(GLOB SOURCES_TO_LINT "src/*.cpp" "src/*.hpp" "cli-apps/*.cpp")
 
 # add target to run standard lints and formatters
 add_custom_target(lint
@@ -104,6 +105,10 @@ add_custom_target(lint
 
 # add target to run cpp tests in test/ directory with gtest
 
+# get gtest from vendor/googletest
+set(BUILD_GMOCK OFF CACHE BOOL "Disable gmock in googletest" FORCE)
+add_subdirectory(vendor/googletest)
+
 # include test/*.cpp as test files
 file(GLOB TEST_SOURCES "test/*.cpp")
 
 
@@ -5,6 +5,7 @@
 #include <Eigen/Dense>
 #include <cassert>
 #include <filesystem>
+#include <iomanip>
 #include <iostream>
 #include <libnyquist/Common.h>
 #include <libnyquist/Decoders.h>
@@ -146,13 +147,19 @@ int main(int argc, const char **argv)
     std::cout << "Starting Demucs (" << std::to_string(nb_sources)
               << "-source) inference" << std::endl;
 
-    demucscpp::ProgressCallback progressCallback = [](float progress)
-    { std::cout << "Progress: " << progress * 100 << "%\n"; };
+    // set output precision to 3 decimal places
+    std::cout << std::fixed << std::setprecision(3);
+
+    demucscpp::ProgressCallback progressCallback =
+        [](float progress, const std::string &log_message)
+    {
+        std::cout << "(" << std::setw(3) << std::setfill(' ')
+                  << progress * 100.0f << "%) " << log_message << std::endl;
+    };
 
     // create 4 audio matrix same size, to hold output
     Eigen::Tensor3dXf audio_targets =
         demucscpp::demucs_inference(model, audio, progressCallback);
-    std::cout << "returned!" << std::endl;
 
     out_targets = audio_targets;
 
@@ -203,7 +210,8 @@ int main(int argc, const char **argv)
 
         // insert target_name into the path after the digit
         // e.g. target_name_0_drums.wav
-        p_target.replace_filename("target_" + std::to_string(target) + "_" + target_name + ".wav");
+        p_target.replace_filename("target_" + std::to_string(target) + "_" +
+                                  target_name + ".wav");
 
         std::cout << "Writing wav file " << p_target << std::endl;
 
 
@@ -5,6 +5,7 @@
 #include <Eigen/Dense>
 #include <cassert>
 #include <filesystem>
+#include <iomanip>
 #include <iostream>
 #include <libnyquist/Common.h>
 #include <libnyquist/Decoders.h>
@@ -107,8 +108,8 @@ int main(int argc, const char **argv)
 {
     if (argc != 4)
     {
-        std::cerr << "Usage: " << argv[0]
-                  << " <model dir> <wav file> <out dir>" << std::endl;
+        std::cerr << "Usage: " << argv[0] << " <model dir> <wav file> <out dir>"
+                  << std::endl;
         exit(1);
     }
 
@@ -135,63 +136,100 @@ int main(int argc, const char **argv)
     std::string model_file;
     for (const auto &entry : std::filesystem::directory_iterator(model_dir))
     {
-        bool ret;
+        bool ret = false;
 
         // check if entry contains the name "htdemucs_ft_drums"
         if (entry.path().string().find("htdemucs_ft_drums") !=
             std::string::npos)
         {
-            ret =  load_demucs_model(entry.path().string(), &models[0]);
-            std::cout << "Loading ft model " << entry.path().string() << " for drums" << std::endl;
-        } else if (entry.path().string().find("htdemucs_ft_bass") !=
-            std::string::npos)
+            ret = load_demucs_model(entry.path().string(), &models[0]);
+            std::cout << "Loading ft model " << entry.path().string()
+                      << " for drums" << std::endl;
+        }
+        else if (entry.path().string().find("htdemucs_ft_bass") !=
+                 std::string::npos)
         {
-            ret =  load_demucs_model(entry.path().string(), &models[1]);
-            std::cout << "Loading ft model " << entry.path().string() << " for bass" << std::endl;
-        } else if (entry.path().string().find("htdemucs_ft_other") !=
-            std::string::npos)
+            ret = load_demucs_model(entry.path().string(), &models[1]);
+            std::cout << "Loading ft model " << entry.path().string()
+                      << " for bass" << std::endl;
+        }
+        else if (entry.path().string().find("htdemucs_ft_other") !=
+                 std::string::npos)
         {
-            ret =  load_demucs_model(entry.path().string(), &models[2]);
-            std::cout << "Loading ft model " << entry.path().string() << " for other" << std::endl;
-        } else if (entry.path().string().find("htdemucs_ft_vocals") !=
-            std::string::npos)
+            ret = load_demucs_model(entry.path().string(), &models[2]);
+            std::cout << "Loading ft model " << entry.path().string()
+                      << " for other" << std::endl;
+        }
+        else if (entry.path().string().find("htdemucs_ft_vocals") !=
+                 std::string::npos)
         {
-            ret =  load_demucs_model(entry.path().string(), &models[3]);
-            std::cout << "Loading ft model " << entry.path().string() << " for vocals" << std::endl;
+            ret = load_demucs_model(entry.path().string(), &models[3]);
+            std::cout << "Loading ft model " << entry.path().string()
+                      << " for vocals" << std::endl;
         }
 
         // debug some members of model
         std::cout << "demucs_model_load returned " << (ret ? "true" : "false")
-                << std::endl;
+                  << std::endl;
         if (!ret)
         {
             std::cerr << "Error loading model" << std::endl;
             exit(1);
         }
-
     }
 
     const int nb_sources = 4;
 
     std::cout << "Starting Demucs fine-tuned (" << std::to_string(nb_sources)
               << "-source) inference" << std::endl;
 
-    demucscpp::ProgressCallback progressCallback = [](float progress)
-    { std::cout << "Progress: " << progress * 100 << "%\n"; };
+    // set output precision to 3 decimal places
+    std::cout << std::fixed << std::setprecision(3);
+
+    demucscpp::ProgressCallback progressCallback1 =
+        [](float progress, const std::string &log_message)
+    {
+        std::cout << "[DRUMS] \t(" << std::setw(3) << std::setfill(' ')
+                  << progress * 25.0f << "%) " << log_message << std::endl;
+    };
+    demucscpp::ProgressCallback progressCallback2 =
+        [](float progress, const std::string &log_message)
+    {
+        std::cout << "[BASS] \t(" << std::setw(3) << std::setfill(' ')
+                  << 25.0f + progress * 25.0f << "%) " << log_message
+                  << std::endl;
+    };
+    demucscpp::ProgressCallback progressCallback3 =
+        [](float progress, const std::string &log_message)
+    {
+        std::cout << "[OTHER] \t(" << std::setw(3) << std::setfill(' ')
+                  << 50.0f + progress * 25.0f << "%) " << log_message
+                  << std::endl;
+    };
+    demucscpp::ProgressCallback progressCallback4 =
+        [](float progress, const std::string &log_message)
+    {
+        std::cout << "[VOCALS] \t(" << std::setw(3) << std::setfill(' ')
+                  << 75.0f + progress * 25.0f << "%) " << log_message
+                  << std::endl;
+    };
 
     // create 4 audio matrix same size, to hold output
     Eigen::Tensor3dXf drums_targets =
-        demucscpp::demucs_inference(models[0], audio, progressCallback);
+        demucscpp::demucs_inference(models[0], audio, progressCallback1);
+
     Eigen::Tensor3dXf bass_targets =
-        demucscpp::demucs_inference(models[1], audio, progressCallback);
+        demucscpp::demucs_inference(models[1], audio, progressCallback2);
+
     Eigen::Tensor3dXf other_targets =
-        demucscpp::demucs_inference(models[2], audio, progressCallback);
+        demucscpp::demucs_inference(models[2], audio, progressCallback3);
+
     Eigen::Tensor3dXf vocals_targets =
-        demucscpp::demucs_inference(models[3], audio, progressCallback);
+        demucscpp::demucs_inference(models[3], audio, progressCallback4);
 
     out_targets = Eigen::Tensor3dXf(drums_targets.dimension(0),
-                                     drums_targets.dimension(1),
-                                     drums_targets.dimension(2));
+                                    drums_targets.dimension(1),
+                                    drums_targets.dimension(2));
 
     // simply use the respective stem from each independent fine-tuned model
     out_targets.chip<0>(0) = drums_targets.chip<0>(0);
@@ -246,7 +284,8 @@ int main(int argc, const char **argv)
 
         // insert target_name into the path after the digit
         // e.g. target_name_0_drums.wav
-        p_target.replace_filename("target_" + std::to_string(target) + "_" + target_name + ".wav");
+        p_target.replace_filename("target_" + std::to_string(target) + "_" +
+                                  target_name + ".wav");
 
         std::cout << "Writing wav file " << p_target << std::endl;
 
 
@@ -118,13 +118,13 @@ Eigen::Tensor3dXf conv2d_gemm(const Eigen::Tensor3dXf &x,
     {
         for (int h = 0; h < out_height; ++h)
         {
-            for (int w = 0; w < out_width; ++w)
+            for (int w_ = 0; w_ < out_width; ++w_)
             {
-                int row_idx = h * out_width + w;
+                int row_idx = h * out_width + w_;
                 // Assign the value from the GEMM output to the output tensor
                 if (row_idx < result.rows())
                 {
-                    y_out(chout, h, w) = result(row_idx, chout);
+                    y_out(chout, h, w_) = result(row_idx, chout);
                 }
             }
         }
@@ -187,16 +187,16 @@ Eigen::Tensor3dXf conv2d_gemm_fused_gelu(const Eigen::Tensor3dXf &x,
     {
         for (int h = 0; h < out_height; ++h)
         {
-            for (int w = 0; w < out_width; ++w)
+            for (int w_ = 0; w_ < out_width; ++w_)
             {
-                int row_idx = h * out_width + w;
+                int row_idx = h * out_width + w_;
                 // Assign the value from the GEMM output to the output tensor
                 // with gelu
                 float value = result(row_idx, chout);
                 float activated_value =
                     0.5f * value * (1.0f + std::erf(value / std::sqrt(2.0f)));
                 // Assign the activated value to the output tensor
-                y_out(chout, h, w) = activated_value;
+                y_out(chout, h, w_) = activated_value;
             }
         }
     }
@@ -378,15 +378,15 @@ Eigen::Tensor3dXf conv2d_tr_gemm(const Eigen::Tensor3dXf &x,
     {
         for (int h = 0; h < out_height; ++h)
         {
-            for (int w = 0; w < out_width; ++w)
+            for (int w_ = 0; w_ < out_width; ++w_)
             {
                 // Calculate the linear index in the GEMM result corresponding
                 // to this output location
-                int gemm_row = h * out_width + w;
+                int gemm_row = h * out_width + w_;
                 int gemm_col = ch;
 
                 // Assign the value from the GEMM result to the output tensor
-                y_out(ch, h, w) += result(gemm_row, gemm_col);
+                y_out(ch, h, w_) += result(gemm_row, gemm_col);
             }
         }
     }
@@ -455,11 +455,11 @@ Eigen::Tensor3dXf conv2d_tr_gemm_fused_gelu(const Eigen::Tensor3dXf &x,
     {
         for (int h = 0; h < out_height; ++h)
         {
-            for (int w = 0; w < out_width; ++w)
+            for (int w_ = 0; w_ < out_width; ++w_)
             {
                 // Calculate the linear index in the GEMM result corresponding
                 // to this output location
-                int gemm_row = h * out_width + w;
+                int gemm_row = h * out_width + w_;
                 int gemm_col = ch;
 
                 // Compute the value from the GEMM result
@@ -470,7 +470,7 @@ Eigen::Tensor3dXf conv2d_tr_gemm_fused_gelu(const Eigen::Tensor3dXf &x,
                     0.5f * value * (1.0f + std::erf(value / std::sqrt(2.0f)));
 
                 // Assign the activated value to the output tensor
-                y_out(ch, h, w) += activated_value;
+                y_out(ch, h, w_) += activated_value;
             }
         }
     }
Original file line number	Diff line number	Diff line change
`@@ -118,13 +118,13 @@ Eigen::Tensor3dXf conv2d_gemm(const Eigen::Tensor3dXf &x,`
`118`	`118`	`{`
`119`	`119`	`for (int h = 0; h < out_height; ++h)`
`120`	`120`	`{`
`121`		`- for (int w = 0; w < out_width; ++w)`
	`121`	`+ for (int w_ = 0; w_ < out_width; ++w_)`
`122`	`122`	`{`
`123`		`- int row_idx = h * out_width + w;`
	`123`	`+ int row_idx = h * out_width + w_;`
`124`	`124`	`// Assign the value from the GEMM output to the output tensor`
`125`	`125`	`if (row_idx < result.rows())`
`126`	`126`	`{`
`127`		`- y_out(chout, h, w) = result(row_idx, chout);`
	`127`	`+ y_out(chout, h, w_) = result(row_idx, chout);`
`128`	`128`	`}`
`129`	`129`	`}`
`130`	`130`	`}`
`@@ -187,16 +187,16 @@ Eigen::Tensor3dXf conv2d_gemm_fused_gelu(const Eigen::Tensor3dXf &x,`
`187`	`187`	`{`
`188`	`188`	`for (int h = 0; h < out_height; ++h)`
`189`	`189`	`{`
`190`		`- for (int w = 0; w < out_width; ++w)`
	`190`	`+ for (int w_ = 0; w_ < out_width; ++w_)`
`191`	`191`	`{`
`192`		`- int row_idx = h * out_width + w;`
	`192`	`+ int row_idx = h * out_width + w_;`
`193`	`193`	`// Assign the value from the GEMM output to the output tensor`
`194`	`194`	`// with gelu`
`195`	`195`	`float value = result(row_idx, chout);`
`196`	`196`	`float activated_value =`
`197`	`197`	`0.5f * value * (1.0f + std::erf(value / std::sqrt(2.0f)));`
`198`	`198`	`// Assign the activated value to the output tensor`
`199`		`- y_out(chout, h, w) = activated_value;`
	`199`	`+ y_out(chout, h, w_) = activated_value;`
`200`	`200`	`}`
`201`	`201`	`}`
`202`	`202`	`}`
`@@ -378,15 +378,15 @@ Eigen::Tensor3dXf conv2d_tr_gemm(const Eigen::Tensor3dXf &x,`
`378`	`378`	`{`
`379`	`379`	`for (int h = 0; h < out_height; ++h)`
`380`	`380`	`{`
`381`		`- for (int w = 0; w < out_width; ++w)`
	`381`	`+ for (int w_ = 0; w_ < out_width; ++w_)`
`382`	`382`	`{`
`383`	`383`	`// Calculate the linear index in the GEMM result corresponding`
`384`	`384`	`// to this output location`
`385`		`- int gemm_row = h * out_width + w;`
	`385`	`+ int gemm_row = h * out_width + w_;`
`386`	`386`	`int gemm_col = ch;`
`387`	`387`
`388`	`388`	`// Assign the value from the GEMM result to the output tensor`
`389`		`- y_out(ch, h, w) += result(gemm_row, gemm_col);`
	`389`	`+ y_out(ch, h, w_) += result(gemm_row, gemm_col);`
`390`	`390`	`}`
`391`	`391`	`}`
`392`	`392`	`}`
`@@ -455,11 +455,11 @@ Eigen::Tensor3dXf conv2d_tr_gemm_fused_gelu(const Eigen::Tensor3dXf &x,`
`455`	`455`	`{`
`456`	`456`	`for (int h = 0; h < out_height; ++h)`
`457`	`457`	`{`
`458`		`- for (int w = 0; w < out_width; ++w)`
	`458`	`+ for (int w_ = 0; w_ < out_width; ++w_)`
`459`	`459`	`{`
`460`	`460`	`// Calculate the linear index in the GEMM result corresponding`
`461`	`461`	`// to this output location`
`462`		`- int gemm_row = h * out_width + w;`
	`462`	`+ int gemm_row = h * out_width + w_;`
`463`	`463`	`int gemm_col = ch;`
`464`	`464`
`465`	`465`	`// Compute the value from the GEMM result`
`@@ -470,7 +470,7 @@ Eigen::Tensor3dXf conv2d_tr_gemm_fused_gelu(const Eigen::Tensor3dXf &x,`
`470`	`470`	`0.5f * value * (1.0f + std::erf(value / std::sqrt(2.0f)));`
`471`	`471`
`472`	`472`	`// Assign the activated value to the output tensor`
`473`		`- y_out(ch, h, w) += activated_value;`
	`473`	`+ y_out(ch, h, w_) += activated_value;`
`474`	`474`	`}`
`475`	`475`	`}`
`476`	`476`	`}`