diff --git a/docker/logduration.def b/docker/logduration.def
index fdc392a..e416838 100644
--- a/docker/logduration.def
+++ b/docker/logduration.def
@@ -27,7 +27,7 @@ From: rocm/rocm-build-ubuntu-22.04:6.3
     apt-get update 
     apt-get install -y software-properties-common 
     apt-get upgrade -y 
-    apt-get install -y git build-essential wget clang lld libzstd-dev libomp-dev ccache libdwarf-dev python3-dev 
+    apt-get install -y git build-essential wget clang lld libzstd-dev libomp-dev ccache libdwarf-dev python3-dev
     python3 -m pip install --upgrade pip 
     python3 -m pip install --upgrade setuptools 
     
diff --git a/external/dh_comms b/external/dh_comms
index b87a31c..ec5d9d4 160000
--- a/external/dh_comms
+++ b/external/dh_comms
@@ -1 +1 @@
-Subproject commit b87a31ce2c400d92263eb6979328283a0674edc8
+Subproject commit ec5d9d42a00f68fa1f37c9a118e5ffe7eb609f1f
diff --git a/external/instrument-amdgpu-kernels b/external/instrument-amdgpu-kernels
index 1be4597..70fcfa6 160000
--- a/external/instrument-amdgpu-kernels
+++ b/external/instrument-amdgpu-kernels
@@ -1 +1 @@
-Subproject commit 1be4597cc2d018d38df9fdb4a115a979ea9bd49e
+Subproject commit 70fcfa6606d1fceb0269a263e00e01d74a9a23b9
diff --git a/inc/memory_analysis_wrapper.h b/inc/memory_analysis_wrapper.h
index 1d6b653..80dcd9b 100644
--- a/inc/memory_analysis_wrapper.h
+++ b/inc/memory_analysis_wrapper.h
@@ -37,8 +37,10 @@ class memory_analysis_wrapper_t : public dh_comms::message_handler_base {
   virtual void report() override;
   virtual void clear() override;
 
+private:
   const std::string& kernel_;
   uint64_t dispatch_id_;
   const std::string& location_;
+  bool verbose_;
   dh_comms::memory_analysis_handler_t wrapped_;
 };
diff --git a/omniprobe/omniprobe b/omniprobe/omniprobe
index 5f3147c..98cfed9 100755
--- a/omniprobe/omniprobe
+++ b/omniprobe/omniprobe
@@ -263,7 +263,13 @@ def setup_env(parms):
             env['LOGDUR_LOG_FORMAT'] = parms.log_format
             env_dump['LOGDUR_LOG_FORMAT'] = parms.log_format
 
-            
+    if parms.verbose:
+        env['LOGDUR_VERBOSE'] = "true"
+        env_dump['LOGDUR_VERBOSE'] = "true"
+    else:
+        env['LOGDUR_VERBOSE'] = "false"
+        env_dump['LOGDUR_VERBOSE'] = "false"
+
     if len(parms.log_location):
         if parms.log_location != "console":
             if not os.path.isdir(parms.log_location):
diff --git a/plugins/memory_analysis_plugin.cc b/plugins/memory_analysis_plugin.cc
index 42a5251..94cc375 100644
--- a/plugins/memory_analysis_plugin.cc
+++ b/plugins/memory_analysis_plugin.cc
@@ -8,6 +8,14 @@ extern "C"{
         const char* logDurLogLocation = std::getenv("LOGDUR_LOG_LOCATION");
         if (logDurLogLocation != NULL)
             location = logDurLogLocation;
-        outHandlers.push_back(new memory_analysis_wrapper_t(kernel, dispatch_id, location, false));
+
+        // Read verbose setting from environment
+        bool verbose = false;
+        const char* logDurVerbose = std::getenv("LOGDUR_VERBOSE");
+        if (logDurVerbose != NULL && (strcmp(logDurVerbose, "1") == 0 || strcmp(logDurVerbose, "true") == 0)) {
+            verbose = true;
+        }
+        
+        outHandlers.push_back(new memory_analysis_wrapper_t(kernel, dispatch_id, location, verbose));
     }
 }
diff --git a/src/memory_analysis_wrapper.cc b/src/memory_analysis_wrapper.cc
index 4b39c9b..3fc4d50 100644
--- a/src/memory_analysis_wrapper.cc
+++ b/src/memory_analysis_wrapper.cc
@@ -8,13 +8,31 @@
 #include <set>
 #include <string>
 #include <iostream>
+#include <filesystem>
 
 __attribute__((constructor)) void on_library_load() { std::cout << "Memory Analysis Wrapper loaded." << std::endl; }
-__attribute__((destructor)) void on_library_unload() { std::cout << "Memory Analysis Wrapper unloaded." << std::endl; }
+
+// Manual cleanup when we're truly done
+void on_library_unload() { 
+    std::cout << "Memory Analysis Wrapper manual unload requested." << std::endl;
+    // Only cleanup JsonOutputManager after we're done with all analysis
+    dh_comms::JsonOutputManager::cleanup();
+}
 
 memory_analysis_wrapper_t::memory_analysis_wrapper_t(const std::string& kernel, uint64_t dispatch_id, const std::string& location,  bool verbose) :
     kernel_(kernel), dispatch_id_(dispatch_id), location_(location), wrapped_(verbose)
 {
+    std::cout << "[MemoryAnalysisWrapper] Initializing wrapper for kernel: " << kernel << std::endl;
+    dh_comms::JsonOutputManager::getInstance().initializeKernelAnalysis(kernel, dispatch_id);
+    
+    // Get GPU architecture and cache line size
+    hipDeviceProp_t props;
+    hipGetDeviceProperties(&props, 0);
+    std::string gpu_arch = props.gcnArchName;
+    
+    // Initialize metadata with default kernels_found (will be updated in report)
+    dh_comms::JsonOutputManager::getInstance().setMetadata(gpu_arch, 128, 0); // Using default cache line size of 128
+    std::cout << "[MemoryAnalysisWrapper] Initialization complete" << std::endl;
 }
 
 bool memory_analysis_wrapper_t::handle(const dh_comms::message_t &message, const std::string& kernel, kernelDB::kernelDB& kdb)
@@ -29,19 +47,57 @@ bool memory_analysis_wrapper_t::handle(const dh_comms::message_t &message) {
 
 void memory_analysis_wrapper_t::report(const std::string& kernel_name, kernelDB::kernelDB& kdb)
 {
-    if (kernel_name.length() == 0)
-    {
+    // Get all kernels and update the count
+    std::vector<std::string> kernels;
+    kdb.getKernels(kernels);
+    dh_comms::JsonOutputManager::getInstance().updateKernelsFound(kernels.size());
+    
+    // Only get lines if kernel_name is provided
+    if (!kernel_name.empty()) {
         std::vector<uint32_t> lines;
         kdb.getKernelLines(kernel_name, lines);
     }
+    
     report();
 }
 
 void memory_analysis_wrapper_t::report() {
-  std::cout << "Memory analysis for " << kernel_ << " dispatch_id[" << std::dec << dispatch_id_ << "]" << std::endl;
-  wrapped_.report();
+  if (verbose_) {
+    std::cout << "Memory analysis for " << kernel_ << " dispatch_id[" << std::dec << dispatch_id_ << "]" << std::endl;
+  }
+  
+  std::cout << "[MemoryAnalysisWrapper] Starting wrapped_.report()..." << std::endl;
+  try {
+    wrapped_.report();
+    std::cout << "[MemoryAnalysisWrapper] Completed wrapped_.report() successfully" << std::endl;
+    std::cout << "[MemoryAnalysisWrapper] Current analysis size after report: " 
+              << dh_comms::JsonOutputManager::getInstance().getCurrentAnalysisSize() << std::endl;
+  } catch (const std::exception& e) {
+    std::cerr << "[MemoryAnalysisWrapper] ERROR: Exception in wrapped_.report(): " << e.what() << std::endl;
+  } catch (...) {
+    std::cerr << "[MemoryAnalysisWrapper] ERROR: Unknown exception in wrapped_.report()" << std::endl;
+  }
+  
+  // Write to single output file
+  std::string filename = (std::filesystem::current_path() / "memory_analysis_output.json").string();
+  std::cout << "[MemoryAnalysisWrapper] Writing memory analysis to " << filename << std::endl;
+  
+  // Dump current state before writing
+  std::cout << "[MemoryAnalysisWrapper] Dumping current JsonOutputManager state..." << std::endl;
+  auto& manager = dh_comms::JsonOutputManager::getInstance();
+  std::cout << "[MemoryAnalysisWrapper] Current analysis size before dump: " << manager.getCurrentAnalysisSize() << std::endl;
+  manager.dumpCurrentState();
+  
+  // Attempt to write the file
+  try {
+    manager.writeToFile(filename);
+    std::cout << "[MemoryAnalysisWrapper] Report completed successfully" << std::endl;
+  } catch (const std::exception& e) {
+    std::cerr << "[MemoryAnalysisWrapper] ERROR: Unexpected error writing file: " << e.what() << std::endl;
+  }
 }
 
 void memory_analysis_wrapper_t::clear() {
   wrapped_.clear();
+  dh_comms::JsonOutputManager::getInstance().clear();
 }