diff --git a/.gitignore b/.gitignore
deleted file mode 100644
index 25f9674..0000000
--- a/.gitignore
+++ /dev/null
@@ -1,2 +0,0 @@
-/Testing/
-/CMakeFiles/
diff --git a/CMakeCache.txt b/CMakeCache.txt
deleted file mode 100644
index df96834..0000000
--- a/CMakeCache.txt
+++ /dev/null
@@ -1,423 +0,0 @@
-# This is the CMakeCache file.
-# For build in directory: /home/justin/Thesis/topo code/SAND
-# It was generated by CMake: /usr/bin/cmake
-# You can edit this file to change values found and used by cmake.
-# If you do not want to change any of the values, simply exit the editor.
-# If you do want to change a value, simply edit, save, and exit the editor.
-# The syntax for the file is as follows:
-# KEY:TYPE=VALUE
-# KEY is the name of a variable in the cache.
-# TYPE is a hint to GUIs for the type of VALUE, DO NOT EDIT TYPE!.
-# VALUE is the current value for the KEY.
-
-########################
-# EXTERNAL cache entries
-########################
-
-//Path to a program.
-CMAKE_ADDR2LINE:FILEPATH=/usr/bin/addr2line
-
-//Path to a program.
-CMAKE_AR:FILEPATH=/usr/bin/ar
-
-//Choose the type of build, options are: Debug, Release
-CMAKE_BUILD_TYPE:STRING=Debug
-
-//Enable/Disable color output during build.
-CMAKE_COLOR_MAKEFILE:BOOL=ON
-
-//CXX compiler
-CMAKE_CXX_COMPILER:STRING=/usr/bin/c++
-
-//A wrapper around 'ar' adding the appropriate '--plugin' option
-// for the GCC compiler
-CMAKE_CXX_COMPILER_AR:FILEPATH=/usr/bin/gcc-ar-9
-
-//A wrapper around 'ranlib' adding the appropriate '--plugin' option
-// for the GCC compiler
-CMAKE_CXX_COMPILER_RANLIB:FILEPATH=/usr/bin/gcc-ranlib-9
-
-//Flags used by the compiler during all build types.
-CMAKE_CXX_FLAGS:STRING=
-
-//Flags used by the compiler during debug builds.
-CMAKE_CXX_FLAGS_DEBUG:STRING=
-
-//Flags used by the CXX compiler during MINSIZEREL builds.
-CMAKE_CXX_FLAGS_MINSIZEREL:STRING=-Os -DNDEBUG
-
-//Flags used by the compiler during release builds.
-CMAKE_CXX_FLAGS_RELEASE:STRING=
-
-//Flags used by the CXX compiler during RELWITHDEBINFO builds.
-CMAKE_CXX_FLAGS_RELWITHDEBINFO:STRING=-O2 -g -DNDEBUG
-
-//C compiler
-CMAKE_C_COMPILER:STRING=/usr/bin/cc
-
-//A wrapper around 'ar' adding the appropriate '--plugin' option
-// for the GCC compiler
-CMAKE_C_COMPILER_AR:FILEPATH=/usr/bin/gcc-ar-9
-
-//A wrapper around 'ranlib' adding the appropriate '--plugin' option
-// for the GCC compiler
-CMAKE_C_COMPILER_RANLIB:FILEPATH=/usr/bin/gcc-ranlib-9
-
-//Flags used by the C compiler during all build types.
-CMAKE_C_FLAGS:STRING=
-
-//Flags used by the C compiler during DEBUG builds.
-CMAKE_C_FLAGS_DEBUG:STRING=-g
-
-//Flags used by the C compiler during MINSIZEREL builds.
-CMAKE_C_FLAGS_MINSIZEREL:STRING=-Os -DNDEBUG
-
-//Flags used by the C compiler during RELEASE builds.
-CMAKE_C_FLAGS_RELEASE:STRING=-O3 -DNDEBUG
-
-//Flags used by the C compiler during RELWITHDEBINFO builds.
-CMAKE_C_FLAGS_RELWITHDEBINFO:STRING=-O2 -g -DNDEBUG
-
-//No help, variable specified on the command line.
-CMAKE_DEPENDS_USE_COMPILER:UNINITIALIZED=FALSE
-
-//Path to a program.
-CMAKE_DLLTOOL:FILEPATH=CMAKE_DLLTOOL-NOTFOUND
-
-//The Eclipse executable
-CMAKE_ECLIPSE_EXECUTABLE:FILEPATH=CMAKE_ECLIPSE_EXECUTABLE-NOTFOUND
-
-//If disabled, CMake will not generate linked resource to the subprojects
-// and to the source files within targets
-CMAKE_ECLIPSE_GENERATE_LINKED_RESOURCES:BOOL=TRUE
-
-//If enabled, CMake will generate a source project for Eclipse
-// in CMAKE_SOURCE_DIR
-CMAKE_ECLIPSE_GENERATE_SOURCE_PROJECT:BOOL=FALSE
-
-//Additional command line arguments when Eclipse invokes make.
-// Enter e.g. -j<some_number> to get parallel builds
-CMAKE_ECLIPSE_MAKE_ARGUMENTS:STRING=-j8
-
-//The version of Eclipse. If Eclipse has not been found, 3.6 (Helios)
-// is assumed.
-CMAKE_ECLIPSE_VERSION:STRING=3.6 (Helios)
-
-//Flags used by the linker during all build types.
-CMAKE_EXE_LINKER_FLAGS:STRING=
-
-//Flags used by the linker during DEBUG builds.
-CMAKE_EXE_LINKER_FLAGS_DEBUG:STRING=
-
-//Flags used by the linker during MINSIZEREL builds.
-CMAKE_EXE_LINKER_FLAGS_MINSIZEREL:STRING=
-
-//Flags used by the linker during RELEASE builds.
-CMAKE_EXE_LINKER_FLAGS_RELEASE:STRING=
-
-//Flags used by the linker during RELWITHDEBINFO builds.
-CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO:STRING=
-
-//Enable/Disable output of compile commands during generation.
-CMAKE_EXPORT_COMPILE_COMMANDS:BOOL=OFF
-
-//Install path prefix, prepended onto install directories.
-CMAKE_INSTALL_PREFIX:PATH=/usr/local
-
-//Path to a program.
-CMAKE_LINKER:FILEPATH=/usr/bin/ld
-
-//Path to a program.
-CMAKE_MAKE_PROGRAM:FILEPATH=/usr/bin/make
-
-//Flags used by the linker during the creation of modules during
-// all build types.
-CMAKE_MODULE_LINKER_FLAGS:STRING=
-
-//Flags used by the linker during the creation of modules during
-// DEBUG builds.
-CMAKE_MODULE_LINKER_FLAGS_DEBUG:STRING=
-
-//Flags used by the linker during the creation of modules during
-// MINSIZEREL builds.
-CMAKE_MODULE_LINKER_FLAGS_MINSIZEREL:STRING=
-
-//Flags used by the linker during the creation of modules during
-// RELEASE builds.
-CMAKE_MODULE_LINKER_FLAGS_RELEASE:STRING=
-
-//Flags used by the linker during the creation of modules during
-// RELWITHDEBINFO builds.
-CMAKE_MODULE_LINKER_FLAGS_RELWITHDEBINFO:STRING=
-
-//Path to a program.
-CMAKE_NM:FILEPATH=/usr/bin/nm
-
-//Path to a program.
-CMAKE_OBJCOPY:FILEPATH=/usr/bin/objcopy
-
-//Path to a program.
-CMAKE_OBJDUMP:FILEPATH=/usr/bin/objdump
-
-//Value Computed by CMake
-CMAKE_PROJECT_DESCRIPTION:STATIC=
-
-//Value Computed by CMake
-CMAKE_PROJECT_HOMEPAGE_URL:STATIC=
-
-//Value Computed by CMake
-CMAKE_PROJECT_NAME:STATIC=SAND
-
-//Path to a program.
-CMAKE_RANLIB:FILEPATH=/usr/bin/ranlib
-
-//Path to a program.
-CMAKE_READELF:FILEPATH=/usr/bin/readelf
-
-//Flags used by the linker during the creation of shared libraries
-// during all build types.
-CMAKE_SHARED_LINKER_FLAGS:STRING=
-
-//Flags used by the linker during the creation of shared libraries
-// during DEBUG builds.
-CMAKE_SHARED_LINKER_FLAGS_DEBUG:STRING=
-
-//Flags used by the linker during the creation of shared libraries
-// during MINSIZEREL builds.
-CMAKE_SHARED_LINKER_FLAGS_MINSIZEREL:STRING=
-
-//Flags used by the linker during the creation of shared libraries
-// during RELEASE builds.
-CMAKE_SHARED_LINKER_FLAGS_RELEASE:STRING=
-
-//Flags used by the linker during the creation of shared libraries
-// during RELWITHDEBINFO builds.
-CMAKE_SHARED_LINKER_FLAGS_RELWITHDEBINFO:STRING=
-
-//If set, runtime paths are not added when installing shared libraries,
-// but are added when building.
-CMAKE_SKIP_INSTALL_RPATH:BOOL=NO
-
-//If set, runtime paths are not added when using shared libraries.
-CMAKE_SKIP_RPATH:BOOL=NO
-
-//Flags used by the linker during the creation of static libraries
-// during all build types.
-CMAKE_STATIC_LINKER_FLAGS:STRING=
-
-//Flags used by the linker during the creation of static libraries
-// during DEBUG builds.
-CMAKE_STATIC_LINKER_FLAGS_DEBUG:STRING=
-
-//Flags used by the linker during the creation of static libraries
-// during MINSIZEREL builds.
-CMAKE_STATIC_LINKER_FLAGS_MINSIZEREL:STRING=
-
-//Flags used by the linker during the creation of static libraries
-// during RELEASE builds.
-CMAKE_STATIC_LINKER_FLAGS_RELEASE:STRING=
-
-//Flags used by the linker during the creation of static libraries
-// during RELWITHDEBINFO builds.
-CMAKE_STATIC_LINKER_FLAGS_RELWITHDEBINFO:STRING=
-
-//Path to a program.
-CMAKE_STRIP:FILEPATH=/usr/bin/strip
-
-//If this value is on, makefiles will be generated without the
-// .SILENT directive, and all commands will be echoed to the console
-// during the make.  This is useful for debugging only. With Visual
-// Studio IDE projects all commands are done without /nologo.
-CMAKE_VERBOSE_MAKEFILE:BOOL=FALSE
-
-//No help, variable specified on the command line.
-DEAL_II_DIR:UNINITIALIZED=/home/justin/Dealii/installed
-
-//Path to a program.
-PERL_EXECUTABLE:FILEPATH=/usr/bin/perl
-
-//Path to a program.
-ProcessorCount_cmd_nproc:FILEPATH=/usr/bin/nproc
-
-//Path to a program.
-ProcessorCount_cmd_sysctl:FILEPATH=/usr/sbin/sysctl
-
-//Value Computed by CMake
-SAND_BINARY_DIR:STATIC=/home/justin/Thesis/topo code/SAND
-
-//Value Computed by CMake
-SAND_SOURCE_DIR:STATIC=/home/justin/Thesis/topo code/SAND
-
-//The directory containing a CMake configuration file for deal.II.
-deal.II_DIR:PATH=/home/justin/Dealii/installed/lib/cmake/deal.II
-
-
-########################
-# INTERNAL cache entries
-########################
-
-//ADVANCED property for variable: CMAKE_ADDR2LINE
-CMAKE_ADDR2LINE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_AR
-CMAKE_AR-ADVANCED:INTERNAL=1
-//This is the directory where this CMakeCache.txt was created
-CMAKE_CACHEFILE_DIR:INTERNAL=/home/justin/Thesis/topo code/SAND
-//Major version of cmake used to create the current loaded cache
-CMAKE_CACHE_MAJOR_VERSION:INTERNAL=3
-//Minor version of cmake used to create the current loaded cache
-CMAKE_CACHE_MINOR_VERSION:INTERNAL=16
-//Patch version of cmake used to create the current loaded cache
-CMAKE_CACHE_PATCH_VERSION:INTERNAL=3
-//ADVANCED property for variable: CMAKE_COLOR_MAKEFILE
-CMAKE_COLOR_MAKEFILE-ADVANCED:INTERNAL=1
-//Path to CMake executable.
-CMAKE_COMMAND:INTERNAL=/usr/bin/cmake
-//Path to cpack program executable.
-CMAKE_CPACK_COMMAND:INTERNAL=/usr/bin/cpack
-//Path to ctest program executable.
-CMAKE_CTEST_COMMAND:INTERNAL=/usr/bin/ctest
-//ADVANCED property for variable: CMAKE_CXX_COMPILER
-CMAKE_CXX_COMPILER-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_COMPILER_AR
-CMAKE_CXX_COMPILER_AR-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_COMPILER_RANLIB
-CMAKE_CXX_COMPILER_RANLIB-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_FLAGS
-CMAKE_CXX_FLAGS-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_FLAGS_DEBUG
-CMAKE_CXX_FLAGS_DEBUG-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_FLAGS_MINSIZEREL
-CMAKE_CXX_FLAGS_MINSIZEREL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_FLAGS_RELEASE
-CMAKE_CXX_FLAGS_RELEASE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_CXX_FLAGS_RELWITHDEBINFO
-CMAKE_CXX_FLAGS_RELWITHDEBINFO-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_COMPILER
-CMAKE_C_COMPILER-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_COMPILER_AR
-CMAKE_C_COMPILER_AR-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_COMPILER_RANLIB
-CMAKE_C_COMPILER_RANLIB-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_FLAGS
-CMAKE_C_FLAGS-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_FLAGS_DEBUG
-CMAKE_C_FLAGS_DEBUG-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_FLAGS_MINSIZEREL
-CMAKE_C_FLAGS_MINSIZEREL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_FLAGS_RELEASE
-CMAKE_C_FLAGS_RELEASE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_C_FLAGS_RELWITHDEBINFO
-CMAKE_C_FLAGS_RELWITHDEBINFO-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_DLLTOOL
-CMAKE_DLLTOOL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_ECLIPSE_GENERATE_SOURCE_PROJECT
-CMAKE_ECLIPSE_GENERATE_SOURCE_PROJECT-ADVANCED:INTERNAL=1
-//STRINGS property for variable: CMAKE_ECLIPSE_VERSION
-CMAKE_ECLIPSE_VERSION-STRINGS:INTERNAL=3.2 (Callisto);3.3 (Europa);3.4 (Ganymede);3.5 (Galileo);3.6 (Helios);3.7 (Indigo);4.2 (Juno);4.3 (Kepler);4.4 (Luna);4.5 (Mars)
-//Executable file format
-CMAKE_EXECUTABLE_FORMAT:INTERNAL=ELF
-//ADVANCED property for variable: CMAKE_EXE_LINKER_FLAGS
-CMAKE_EXE_LINKER_FLAGS-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_EXE_LINKER_FLAGS_DEBUG
-CMAKE_EXE_LINKER_FLAGS_DEBUG-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_EXE_LINKER_FLAGS_MINSIZEREL
-CMAKE_EXE_LINKER_FLAGS_MINSIZEREL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_EXE_LINKER_FLAGS_RELEASE
-CMAKE_EXE_LINKER_FLAGS_RELEASE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO
-CMAKE_EXE_LINKER_FLAGS_RELWITHDEBINFO-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_EXPORT_COMPILE_COMMANDS
-CMAKE_EXPORT_COMPILE_COMMANDS-ADVANCED:INTERNAL=1
-//Name of external makefile project generator.
-CMAKE_EXTRA_GENERATOR:INTERNAL=Eclipse CDT4
-//CXX compiler system defined macros
-CMAKE_EXTRA_GENERATOR_CXX_SYSTEM_DEFINED_MACROS:INTERNAL=__STDC__;1;__STDC_VERSION__;201710L;__STDC_UTF_16__;1;__STDC_UTF_32__;1;__STDC_HOSTED__;1;__GNUC__;9;__GNUC_MINOR__;3;__GNUC_PATCHLEVEL__;0;__VERSION__;"9.3.0";__ATOMIC_RELAXED;0;__ATOMIC_SEQ_CST;5;__ATOMIC_ACQUIRE;2;__ATOMIC_RELEASE;3;__ATOMIC_ACQ_REL;4;__ATOMIC_CONSUME;1;__pic__;2;__PIC__;2;__pie__;2;__PIE__;2;__FINITE_MATH_ONLY__;0;_LP64;1;__LP64__;1;__SIZEOF_INT__;4;__SIZEOF_LONG__;8;__SIZEOF_LONG_LONG__;8;__SIZEOF_SHORT__;2;__SIZEOF_FLOAT__;4;__SIZEOF_DOUBLE__;8;__SIZEOF_LONG_DOUBLE__;16;__SIZEOF_SIZE_T__;8;__CHAR_BIT__;8;__BIGGEST_ALIGNMENT__;16;__ORDER_LITTLE_ENDIAN__;1234;__ORDER_BIG_ENDIAN__;4321;__ORDER_PDP_ENDIAN__;3412;__BYTE_ORDER__;__ORDER_LITTLE_ENDIAN__;__FLOAT_WORD_ORDER__;__ORDER_LITTLE_ENDIAN__;__SIZEOF_POINTER__;8;__SIZE_TYPE__;long unsigned int;__PTRDIFF_TYPE__;long int;__WCHAR_TYPE__;int;__WINT_TYPE__;unsigned int;__INTMAX_TYPE__;long int;__UINTMAX_TYPE__;long unsigned int;__CHAR16_TYPE__;short unsigned int;__CHAR32_TYPE__;unsigned int;__SIG_ATOMIC_TYPE__;int;__INT8_TYPE__;signed char;__INT16_TYPE__;short int;__INT32_TYPE__;int;__INT64_TYPE__;long int;__UINT8_TYPE__;unsigned char;__UINT16_TYPE__;short unsigned int;__UINT32_TYPE__;unsigned int;__UINT64_TYPE__;long unsigned int;__INT_LEAST8_TYPE__;signed char;__INT_LEAST16_TYPE__;short int;__INT_LEAST32_TYPE__;int;__INT_LEAST64_TYPE__;long int;__UINT_LEAST8_TYPE__;unsigned char;__UINT_LEAST16_TYPE__;short unsigned int;__UINT_LEAST32_TYPE__;unsigned int;__UINT_LEAST64_TYPE__;long unsigned int;__INT_FAST8_TYPE__;signed char;__INT_FAST16_TYPE__;long int;__INT_FAST32_TYPE__;long int;__INT_FAST64_TYPE__;long int;__UINT_FAST8_TYPE__;unsigned char;__UINT_FAST16_TYPE__;long unsigned int;__UINT_FAST32_TYPE__;long unsigned int;__UINT_FAST64_TYPE__;long unsigned int;__INTPTR_TYPE__;long int;__UINTPTR_TYPE__;long unsigned int;__has_include(STR);__has_include__(STR);__has_include_next(STR);__has_include_next__(STR);__GXX_ABI_VERSION;1013;__SCHAR_MAX__;0x7f;__SHRT_MAX__;0x7fff;__INT_MAX__;0x7fffffff;__LONG_MAX__;0x7fffffffffffffffL;__LONG_LONG_MAX__;0x7fffffffffffffffLL;__WCHAR_MAX__;0x7fffffff;__WCHAR_MIN__;(-__WCHAR_MAX__ - 1);__WINT_MAX__;0xffffffffU;__WINT_MIN__;0U;__PTRDIFF_MAX__;0x7fffffffffffffffL;__SIZE_MAX__;0xffffffffffffffffUL;__SCHAR_WIDTH__;8;__SHRT_WIDTH__;16;__INT_WIDTH__;32;__LONG_WIDTH__;64;__LONG_LONG_WIDTH__;64;__WCHAR_WIDTH__;32;__WINT_WIDTH__;32;__PTRDIFF_WIDTH__;64;__SIZE_WIDTH__;64;__INTMAX_MAX__;0x7fffffffffffffffL;__INTMAX_C(c);c ## L;__UINTMAX_MAX__;0xffffffffffffffffUL;__UINTMAX_C(c);c ## UL;__INTMAX_WIDTH__;64;__SIG_ATOMIC_MAX__;0x7fffffff;__SIG_ATOMIC_MIN__;(-__SIG_ATOMIC_MAX__ - 1);__SIG_ATOMIC_WIDTH__;32;__INT8_MAX__;0x7f;__INT16_MAX__;0x7fff;__INT32_MAX__;0x7fffffff;__INT64_MAX__;0x7fffffffffffffffL;__UINT8_MAX__;0xff;__UINT16_MAX__;0xffff;__UINT32_MAX__;0xffffffffU;__UINT64_MAX__;0xffffffffffffffffUL;__INT_LEAST8_MAX__;0x7f;__INT8_C(c);c;__INT_LEAST8_WIDTH__;8;__INT_LEAST16_MAX__;0x7fff;__INT16_C(c);c;__INT_LEAST16_WIDTH__;16;__INT_LEAST32_MAX__;0x7fffffff;__INT32_C(c);c;__INT_LEAST32_WIDTH__;32;__INT_LEAST64_MAX__;0x7fffffffffffffffL;__INT64_C(c);c ## L;__INT_LEAST64_WIDTH__;64;__UINT_LEAST8_MAX__;0xff;__UINT8_C(c);c;__UINT_LEAST16_MAX__;0xffff;__UINT16_C(c);c;__UINT_LEAST32_MAX__;0xffffffffU;__UINT32_C(c);c ## U;__UINT_LEAST64_MAX__;0xffffffffffffffffUL;__UINT64_C(c);c ## UL;__INT_FAST8_MAX__;0x7f;__INT_FAST8_WIDTH__;8;__INT_FAST16_MAX__;0x7fffffffffffffffL;__INT_FAST16_WIDTH__;64;__INT_FAST32_MAX__;0x7fffffffffffffffL;__INT_FAST32_WIDTH__;64;__INT_FAST64_MAX__;0x7fffffffffffffffL;__INT_FAST64_WIDTH__;64;__UINT_FAST8_MAX__;0xff;__UINT_FAST16_MAX__;0xffffffffffffffffUL;__UINT_FAST32_MAX__;0xffffffffffffffffUL;__UINT_FAST64_MAX__;0xffffffffffffffffUL;__INTPTR_MAX__;0x7fffffffffffffffL;__INTPTR_WIDTH__;64;__UINTPTR_MAX__;0xffffffffffffffffUL;__GCC_IEC_559;2;__GCC_IEC_559_COMPLEX;2;__FLT_EVAL_METHOD__;0;__FLT_EVAL_METHOD_TS_18661_3__;0;__DEC_EVAL_METHOD__;2;__FLT_RADIX__;2;__FLT_MANT_DIG__;24;__FLT_DIG__;6;__FLT_MIN_EXP__;(-125);__FLT_MIN_10_EXP__;(-37);__FLT_MAX_EXP__;128;__FLT_MAX_10_EXP__;38;__FLT_DECIMAL_DIG__;9;__FLT_MAX__;3.40282346638528859811704183484516925e+38F;__FLT_MIN__;1.17549435082228750796873653722224568e-38F;__FLT_EPSILON__;1.19209289550781250000000000000000000e-7F;__FLT_DENORM_MIN__;1.40129846432481707092372958328991613e-45F;__FLT_HAS_DENORM__;1;__FLT_HAS_INFINITY__;1;__FLT_HAS_QUIET_NAN__;1;__DBL_MANT_DIG__;53;__DBL_DIG__;15;__DBL_MIN_EXP__;(-1021);__DBL_MIN_10_EXP__;(-307);__DBL_MAX_EXP__;1024;__DBL_MAX_10_EXP__;308;__DBL_DECIMAL_DIG__;17;__DBL_MAX__;((double)1.79769313486231570814527423731704357e+308L);__DBL_MIN__;((double)2.22507385850720138309023271733240406e-308L);__DBL_EPSILON__;((double)2.22044604925031308084726333618164062e-16L);__DBL_DENORM_MIN__;((double)4.94065645841246544176568792868221372e-324L);__DBL_HAS_DENORM__;1;__DBL_HAS_INFINITY__;1;__DBL_HAS_QUIET_NAN__;1;__LDBL_MANT_DIG__;64;__LDBL_DIG__;18;__LDBL_MIN_EXP__;(-16381);__LDBL_MIN_10_EXP__;(-4931);__LDBL_MAX_EXP__;16384;__LDBL_MAX_10_EXP__;4932;__DECIMAL_DIG__;21;__LDBL_DECIMAL_DIG__;21;__LDBL_MAX__;1.18973149535723176502126385303097021e+4932L;__LDBL_MIN__;3.36210314311209350626267781732175260e-4932L;__LDBL_EPSILON__;1.08420217248550443400745280086994171e-19L;__LDBL_DENORM_MIN__;3.64519953188247460252840593361941982e-4951L;__LDBL_HAS_DENORM__;1;__LDBL_HAS_INFINITY__;1;__LDBL_HAS_QUIET_NAN__;1;__FLT32_MANT_DIG__;24;__FLT32_DIG__;6;__FLT32_MIN_EXP__;(-125);__FLT32_MIN_10_EXP__;(-37);__FLT32_MAX_EXP__;128;__FLT32_MAX_10_EXP__;38;__FLT32_DECIMAL_DIG__;9;__FLT32_MAX__;3.40282346638528859811704183484516925e+38F32;__FLT32_MIN__;1.17549435082228750796873653722224568e-38F32;__FLT32_EPSILON__;1.19209289550781250000000000000000000e-7F32;__FLT32_DENORM_MIN__;1.40129846432481707092372958328991613e-45F32;__FLT32_HAS_DENORM__;1;__FLT32_HAS_INFINITY__;1;__FLT32_HAS_QUIET_NAN__;1;__FLT64_MANT_DIG__;53;__FLT64_DIG__;15;__FLT64_MIN_EXP__;(-1021);__FLT64_MIN_10_EXP__;(-307);__FLT64_MAX_EXP__;1024;__FLT64_MAX_10_EXP__;308;__FLT64_DECIMAL_DIG__;17;__FLT64_MAX__;1.79769313486231570814527423731704357e+308F64;__FLT64_MIN__;2.22507385850720138309023271733240406e-308F64;__FLT64_EPSILON__;2.22044604925031308084726333618164062e-16F64;__FLT64_DENORM_MIN__;4.94065645841246544176568792868221372e-324F64;__FLT64_HAS_DENORM__;1;__FLT64_HAS_INFINITY__;1;__FLT64_HAS_QUIET_NAN__;1;__FLT128_MANT_DIG__;113;__FLT128_DIG__;33;__FLT128_MIN_EXP__;(-16381);__FLT128_MIN_10_EXP__;(-4931);__FLT128_MAX_EXP__;16384;__FLT128_MAX_10_EXP__;4932;__FLT128_DECIMAL_DIG__;36;__FLT128_MAX__;1.18973149535723176508575932662800702e+4932F128;__FLT128_MIN__;3.36210314311209350626267781732175260e-4932F128;__FLT128_EPSILON__;1.92592994438723585305597794258492732e-34F128;__FLT128_DENORM_MIN__;6.47517511943802511092443895822764655e-4966F128;__FLT128_HAS_DENORM__;1;__FLT128_HAS_INFINITY__;1;__FLT128_HAS_QUIET_NAN__;1;__FLT32X_MANT_DIG__;53;__FLT32X_DIG__;15;__FLT32X_MIN_EXP__;(-1021);__FLT32X_MIN_10_EXP__;(-307);__FLT32X_MAX_EXP__;1024;__FLT32X_MAX_10_EXP__;308;__FLT32X_DECIMAL_DIG__;17;__FLT32X_MAX__;1.79769313486231570814527423731704357e+308F32x;__FLT32X_MIN__;2.22507385850720138309023271733240406e-308F32x;__FLT32X_EPSILON__;2.22044604925031308084726333618164062e-16F32x;__FLT32X_DENORM_MIN__;4.94065645841246544176568792868221372e-324F32x;__FLT32X_HAS_DENORM__;1;__FLT32X_HAS_INFINITY__;1;__FLT32X_HAS_QUIET_NAN__;1;__FLT64X_MANT_DIG__;64;__FLT64X_DIG__;18;__FLT64X_MIN_EXP__;(-16381);__FLT64X_MIN_10_EXP__;(-4931);__FLT64X_MAX_EXP__;16384;__FLT64X_MAX_10_EXP__;4932;__FLT64X_DECIMAL_DIG__;21;__FLT64X_MAX__;1.18973149535723176502126385303097021e+4932F64x;__FLT64X_MIN__;3.36210314311209350626267781732175260e-4932F64x;__FLT64X_EPSILON__;1.08420217248550443400745280086994171e-19F64x;__FLT64X_DENORM_MIN__;3.64519953188247460252840593361941982e-4951F64x;__FLT64X_HAS_DENORM__;1;__FLT64X_HAS_INFINITY__;1;__FLT64X_HAS_QUIET_NAN__;1;__DEC32_MANT_DIG__;7;__DEC32_MIN_EXP__;(-94);__DEC32_MAX_EXP__;97;__DEC32_MIN__;1E-95DF;__DEC32_MAX__;9.999999E96DF;__DEC32_EPSILON__;1E-6DF;__DEC32_SUBNORMAL_MIN__;0.000001E-95DF;__DEC64_MANT_DIG__;16;__DEC64_MIN_EXP__;(-382);__DEC64_MAX_EXP__;385;__DEC64_MIN__;1E-383DD;__DEC64_MAX__;9.999999999999999E384DD;__DEC64_EPSILON__;1E-15DD;__DEC64_SUBNORMAL_MIN__;0.000000000000001E-383DD;__DEC128_MANT_DIG__;34;__DEC128_MIN_EXP__;(-6142);__DEC128_MAX_EXP__;6145;__DEC128_MIN__;1E-6143DL;__DEC128_MAX__;9.999999999999999999999999999999999E6144DL;__DEC128_EPSILON__;1E-33DL;__DEC128_SUBNORMAL_MIN__;0.000000000000000000000000000000001E-6143DL;__REGISTER_PREFIX__; ;__USER_LABEL_PREFIX__; ;__GNUC_STDC_INLINE__;1;__NO_INLINE__;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_1;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_2;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_4;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_8;1;__GCC_ATOMIC_BOOL_LOCK_FREE;2;__GCC_ATOMIC_CHAR_LOCK_FREE;2;__GCC_ATOMIC_CHAR16_T_LOCK_FREE;2;__GCC_ATOMIC_CHAR32_T_LOCK_FREE;2;__GCC_ATOMIC_WCHAR_T_LOCK_FREE;2;__GCC_ATOMIC_SHORT_LOCK_FREE;2;__GCC_ATOMIC_INT_LOCK_FREE;2;__GCC_ATOMIC_LONG_LOCK_FREE;2;__GCC_ATOMIC_LLONG_LOCK_FREE;2;__GCC_ATOMIC_TEST_AND_SET_TRUEVAL;1;__GCC_ATOMIC_POINTER_LOCK_FREE;2;__HAVE_SPECULATION_SAFE_VALUE;1;__GCC_HAVE_DWARF2_CFI_ASM;1;__PRAGMA_REDEFINE_EXTNAME;1;__SSP_STRONG__;3;__SIZEOF_INT128__;16;__SIZEOF_WCHAR_T__;4;__SIZEOF_WINT_T__;4;__SIZEOF_PTRDIFF_T__;8;__amd64;1;__amd64__;1;__x86_64;1;__x86_64__;1;__SIZEOF_FLOAT80__;16;__SIZEOF_FLOAT128__;16;__ATOMIC_HLE_ACQUIRE;65536;__ATOMIC_HLE_RELEASE;131072;__GCC_ASM_FLAG_OUTPUTS__;1;__k8;1;__k8__;1;__code_model_small__;1;__MMX__;1;__SSE__;1;__SSE2__;1;__FXSR__;1;__SSE_MATH__;1;__SSE2_MATH__;1;__SEG_FS;1;__SEG_GS;1;__CET__;3;__gnu_linux__;1;__linux;1;__linux__;1;linux;1;__unix;1;__unix__;1;unix;1;__ELF__;1;__DECIMAL_BID_FORMAT__;1;_STDC_PREDEF_H;1;__STDC_IEC_559__;1;__STDC_IEC_559_COMPLEX__;1;__STDC_ISO_10646__;201706L;__STDC__;1;__cplusplus;201402L;__STDC_UTF_16__;1;__STDC_UTF_32__;1;__STDC_HOSTED__;1;__GNUC__;9;__GNUC_MINOR__;3;__GNUC_PATCHLEVEL__;0;__VERSION__;"9.3.0";__ATOMIC_RELAXED;0;__ATOMIC_SEQ_CST;5;__ATOMIC_ACQUIRE;2;__ATOMIC_RELEASE;3;__ATOMIC_ACQ_REL;4;__ATOMIC_CONSUME;1;__pic__;2;__PIC__;2;__pie__;2;__PIE__;2;__FINITE_MATH_ONLY__;0;_LP64;1;__LP64__;1;__SIZEOF_INT__;4;__SIZEOF_LONG__;8;__SIZEOF_LONG_LONG__;8;__SIZEOF_SHORT__;2;__SIZEOF_FLOAT__;4;__SIZEOF_DOUBLE__;8;__SIZEOF_LONG_DOUBLE__;16;__SIZEOF_SIZE_T__;8;__CHAR_BIT__;8;__BIGGEST_ALIGNMENT__;16;__ORDER_LITTLE_ENDIAN__;1234;__ORDER_BIG_ENDIAN__;4321;__ORDER_PDP_ENDIAN__;3412;__BYTE_ORDER__;__ORDER_LITTLE_ENDIAN__;__FLOAT_WORD_ORDER__;__ORDER_LITTLE_ENDIAN__;__SIZEOF_POINTER__;8;__GNUG__;9;__SIZE_TYPE__;long unsigned int;__PTRDIFF_TYPE__;long int;__WCHAR_TYPE__;int;__WINT_TYPE__;unsigned int;__INTMAX_TYPE__;long int;__UINTMAX_TYPE__;long unsigned int;__CHAR16_TYPE__;short unsigned int;__CHAR32_TYPE__;unsigned int;__SIG_ATOMIC_TYPE__;int;__INT8_TYPE__;signed char;__INT16_TYPE__;short int;__INT32_TYPE__;int;__INT64_TYPE__;long int;__UINT8_TYPE__;unsigned char;__UINT16_TYPE__;short unsigned int;__UINT32_TYPE__;unsigned int;__UINT64_TYPE__;long unsigned int;__INT_LEAST8_TYPE__;signed char;__INT_LEAST16_TYPE__;short int;__INT_LEAST32_TYPE__;int;__INT_LEAST64_TYPE__;long int;__UINT_LEAST8_TYPE__;unsigned char;__UINT_LEAST16_TYPE__;short unsigned int;__UINT_LEAST32_TYPE__;unsigned int;__UINT_LEAST64_TYPE__;long unsigned int;__INT_FAST8_TYPE__;signed char;__INT_FAST16_TYPE__;long int;__INT_FAST32_TYPE__;long int;__INT_FAST64_TYPE__;long int;__UINT_FAST8_TYPE__;unsigned char;__UINT_FAST16_TYPE__;long unsigned int;__UINT_FAST32_TYPE__;long unsigned int;__UINT_FAST64_TYPE__;long unsigned int;__INTPTR_TYPE__;long int;__UINTPTR_TYPE__;long unsigned int;__has_include(STR);__has_include__(STR);__has_include_next(STR);__has_include_next__(STR);__GXX_WEAK__;1;__DEPRECATED;1;__GXX_RTTI;1;__cpp_rtti;199711;__GXX_EXPERIMENTAL_CXX0X__;1;__cpp_binary_literals;201304;__cpp_hex_float;201603;__cpp_runtime_arrays;198712;__cpp_unicode_characters;200704;__cpp_raw_strings;200710;__cpp_unicode_literals;200710;__cpp_user_defined_literals;200809;__cpp_lambdas;200907;__cpp_range_based_for;200907;__cpp_static_assert;200410;__cpp_decltype;200707;__cpp_attributes;200809;__cpp_rvalue_reference;200610;__cpp_rvalue_references;200610;__cpp_variadic_templates;200704;__cpp_initializer_lists;200806;__cpp_delegating_constructors;200604;__cpp_nsdmi;200809;__cpp_inheriting_constructors;201511;__cpp_ref_qualifiers;200710;__cpp_alias_templates;200704;__cpp_return_type_deduction;201304;__cpp_init_captures;201304;__cpp_generic_lambdas;201304;__cpp_constexpr;201304;__cpp_decltype_auto;201304;__cpp_aggregate_nsdmi;201304;__cpp_variable_templates;201304;__cpp_digit_separators;201309;__cpp_sized_deallocation;201309;__cpp_threadsafe_static_init;200806;__EXCEPTIONS;1;__cpp_exceptions;199711;__GXX_ABI_VERSION;1013;__SCHAR_MAX__;0x7f;__SHRT_MAX__;0x7fff;__INT_MAX__;0x7fffffff;__LONG_MAX__;0x7fffffffffffffffL;__LONG_LONG_MAX__;0x7fffffffffffffffLL;__WCHAR_MAX__;0x7fffffff;__WCHAR_MIN__;(-__WCHAR_MAX__ - 1);__WINT_MAX__;0xffffffffU;__WINT_MIN__;0U;__PTRDIFF_MAX__;0x7fffffffffffffffL;__SIZE_MAX__;0xffffffffffffffffUL;__SCHAR_WIDTH__;8;__SHRT_WIDTH__;16;__INT_WIDTH__;32;__LONG_WIDTH__;64;__LONG_LONG_WIDTH__;64;__WCHAR_WIDTH__;32;__WINT_WIDTH__;32;__PTRDIFF_WIDTH__;64;__SIZE_WIDTH__;64;__GLIBCXX_TYPE_INT_N_0;__int128;__GLIBCXX_BITSIZE_INT_N_0;128;__INTMAX_MAX__;0x7fffffffffffffffL;__INTMAX_C(c);c ## L;__UINTMAX_MAX__;0xffffffffffffffffUL;__UINTMAX_C(c);c ## UL;__INTMAX_WIDTH__;64;__SIG_ATOMIC_MAX__;0x7fffffff;__SIG_ATOMIC_MIN__;(-__SIG_ATOMIC_MAX__ - 1);__SIG_ATOMIC_WIDTH__;32;__INT8_MAX__;0x7f;__INT16_MAX__;0x7fff;__INT32_MAX__;0x7fffffff;__INT64_MAX__;0x7fffffffffffffffL;__UINT8_MAX__;0xff;__UINT16_MAX__;0xffff;__UINT32_MAX__;0xffffffffU;__UINT64_MAX__;0xffffffffffffffffUL;__INT_LEAST8_MAX__;0x7f;__INT8_C(c);c;__INT_LEAST8_WIDTH__;8;__INT_LEAST16_MAX__;0x7fff;__INT16_C(c);c;__INT_LEAST16_WIDTH__;16;__INT_LEAST32_MAX__;0x7fffffff;__INT32_C(c);c;__INT_LEAST32_WIDTH__;32;__INT_LEAST64_MAX__;0x7fffffffffffffffL;__INT64_C(c);c ## L;__INT_LEAST64_WIDTH__;64;__UINT_LEAST8_MAX__;0xff;__UINT8_C(c);c;__UINT_LEAST16_MAX__;0xffff;__UINT16_C(c);c;__UINT_LEAST32_MAX__;0xffffffffU;__UINT32_C(c);c ## U;__UINT_LEAST64_MAX__;0xffffffffffffffffUL;__UINT64_C(c);c ## UL;__INT_FAST8_MAX__;0x7f;__INT_FAST8_WIDTH__;8;__INT_FAST16_MAX__;0x7fffffffffffffffL;__INT_FAST16_WIDTH__;64;__INT_FAST32_MAX__;0x7fffffffffffffffL;__INT_FAST32_WIDTH__;64;__INT_FAST64_MAX__;0x7fffffffffffffffL;__INT_FAST64_WIDTH__;64;__UINT_FAST8_MAX__;0xff;__UINT_FAST16_MAX__;0xffffffffffffffffUL;__UINT_FAST32_MAX__;0xffffffffffffffffUL;__UINT_FAST64_MAX__;0xffffffffffffffffUL;__INTPTR_MAX__;0x7fffffffffffffffL;__INTPTR_WIDTH__;64;__UINTPTR_MAX__;0xffffffffffffffffUL;__GCC_IEC_559;2;__GCC_IEC_559_COMPLEX;2;__FLT_EVAL_METHOD__;0;__FLT_EVAL_METHOD_TS_18661_3__;0;__DEC_EVAL_METHOD__;2;__FLT_RADIX__;2;__FLT_MANT_DIG__;24;__FLT_DIG__;6;__FLT_MIN_EXP__;(-125);__FLT_MIN_10_EXP__;(-37);__FLT_MAX_EXP__;128;__FLT_MAX_10_EXP__;38;__FLT_DECIMAL_DIG__;9;__FLT_MAX__;3.40282346638528859811704183484516925e+38F;__FLT_MIN__;1.17549435082228750796873653722224568e-38F;__FLT_EPSILON__;1.19209289550781250000000000000000000e-7F;__FLT_DENORM_MIN__;1.40129846432481707092372958328991613e-45F;__FLT_HAS_DENORM__;1;__FLT_HAS_INFINITY__;1;__FLT_HAS_QUIET_NAN__;1;__DBL_MANT_DIG__;53;__DBL_DIG__;15;__DBL_MIN_EXP__;(-1021);__DBL_MIN_10_EXP__;(-307);__DBL_MAX_EXP__;1024;__DBL_MAX_10_EXP__;308;__DBL_DECIMAL_DIG__;17;__DBL_MAX__;double(1.79769313486231570814527423731704357e+308L);__DBL_MIN__;double(2.22507385850720138309023271733240406e-308L);__DBL_EPSILON__;double(2.22044604925031308084726333618164062e-16L);__DBL_DENORM_MIN__;double(4.94065645841246544176568792868221372e-324L);__DBL_HAS_DENORM__;1;__DBL_HAS_INFINITY__;1;__DBL_HAS_QUIET_NAN__;1;__LDBL_MANT_DIG__;64;__LDBL_DIG__;18;__LDBL_MIN_EXP__;(-16381);__LDBL_MIN_10_EXP__;(-4931);__LDBL_MAX_EXP__;16384;__LDBL_MAX_10_EXP__;4932;__DECIMAL_DIG__;21;__LDBL_DECIMAL_DIG__;21;__LDBL_MAX__;1.18973149535723176502126385303097021e+4932L;__LDBL_MIN__;3.36210314311209350626267781732175260e-4932L;__LDBL_EPSILON__;1.08420217248550443400745280086994171e-19L;__LDBL_DENORM_MIN__;3.64519953188247460252840593361941982e-4951L;__LDBL_HAS_DENORM__;1;__LDBL_HAS_INFINITY__;1;__LDBL_HAS_QUIET_NAN__;1;__FLT32_MANT_DIG__;24;__FLT32_DIG__;6;__FLT32_MIN_EXP__;(-125);__FLT32_MIN_10_EXP__;(-37);__FLT32_MAX_EXP__;128;__FLT32_MAX_10_EXP__;38;__FLT32_DECIMAL_DIG__;9;__FLT32_MAX__;3.40282346638528859811704183484516925e+38F32;__FLT32_MIN__;1.17549435082228750796873653722224568e-38F32;__FLT32_EPSILON__;1.19209289550781250000000000000000000e-7F32;__FLT32_DENORM_MIN__;1.40129846432481707092372958328991613e-45F32;__FLT32_HAS_DENORM__;1;__FLT32_HAS_INFINITY__;1;__FLT32_HAS_QUIET_NAN__;1;__FLT64_MANT_DIG__;53;__FLT64_DIG__;15;__FLT64_MIN_EXP__;(-1021);__FLT64_MIN_10_EXP__;(-307);__FLT64_MAX_EXP__;1024;__FLT64_MAX_10_EXP__;308;__FLT64_DECIMAL_DIG__;17;__FLT64_MAX__;1.79769313486231570814527423731704357e+308F64;__FLT64_MIN__;2.22507385850720138309023271733240406e-308F64;__FLT64_EPSILON__;2.22044604925031308084726333618164062e-16F64;__FLT64_DENORM_MIN__;4.94065645841246544176568792868221372e-324F64;__FLT64_HAS_DENORM__;1;__FLT64_HAS_INFINITY__;1;__FLT64_HAS_QUIET_NAN__;1;__FLT128_MANT_DIG__;113;__FLT128_DIG__;33;__FLT128_MIN_EXP__;(-16381);__FLT128_MIN_10_EXP__;(-4931);__FLT128_MAX_EXP__;16384;__FLT128_MAX_10_EXP__;4932;__FLT128_DECIMAL_DIG__;36;__FLT128_MAX__;1.18973149535723176508575932662800702e+4932F128;__FLT128_MIN__;3.36210314311209350626267781732175260e-4932F128;__FLT128_EPSILON__;1.92592994438723585305597794258492732e-34F128;__FLT128_DENORM_MIN__;6.47517511943802511092443895822764655e-4966F128;__FLT128_HAS_DENORM__;1;__FLT128_HAS_INFINITY__;1;__FLT128_HAS_QUIET_NAN__;1;__FLT32X_MANT_DIG__;53;__FLT32X_DIG__;15;__FLT32X_MIN_EXP__;(-1021);__FLT32X_MIN_10_EXP__;(-307);__FLT32X_MAX_EXP__;1024;__FLT32X_MAX_10_EXP__;308;__FLT32X_DECIMAL_DIG__;17;__FLT32X_MAX__;1.79769313486231570814527423731704357e+308F32x;__FLT32X_MIN__;2.22507385850720138309023271733240406e-308F32x;__FLT32X_EPSILON__;2.22044604925031308084726333618164062e-16F32x;__FLT32X_DENORM_MIN__;4.94065645841246544176568792868221372e-324F32x;__FLT32X_HAS_DENORM__;1;__FLT32X_HAS_INFINITY__;1;__FLT32X_HAS_QUIET_NAN__;1;__FLT64X_MANT_DIG__;64;__FLT64X_DIG__;18;__FLT64X_MIN_EXP__;(-16381);__FLT64X_MIN_10_EXP__;(-4931);__FLT64X_MAX_EXP__;16384;__FLT64X_MAX_10_EXP__;4932;__FLT64X_DECIMAL_DIG__;21;__FLT64X_MAX__;1.18973149535723176502126385303097021e+4932F64x;__FLT64X_MIN__;3.36210314311209350626267781732175260e-4932F64x;__FLT64X_EPSILON__;1.08420217248550443400745280086994171e-19F64x;__FLT64X_DENORM_MIN__;3.64519953188247460252840593361941982e-4951F64x;__FLT64X_HAS_DENORM__;1;__FLT64X_HAS_INFINITY__;1;__FLT64X_HAS_QUIET_NAN__;1;__DEC32_MANT_DIG__;7;__DEC32_MIN_EXP__;(-94);__DEC32_MAX_EXP__;97;__DEC32_MIN__;1E-95DF;__DEC32_MAX__;9.999999E96DF;__DEC32_EPSILON__;1E-6DF;__DEC32_SUBNORMAL_MIN__;0.000001E-95DF;__DEC64_MANT_DIG__;16;__DEC64_MIN_EXP__;(-382);__DEC64_MAX_EXP__;385;__DEC64_MIN__;1E-383DD;__DEC64_MAX__;9.999999999999999E384DD;__DEC64_EPSILON__;1E-15DD;__DEC64_SUBNORMAL_MIN__;0.000000000000001E-383DD;__DEC128_MANT_DIG__;34;__DEC128_MIN_EXP__;(-6142);__DEC128_MAX_EXP__;6145;__DEC128_MIN__;1E-6143DL;__DEC128_MAX__;9.999999999999999999999999999999999E6144DL;__DEC128_EPSILON__;1E-33DL;__DEC128_SUBNORMAL_MIN__;0.000000000000000000000000000000001E-6143DL;__REGISTER_PREFIX__; ;__USER_LABEL_PREFIX__; ;__GNUC_STDC_INLINE__;1;__NO_INLINE__;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_1;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_2;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_4;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_8;1;__GCC_ATOMIC_BOOL_LOCK_FREE;2;__GCC_ATOMIC_CHAR_LOCK_FREE;2;__GCC_ATOMIC_CHAR16_T_LOCK_FREE;2;__GCC_ATOMIC_CHAR32_T_LOCK_FREE;2;__GCC_ATOMIC_WCHAR_T_LOCK_FREE;2;__GCC_ATOMIC_SHORT_LOCK_FREE;2;__GCC_ATOMIC_INT_LOCK_FREE;2;__GCC_ATOMIC_LONG_LOCK_FREE;2;__GCC_ATOMIC_LLONG_LOCK_FREE;2;__GCC_ATOMIC_TEST_AND_SET_TRUEVAL;1;__GCC_ATOMIC_POINTER_LOCK_FREE;2;__HAVE_SPECULATION_SAFE_VALUE;1;__GCC_HAVE_DWARF2_CFI_ASM;1;__PRAGMA_REDEFINE_EXTNAME;1;__SSP_STRONG__;3;__SIZEOF_INT128__;16;__SIZEOF_WCHAR_T__;4;__SIZEOF_WINT_T__;4;__SIZEOF_PTRDIFF_T__;8;__amd64;1;__amd64__;1;__x86_64;1;__x86_64__;1;__SIZEOF_FLOAT80__;16;__SIZEOF_FLOAT128__;16;__ATOMIC_HLE_ACQUIRE;65536;__ATOMIC_HLE_RELEASE;131072;__GCC_ASM_FLAG_OUTPUTS__;1;__k8;1;__k8__;1;__code_model_small__;1;__MMX__;1;__SSE__;1;__SSE2__;1;__FXSR__;1;__SSE_MATH__;1;__SSE2_MATH__;1;__SEG_FS;1;__SEG_GS;1;__CET__;3;__gnu_linux__;1;__linux;1;__linux__;1;linux;1;__unix;1;__unix__;1;unix;1;__ELF__;1;__DECIMAL_BID_FORMAT__;1;_GNU_SOURCE;1;_STDC_PREDEF_H;1;__STDC_IEC_559__;1;__STDC_IEC_559_COMPLEX__;1;__STDC_ISO_10646__;201706L
-//CXX compiler system include directories
-CMAKE_EXTRA_GENERATOR_CXX_SYSTEM_INCLUDE_DIRS:INTERNAL=/usr/local/cgns/4.1.1_gcc-8.3.0/include;/usr/local/hdf5/1.10.6_gcc-8.3.0/include;/usr/local/szip/2.1.1/include;/usr/include/c++/9;/usr/include/x86_64-linux-gnu/c++/9;/usr/include/c++/9/backward;/usr/lib/gcc/x86_64-linux-gnu/9/include;/usr/local/include;/usr/include/x86_64-linux-gnu;/usr/include
-//C compiler system defined macros
-CMAKE_EXTRA_GENERATOR_C_SYSTEM_DEFINED_MACROS:INTERNAL=__STDC__;1;__STDC_VERSION__;201710L;__STDC_UTF_16__;1;__STDC_UTF_32__;1;__STDC_HOSTED__;1;__GNUC__;9;__GNUC_MINOR__;3;__GNUC_PATCHLEVEL__;0;__VERSION__;"9.3.0";__ATOMIC_RELAXED;0;__ATOMIC_SEQ_CST;5;__ATOMIC_ACQUIRE;2;__ATOMIC_RELEASE;3;__ATOMIC_ACQ_REL;4;__ATOMIC_CONSUME;1;__pic__;2;__PIC__;2;__pie__;2;__PIE__;2;__FINITE_MATH_ONLY__;0;_LP64;1;__LP64__;1;__SIZEOF_INT__;4;__SIZEOF_LONG__;8;__SIZEOF_LONG_LONG__;8;__SIZEOF_SHORT__;2;__SIZEOF_FLOAT__;4;__SIZEOF_DOUBLE__;8;__SIZEOF_LONG_DOUBLE__;16;__SIZEOF_SIZE_T__;8;__CHAR_BIT__;8;__BIGGEST_ALIGNMENT__;16;__ORDER_LITTLE_ENDIAN__;1234;__ORDER_BIG_ENDIAN__;4321;__ORDER_PDP_ENDIAN__;3412;__BYTE_ORDER__;__ORDER_LITTLE_ENDIAN__;__FLOAT_WORD_ORDER__;__ORDER_LITTLE_ENDIAN__;__SIZEOF_POINTER__;8;__SIZE_TYPE__;long unsigned int;__PTRDIFF_TYPE__;long int;__WCHAR_TYPE__;int;__WINT_TYPE__;unsigned int;__INTMAX_TYPE__;long int;__UINTMAX_TYPE__;long unsigned int;__CHAR16_TYPE__;short unsigned int;__CHAR32_TYPE__;unsigned int;__SIG_ATOMIC_TYPE__;int;__INT8_TYPE__;signed char;__INT16_TYPE__;short int;__INT32_TYPE__;int;__INT64_TYPE__;long int;__UINT8_TYPE__;unsigned char;__UINT16_TYPE__;short unsigned int;__UINT32_TYPE__;unsigned int;__UINT64_TYPE__;long unsigned int;__INT_LEAST8_TYPE__;signed char;__INT_LEAST16_TYPE__;short int;__INT_LEAST32_TYPE__;int;__INT_LEAST64_TYPE__;long int;__UINT_LEAST8_TYPE__;unsigned char;__UINT_LEAST16_TYPE__;short unsigned int;__UINT_LEAST32_TYPE__;unsigned int;__UINT_LEAST64_TYPE__;long unsigned int;__INT_FAST8_TYPE__;signed char;__INT_FAST16_TYPE__;long int;__INT_FAST32_TYPE__;long int;__INT_FAST64_TYPE__;long int;__UINT_FAST8_TYPE__;unsigned char;__UINT_FAST16_TYPE__;long unsigned int;__UINT_FAST32_TYPE__;long unsigned int;__UINT_FAST64_TYPE__;long unsigned int;__INTPTR_TYPE__;long int;__UINTPTR_TYPE__;long unsigned int;__has_include(STR);__has_include__(STR);__has_include_next(STR);__has_include_next__(STR);__GXX_ABI_VERSION;1013;__SCHAR_MAX__;0x7f;__SHRT_MAX__;0x7fff;__INT_MAX__;0x7fffffff;__LONG_MAX__;0x7fffffffffffffffL;__LONG_LONG_MAX__;0x7fffffffffffffffLL;__WCHAR_MAX__;0x7fffffff;__WCHAR_MIN__;(-__WCHAR_MAX__ - 1);__WINT_MAX__;0xffffffffU;__WINT_MIN__;0U;__PTRDIFF_MAX__;0x7fffffffffffffffL;__SIZE_MAX__;0xffffffffffffffffUL;__SCHAR_WIDTH__;8;__SHRT_WIDTH__;16;__INT_WIDTH__;32;__LONG_WIDTH__;64;__LONG_LONG_WIDTH__;64;__WCHAR_WIDTH__;32;__WINT_WIDTH__;32;__PTRDIFF_WIDTH__;64;__SIZE_WIDTH__;64;__INTMAX_MAX__;0x7fffffffffffffffL;__INTMAX_C(c);c ## L;__UINTMAX_MAX__;0xffffffffffffffffUL;__UINTMAX_C(c);c ## UL;__INTMAX_WIDTH__;64;__SIG_ATOMIC_MAX__;0x7fffffff;__SIG_ATOMIC_MIN__;(-__SIG_ATOMIC_MAX__ - 1);__SIG_ATOMIC_WIDTH__;32;__INT8_MAX__;0x7f;__INT16_MAX__;0x7fff;__INT32_MAX__;0x7fffffff;__INT64_MAX__;0x7fffffffffffffffL;__UINT8_MAX__;0xff;__UINT16_MAX__;0xffff;__UINT32_MAX__;0xffffffffU;__UINT64_MAX__;0xffffffffffffffffUL;__INT_LEAST8_MAX__;0x7f;__INT8_C(c);c;__INT_LEAST8_WIDTH__;8;__INT_LEAST16_MAX__;0x7fff;__INT16_C(c);c;__INT_LEAST16_WIDTH__;16;__INT_LEAST32_MAX__;0x7fffffff;__INT32_C(c);c;__INT_LEAST32_WIDTH__;32;__INT_LEAST64_MAX__;0x7fffffffffffffffL;__INT64_C(c);c ## L;__INT_LEAST64_WIDTH__;64;__UINT_LEAST8_MAX__;0xff;__UINT8_C(c);c;__UINT_LEAST16_MAX__;0xffff;__UINT16_C(c);c;__UINT_LEAST32_MAX__;0xffffffffU;__UINT32_C(c);c ## U;__UINT_LEAST64_MAX__;0xffffffffffffffffUL;__UINT64_C(c);c ## UL;__INT_FAST8_MAX__;0x7f;__INT_FAST8_WIDTH__;8;__INT_FAST16_MAX__;0x7fffffffffffffffL;__INT_FAST16_WIDTH__;64;__INT_FAST32_MAX__;0x7fffffffffffffffL;__INT_FAST32_WIDTH__;64;__INT_FAST64_MAX__;0x7fffffffffffffffL;__INT_FAST64_WIDTH__;64;__UINT_FAST8_MAX__;0xff;__UINT_FAST16_MAX__;0xffffffffffffffffUL;__UINT_FAST32_MAX__;0xffffffffffffffffUL;__UINT_FAST64_MAX__;0xffffffffffffffffUL;__INTPTR_MAX__;0x7fffffffffffffffL;__INTPTR_WIDTH__;64;__UINTPTR_MAX__;0xffffffffffffffffUL;__GCC_IEC_559;2;__GCC_IEC_559_COMPLEX;2;__FLT_EVAL_METHOD__;0;__FLT_EVAL_METHOD_TS_18661_3__;0;__DEC_EVAL_METHOD__;2;__FLT_RADIX__;2;__FLT_MANT_DIG__;24;__FLT_DIG__;6;__FLT_MIN_EXP__;(-125);__FLT_MIN_10_EXP__;(-37);__FLT_MAX_EXP__;128;__FLT_MAX_10_EXP__;38;__FLT_DECIMAL_DIG__;9;__FLT_MAX__;3.40282346638528859811704183484516925e+38F;__FLT_MIN__;1.17549435082228750796873653722224568e-38F;__FLT_EPSILON__;1.19209289550781250000000000000000000e-7F;__FLT_DENORM_MIN__;1.40129846432481707092372958328991613e-45F;__FLT_HAS_DENORM__;1;__FLT_HAS_INFINITY__;1;__FLT_HAS_QUIET_NAN__;1;__DBL_MANT_DIG__;53;__DBL_DIG__;15;__DBL_MIN_EXP__;(-1021);__DBL_MIN_10_EXP__;(-307);__DBL_MAX_EXP__;1024;__DBL_MAX_10_EXP__;308;__DBL_DECIMAL_DIG__;17;__DBL_MAX__;((double)1.79769313486231570814527423731704357e+308L);__DBL_MIN__;((double)2.22507385850720138309023271733240406e-308L);__DBL_EPSILON__;((double)2.22044604925031308084726333618164062e-16L);__DBL_DENORM_MIN__;((double)4.94065645841246544176568792868221372e-324L);__DBL_HAS_DENORM__;1;__DBL_HAS_INFINITY__;1;__DBL_HAS_QUIET_NAN__;1;__LDBL_MANT_DIG__;64;__LDBL_DIG__;18;__LDBL_MIN_EXP__;(-16381);__LDBL_MIN_10_EXP__;(-4931);__LDBL_MAX_EXP__;16384;__LDBL_MAX_10_EXP__;4932;__DECIMAL_DIG__;21;__LDBL_DECIMAL_DIG__;21;__LDBL_MAX__;1.18973149535723176502126385303097021e+4932L;__LDBL_MIN__;3.36210314311209350626267781732175260e-4932L;__LDBL_EPSILON__;1.08420217248550443400745280086994171e-19L;__LDBL_DENORM_MIN__;3.64519953188247460252840593361941982e-4951L;__LDBL_HAS_DENORM__;1;__LDBL_HAS_INFINITY__;1;__LDBL_HAS_QUIET_NAN__;1;__FLT32_MANT_DIG__;24;__FLT32_DIG__;6;__FLT32_MIN_EXP__;(-125);__FLT32_MIN_10_EXP__;(-37);__FLT32_MAX_EXP__;128;__FLT32_MAX_10_EXP__;38;__FLT32_DECIMAL_DIG__;9;__FLT32_MAX__;3.40282346638528859811704183484516925e+38F32;__FLT32_MIN__;1.17549435082228750796873653722224568e-38F32;__FLT32_EPSILON__;1.19209289550781250000000000000000000e-7F32;__FLT32_DENORM_MIN__;1.40129846432481707092372958328991613e-45F32;__FLT32_HAS_DENORM__;1;__FLT32_HAS_INFINITY__;1;__FLT32_HAS_QUIET_NAN__;1;__FLT64_MANT_DIG__;53;__FLT64_DIG__;15;__FLT64_MIN_EXP__;(-1021);__FLT64_MIN_10_EXP__;(-307);__FLT64_MAX_EXP__;1024;__FLT64_MAX_10_EXP__;308;__FLT64_DECIMAL_DIG__;17;__FLT64_MAX__;1.79769313486231570814527423731704357e+308F64;__FLT64_MIN__;2.22507385850720138309023271733240406e-308F64;__FLT64_EPSILON__;2.22044604925031308084726333618164062e-16F64;__FLT64_DENORM_MIN__;4.94065645841246544176568792868221372e-324F64;__FLT64_HAS_DENORM__;1;__FLT64_HAS_INFINITY__;1;__FLT64_HAS_QUIET_NAN__;1;__FLT128_MANT_DIG__;113;__FLT128_DIG__;33;__FLT128_MIN_EXP__;(-16381);__FLT128_MIN_10_EXP__;(-4931);__FLT128_MAX_EXP__;16384;__FLT128_MAX_10_EXP__;4932;__FLT128_DECIMAL_DIG__;36;__FLT128_MAX__;1.18973149535723176508575932662800702e+4932F128;__FLT128_MIN__;3.36210314311209350626267781732175260e-4932F128;__FLT128_EPSILON__;1.92592994438723585305597794258492732e-34F128;__FLT128_DENORM_MIN__;6.47517511943802511092443895822764655e-4966F128;__FLT128_HAS_DENORM__;1;__FLT128_HAS_INFINITY__;1;__FLT128_HAS_QUIET_NAN__;1;__FLT32X_MANT_DIG__;53;__FLT32X_DIG__;15;__FLT32X_MIN_EXP__;(-1021);__FLT32X_MIN_10_EXP__;(-307);__FLT32X_MAX_EXP__;1024;__FLT32X_MAX_10_EXP__;308;__FLT32X_DECIMAL_DIG__;17;__FLT32X_MAX__;1.79769313486231570814527423731704357e+308F32x;__FLT32X_MIN__;2.22507385850720138309023271733240406e-308F32x;__FLT32X_EPSILON__;2.22044604925031308084726333618164062e-16F32x;__FLT32X_DENORM_MIN__;4.94065645841246544176568792868221372e-324F32x;__FLT32X_HAS_DENORM__;1;__FLT32X_HAS_INFINITY__;1;__FLT32X_HAS_QUIET_NAN__;1;__FLT64X_MANT_DIG__;64;__FLT64X_DIG__;18;__FLT64X_MIN_EXP__;(-16381);__FLT64X_MIN_10_EXP__;(-4931);__FLT64X_MAX_EXP__;16384;__FLT64X_MAX_10_EXP__;4932;__FLT64X_DECIMAL_DIG__;21;__FLT64X_MAX__;1.18973149535723176502126385303097021e+4932F64x;__FLT64X_MIN__;3.36210314311209350626267781732175260e-4932F64x;__FLT64X_EPSILON__;1.08420217248550443400745280086994171e-19F64x;__FLT64X_DENORM_MIN__;3.64519953188247460252840593361941982e-4951F64x;__FLT64X_HAS_DENORM__;1;__FLT64X_HAS_INFINITY__;1;__FLT64X_HAS_QUIET_NAN__;1;__DEC32_MANT_DIG__;7;__DEC32_MIN_EXP__;(-94);__DEC32_MAX_EXP__;97;__DEC32_MIN__;1E-95DF;__DEC32_MAX__;9.999999E96DF;__DEC32_EPSILON__;1E-6DF;__DEC32_SUBNORMAL_MIN__;0.000001E-95DF;__DEC64_MANT_DIG__;16;__DEC64_MIN_EXP__;(-382);__DEC64_MAX_EXP__;385;__DEC64_MIN__;1E-383DD;__DEC64_MAX__;9.999999999999999E384DD;__DEC64_EPSILON__;1E-15DD;__DEC64_SUBNORMAL_MIN__;0.000000000000001E-383DD;__DEC128_MANT_DIG__;34;__DEC128_MIN_EXP__;(-6142);__DEC128_MAX_EXP__;6145;__DEC128_MIN__;1E-6143DL;__DEC128_MAX__;9.999999999999999999999999999999999E6144DL;__DEC128_EPSILON__;1E-33DL;__DEC128_SUBNORMAL_MIN__;0.000000000000000000000000000000001E-6143DL;__REGISTER_PREFIX__; ;__USER_LABEL_PREFIX__; ;__GNUC_STDC_INLINE__;1;__NO_INLINE__;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_1;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_2;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_4;1;__GCC_HAVE_SYNC_COMPARE_AND_SWAP_8;1;__GCC_ATOMIC_BOOL_LOCK_FREE;2;__GCC_ATOMIC_CHAR_LOCK_FREE;2;__GCC_ATOMIC_CHAR16_T_LOCK_FREE;2;__GCC_ATOMIC_CHAR32_T_LOCK_FREE;2;__GCC_ATOMIC_WCHAR_T_LOCK_FREE;2;__GCC_ATOMIC_SHORT_LOCK_FREE;2;__GCC_ATOMIC_INT_LOCK_FREE;2;__GCC_ATOMIC_LONG_LOCK_FREE;2;__GCC_ATOMIC_LLONG_LOCK_FREE;2;__GCC_ATOMIC_TEST_AND_SET_TRUEVAL;1;__GCC_ATOMIC_POINTER_LOCK_FREE;2;__HAVE_SPECULATION_SAFE_VALUE;1;__GCC_HAVE_DWARF2_CFI_ASM;1;__PRAGMA_REDEFINE_EXTNAME;1;__SSP_STRONG__;3;__SIZEOF_INT128__;16;__SIZEOF_WCHAR_T__;4;__SIZEOF_WINT_T__;4;__SIZEOF_PTRDIFF_T__;8;__amd64;1;__amd64__;1;__x86_64;1;__x86_64__;1;__SIZEOF_FLOAT80__;16;__SIZEOF_FLOAT128__;16;__ATOMIC_HLE_ACQUIRE;65536;__ATOMIC_HLE_RELEASE;131072;__GCC_ASM_FLAG_OUTPUTS__;1;__k8;1;__k8__;1;__code_model_small__;1;__MMX__;1;__SSE__;1;__SSE2__;1;__FXSR__;1;__SSE_MATH__;1;__SSE2_MATH__;1;__SEG_FS;1;__SEG_GS;1;__CET__;3;__gnu_linux__;1;__linux;1;__linux__;1;linux;1;__unix;1;__unix__;1;unix;1;__ELF__;1;__DECIMAL_BID_FORMAT__;1;_STDC_PREDEF_H;1;__STDC_IEC_559__;1;__STDC_IEC_559_COMPLEX__;1;__STDC_ISO_10646__;201706L
-//C compiler system include directories
-CMAKE_EXTRA_GENERATOR_C_SYSTEM_INCLUDE_DIRS:INTERNAL=/usr/local/cgns/4.1.1_gcc-8.3.0/include;/usr/local/hdf5/1.10.6_gcc-8.3.0/include;/usr/local/szip/2.1.1/include;/usr/lib/gcc/x86_64-linux-gnu/9/include;/usr/local/include;/usr/include/x86_64-linux-gnu;/usr/include
-//Name of generator.
-CMAKE_GENERATOR:INTERNAL=Unix Makefiles
-//Generator instance identifier.
-CMAKE_GENERATOR_INSTANCE:INTERNAL=
-//Name of generator platform.
-CMAKE_GENERATOR_PLATFORM:INTERNAL=
-//Name of generator toolset.
-CMAKE_GENERATOR_TOOLSET:INTERNAL=
-//Source directory with the top level CMakeLists.txt file for this
-// project
-CMAKE_HOME_DIRECTORY:INTERNAL=/home/justin/Thesis/topo code/SAND
-//ADVANCED property for variable: CMAKE_INSTALL_PREFIX
-CMAKE_INSTALL_PREFIX-ADVANCED:INTERNAL=1
-//Install .so files without execute permission.
-CMAKE_INSTALL_SO_NO_EXE:INTERNAL=1
-//ADVANCED property for variable: CMAKE_LINKER
-CMAKE_LINKER-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_MAKE_PROGRAM
-CMAKE_MAKE_PROGRAM-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_MODULE_LINKER_FLAGS
-CMAKE_MODULE_LINKER_FLAGS-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_MODULE_LINKER_FLAGS_DEBUG
-CMAKE_MODULE_LINKER_FLAGS_DEBUG-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_MODULE_LINKER_FLAGS_MINSIZEREL
-CMAKE_MODULE_LINKER_FLAGS_MINSIZEREL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_MODULE_LINKER_FLAGS_RELEASE
-CMAKE_MODULE_LINKER_FLAGS_RELEASE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_MODULE_LINKER_FLAGS_RELWITHDEBINFO
-CMAKE_MODULE_LINKER_FLAGS_RELWITHDEBINFO-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_NM
-CMAKE_NM-ADVANCED:INTERNAL=1
-//number of local generators
-CMAKE_NUMBER_OF_MAKEFILES:INTERNAL=1
-//ADVANCED property for variable: CMAKE_OBJCOPY
-CMAKE_OBJCOPY-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_OBJDUMP
-CMAKE_OBJDUMP-ADVANCED:INTERNAL=1
-//Platform information initialized
-CMAKE_PLATFORM_INFO_INITIALIZED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_RANLIB
-CMAKE_RANLIB-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_READELF
-CMAKE_READELF-ADVANCED:INTERNAL=1
-//Path to CMake installation.
-CMAKE_ROOT:INTERNAL=/usr/share/cmake-3.16
-//ADVANCED property for variable: CMAKE_SHARED_LINKER_FLAGS
-CMAKE_SHARED_LINKER_FLAGS-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_SHARED_LINKER_FLAGS_DEBUG
-CMAKE_SHARED_LINKER_FLAGS_DEBUG-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_SHARED_LINKER_FLAGS_MINSIZEREL
-CMAKE_SHARED_LINKER_FLAGS_MINSIZEREL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_SHARED_LINKER_FLAGS_RELEASE
-CMAKE_SHARED_LINKER_FLAGS_RELEASE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_SHARED_LINKER_FLAGS_RELWITHDEBINFO
-CMAKE_SHARED_LINKER_FLAGS_RELWITHDEBINFO-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_SKIP_INSTALL_RPATH
-CMAKE_SKIP_INSTALL_RPATH-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_SKIP_RPATH
-CMAKE_SKIP_RPATH-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_STATIC_LINKER_FLAGS
-CMAKE_STATIC_LINKER_FLAGS-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_STATIC_LINKER_FLAGS_DEBUG
-CMAKE_STATIC_LINKER_FLAGS_DEBUG-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_STATIC_LINKER_FLAGS_MINSIZEREL
-CMAKE_STATIC_LINKER_FLAGS_MINSIZEREL-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_STATIC_LINKER_FLAGS_RELEASE
-CMAKE_STATIC_LINKER_FLAGS_RELEASE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_STATIC_LINKER_FLAGS_RELWITHDEBINFO
-CMAKE_STATIC_LINKER_FLAGS_RELWITHDEBINFO-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: CMAKE_STRIP
-CMAKE_STRIP-ADVANCED:INTERNAL=1
-//uname command
-CMAKE_UNAME:INTERNAL=/usr/bin/uname
-//ADVANCED property for variable: CMAKE_VERBOSE_MAKEFILE
-CMAKE_VERBOSE_MAKEFILE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: PERL_EXECUTABLE
-PERL_EXECUTABLE-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: ProcessorCount_cmd_nproc
-ProcessorCount_cmd_nproc-ADVANCED:INTERNAL=1
-//ADVANCED property for variable: ProcessorCount_cmd_sysctl
-ProcessorCount_cmd_sysctl-ADVANCED:INTERNAL=1
-USAGE_PRINTED:INTERNAL=TRUE
-
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6625bfd..c416efe 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -1,6 +1,7 @@
 # Set the name of the project and target:
 SET(TARGET "SAND")
 
+
 # Declare all source files the target consists of. Here, this is only
 # the one step-X.cc file, but as you expand your project you may wish
 # to add other source files as well. If your project becomes much larger,
@@ -21,9 +22,8 @@ SET(  TARGET_SRC ${TARGET_SRC} ${TARGET_INC}
   
 # Usually, you will not need to modify anything beyond this point...
 
-CMAKE_MINIMUM_REQUIRED(VERSION 2.8.12)
-
-FIND_PACKAGE(deal.II 9.2.0 QUIET
+CMAKE_MINIMUM_REQUIRED(VERSION 3.1.0)
+FIND_PACKAGE(deal.II 9.4.0 QUIET
   HINTS ${deal.II_DIR} ${DEAL_II_DIR} ../ ../../ $ENV{DEAL_II_DIR}
   )
 IF(NOT ${deal.II_FOUND})
diff --git a/cmake_install.cmake b/cmake_install.cmake
deleted file mode 100644
index 417d8e3..0000000
--- a/cmake_install.cmake
+++ /dev/null
@@ -1,49 +0,0 @@
-# Install script for directory: /home/justin/Thesis/topo code/SAND
-
-# Set the install prefix
-if(NOT DEFINED CMAKE_INSTALL_PREFIX)
-  set(CMAKE_INSTALL_PREFIX "/usr/local")
-endif()
-string(REGEX REPLACE "/$" "" CMAKE_INSTALL_PREFIX "${CMAKE_INSTALL_PREFIX}")
-
-# Set the install configuration name.
-if(NOT DEFINED CMAKE_INSTALL_CONFIG_NAME)
-  if(BUILD_TYPE)
-    string(REGEX REPLACE "^[^A-Za-z0-9_]+" ""
-           CMAKE_INSTALL_CONFIG_NAME "${BUILD_TYPE}")
-  else()
-    set(CMAKE_INSTALL_CONFIG_NAME "Release")
-  endif()
-  message(STATUS "Install configuration: \"${CMAKE_INSTALL_CONFIG_NAME}\"")
-endif()
-
-# Set the component getting installed.
-if(NOT CMAKE_INSTALL_COMPONENT)
-  if(COMPONENT)
-    message(STATUS "Install component: \"${COMPONENT}\"")
-    set(CMAKE_INSTALL_COMPONENT "${COMPONENT}")
-  else()
-    set(CMAKE_INSTALL_COMPONENT)
-  endif()
-endif()
-
-# Install shared libraries without execute permission?
-if(NOT DEFINED CMAKE_INSTALL_SO_NO_EXE)
-  set(CMAKE_INSTALL_SO_NO_EXE "1")
-endif()
-
-# Is this installation the result of a crosscompile?
-if(NOT DEFINED CMAKE_CROSSCOMPILING)
-  set(CMAKE_CROSSCOMPILING "FALSE")
-endif()
-
-if(CMAKE_INSTALL_COMPONENT)
-  set(CMAKE_INSTALL_MANIFEST "install_manifest_${CMAKE_INSTALL_COMPONENT}.txt")
-else()
-  set(CMAKE_INSTALL_MANIFEST "install_manifest.txt")
-endif()
-
-string(REPLACE ";" "\n" CMAKE_INSTALL_MANIFEST_CONTENT
-       "${CMAKE_INSTALL_MANIFEST_FILES}")
-file(WRITE "/home/justin/Thesis/topo code/SAND/${CMAKE_INSTALL_MANIFEST}"
-     "${CMAKE_INSTALL_MANIFEST_CONTENT}")
diff --git a/include/density_filter.h b/include/density_filter.h
index 0a23cc9..51daba2 100644
--- a/include/density_filter.h
+++ b/include/density_filter.h
@@ -20,10 +20,13 @@
 #include <deal.II/lac/packaged_operation.h>
 #include <deal.II/lac/sparse_direct.h>
 #include <deal.II/lac/affine_constraints.h>
+#include <deal.II/lac/trilinos_parallel_block_vector.h>
+#include <deal.II/lac/generic_linear_algebra.h>
 
 #include <deal.II/grid/tria.h>
 #include <deal.II/grid/grid_generator.h>
 #include <deal.II/grid/grid_refinement.h>
+#include <deal.II/grid/cell_id.h>
 
 #include <deal.II/dofs/dof_handler.h>
 #include <deal.II/dofs/dof_renumbering.h>
@@ -47,20 +50,37 @@
  * Once formed, we have F*\sigma = \rho*/
 namespace SAND {
     using namespace dealii;
-
+    namespace LA
+    {
+        using namespace dealii::LinearAlgebraTrilinos;
+    }
     template<int dim>
     class DensityFilter {
     public:
 
-        DensityFilter()=default;
+        MPI_Comm  mpi_communicator;
+        std::vector<IndexSet> owned_partitioning;
+        std::vector<IndexSet> relevant_partitioning;
 
-        SparseMatrix<double> filter_matrix;
+        DensityFilter();
+        DynamicSparsityPattern filter_dsp;
+        LA::MPI::SparseMatrix filter_matrix;
+        LA::MPI::SparseMatrix filter_matrix_transpose;
         SparsityPattern filter_sparsity_pattern;
-        void initialize(Triangulation<dim> &triangulation);
-
+        void initialize(DoFHandler<dim> &dof_handler);
+        std::set<types::global_dof_index> find_relevant_neighbors(types::global_dof_index cell_index) const;
 
     private:
-        std::set<typename Triangulation<dim>::cell_iterator> find_relevant_neighbors(typename Triangulation<dim>::cell_iterator cell) const;
+        std::vector<double> cell_m;
+        std::vector<double> x_coord;
+        std::vector<double> y_coord;
+        std::vector<double> z_coord;
+        std::vector<double> cell_m_part;
+        std::vector<double> x_coord_part;
+        std::vector<double> y_coord_part;
+        std::vector<double> z_coord_part;
+
+        ConditionalOStream pcout;
 
     };
 }
diff --git a/include/input_information.h b/include/input_information.h
index 51e796e..8e95b17 100644
--- a/include/input_information.h
+++ b/include/input_information.h
@@ -16,19 +16,23 @@ namespace SAND {
 
         //geometry options
         constexpr unsigned int geometry_base = GeometryOptions::mbb;
-        constexpr unsigned int dim = 2;
-        constexpr unsigned int refinements =  3;
+
+        constexpr unsigned int dim = 3;
+        // constexpr unsigned int refinements = 3;
+        extern unsigned int refinements;
 
         //nonlinear algorithm options
         constexpr double initial_barrier_size = 25;
-        constexpr double min_barrier_size = .00000;
-        constexpr double fraction_to_boundary = .9;
-        constexpr unsigned int max_steps=75;
+        constexpr double min_barrier_size = 1e-12;
+
+        constexpr double fraction_to_boundary = .7;
+        constexpr unsigned int max_steps=100;
+
         constexpr unsigned int barrier_reduction=BarrierOptions::loqo;
         constexpr double required_norm = .0001;
 
         //density filter options
-        constexpr double filter_r = .251;
+        constexpr double filter_r = .25;
 
         //other options
         constexpr double density_penalty_exponent = 3;
@@ -39,11 +43,22 @@ namespace SAND {
         constexpr bool output_parts_of_matrix = false;
 
         //Linear solver options
-        constexpr unsigned int solver_choice = SolverOptions::inexact_K_with_exact_A_gmres;
+        constexpr unsigned int solver_choice = SolverOptions::inexact_K_with_inexact_A_gmres;
         constexpr bool use_eisenstat_walker = false;
         constexpr double default_gmres_tolerance = 1e-6;
 
+        extern unsigned int a_inv_iterations;
+        extern unsigned int k_inv_iterations;
+
+        // constexpr double a_inv_iterations = 5;
+        // constexpr double k_inv_iterations = 30;
+
+        constexpr double a_rel_tol = 1e-12;
+        constexpr double k_rel_tol = 1e-12;
 
+        //Material Options
+        constexpr double material_lambda = 1.;
+        constexpr double material_mu = 1.;
     }
 }
-#endif //SAND_INPUT_INFORMATION_H
+#endif //SAND_INPUT_INFORMATION_H
\ No newline at end of file
diff --git a/include/kkt_system.h b/include/kkt_system.h
index 89f1d48..bb264a1 100644
--- a/include/kkt_system.h
+++ b/include/kkt_system.h
@@ -5,11 +5,15 @@
 #ifndef SAND_KKT_SYSTEM_H
 #define SAND_KKT_SYSTEM_H
 #include <deal.II/base/quadrature_lib.h>
+#include <deal.II/base/utilities.h>
+#include <deal.II/base/conditional_ostream.h>
+#include <deal.II/base/index_set.h>
 #include <deal.II/base/function.h>
 #include <deal.II/base/tensor.h>
 #include <deal.II/base/timer.h>
 
 #include <deal.II/lac/block_vector.h>
+#include <deal.II/lac/vector.h>
 #include <deal.II/lac/full_matrix.h>
 #include <deal.II/lac/block_sparse_matrix.h>
 #include <deal.II/lac/solver_cg.h>
@@ -18,10 +22,18 @@
 #include <deal.II/lac/packaged_operation.h>
 #include <deal.II/lac/sparse_direct.h>
 #include <deal.II/lac/affine_constraints.h>
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/dynamic_sparsity_pattern.h>
+#include <deal.II/lac/sparsity_tools.h>
+#include <deal.II/lac/trilinos_sparse_matrix.h>
+#include <deal.II/lac/trilinos_block_sparse_matrix.h>
+#include <deal.II/lac/trilinos_parallel_block_vector.h>
+#include <deal.II/lac/trilinos_vector.h>
 
-#include <deal.II/grid/tria.h>
 #include <deal.II/grid/grid_generator.h>
+#include <deal.II/grid/manifold_lib.h>
 #include <deal.II/grid/grid_refinement.h>
+#include <deal.II/grid/grid_tools.h>
 
 #include <deal.II/dofs/dof_handler.h>
 #include <deal.II/dofs/dof_renumbering.h>
@@ -38,19 +50,50 @@
 #include <deal.II/numerics/error_estimator.h>
 #include <deal.II/hp/fe_collection.h>
 
+#include <deal.II/distributed/tria.h>
+#include <deal.II/distributed/grid_refinement.h>
+
+#include <deal.II/multigrid/multigrid.h>
+#include <deal.II/multigrid/mg_transfer_matrix_free.h>
+#include <deal.II/multigrid/mg_tools.h>
+#include <deal.II/multigrid/mg_coarse.h>
+#include <deal.II/multigrid/mg_smoother.h>
+#include <deal.II/multigrid/mg_matrix.h>
+
+#include <deal.II/matrix_free/matrix_free.h>
+#include <deal.II/matrix_free/operators.h>
+#include <deal.II/matrix_free/fe_evaluation.h>
+
+
 #include "../include/schur_preconditioner.h"
 #include "../include/density_filter.h"
+#include "matrix_free_elasticity.h"
+
+#include <deal.II/base/conditional_ostream.h>
 
 #include <iostream>
 #include <fstream>
 #include <algorithm>
 namespace SAND {
+
+
+
+    namespace LA
+    {
+        using namespace dealii::LinearAlgebraTrilinos;
+    }
     using namespace dealii;
 
     template<int dim>
     class KktSystem {
 
+    using SystemMFMatrixType = MF_Elasticity_Operator<dim, 1, double>;
+    using LevelMFMatrixType = MF_Elasticity_Operator<dim, 1, double>;
     public:
+        MPI_Comm  mpi_communicator;
+        std::vector<IndexSet> owned_partitioning;
+        std::vector<IndexSet> relevant_partitioning;
+
         KktSystem();
 
         void
@@ -66,63 +109,101 @@ namespace SAND {
         setup_block_system();
 
         void
-        assemble_block_system(const BlockVector<double> &state, const double barrier_size);
+        assemble_block_system(const LA::MPI::BlockVector &state, const double barrier_size);
 
-        BlockVector<double>
-        solve(const BlockVector<double> &state, double barrier_size);
+        LA::MPI::BlockVector
+        solve(const LA::MPI::BlockVector &state);
 
-        BlockVector<double>
+        LA::MPI::BlockVector
         get_initial_state();
 
         double
-        calculate_objective_value(const BlockVector<double> &state) const;
+        calculate_objective_value(const LA::MPI::BlockVector &state) const;
 
         double
-        calculate_barrier_distance(const BlockVector<double> &state) const;
+        calculate_barrier_distance(const LA::MPI::BlockVector &state) const;
 
         double
-        calculate_feasibility(const BlockVector<double> &state, const double barrier_size) const;
+        calculate_feasibility(const LA::MPI::BlockVector &state, const double barrier_size) const;
 
         double
-        calculate_convergence(const BlockVector<double> &state) const;
+        calculate_convergence(const LA::MPI::BlockVector &state) const;
 
         void
-        output(const BlockVector<double> &state, const unsigned int j) const;
+        output(const LA::MPI::BlockVector &state, const unsigned int j) const;
 
         void
         calculate_initial_rhs_error();
 
         double
-        calculate_rhs_norm(const BlockVector<double> &state, const double barrier_size) const;
+        calculate_rhs_norm(const LA::MPI::BlockVector &state, const double barrier_size) const;
 
         void
-        output_stl(const BlockVector<double> &state);
+        output_stl(const LA::MPI::BlockVector &state);
 
     private:
 
-        BlockVector<double>
-        calculate_rhs(const BlockVector<double> &test_solution, const double barrier_size) const;
+        LA::MPI::BlockVector
+        calculate_rhs(const LA::MPI::BlockVector &test_solution, const double barrier_size) const;
 
+        BlockDynamicSparsityPattern dsp;
         BlockSparsityPattern sparsity_pattern;
-        BlockSparseMatrix<double> system_matrix;
-        BlockVector<double> linear_solution;
-        BlockVector<double> system_rhs;
-        Triangulation<dim> triangulation;
+        mutable LA::MPI::BlockSparseMatrix system_matrix;
+        mutable LA::MPI::BlockVector locally_relevant_solution;
+        mutable LA::MPI::BlockVector distributed_solution;
+        LA::MPI::BlockVector system_rhs;
+        parallel::distributed::Triangulation<dim> triangulation;
         DoFHandler<dim> dof_handler;
+        DoFHandler<dim> dof_handler_displacement;
+        DoFHandler<dim> dof_handler_density;
+
+        std::map<types::global_dof_index,types::global_dof_index> displacement_to_system_dof_index_map;
+        MGLevelObject<std::map<types::global_dof_index,types::global_dof_index>> level_displacement_to_system_dof_index_map;
+
         AffineConstraints<double> constraints;
+        AffineConstraints<double> displacement_constraints;
         FESystem<dim> fe_nine;
         FESystem<dim> fe_ten;
         hp::FECollection<dim> fe_collection;
+        FESystem<dim> fe_displacement;
+        FE_DGQ<dim> fe_density;
         const double density_ratio;
         const double density_penalty_exponent;
 
-        DensityFilter<dim> density_filter;
+        mutable DensityFilter<dim> density_filter;
 
         std::map<types::global_dof_index, double> boundary_values;
-
+        MGLevelObject<std::map<types::global_dof_index, double>> level_boundary_values;
+        ConditionalOStream pcout;
 
         double initial_rhs_error;
 
+        MGConstrainedDoFs mg_constrained_dofs;
+        SystemMFMatrixType elasticity_matrix_mf;
+        MGLevelObject<LevelMFMatrixType> mg_matrices;
+
+        OperatorCellData<dim, GMGNumberType> active_cell_data;
+        MGLevelObject<OperatorCellData<dim, GMGNumberType>> level_cell_data;
+        dealii::LinearAlgebra::distributed::Vector<double> active_density_vector;
+        dealii::LinearAlgebra::distributed::Vector<double> relevant_density_vector;
+        MGLevelObject<dealii::LinearAlgebra::distributed::Vector<double>> level_density_vector;
+
+        MGTransferMatrixFree<dim,GMGNumberType> transfer;
+        MGTransferMatrixFree<dim, double> mg_transfer;
+
+        using SmootherType = PreconditionChebyshev<LevelMFMatrixType, LinearAlgebra::distributed::Vector<double>>;
+        mg::SmootherRelaxation<SmootherType,LinearAlgebra::distributed::Vector<double>> mg_smoother;
+        MGLevelObject<typename SmootherType::AdditionalData> smoother_data;
+        MGCoarseGridApplySmoother<LinearAlgebra::distributed::Vector<double>> mg_coarse;
+        MGLevelObject<std::set<types::boundary_id>> level_dirichlet_boundary_dofs;
+        MGLevelObject<AffineConstraints<double>> mg_level_constraints;
+        MGLevelObject<MatrixFreeOperators::MGInterfaceOperator<LevelMFMatrixType>> mg_interface_matrices;
+
+        std::set<types::boundary_id> dirichlet_boundary;
+
+        LinearAlgebra::distributed::Vector<double> distributed_displacement_sol;
+        LinearAlgebra::distributed::Vector<double> distributed_displacement_rhs;
+
     };
 }
 
diff --git a/include/matrix_free_elasticity.h b/include/matrix_free_elasticity.h
new file mode 100644
index 0000000..525136f
--- /dev/null
+++ b/include/matrix_free_elasticity.h
@@ -0,0 +1,108 @@
+#ifndef MATRIX_FREE_GMG_H
+#define MATRIX_FREE_GMG_H
+
+#include <deal.II/base/quadrature_lib.h>
+#include <deal.II/base/function.h>
+#include <deal.II/base/timer.h>
+#include <deal.II/lac/affine_constraints.h>
+#include <deal.II/lac/solver_cg.h>
+#include <deal.II/lac/la_parallel_vector.h>
+#include <deal.II/lac/precondition.h>
+#include <deal.II/fe/fe_q.h>
+#include <deal.II/fe/fe_system.h>
+#include <deal.II/grid/tria.h>
+#include <deal.II/grid/grid_generator.h>
+#include <deal.II/dofs/dof_handler.h>
+#include <deal.II/dofs/dof_renumbering.h>
+#include <deal.II/dofs/dof_tools.h>
+#include <deal.II/multigrid/multigrid.h>
+#include <deal.II/multigrid/mg_transfer_matrix_free.h>
+#include <deal.II/multigrid/mg_tools.h>
+#include <deal.II/multigrid/mg_coarse.h>
+#include <deal.II/multigrid/mg_smoother.h>
+#include <deal.II/multigrid/mg_matrix.h>
+#include <deal.II/numerics/data_out.h>
+#include <deal.II/numerics/vector_tools.h>
+#include <deal.II/matrix_free/matrix_free.h>
+#include <deal.II/matrix_free/operators.h>
+#include <deal.II/matrix_free/fe_evaluation.h>
+#include <deal.II/base/utilities.h>
+
+#include "../include/parameters_and_components.h"
+#include "../include/input_information.h"
+
+
+
+namespace SAND
+{
+using GMGNumberType = double;
+using namespace dealii;
+
+template <int dim, typename number>
+struct OperatorCellData
+{
+    Table<2, VectorizedArray<number>> density;
+    std::size_t
+    memory_consumption() const;
+};
+
+template <int dim, int fe_degree, typename number>
+class MF_Elasticity_Operator
+        : public MatrixFreeOperators::
+        Base<dim, LinearAlgebra::distributed::Vector<number>>
+{
+public:
+
+    MPI_Comm  mpi_communicator;
+
+    using value_type = number;
+
+    MF_Elasticity_Operator();
+
+    void set_cell_data (const OperatorCellData<dim,number> &data);
+
+    void compute_diagonal() override;
+
+    void clear() override;
+
+private:
+
+    void apply_add (dealii::LinearAlgebra::distributed::Vector<number> &dst,
+                    const dealii::LinearAlgebra::distributed::Vector<number> &src) const override;
+
+
+    void local_apply (const dealii::MatrixFree<dim, number> &data,
+                      dealii::LinearAlgebra::distributed::Vector<number> &dst,
+                      const dealii::LinearAlgebra::distributed::Vector<number> &src,
+                      const std::pair<unsigned int, unsigned int> &cell_range) const;
+
+    void local_apply_face (const dealii::MatrixFree<dim, number> &data,
+                           dealii::LinearAlgebra::distributed::Vector<number> &dst,
+                           const dealii::LinearAlgebra::distributed::Vector<number> &src,
+                           const std::pair<unsigned int, unsigned int> &face_range) const;
+
+
+    void local_apply_boundary_face (const dealii::MatrixFree<dim, number> &data,
+                                    dealii::LinearAlgebra::distributed::Vector<number> &dst,
+                                    const dealii::LinearAlgebra::distributed::Vector<number> &src,
+                                    const std::pair<unsigned int, unsigned int> &face_range) const;
+
+    void local_compute_diagonal (const MatrixFree<dim,number>                     &data,
+                              dealii::LinearAlgebra::distributed::Vector<number>  &dst,
+                              const unsigned int &,
+                              const std::pair<unsigned int,unsigned int>       &cell_range) const;
+
+
+    const OperatorCellData<dim,number> *cell_data;
+
+    ConditionalOStream pcout;
+
+};
+
+
+}
+
+
+
+
+#endif // MATRIX_FREE_GMG_H
diff --git a/include/parameters_and_components.h b/include/parameters_and_components.h
index 192b085..978cd96 100644
--- a/include/parameters_and_components.h
+++ b/include/parameters_and_components.h
@@ -63,6 +63,6 @@ namespace SAND {
         static constexpr unsigned int mbb = 1;
         static constexpr unsigned int l_shape = 2;
     }
-
+    static constexpr unsigned int block_number = 10;
 }
 #endif //SAND_PARAMETERS_AND_COMPONENTS_H
diff --git a/include/sand_tools.h b/include/sand_tools.h
index 767a203..4d19664 100644
--- a/include/sand_tools.h
+++ b/include/sand_tools.h
@@ -4,26 +4,80 @@
 
 #ifndef SAND_MY_TOOLS_H
 #define SAND_MY_TOOLS_H
+#include <deal.II/base/quadrature_lib.h>
+#include <deal.II/base/function.h>
+#include <deal.II/base/tensor.h>
+#include <deal.II/base/timer.h>
+
+#include <deal.II/lac/block_vector.h>
+#include <deal.II/lac/full_matrix.h>
+#include <deal.II/lac/block_sparse_matrix.h>
+#include <deal.II/lac/precondition.h>
+#include <deal.II/lac/linear_operator.h>
+#include <deal.II/lac/linear_operator_tools.h>
+#include <deal.II/lac/packaged_operation.h>
+#include <deal.II/lac/sparse_direct.h>
+#include <deal.II/lac/solver_gmres.h>
+#include <deal.II/lac/solver_cg.h>
+#include <deal.II/lac/solver_bicgstab.h>
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/matrix_out.h>
+#include <deal.II/lac/trilinos_sparse_matrix.h>
+#include <deal.II/lac/trilinos_block_sparse_matrix.h>
+
+#include <deal.II/grid/tria.h>
+#include <deal.II/grid/grid_generator.h>
+#include <deal.II/grid/grid_refinement.h>
+
+#include <deal.II/dofs/dof_handler.h>
+#include <deal.II/dofs/dof_renumbering.h>
+#include <deal.II/dofs/dof_tools.h>
+
+#include <deal.II/fe/fe_values.h>
+#include <deal.II/fe/fe_dgq.h>
+#include <deal.II/fe/fe_system.h>
+#include <deal.II/fe/fe_q.h>
+
+#include <deal.II/numerics/vector_tools.h>
+#include <deal.II/numerics/matrix_tools.h>
+#include <deal.II/numerics/data_out.h>
+#include <deal.II/numerics/error_estimator.h>
+#include <deal.II/base/config.h>
+#include <deal.II/base/numbers.h>
+#include <deal.II/base/table.h>
+#include <deal.II/base/tensor.h>
+#include <deal.II/base/timer.h>
+
+#include <deal.II/differentiation/ad/ad_number_traits.h>
+
+#include <deal.II/lac/exceptions.h>
+#include <deal.II/lac/identity_matrix.h>
+
 
 
 namespace SAND{
+    namespace LA
+    {
+        using namespace dealii::LinearAlgebraTrilinos;
+    }
+
     using namespace dealii;
 
-    void build_matrix_element_by_element (const auto &X,
-                                          FullMatrix<double>   &X_matrix)
-    {
 
+    void build_matrix_element_by_element (const LinearOperator<LA::MPI::Vector,LA::MPI::Vector,dealii::TrilinosWrappers::internal::LinearOperatorImplementation::TrilinosPayload> &op_X,
+                                          FullMatrix<double>   &X_matrix,
+                                          LA::MPI::Vector &exemplar_vector)
+    {
         Threads::TaskGroup<void> tasks;
         for (unsigned int j=0; j<X_matrix.n(); ++j)
-            tasks += Threads::new_task ([&X, &X_matrix, j]()
+            tasks += Threads::new_task ([&op_X, &X_matrix, &exemplar_vector, j]()
                                         {
-                                            Vector<double> e_j (X_matrix.m());
-                                            Vector<double> r_j (X_matrix.n());
+                                            LA::MPI::Vector e_j (exemplar_vector);
+                                            LA::MPI::Vector r_j (exemplar_vector);
 
                                             e_j = 0;
                                             e_j(j) = 1;
-
-                                            X.vmult (r_j, e_j);
+                                            r_j = op_X * e_j;
 
                                             for (unsigned int i=0; i<X_matrix.m(); ++i)
                                                 X_matrix(i,j) = r_j(i);
@@ -32,41 +86,60 @@ namespace SAND{
         tasks.join_all();
     }
 
-//    void print_matrix (std::string &name, FullMatrix<double>   &X_matrix)
-//    {
-////        const unsigned int n = X_matrix.n();
-////        const unsigned int m = X_matrix.m();
-////        std::ofstream Xmat(name);
-////        for (unsigned int i = 0; i < m; i++)
-////        {
-////            Xmat << X_matrix(i, 0);
-////            for (unsigned int j = 1; j < n; j++)
-////            {
-////                Xmat << "," << X_matrix(i, j);
-////            }
-////            Xmat << "\n";
-////        }
-////        Xmat.close();
-//    }
-
-//    void print_matrix (std::string &name, SparseMatrix<double>   &X_matrix)
-//    {
-////        const unsigned int n = X_matrix.n();
-////        const unsigned int m = X_matrix.m();
-////        std::ofstream Xmat(name);
-////        for (unsigned int i = 0; i < m; i++)
-////        {
-////            Xmat << X_matrix.el(i, 0);
-////            for (unsigned int j = 1; j < n; j++)
-////            {
-////                Xmat << "," << X_matrix.el(i, j);
-////            }
-////            Xmat << "\n";
-////        }
-////        Xmat.close();
-//    }
+    void print_matrix (std::string name, FullMatrix<double>   &X_matrix)
+    {
+        const unsigned int n = X_matrix.n();
+        const unsigned int m = X_matrix.m();
+        std::ofstream Xmat(name);
+        for (unsigned int i = 0; i < m; i++)
+        {
+            Xmat << X_matrix(i, 0);
+            for (unsigned int j = 1; j < n; j++)
+            {
+                Xmat << "," << X_matrix(i, j);
+            }
+            Xmat << "\n";
+        }
+        Xmat.close();
+    }
+
+    void print_matrix (std::string &name, SparseMatrix<double>   &X_matrix)
+    {
+        const unsigned int n = X_matrix.n();
+        const unsigned int m = X_matrix.m();
+        std::ofstream Xmat(name);
+        for (unsigned int i = 0; i < m; i++)
+        {
+            Xmat << X_matrix.el(i, 0);
+            for (unsigned int j = 1; j < n; j++)
+            {
+                Xmat << "," << X_matrix.el(i, j);
+            }
+            Xmat << "\n";
+        }
+        Xmat.close();
+    }
+
+    void print_matrix (std::string &name, LA::MPI::SparseMatrix &X_matrix)
+    {
+        const unsigned int n = X_matrix.n();
+        const unsigned int m = X_matrix.m();
+        std::ofstream Xmat(name);
+        for (unsigned int i = 0; i < m; i++)
+        {
+            Xmat << X_matrix.el(i, 0);
+            for (unsigned int j = 1; j < n; j++)
+            {
+                Xmat << "," << X_matrix.el(i, j);
+            }
+            Xmat << "\n";
+        }
+        Xmat.close();
+    }
 
 }
 
 
+
+
 #endif //SAND_MY_TOOLS_H
diff --git a/include/schur_preconditioner.h b/include/schur_preconditioner.h
index 0d6ef4e..8f06feb 100644
--- a/include/schur_preconditioner.h
+++ b/include/schur_preconditioner.h
@@ -14,11 +14,16 @@
 #include <deal.II/lac/block_sparse_matrix.h>
 #include <deal.II/lac/precondition.h>
 #include <deal.II/lac/linear_operator.h>
+#include <deal.II/lac/linear_operator_tools.h>
 #include <deal.II/lac/packaged_operation.h>
 #include <deal.II/lac/sparse_direct.h>
 #include <deal.II/lac/solver_gmres.h>
 #include <deal.II/lac/solver_cg.h>
 #include <deal.II/lac/solver_bicgstab.h>
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/matrix_out.h>
+#include <deal.II/lac/trilinos_sparse_matrix.h>
+#include <deal.II/lac/trilinos_block_sparse_matrix.h>
 
 #include <deal.II/grid/tria.h>
 #include <deal.II/grid/grid_generator.h>
@@ -55,6 +60,10 @@
 
 
 #include "../include/parameters_and_components.h"
+#include "../include/poly_pre.h"
+#include "matrix_free_elasticity.h"
+
+#include <deal.II/base/conditional_ostream.h>
 
 #include <iostream>
 #include <algorithm>
@@ -62,79 +71,400 @@
 
 namespace SAND
 {
+    using MatrixType  = dealii::TrilinosWrappers::SparseMatrix;
+    using VectorType  = dealii::TrilinosWrappers::MPI::Vector;
+    using PayloadType = dealii::TrilinosWrappers::internal::LinearOperatorImplementation::TrilinosPayload;
+    using PayloadVectorType = typename PayloadType::VectorType;
+    namespace LA
+    {
+        using namespace dealii::LinearAlgebraTrilinos;
+    }
     using namespace dealii;
+
+    class VmultTrilinosSolverDirect : public TrilinosWrappers::SparseMatrix {
+        public:
+            VmultTrilinosSolverDirect(SolverControl &cn,
+                                      const TrilinosWrappers::SolverDirect::AdditionalData &data
+                                      );
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void vmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const;
+            void initialize(LA::MPI::SparseMatrix &a_mat);
+            unsigned int m() const;
+            unsigned int n() const;
+            int get_size()
+            {
+                return size;
+            }
+        private:
+            mutable TrilinosWrappers::SolverDirect solver_direct;
+            int size;
+    };
+
+    class AMatWrapped : public TrilinosWrappers::SparseMatrix {
+        public:
+            AMatWrapped(LA::MPI::SparseMatrix &a_mat);
+            void vmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const;
+            void Tvmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const;
+            unsigned int m() const;
+            unsigned int n() const;
+            void set_exemplar_vector (const LA::MPI::Vector &exemplar_vector)
+            {
+                temp_dst = exemplar_vector;
+                temp_src = exemplar_vector;
+            }
+
+        private:
+            const LA::MPI::SparseMatrix &a_mat;
+            mutable LA::MPI::Vector temp_src;
+            mutable LA::MPI::Vector temp_dst;
+
+    };
+
+    template<int dim>
+    class AInvMatMFGMG : public TrilinosWrappers::SparseMatrix {
+        public:
+            AInvMatMFGMG(MF_Elasticity_Operator<dim,1,double> &mf_elasticity_operator_in , PreconditionMG<dim,LinearAlgebra::distributed::Vector<double>,MGTransferMatrixFree<dim, double>>
+                         &mf_gmg_preconditioner_in,LA::MPI::SparseMatrix &a_mat, std::map<types::global_dof_index,types::global_dof_index> &displacement_to_system_dof_index_map);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            unsigned int m() const;
+            unsigned int n() const;
+            void set_tol(double tolerance_in);
+            void set_iter(unsigned int iterations_in);
+            void set_exemplar_vector (const LA::MPI::Vector &exemplar_vector)
+            {
+                a_mat_wrapped.set_exemplar_vector(exemplar_vector);
+            }
+            double tolerance = Input::a_rel_tol;
+            unsigned int iterations = Input::a_inv_iterations;
+        private:
+            AMatWrapped a_mat_wrapped;
+            MF_Elasticity_Operator<dim,1,double> &mf_elasticity_operator;
+            PreconditionMG<dim,LinearAlgebra::distributed::Vector<double>,MGTransferMatrixFree<dim, double>> &mf_gmg_preconditioner;
+            const std::map<types::global_dof_index,types::global_dof_index> displacement_to_system_dof_index_map;
+
+            mutable dealii::LinearAlgebra::distributed::Vector<double> temp_src;
+            mutable dealii::LinearAlgebra::distributed::Vector<double> temp_dst;
+
+    };
+
+
+    class GMatrix : public TrilinosWrappers::SparseMatrix {
+        public:
+            GMatrix(const LA::MPI::SparseMatrix &f_mat_in,const LA::MPI::SparseMatrix &f_t_mat_in, LA::MPI::SparseMatrix &d_8_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            const LA::MPI::SparseMatrix &f_mat;
+            const LA::MPI::SparseMatrix &f_t_mat;
+            LA::MPI::SparseMatrix &d_8_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+
+
+    };
+
+    template<int dim>
+    class HMatrix : public TrilinosWrappers::SparseMatrix {
+        public:
+            HMatrix(LA::MPI::SparseMatrix &a_mat_in, const LA::MPI::SparseMatrix &b_mat_in, const LA::MPI::SparseMatrix &c_mat_in, const LA::MPI::SparseMatrix &e_mat_in,TrilinosWrappers::PreconditionAMG &pre_amg_in, VmultTrilinosSolverDirect &a_inv_direct_in, AInvMatMFGMG<dim> &a_inv_mf_gmg_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector,  LA::MPI::Vector &exemplar_displacement_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            LA::MPI::SparseMatrix &a_mat;
+            const LA::MPI::SparseMatrix &b_mat;
+            const LA::MPI::SparseMatrix &c_mat;
+            const LA::MPI::SparseMatrix &e_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            TrilinosWrappers::PreconditionAMG &pre_amg;
+            VmultTrilinosSolverDirect &a_inv_direct;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+            mutable LA::MPI::Vector temp_vect_5;
+            mutable LA::MPI::Vector temp_vect_6;
+            mutable LA::MPI::Vector temp_vect_7;
+            AInvMatMFGMG<dim> &a_inv_mf_gmg;
+
+    };
+
+    template<int dim>
+    class HMatrixDirect : public TrilinosWrappers::SparseMatrix {
+        public:
+            HMatrixDirect(LA::MPI::SparseMatrix &a_mat_in, const LA::MPI::SparseMatrix &b_mat_in, const LA::MPI::SparseMatrix &c_mat_in, const LA::MPI::SparseMatrix &e_mat_in,TrilinosWrappers::PreconditionAMG &pre_amg_in, VmultTrilinosSolverDirect &a_inv_direct_in, AInvMatMFGMG<dim> &a_inv_mf_gmg_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector,  LA::MPI::Vector &exemplar_displacement_vector);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            LA::MPI::SparseMatrix &a_mat;
+            const LA::MPI::SparseMatrix &b_mat;
+            const LA::MPI::SparseMatrix &c_mat;
+            const LA::MPI::SparseMatrix &e_mat;
+            TrilinosWrappers::PreconditionAMG &pre_amg;
+            VmultTrilinosSolverDirect &a_inv_direct;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+            mutable LA::MPI::Vector temp_vect_5;
+            mutable LA::MPI::Vector temp_vect_6;
+            mutable LA::MPI::Vector temp_vect_7;
+            AInvMatMFGMG<dim> &a_inv_mf_gmg;
+
+    };
+
+    template<int dim>
+    class KinvMatrix : public TrilinosWrappers::SparseMatrix {
+        public:
+            KinvMatrix(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            HMatrix<dim> &h_mat;
+            GMatrix &g_mat;
+            const LA::MPI::SparseMatrix &d_m_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+    };
+
+    template<int dim>
+    class KinvMatrixPart : public Subscriptor {
+        public:
+            KinvMatrixPart(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            HMatrix<dim> &h_mat;
+            GMatrix &g_mat;
+            const LA::MPI::SparseMatrix &d_m_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+    };
+
+    template<int dim>
+    class KinvMatrixDirect : public TrilinosWrappers::SparseMatrix {
+        public:
+            KinvMatrixDirect(HMatrixDirect<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            HMatrixDirect<dim> &h_mat;
+            GMatrix &g_mat;
+            const LA::MPI::SparseMatrix &d_m_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+    };
+
+    template<int dim>
+    class JinvMatrix : public TrilinosWrappers::SparseMatrix {
+        public:
+            JinvMatrix(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            HMatrix<dim> &h_mat;
+            GMatrix &g_mat;
+            const LA::MPI::SparseMatrix &d_m_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+    };
+
+    template<int dim>
+    class JinvMatrixPart : public Subscriptor {
+        public:
+            JinvMatrixPart(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            HMatrix<dim> &h_mat;
+            GMatrix &g_mat;
+            const LA::MPI::SparseMatrix &d_m_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+    };
+
+    template<int dim>
+    class JinvMatrixDirect : public TrilinosWrappers::SparseMatrix {
+        public:
+            JinvMatrixDirect(HMatrixDirect<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            void initialize(LA::MPI::Vector &exemplar_density_vector);
+            unsigned int m() const;
+            unsigned int n() const;
+        private:
+            HMatrixDirect<dim> &h_mat;
+            GMatrix &g_mat;
+            const LA::MPI::SparseMatrix &d_m_mat;
+            LA::MPI::SparseMatrix d_m_inv_mat;
+            mutable LA::MPI::Vector temp_vect_1;
+            mutable LA::MPI::Vector temp_vect_2;
+            mutable LA::MPI::Vector temp_vect_3;
+            mutable LA::MPI::Vector temp_vect_4;
+    };
+
+    
+
     template<int dim>
     class TopOptSchurPreconditioner: public Subscriptor {
     public:
-        TopOptSchurPreconditioner(BlockSparseMatrix<double> &matrix_in);
-        void initialize (BlockSparseMatrix<double> &matrix, const std::map<types::global_dof_index, double> &boundary_values, const DoFHandler<dim> &dof_handler, const double barrier_size, const BlockVector<double> &state);
-        void vmult(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void Tvmult(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void vmult_add(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void Tvmult_add(BlockVector<double> &dst, const BlockVector<double> &src) const;
+        TopOptSchurPreconditioner(LA::MPI::BlockSparseMatrix &matrix_in, DoFHandler<dim> &big_dof_handler_in, MF_Elasticity_Operator<dim,1,double> &mf_elasticity_operator_in , PreconditionMG<dim,LinearAlgebra::distributed::Vector<double>,MGTransferMatrixFree<dim, double>>
+                                  &mf_gmg_preconditioner_in, std::map<types::global_dof_index,types::global_dof_index> &displacement_to_system_dof_index_map);
+        void initialize (LA::MPI::BlockSparseMatrix &matrix, const std::map<types::global_dof_index, double> &boundary_values, const DoFHandler<dim> &dof_handler, const LA::MPI::BlockVector &distributed_state);
+        void vmult(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void Tvmult(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void vmult_add(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void Tvmult_add(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
         void clear();
         unsigned int m() const;
         unsigned int n() const;
         void get_sparsity_pattern(BlockDynamicSparsityPattern &bdsp);
 
-        void assemble_mass_matrix(const BlockVector<double> &state, const hp::FECollection<dim> &fe_system, const DoFHandler<dim> &dof_handler, const AffineConstraints<double> &constraints,   const BlockSparsityPattern &bsp);
+        void assemble_mass_matrix(const LA::MPI::BlockVector &state, const hp::FECollection<dim> &fe_system, const DoFHandler<dim> &dof_handler, const AffineConstraints<double> &constraints,   const BlockSparsityPattern &bsp);
 
-        void print_stuff(const BlockSparseMatrix<double> &matrix);
+        void print_stuff();
 
-        BlockSparseMatrix<double> &system_matrix;
+        LA::MPI::BlockSparseMatrix &system_matrix;
 
     private:
+        MPI_Comm  mpi_communicator;
         unsigned int n_rows;
         unsigned int n_columns;
         unsigned int n_block_rows;
         unsigned int n_block_columns;
-        void vmult_step_1(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void vmult_step_2(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void vmult_step_3(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void vmult_step_4(BlockVector<double> &dst, const BlockVector<double> &src) const;
-        void vmult_step_5(BlockVector<double> &dst, const BlockVector<double> &src) const;
+        void vmult_step_1(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void vmult_step_2(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void vmult_step_3(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void vmult_step_4(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
+        void vmult_step_5(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const;
 
         BlockSparsityPattern mass_sparsity;
-        BlockSparseMatrix<double> approx_h_mat;
+        LA::MPI::BlockSparseMatrix approx_h_mat;
 
         SolverControl other_solver_control;
-        mutable SolverBicgstab<Vector<double>> other_bicgstab;
-        mutable SolverGMRES<Vector<double>> other_gmres;
-        mutable SolverCG<Vector<double>> other_cg;
-
-        SparseMatrix<double> &a_mat;
-        const SparseMatrix<double> &b_mat;
-        const SparseMatrix<double> &c_mat;
-        const SparseMatrix<double> &e_mat;
-        const SparseMatrix<double> &f_mat;
-        const SparseMatrix<double> &d_m_mat;
-        const SparseMatrix<double> &d_1_mat;
-        const SparseMatrix<double> &d_2_mat;
-        const SparseMatrix<double> &m_vect;
-
-        SparseMatrix<double> d_3_mat;
-        SparseMatrix<double> d_4_mat;
-        SparseMatrix<double> d_5_mat;
-        SparseMatrix<double> d_6_mat;
-        SparseMatrix<double> d_7_mat;
-        SparseMatrix<double> d_8_mat;
-        SparseMatrix<double> d_m_inv_mat;
-
-        FullMatrix<double> g_mat;
-        FullMatrix<double> h_mat;
-        FullMatrix<double> k_inv_mat;
-        LAPACKFullMatrix<double> k_mat;
-
-        mutable Vector<double> pre_j;
-        mutable Vector<double> pre_k;
-        mutable Vector<double> g_d_m_inv_density;
-        mutable Vector<double> k_g_d_m_inv_density;
-
-        SparseDirectUMFPACK a_inv_direct;
+        mutable SolverBicgstab<LA::MPI::Vector> other_bicgstab;
+        mutable SolverGMRES<LA::MPI::Vector> other_gmres;
+        mutable SolverCG<LA::MPI::Vector> other_cg;
+
+        LA::MPI::SparseMatrix &a_mat;
+        const LA::MPI::SparseMatrix &b_mat;
+        const LA::MPI::SparseMatrix &c_mat;
+        const LA::MPI::SparseMatrix &e_mat;
+        const LA::MPI::SparseMatrix &f_mat;
+        const LA::MPI::SparseMatrix &f_t_mat;
+        const LA::MPI::SparseMatrix &d_m_mat;
+        const LA::MPI::SparseMatrix &d_1_mat;
+        const LA::MPI::SparseMatrix &d_2_mat;
+        const LA::MPI::SparseMatrix &m_vect;
+        const DoFHandler<dim> &big_dof_handler;
+
+        LA::MPI::SparseMatrix d_3_mat;
+        LA::MPI::SparseMatrix d_4_mat;
+        LA::MPI::SparseMatrix d_5_mat;
+        LA::MPI::SparseMatrix d_6_mat;
+        LA::MPI::SparseMatrix d_7_mat;
+        LA::MPI::SparseMatrix d_8_mat;
+        LA::MPI::SparseMatrix d_m_inv_mat;
+
+        mutable LA::MPI::Vector pre_j;
+        mutable LA::MPI::Vector pre_k;
+        mutable LA::MPI::Vector g_d_m_inv_density;
+        mutable LA::MPI::Vector k_g_d_m_inv_density;
 
+        std::string solver_type;
+        TrilinosWrappers::SolverDirect::AdditionalData additional_data;
+        SolverControl direct_solver_control;
+        mutable VmultTrilinosSolverDirect a_inv_direct;
+
+        mutable AInvMatMFGMG<dim> a_inv_mf_gmg;
+        ConditionalOStream pcout;
         mutable TimerOutput timer;
 
+        mutable TrilinosWrappers::PreconditionAMG pre_amg;
+
+        mutable GMatrix g_mat;
+        HMatrix<dim> h_mat;
+
+        JinvMatrix<dim> j_inv_mat;
+        KinvMatrix<dim> k_inv_mat;
+
+        JinvMatrixPart<dim> j_inv_part;
+        KinvMatrixPart<dim> k_inv_part;
+
+        mutable int num_mults;
+
+    };
+
+        template<int dim>
+    class PolyPreJ {
+
+        public:
+            PolyPreJ(const JinvMatrixPart<dim> &inner_matrix_in, const int degree_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            // void vmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const;
+            
+
+        private:
+            const JinvMatrixPart<dim> &inner_matrix;
+            const int degree;
+    };
+
+    template<int dim>
+    class PolyPreK {
+
+        public:
+            PolyPreK(const KinvMatrixPart<dim> &inner_matrix_in, const int degree_in);
+            void vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const;
+            // void vmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const;
+            
+
+        private:
+            const KinvMatrixPart<dim> &inner_matrix;
+            const int degree;
     };
 
+
 }
 #endif //SAND_SCHUR_PRECONDITIONER_H
diff --git a/include/watchdog.h b/include/watchdog.h
new file mode 100644
index 0000000..3ce4dce
--- /dev/null
+++ b/include/watchdog.h
@@ -0,0 +1,69 @@
+#include <deal.II/lac/block_vector.h>
+#include <deal.II/lac/packaged_operation.h>
+#include <deal.II/grid/tria.h>
+#include <deal.II/grid/grid_refinement.h>
+#include <iostream>
+#include "../include/markov_filter.h"
+#include "../include/kkt_system.h"
+#include "../include/input_information.h"
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/trilinos_parallel_block_vector.h>
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/base/conditional_ostream.h>
+#include <deal.II/base/utilities.h>
+
+///Above are fairly normal files to include.  I also use the sparse direct package, which requiresBLAS/LAPACK
+/// to  perform  a  direct  solve  while  I  work  on  a  fast  iterative  solver  for  this problem.
+
+namespace SAND {
+    namespace LA
+    {
+        using namespace dealii::LinearAlgebraTrilinos;
+    }
+
+
+    using namespace dealii;
+
+    /// Below is the main class for solving this problem. It handles the nonlinear solver portion of the problem,
+    /// taking information from the KKTSystem class for step directions, and calculating step lengths. This class
+    /// not only takes those steps, but handles the barrier parameter for the log barrier used.
+    template<int dim>
+    class NonlinearWatchdog {
+    public:
+        NonlinearWatchdog();
+
+        void
+        run();
+
+    private:
+        MPI_Comm  mpi_communicator;
+        std::pair<double,double>
+        calculate_max_step_size(const LA::MPI::BlockVector &state, const LA::MPI::BlockVector &step) const;
+
+        const LA::MPI::BlockVector
+        find_max_step(const LA::MPI::BlockVector &state);
+
+        LA::MPI::BlockVector
+        take_scaled_step(const LA::MPI::BlockVector &state,const LA::MPI::BlockVector &max_step) const;
+
+        bool
+        check_convergence(const LA::MPI::BlockVector &state) const;
+
+        void
+        update_barrier(LA::MPI::BlockVector &current_state);
+
+        void
+        perform_initial_setup();
+
+        void
+        nonlinear_step(LA::MPI::BlockVector &current_state, LA::MPI::BlockVector &current_step, const unsigned int max_uphill_steps, unsigned int &iteration_number);
+
+        KktSystem<dim> kkt_system;
+        MarkovFilter markov_filter;
+        double barrier_size;
+        bool mixed_barrier_monotone_mode;
+        ConditionalOStream pcout;
+        TimerOutput overall_timer;
+    };
+
+} // namespace SAND
diff --git a/source/density_filter.cc b/source/density_filter.cc
index 184b4a6..4e64a56 100644
--- a/source/density_filter.cc
+++ b/source/density_filter.cc
@@ -7,101 +7,260 @@
 #include <deal.II/lac/block_sparse_matrix.h>
 #include <deal.II/lac/precondition.h>
 #include <deal.II/grid/tria.h>
+#include <deal.II/grid/cell_id.h>
 #include <deal.II/numerics/vector_tools.h>
 #include <deal.II/numerics/matrix_tools.h>
 
-namespace SAND {
+namespace SAND
+{
     using namespace dealii;
 
-    /* When initialized, this function takes the current triangulation and creates a matrix corresponding to a
-     * convolution being applied to a piecewise constant function on that triangulation  */
+    template<int dim>
+    DensityFilter<dim>::DensityFilter() :
+        mpi_communicator(MPI_COMM_WORLD),
+        pcout(std::cout,(Utilities::MPI::this_mpi_process(mpi_communicator) == 0))
+    {
+    }
+
+    ///When initialized, this function takes the current triangulation and creates a matrix corresponding to a
+    /// convolution being applied to a piecewise constant function on that triangulation
+    ///
     template<int dim>
     void
-    DensityFilter<dim>::initialize(Triangulation<dim> &triangulation) {
-        DynamicSparsityPattern filter_dsp;
-        filter_dsp.reinit(triangulation.n_active_cells(),
-                          triangulation.n_active_cells());
+    DensityFilter<dim>::initialize(DoFHandler<dim> &dof_handler) {
+        ///Start by making vectors to fill with information about the x,y,z coords of centers of cells
+        ///
+        std::vector<unsigned int> block_component(10, 2);
+        block_component[SolutionBlocks::density] = 0;
+        block_component[SolutionBlocks::displacement] = 1;
+        const std::vector<types::global_dof_index> dofs_per_block =
+                DoFTools::count_dofs_per_fe_block(dof_handler, block_component);
+        const unsigned int n_p = dofs_per_block[0];
+        IndexSet local_owned = dof_handler.locally_owned_dofs().get_view(0, n_p);
+        x_coord.resize(n_p);
+        y_coord.resize(n_p);
+        z_coord.resize(n_p);
+        auto row_sum = z_coord;
+        auto row_sum_full = z_coord;
+        cell_m.resize(n_p);
+        x_coord_part.resize(n_p);
+        y_coord_part.resize(n_p);
+        z_coord_part.resize(n_p);
+        cell_m_part.resize(n_p);
+
+        filter_dsp.reinit(dofs_per_block[0],
+                          dofs_per_block[0]);
+        filter_sparsity_pattern.copy_from(filter_dsp);
 
+        // const auto owned_dofs = dof_handler.locally_owned_dofs().get_view(0, dofs_per_block[0]);
+
+        // filter_matrix.reinit(owned_dofs, filter_sparsity_pattern, MPI_COMM_WORLD);
+
+
+        // //identity filter
+        // for (const auto &cell : dof_handler.active_cell_iterators())
+        // {
+        //     if(cell->is_locally_owned())
+        //     {
+        //         std::vector<unsigned int> i(cell->get_fe().n_dofs_per_cell());
+        //         cell->get_dof_indices(i);
+        //         filter_matrix.add(i[cell->get_fe().component_to_system_index(0, 0)], i[cell->get_fe().component_to_system_index(0, 0)], 1.0);
+        //     }
+        // }
+       
         std::set<unsigned int> neighbor_ids;
-        std::set<typename Triangulation<dim>::cell_iterator> cells_to_check;
-        std::set<typename Triangulation<dim>::cell_iterator> cells_to_check_temp;
-
-        /*finds neighbors whose values would be relevant, and adds them to the sparsity pattern of the matrix*/
-        for (const auto &cell : triangulation.active_cell_iterators()) {
-            const unsigned int i = cell->active_cell_index();
-            for (const auto &neighbor_cell : find_relevant_neighbors(cell)) {
-                const unsigned int j = neighbor_cell->active_cell_index();
-                filter_dsp.add(i, j);
+        std::set<typename DoFHandler<dim>::cell_iterator> cells_to_check;
+        std::set<typename DoFHandler<dim>::cell_iterator> cells_to_check_temp;
+        ///finds neighbors whose values would be relevant, and adds them to the sparsity pattern of the matrix
+         for (const auto &cell : dof_handler.active_cell_iterators())
+         {
+             if(cell->is_locally_owned())
+             {
+                std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+                cell->get_dof_indices(i);
+                const unsigned int i_val = i[cell->get_fe().component_to_system_index(0, 0)];
+                x_coord_part[i_val] = cell->center()[0] ;
+                y_coord_part[i_val] = cell->center()[1] ;
+                cell_m_part[i_val] = cell->measure();
+                if (dim==3)
+                {
+                    z_coord_part[i_val] = cell->center()[2] ;
+                }
+             }
+         }
+        MPI_Allreduce(x_coord_part.data(), x_coord.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(y_coord_part.data(), y_coord.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(z_coord_part.data(), z_coord.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(cell_m_part.data(), cell_m.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+
+        for (const auto &cell : dof_handler.active_cell_iterators()) {
+            if(cell->is_locally_owned())
+            {
+                std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+                cell->get_dof_indices(i);
+                for (const auto &neighbor_cell_index : find_relevant_neighbors(i[cell->get_fe().component_to_system_index(0, 0)]))
+                {
+                    filter_dsp.add(i[cell->get_fe().component_to_system_index(0, 0)], neighbor_cell_index);
+                }
             }
         }
-
         filter_sparsity_pattern.copy_from(filter_dsp);
-        filter_matrix.reinit(filter_sparsity_pattern);
+        const auto owned_dofs = dof_handler.locally_owned_dofs().get_view(4 * n_p, 5 * n_p);
 
-        /*adds values to the matrix corresponding to the max radius - */
-        for (const auto &cell : triangulation.active_cell_iterators())
-        {
-            const unsigned int i = cell->active_cell_index();
-            for (const auto &neighbor_cell : find_relevant_neighbors(cell)) {
-                const unsigned int j = neighbor_cell->active_cell_index();
-                const double d =
-                        cell->center().distance(neighbor_cell->center());
-                /*value should be (max radius - distance between cells)*cell measure */
-                double value = (Input::filter_r - d)*neighbor_cell->measure();
-                filter_matrix.add(i, j, value);
-            }
-        }
+        filter_matrix.reinit(owned_dofs, filter_sparsity_pattern, MPI_COMM_WORLD);
+        filter_matrix_transpose.reinit(owned_dofs, filter_sparsity_pattern, MPI_COMM_WORLD);
 
-        //here we normalize the filter so it computes an average. Sum of values in a row should be 1
-        for (const auto &cell : triangulation.active_cell_iterators())
+        /// adds values to the matrix corresponding to the max radius - distance
+        for (const auto &cell : dof_handler.active_cell_iterators())
         {
-            const unsigned int i = cell->active_cell_index();
-            double denominator = 0;
-            typename SparseMatrix<double>::iterator iter = filter_matrix.begin(
-                    i);
-            for (; iter != filter_matrix.end(i); iter++)
+            if(cell->is_locally_owned())
             {
-                denominator = denominator + iter->value();
+                std::vector<unsigned int> i(cell->get_fe().n_dofs_per_cell());
+                cell->get_dof_indices(i);
+                auto cell_index = i[cell->get_fe().component_to_system_index(0, 0)];
+                double value_total = 0;
+                for (const auto &neighbor_cell_index : find_relevant_neighbors(cell_index))
+                {
+                    double d_x = std::abs(x_coord[cell_index]-x_coord[neighbor_cell_index]);
+                    double d_y = std::abs(y_coord[cell_index]-y_coord[neighbor_cell_index]);
+                    double d;
+                    if (dim==3)
+                    {
+                        double d_z = std::abs(z_coord[cell_index]-z_coord[neighbor_cell_index]);
+                        d = std::pow(d_x*d_x + d_y*d_y + d_z*d_z , .5);
+                    }
+                    else
+                    {
+                        d = std::pow(d_x*d_x + d_y*d_y , .5);
+                    }
+                    ///value should be (max radius - distance between cells)*cell measure
+                    double value = (Input::filter_r - d)*cell_m[neighbor_cell_index];
+                    value_total += value;
+                }
+                row_sum[cell_index] = value_total;
+                
             }
-            iter = filter_matrix.begin(i);
-            for (; iter != filter_matrix.end(i); iter++)
+        }
+        MPI_Allreduce(row_sum.data(), row_sum_full.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        for (const auto &cell : dof_handler.active_cell_iterators())
+        {
+            if(cell->is_locally_owned())
             {
-                iter->value() = iter->value() / denominator;
+                std::vector<unsigned int> i(cell->get_fe().n_dofs_per_cell());
+                cell->get_dof_indices(i);
+                auto cell_index = i[cell->get_fe().component_to_system_index(0, 0)];
+                for (const auto &neighbor_cell_index : find_relevant_neighbors(cell_index))
+                {
+                    double d_x = std::abs(x_coord[cell_index]-x_coord[neighbor_cell_index]);
+                    double d_y = std::abs(y_coord[cell_index]-y_coord[neighbor_cell_index]);
+                    double d;
+                    if (dim==3)
+                    {
+                        double d_z = std::abs(z_coord[cell_index]-z_coord[neighbor_cell_index]);
+                        d = std::pow(d_x*d_x + d_y*d_y + d_z*d_z , .5);
+                    }
+                    else
+                    {
+                        d = std::pow(d_x*d_x + d_y*d_y , .5);
+                    }
+                    ///value should be (max radius - distance between cells)*cell measure
+                    double value = (Input::filter_r - d)*cell_m[neighbor_cell_index];
+                    filter_matrix.set(cell_index, neighbor_cell_index, value/row_sum_full[cell_index]);
+                    filter_matrix_transpose.set(cell_index, neighbor_cell_index, value/row_sum_full[neighbor_cell_index]);
+                }
             }
         }
+        double sum_sum = 0;
+        double x_sum = 0;
+        double y_sum = 0;
+        double z_sum = 0;
+        for (int i=0; i< row_sum_full.size(); i++)
+        {
+            sum_sum += std::abs(row_sum_full[i]);
+            x_sum += std::abs(x_coord[i]);
+            y_sum += std::abs(y_coord[i]);
+            z_sum += std::abs(z_coord[i]);
+        }
+        filter_matrix.compress(VectorOperation::insert);
+        filter_matrix_transpose.compress(VectorOperation::insert);
+
+        ///here we normalize the filter so it computes an average. Sum of values in a row should be 1
+        // for (const auto &cell : dof_handler.active_cell_iterators())
+        // {
+        //     if(cell->is_locally_owned())
+        //     {
+        //         std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+        //         cell->get_dof_indices(i);
+        //         const int i_ind = cell->get_fe().component_to_system_index(0, 0);
+        //         double denominator = 0;
+        //         typename LA::MPI::SparseMatrix::iterator iter = filter_matrix.begin(
+        //                 i[i_ind]);
+        //         for (; iter != filter_matrix.end(i[i_ind]); iter++)
+        //         {
+        //             denominator = denominator + iter->value();
+        //         }
+        //         iter = filter_matrix.begin(i[i_ind]);
+        //         for (; iter != filter_matrix.end(i[i_ind]); iter++)
+        //         {
+        //             iter->value() = iter->value() / denominator;
+        //         }
+        //     }
+        // }
+        // pcout << "FILTER TO 5" << std::endl;
+        // LA::MPI::Vector test_density_start;
+        // test_density_start.reinit(local_owned, mpi_communicator);
+        // LA::MPI::Vector test_density_end;
+        // test_density_end.reinit(local_owned, mpi_communicator);
+        // test_density_end = 0.;
+        // for (int i = 0; i<n_p; i++)
+        // {
+        //     if (test_density_start.in_local_range(i))
+        //     {
+        //         test_density_start[i] = i;
+        //     }
+        // }
+        // test_density_start.compress(VectorOperation::insert);
+        // filter_matrix.vmult(test_density_end,test_density_start);
+
     }
 
-    /*This function finds which neighbors are within a certain radius of the initial cell.*/
+    ///This function finds which neighbors are within a certain radius of the initial cell.
     template<int dim>
-    std::set<typename Triangulation<dim>::cell_iterator>
-    DensityFilter<dim>::find_relevant_neighbors(typename Triangulation<dim>::cell_iterator cell) const {
-        std::set<unsigned int> neighbor_ids;
-        std::set<typename Triangulation<dim>::cell_iterator> cells_to_check;
-        neighbor_ids.insert(cell->active_cell_index());
-        cells_to_check.insert(cell);
-        bool new_neighbors_found;
-        do {
-            new_neighbors_found = false;
-            for (const auto &check_cell :
-                    std::vector<typename Triangulation<dim>::cell_iterator>(
-                            cells_to_check.begin(), cells_to_check.end())) {
-                for (const auto n : check_cell->face_indices()) {
-                    if (!(check_cell->face(n)->at_boundary())) {
-                        const auto &neighbor = check_cell->neighbor(n);
-                        const double distance =
-                                cell->center().distance(neighbor->center());
-                        if ((distance < Input::filter_r) &&
-                            !(neighbor_ids.count(neighbor->active_cell_index())))
+    std::set<types::global_dof_index>
+    DensityFilter<dim>::find_relevant_neighbors(types::global_dof_index cell_index) const
+    {
+        double d_x,d_y,d_z;
+        std::set<types::global_dof_index> relevant_cells;
+            for (unsigned int i=0; i < x_coord.size(); i++)
+            {
+                d_x = std::abs(x_coord[cell_index]-x_coord[i]);
+
+                if (d_x < Input::filter_r)
+                {
+                    d_y = std::abs(y_coord[cell_index]-y_coord[i]);
+
+                    if ((d_x*d_x + d_y*d_y) < (Input::filter_r*Input::filter_r))
+                    {
+
+                        if (dim == 3)
+                        {
+                            d_z = std::abs(z_coord[cell_index]-z_coord[i]);
+
+                            if ((d_x*d_x + d_y*d_y + d_z*d_z) < (Input::filter_r*Input::filter_r))
+                            {
+                                relevant_cells.insert(i);
+                            }
+                        }
+                        else
                         {
-                            cells_to_check.insert(neighbor);
-                            neighbor_ids.insert(neighbor->active_cell_index());
-                            new_neighbors_found = true;
+                            relevant_cells.insert(i);
                         }
+
                     }
                 }
-            }
-        } while (new_neighbors_found);
-        return cells_to_check;
+        }
+        return relevant_cells;
+
     }
 
 }//SAND namespace
diff --git a/source/kkt_system.cc b/source/kkt_system.cc
index e505e36..12b5c8b 100644
--- a/source/kkt_system.cc
+++ b/source/kkt_system.cc
@@ -7,18 +7,16 @@
 #include <deal.II/base/tensor.h>
 #include <deal.II/base/timer.h>
 
-#include <deal.II/lac/block_vector.h>
 #include <deal.II/lac/full_matrix.h>
-#include <deal.II/lac/block_sparse_matrix.h>
-#include <deal.II/lac/precondition.h>
 #include <deal.II/lac/linear_operator.h>
 #include <deal.II/lac/solver_gmres.h>
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/trilinos_sparse_matrix.h>
+
 
 #include <deal.II/lac/matrix_out.h>
 
-#include <deal.II/grid/tria.h>
 #include <deal.II/grid/grid_generator.h>
-#include <deal.II/grid/grid_refinement.h>
 
 #include <deal.II/dofs/dof_renumbering.h>
 #include <deal.II/dofs/dof_tools.h>
@@ -37,86 +35,191 @@
 #include <deal.II/numerics/data_out.h>
 #include <deal.II/numerics/error_estimator.h>
 
+
+#include <deal.II/base/conditional_ostream.h>
+
 #include "../include/input_information.h"
-#include "../include/sand_tools.h"
+#include "../include/matrix_free_elasticity.h"
+#include "../include/poly_pre.h"
 
 #include <iostream>
 #include <algorithm>
 
-// This problem initializes with a FESystem composed of 2×dim FE_Q(1) elements, and 8 FE_DGQ(0)  elements.
-// The  piecewise  constant  functions  are  for  density-related  variables,and displacement-related variables are assigned to the FE_Q(1) elements.
+/// This problem initializes with a FESystem composed of 2×dim FE_Q(1) elements, and 8 FE_DGQ(0)  elements.
+/// The  piecewise  constant  functions  are  for  density-related  variables,and displacement-related variables are assigned to the FE_Q(1) elements.
 namespace SAND {
-    template<int dim>
-    KktSystem<dim>::KktSystem()
-            :
-            dof_handler(triangulation),
-            /*fe should have 1 FE_DGQ<dim>(0) element for density, dim FE_Q finite elements for displacement,
-             * another dim FE_Q elements for the lagrange multiplier on the FE constraint, and 2 more FE_DGQ<dim>(0)
-             * elements for the upper and lower bound constraints */
-            fe_nine(FE_DGQ<dim>(0) ^ 5,
-                    (FESystem<dim>(FE_Q<dim>(1) ^ dim)) ^ 2,
-                    FE_DGQ<dim>(0) ^ 2,
-                    FE_Nothing<dim>() ^ 1),
-            fe_ten(FE_DGQ<dim>(0) ^ 5,
-                   (FESystem<dim>(FE_Q<dim>(1) ^ dim)) ^ 2,
-                   FE_DGQ<dim>(0) ^ 2,
-                   FE_DGQ<dim>(0) ^ 1),
-            density_ratio(Input::volume_percentage),
-            density_penalty_exponent(Input::density_penalty_exponent),
-            density_filter() {
-        fe_collection.push_back(fe_nine);
-        fe_collection.push_back(fe_ten);
+
+///Necessary functions for going between Trilinos vectors and multigrid-compatible distributed vectors.
+namespace ChangeVectorTypes
+{
+template <typename number>
+void copy_from_displacement_to_system_vector(LA::MPI::Vector                                           &out,
+                                             const dealii::LinearAlgebra::distributed::Vector<number>  &in,
+                                             std::map<types::global_dof_index,types::global_dof_index>  & displacement_to_system_dof_index_map)
+{
+//    dealii::LinearAlgebra::ReadWriteVector<double> rwv(
+//                out.locally_owned_elements());
+//    rwv.import(in, VectorOperation::insert);
+    for (const auto &index_pair : displacement_to_system_dof_index_map)
+    {
+        out[index_pair.second] = in[index_pair.first];
+    }
+//    out.import(rwv, VectorOperation::insert);
+}
+
+template <typename number>
+void copy_from_system_to_displacement_vector(dealii::LinearAlgebra::distributed::Vector<number>  &out,
+                                             const LA::MPI::Vector                                           &in,
+                                             std::map<types::global_dof_index,types::global_dof_index>  & displacement_to_system_dof_index_map)
+{
+//    dealii::LinearAlgebra::ReadWriteVector<double> rwv(
+//                out.locally_owned_elements());
+//    rwv.import(in, VectorOperation::insert);
+    ConditionalOStream pcout (std::cout,(Utilities::MPI::this_mpi_process(MPI_COMM_WORLD) == 1));
+    for (const auto &index_pair : displacement_to_system_dof_index_map)
+    {
+        out[index_pair.first] = in[index_pair.second];
     }
+//    out.import(rwv, VectorOperation::insert);
+}
+
+template <typename number>
+void copy(LA::MPI::Vector &                                         out,
+          const dealii::LinearAlgebra::distributed::Vector<number> &in)
+{
+    dealii::LinearAlgebra::ReadWriteVector<double> rwv(
+                out.locally_owned_elements());
+    rwv.import(in, VectorOperation::insert);
+    out.import(rwv, VectorOperation::insert);
+}
+template <typename number>
+void copy(dealii::LinearAlgebra::distributed::Vector<number> &out,
+          const LA::MPI::Vector &                             in)
+{
+    dealii::LinearAlgebra::ReadWriteVector<double> rwv;
+    rwv.reinit(in);
+    out.import(rwv, VectorOperation::insert);
+}
+
+
+} // namespace ChangeVectorTypes
+
+///The KKTSystem class calculates the Hessian and Gradient of the Lagrangian of the system, and solves the resulting system to be used
+/// as a step direction for the overarching solver.
+template<int dim>
+KktSystem<dim>::KktSystem()
+    :
+      mpi_communicator(MPI_COMM_WORLD),
+      triangulation(mpi_communicator,
+                    Triangulation<dim>::limit_level_difference_at_vertices,
+                    parallel::distributed::Triangulation<dim>::construct_multigrid_hierarchy),
+      dof_handler(triangulation),
+      dof_handler_displacement(triangulation),
+      dof_handler_density(triangulation),
+      /*fe should have 1 FE_DGQ<dim>(0) element for density, dim FE_Q finite elements for displacement,
+                   * another dim FE_Q elements for the lagrange multiplier on the FE constraint, and 2 more FE_DGQ<dim>(0)
+                   * elements for the upper and lower bound constraints */
+      fe_nine(FE_DGQ<dim>(0) ^ 5,
+              (FESystem<dim>(FE_Q<dim>(1) ^ dim)) ^ 2,
+              FE_DGQ<dim>(0) ^ 2,
+              FE_Nothing<dim>() ^ 1),
+      fe_ten(FE_DGQ<dim>(0) ^ 5,
+             (FESystem<dim>(FE_Q<dim>(1) ^ dim)) ^ 2,
+             FE_DGQ<dim>(0) ^ 2,
+             FE_DGQ<dim>(0) ^ 1),
+      fe_displacement(FE_Q<dim>(1) ^ dim),
+      fe_density(0),
+      density_ratio(Input::volume_percentage),
+      density_penalty_exponent(Input::density_penalty_exponent),
+      density_filter(),
+      pcout(std::cout,(Utilities::MPI::this_mpi_process(mpi_communicator) == 0))
+{
+    fe_collection.push_back(fe_nine);
+    fe_collection.push_back(fe_ten);
+
+}
+
+
+///A  function  used  once  at  the  beginning  of  the  program,  this  creates  a  matrix  H  so  that H* unfiltered density = filtered density
+
+template<int dim>
+void
+KktSystem<dim>::setup_filter_matrix() {
+    pcout << "IN KKT FILTER SETUP FUNCTION" << std::endl;
+    density_filter.initialize(dof_handler);
+}
+
+///This triangulation matches the problem description
 
+template<int dim>
+void
+KktSystem<dim>::create_triangulation() {
 
-//A  function  used  once  at  the  beginning  of  the  program,  this  creates  a  matrix  H  so  that H* unfiltered density = filtered density
+    ///Start by defining the sub-blocks of the DoFHandler
 
-    template<int dim>
-    void
-    KktSystem<dim>::setup_filter_matrix() {
+    std::vector<unsigned int> sub_blocks(2*dim+8, 0);
 
-        density_filter.initialize(triangulation);
+    sub_blocks[0]=0;
+    sub_blocks[1]=1;
+    sub_blocks[2]=2;
+    sub_blocks[3]=3;
+    sub_blocks[4]=4;
+    for(int i=0; i<dim; i++)
+    {
+        sub_blocks[5+i]=5;
+    }
+    for(int i=0; i<dim; i++)
+    {
+        sub_blocks[5+dim+i]=6;
     }
+    sub_blocks[5+2*dim]=7;
+    sub_blocks[6+2*dim]=8;
+    sub_blocks[7+2*dim]=9;
+
+    ///MBB Beam defined here
+    if (Input::geometry_base == GeometryOptions::mbb) {
+        const double width = 6;
+        const unsigned int width_refine = 6;
+        const double height = 1;
+        const unsigned int height_refine = 1;
+        const double depth = 1;
+        const unsigned int depth_refine = 1;
+        const double downforce_y = 1;
+        const double downforce_x = 3;
+        const double downforce_size = .3;
+
+        if (dim == 2)
+        {
+            GridGenerator::subdivided_hyper_rectangle(triangulation,
+                                                      {width_refine, height_refine},
+                                                      Point<dim>(0, 0),
+                                                      Point<dim>(width, height));
 
-    //This triangulation matches the problem description -
-    // a 6-by-1 rectangle where a force will be applied in the top center.
-
-    template<int dim>
-    void
-    KktSystem<dim>::create_triangulation() {
-        if (Input::geometry_base == GeometryOptions::mbb) {
-            const double width = 6;
-            const unsigned int width_refine = 6;
-            const double height = 1;
-            const unsigned int height_refine = 1;
-            const double depth = 1;
-            const unsigned int depth_refine = 1;
-            const double downforce_y = 1;
-            const double downforce_x = 3;
-            const double downforce_size = .3;
-
-            if (dim == 2) {
-                GridGenerator::subdivided_hyper_rectangle(triangulation,
-                                                          {width_refine, height_refine},
-                                                          Point<dim>(0, 0),
-                                                          Point<dim>(width, height));
-
-                triangulation.refine_global(Input::refinements);
-
-                /*Set BCIDs   */
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+            triangulation.refine_global(Input::refinements);
+
+            /*Set BCIDs   */
+            for (const auto &cell: dof_handler.active_cell_iterators())
+            {
+                if(cell->is_locally_owned())
+                {
                     cell->set_active_fe_index(0);
                     cell->set_material_id(MaterialIds::without_multiplier);
                     for (unsigned int face_number = 0;
                          face_number < GeometryInfo<dim>::faces_per_cell;
-                         ++face_number) {
-                        if (cell->face(face_number)->at_boundary()) {
+                         ++face_number)
+                    {
+                        if (cell->face(face_number)->at_boundary())
+                        {
                             const auto center = cell->face(face_number)->center();
 
-                            if (std::fabs(center(1) - downforce_y) < 1e-12) {
-                                if (std::fabs(center(0) - downforce_x) < downforce_size) {
+                            if (std::fabs(center(1) - downforce_y) < 1e-12)
+                            {
+                                if (std::fabs(center(0) - downforce_x) < downforce_size)
+                                {
                                     cell->face(face_number)->set_boundary_id(BoundaryIds::down_force);
-                                } else {
+                                }
+                                else
+                                {
                                     cell->face(face_number)->set_boundary_id(BoundaryIds::no_force);
                                 }
                             }
@@ -126,25 +229,27 @@ namespace SAND {
                          vertex_number < GeometryInfo<dim>::vertices_per_cell;
                          ++vertex_number) {
                         if (std::abs(cell->vertex(vertex_number)(0)) + std::abs(cell->vertex(vertex_number)(1)) <
-                            1e-10) {
+                                1e-10) {
                             cell->set_active_fe_index(1);
                             cell->set_material_id(MaterialIds::with_multiplier);
                         }
                     }
                 }
+            }
 
-                dof_handler.distribute_dofs(fe_collection);
-
-                DoFRenumbering::component_wise(dof_handler);
-            } else if (dim == 3) {
-                GridGenerator::subdivided_hyper_rectangle(triangulation,
-                                                          {width_refine, height_refine, depth_refine},
-                                                          Point<dim>(0, 0, 0),
-                                                          Point<dim>(width, height, depth));
+        }
+        else if (dim == 3)
+        {
+            GridGenerator::subdivided_hyper_rectangle(triangulation,
+                                                      {width_refine, height_refine, depth_refine},
+                                                      Point<dim>(0, 0, 0),
+                                                      Point<dim>(width, height, depth));
 
-                triangulation.refine_global(Input::refinements);
+            triangulation.refine_global(Input::refinements);
 
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+            for (const auto &cell: dof_handler.active_cell_iterators()) {
+                if (cell->is_locally_owned())
+                {
                     cell->set_active_fe_index(0);
                     cell->set_material_id(MaterialIds::without_multiplier);
                     for (unsigned int face_number = 0;
@@ -166,43 +271,43 @@ namespace SAND {
                          vertex_number < GeometryInfo<dim>::vertices_per_cell;
                          ++vertex_number) {
                         if (std::abs(cell->vertex(vertex_number)(0)) + std::abs(cell->vertex(vertex_number)(1))
-                            + std::abs(cell->vertex(vertex_number)(2)) < 1e-10) {
+                                + std::abs(cell->vertex(vertex_number)(2)) < 1e-10) {
                             cell->set_active_fe_index(1);
                             cell->set_material_id(MaterialIds::with_multiplier);
                         }
                     }
                 }
-
-                dof_handler.distribute_dofs(fe_collection);
-
-                DoFRenumbering::component_wise(dof_handler);
-
-            } else {
-                throw;
             }
-        } else if (Input::geometry_base == GeometryOptions::l_shape) {
-            const double width = 2;
-            const unsigned int width_refine = 2;
-            const double height = 2;
-            const unsigned int height_refine = 2;
-            const double depth = 1;
-            const unsigned int depth_refine = 1;
-            const double downforce_x = 2;
-            const double downforce_y = 1;
-            const double downforce_z = .5;
-            const double downforce_size = .3;
-
-            if (dim == 2) {
-                GridGenerator::subdivided_hyper_L(triangulation,
-                                                  {width_refine, height_refine},
-                                                  Point<dim>(0, 0),
-                                                  Point<dim>(width, height),
-                                                  {-1, -1});
-
-                triangulation.refine_global(Input::refinements);
-
-                /*Set BCIDs   */
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+
+        } else {
+            throw;
+        }
+    ///L-shaped cantilever with re-entrant corner
+    } else if (Input::geometry_base == GeometryOptions::l_shape) {
+        const double width = 2;
+        const unsigned int width_refine = 2;
+        const double height = 2;
+        const unsigned int height_refine = 2;
+        const double depth = 1;
+        const unsigned int depth_refine = 1;
+        const double downforce_x = 2;
+        const double downforce_y = 1;
+        const double downforce_z = .5;
+        const double downforce_size = .3;
+
+        if (dim == 2) {
+            GridGenerator::subdivided_hyper_L(triangulation,
+                                              {width_refine, height_refine},
+                                              Point<dim>(0, 0),
+                                              Point<dim>(width, height),
+                                              {-1, -1});
+
+            triangulation.refine_global(Input::refinements);
+
+            /*Set BCIDs   */
+            for (const auto &cell: dof_handler.active_cell_iterators()) {
+                if (cell->is_locally_owned())
+                {
                     cell->set_active_fe_index(0);
                     cell->set_material_id(MaterialIds::without_multiplier);
                     for (unsigned int face_number = 0;
@@ -224,28 +329,27 @@ namespace SAND {
                          vertex_number < GeometryInfo<dim>::vertices_per_cell;
                          ++vertex_number) {
                         if (std::abs(cell->vertex(vertex_number)(0)) + std::abs(cell->vertex(vertex_number)(1)) <
-                            1e-10) {
+                                1e-10) {
                             cell->set_active_fe_index(1);
                             cell->set_material_id(MaterialIds::with_multiplier);
                         }
                     }
                 }
+            }
 
-                dof_handler.distribute_dofs(fe_collection);
-
-                DoFRenumbering::component_wise(dof_handler);
-
-            } else if (dim == 3) {
-                GridGenerator::subdivided_hyper_L(triangulation,
-                                                  {width_refine, height_refine, depth_refine},
-                                                  Point<dim>(0, 0, 0),
-                                                  Point<dim>(width, height, depth),
-                                                  {-1, -1, depth_refine});
+        } else if (dim == 3) {
+            GridGenerator::subdivided_hyper_L(triangulation,
+                                              {width_refine, height_refine, depth_refine},
+                                              Point<dim>(0, 0, 0),
+                                              Point<dim>(width, height, depth),
+                                              {-1, -1, depth_refine});
 
-                triangulation.refine_global(Input::refinements);
+            triangulation.refine_global(Input::refinements);
 
-                /*Set BCIDs   */
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+            /*Set BCIDs   */
+            for (const auto &cell: dof_handler.active_cell_iterators()) {
+                if(cell->is_locally_owned())
+                {
                     cell->set_active_fe_index(0);
                     cell->set_material_id(MaterialIds::without_multiplier);
                     for (unsigned int face_number = 0;
@@ -272,46 +376,62 @@ namespace SAND {
                          vertex_number < GeometryInfo<dim>::vertices_per_cell;
                          ++vertex_number) {
                         if (std::abs(cell->vertex(vertex_number)(0)) + std::abs(cell->vertex(vertex_number)(1)) <
-                            1e-10) {
+                                1e-10) {
                             cell->set_active_fe_index(1);
                             cell->set_material_id(MaterialIds::with_multiplier);
                         }
                     }
                 }
-
-                dof_handler.distribute_dofs(fe_collection);
-
-                DoFRenumbering::component_wise(dof_handler);
-            } else {
-                throw;
             }
         } else {
             throw;
         }
-
+    } else {
+        throw;
     }
 
-// The  bottom  corners  are  kept  in  place  in  the  y  direction  -  the  bottom  left  also  in  the  x direction.
-// Because deal.ii is formulated to enforce boundary conditions along regions of the boundary,
-// we do this to ensure these BCs are only enforced at points.
-    template<int dim>
-    void
-    KktSystem<dim>::setup_boundary_values() {
-        if (Input::geometry_base == GeometryOptions::mbb) {
-            if (dim == 2) {
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+    dof_handler.distribute_dofs(fe_collection);
+    DoFRenumbering::component_wise(dof_handler, sub_blocks);
+
+    dof_handler_displacement.distribute_dofs(fe_displacement);
+    dof_handler_displacement.distribute_mg_dofs();
 
+    displacement_to_system_dof_index_map.clear();
+
+}
+
+/// Only individual points are given Dirichlet Boundary Conditions.
+/// For example, in the MBB caes, The  bottom  corners  are  kept  in  place  in  the  y  direction
+/// and the  bottom  left  also  in  the  x direction.
+/// Because deal.ii is formulated to enforce boundary conditions along regions of the boundary,
+/// we do this to ensure these BCs are only enforced at points.
+template<int dim>
+void
+KktSystem<dim>::setup_boundary_values()
+{
+    if (Input::geometry_base == GeometryOptions::mbb)
+    {
+        if (dim == 2)
+        {
+            for (const auto &cell: dof_handler.active_cell_iterators())
+            {
+                if(cell->is_locally_owned())
+                {
                     for (unsigned int face_number = 0;
                          face_number < GeometryInfo<dim>::faces_per_cell;
-                         ++face_number) {
-                        if (cell->face(face_number)->at_boundary()) {
+                         ++face_number)
+                    {
+                        if (cell->face(face_number)->at_boundary())
+                        {
                             for (unsigned int vertex_number = 0;
                                  vertex_number < GeometryInfo<dim>::vertices_per_cell;
-                                 ++vertex_number) {
+                                 ++vertex_number)
+                            {
                                 const auto vert = cell->vertex(vertex_number);
                                 /*Find bottom left corner*/
                                 if (std::fabs(vert(0) - 0) < 1e-12 && std::fabs(
-                                        vert(1) - 0) < 1e-12) {
+                                            vert(1) - 0) < 1e-12)
+                                {
 
                                     const unsigned int x_displacement =
                                             cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
@@ -329,39 +449,139 @@ namespace SAND {
                                 }
                                 /*Find bottom right corner*/
                                 if (std::fabs(vert(0) - 6) < 1e-12 && std::fabs(
-                                        vert(1) - 0) < 1e-12) {
-//                            const unsigned int x_displacement =
-//                                    cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
+                                            vert(1) - 0) < 1e-12)
+                                {
+//                                                                const unsigned int x_displacement =
+//                                                                        cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
                                     const unsigned int y_displacement =
                                             cell->vertex_dof_index(vertex_number, 1, cell->active_fe_index());
-//                            const unsigned int x_displacement_multiplier =
-//                                    cell->vertex_dof_index(vertex_number, 2, cell->active_fe_index());
+//                                                                const unsigned int x_displacement_multiplier =
+//                                                                        cell->vertex_dof_index(vertex_number, 2, cell->active_fe_index());
                                     const unsigned int y_displacement_multiplier =
                                             cell->vertex_dof_index(vertex_number, 3, cell->active_fe_index());
-//                            boundary_values[x_displacement] = 0;
+//                                    boundary_values[x_displacement] = 0;
                                     boundary_values[y_displacement] = 0;
-//                            boundary_values[x_displacement_multiplier] = 0;
+//                                    boundary_values[x_displacement_multiplier] = 0;
                                     boundary_values[y_displacement_multiplier] = 0;
                                 }
                             }
                         }
                     }
                 }
-            } else if (dim == 3) {
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+
+            }
+            const unsigned int n_levels = triangulation.n_global_levels();
+            level_dirichlet_boundary_dofs.resize(0,n_levels-1);
+            level_boundary_values.resize(0,n_levels-1);
+            mg_level_constraints.resize(0,n_levels-1);
+
+            for(unsigned int level = 0; level < n_levels; ++level)
+            {
+                IndexSet relevant_dofs;
+                DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,
+                                                      level,
+                                                      relevant_dofs);
+                mg_level_constraints[level].reinit(relevant_dofs);
+            }
+
+
+            for (auto cell=dof_handler_displacement.begin_active(n_levels-1); 
+                 cell!=dof_handler_displacement.end_active(n_levels-1); 
+                 ++cell)
+            {
+                if(cell->is_locally_owned())
+                {
                     for (unsigned int face_number = 0;
                          face_number < GeometryInfo<dim>::faces_per_cell;
-                         ++face_number) {
-                        if (cell->face(face_number)->at_boundary()) {
+                         ++face_number)
+                    {
+                        if (cell->face(face_number)->at_boundary())
+                        {
                             for (unsigned int vertex_number = 0;
                                  vertex_number < GeometryInfo<dim>::vertices_per_cell;
-                                 ++vertex_number) {
+                                 ++vertex_number)
+                            {
                                 const auto vert = cell->vertex(vertex_number);
                                 /*Find bottom left corner*/
                                 if (std::fabs(vert(0) - 0) < 1e-12 && std::fabs(
-                                        vert(1) - 0) < 1e-12 && ((std::fabs(
-                                        vert(2) - 0) < 1e-12) || (std::fabs(
-                                        vert(2) - 1) < 1e-12))) {
+                                        vert(1) - 0) < 1e-12)
+                                {
+                                     for (unsigned int level = 0; level < n_levels; ++level)
+                                     {
+                                         const unsigned int x_displacement =
+                                                 cell->mg_vertex_dof_index(level, vertex_number, 0, cell->active_fe_index());
+                                         const unsigned int y_displacement =
+                                                 cell->mg_vertex_dof_index(level, vertex_number, 1, cell->active_fe_index());
+                                                 
+                                        /*set bottom left BC*/
+
+                                         level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                         level_dirichlet_boundary_dofs[level].insert(y_displacement);
+
+                                         level_boundary_values[level][x_displacement] = 0;
+                                         level_boundary_values[level][y_displacement] = 0;
+                                     }
+
+                                }
+                                /*Find bottom right corner*/
+                                if (std::fabs(vert(0) - 6) < 1e-12 && std::fabs(
+                                        vert(1) - 0) < 1e-12)
+                                {
+                                    for (unsigned int level = 0; level < n_levels; ++level)
+                                    {
+
+//                                        const unsigned int x_displacement =
+//                                                cell->mg_vertex_dof_index(level, vertex_number, 0,cell->active_fe_index());
+                                        const unsigned int y_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 1, cell->active_fe_index());
+
+//                                        level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+                                         
+//                                        level_boundary_values[level][x_displacement] = 0;
+                                        level_boundary_values[level][y_displacement] = 0;
+                                    }
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+            for (unsigned int level = 0; level < n_levels; ++level)
+            {
+                IndexSet relevant_dofs;
+                DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,level,relevant_dofs);
+                mg_level_constraints[level].add_lines(level_dirichlet_boundary_dofs[level]);
+                mg_level_constraints[level].make_consistent_in_parallel(
+                    dof_handler_displacement.locally_owned_mg_dofs(level),
+                    relevant_dofs,
+                    mpi_communicator
+                );
+                mg_level_constraints[level].close();
+            }
+
+        } else if (dim == 3)
+        {
+            pcout << "setting up BVs" << std::endl;
+            for (const auto &cell: dof_handler.active_cell_iterators()) 
+            {
+                if(cell->is_locally_owned())
+                {
+                    for (unsigned int face_number = 0;
+                         face_number < GeometryInfo<dim>::faces_per_cell;
+                         ++face_number) 
+                    {
+                        if (cell->face(face_number)->at_boundary()) 
+                        {
+                            for (unsigned int vertex_number = 0;
+                                 vertex_number < GeometryInfo<dim>::vertices_per_cell;
+                                 ++vertex_number) {
+                                const auto vert = cell->vertex(vertex_number);
+                                /*Find bottom left corner*/
+                                if (std::fabs(vert(0) - 0) < 1e-12 && 
+                                    std::fabs(vert(1) - 0) < 1e-12 && 
+                                    ((std::fabs(vert(2) - 0) < 1e-12) || (std::fabs(vert(2) - 1) < 1e-12))) 
+                                {
 
 
                                     const unsigned int x_displacement =
@@ -385,26 +605,26 @@ namespace SAND {
                                     boundary_values[z_displacement_multiplier] = 0;
                                 }
                                 /*Find bottom right corner*/
-                                if (std::fabs(vert(0) - 6) < 1e-12 && std::fabs(
-                                        vert(1) - 0) < 1e-12 && ((std::fabs(
-                                        vert(2) - 0) < 1e-12) || (std::fabs(
-                                        vert(2) - 1) < 1e-12))) {
-//                              const unsigned int x_displacement =
-//                                    cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
+                                if (std::fabs(vert(0) - 6) < 1e-12 && 
+                                    std::fabs(vert(1) - 0) < 1e-12 && 
+                                    ((std::fabs(vert(2) - 0) < 1e-12) || (std::fabs(vert(2) - 1) < 1e-12))) 
+                                {
+                                    //                              const unsigned int x_displacement =
+                                    //                                    cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
                                     const unsigned int y_displacement =
                                             cell->vertex_dof_index(vertex_number, 1, cell->active_fe_index());
                                     const unsigned int z_displacement =
                                             cell->vertex_dof_index(vertex_number, 2, cell->active_fe_index());
-//                              const unsigned int x_displacement_multiplier =
-//                                    cell->vertex_dof_index(vertex_number, 3, cell->active_fe_index());
+                                    //                              const unsigned int x_displacement_multiplier =
+                                    //                                    cell->vertex_dof_index(vertex_number, 3, cell->active_fe_index());
                                     const unsigned int y_displacement_multiplier =
                                             cell->vertex_dof_index(vertex_number, 4, cell->active_fe_index());
                                     const unsigned int z_displacement_multiplier =
                                             cell->vertex_dof_index(vertex_number, 5, cell->active_fe_index());
-//                              boundary_values[x_displacement] = 0;
+                                    //                              boundary_values[x_displacement] = 0;
                                     boundary_values[y_displacement] = 0;
                                     boundary_values[z_displacement] = 0;
-//                              boundary_values[x_displacement_multiplier] = 0;
+                                    //                              boundary_values[x_displacement_multiplier] = 0;
                                     boundary_values[y_displacement_multiplier] = 0;
                                     boundary_values[z_displacement_multiplier] = 0;
                                 }
@@ -412,13 +632,111 @@ namespace SAND {
                         }
                     }
                 }
-            } else {
-                throw;
+
+            }
+
+            const unsigned int n_levels = triangulation.n_global_levels();
+            level_dirichlet_boundary_dofs.resize(0,n_levels-1);
+            level_boundary_values.resize(0,n_levels-1);
+            mg_level_constraints.resize(0,n_levels-1);
+
+            for(unsigned int level = 0; level < n_levels; ++level)
+            {
+                IndexSet relevant_dofs;
+                DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,
+                                                      level,
+                                                      relevant_dofs);
+                mg_level_constraints[level].reinit(relevant_dofs);
             }
-        } else if (Input::geometry_base == GeometryOptions::l_shape) {
-            if (dim == 2) {
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
 
+            for (auto cell=dof_handler_displacement.begin_active(n_levels-1);
+                    cell!=dof_handler_displacement.end_active(n_levels-1);
+                    ++cell)
+            {
+                if(cell->is_locally_owned())
+                {
+                    for (unsigned int face_number = 0;
+                            face_number < GeometryInfo<dim>::faces_per_cell;
+                            ++face_number)
+                    {
+                        if (cell->face(face_number)->at_boundary())
+                        {
+                            for (unsigned int vertex_number = 0;
+                                    vertex_number < GeometryInfo<dim>::vertices_per_cell;
+                                    ++vertex_number)
+                            {
+                                const auto vert = cell->vertex(vertex_number);
+                                /*Find bottom left corner*/
+                                if (std::fabs(vert(0) - 0) < 1e-12 && 
+                                    std::fabs(vert(1) - 0) < 1e-12 && 
+                                    ((std::fabs(vert(2) - 0) < 1e-12) || (std::fabs(vert(2) - 1) < 1e-12)))
+                                {
+                                    for (unsigned int level = 0; level < n_levels; ++level)
+                                    {
+                                        const unsigned int x_displacement =
+                                                 cell->mg_vertex_dof_index(level, vertex_number, 0, cell->active_fe_index());
+                                        const unsigned int y_displacement =
+                                            cell->mg_vertex_dof_index(level, vertex_number, 1, cell->active_fe_index());
+                                        const unsigned int z_displacement =
+                                            cell->mg_vertex_dof_index(level, vertex_number, 2, cell->active_fe_index());
+                                        /*set bottom left BC*/
+                                        level_boundary_values[level][x_displacement] = 0;
+                                        level_boundary_values[level][y_displacement] = 0;
+                                        level_boundary_values[level][z_displacement] = 0;
+                                        level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(z_displacement);
+                                    }
+                                }
+                                /*Find bottom right corner*/
+                                if (std::fabs(vert(0) - 6) < 1e-12 && 
+                                    std::fabs(vert(1) - 0) < 1e-12 && 
+                                    ((std::fabs(vert(2) - 0) < 1e-12) || 
+                                     (std::fabs(vert(2) - 1) < 1e-12)))
+                                {
+                                    for (unsigned int level = 0; level < n_levels; ++level)
+                                    {
+                                        const unsigned int y_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 1, cell->active_fe_index());
+                                        const unsigned int z_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 2, cell->active_fe_index());
+                                        level_boundary_values[level][y_displacement] = 0;
+                                        level_boundary_values[level][z_displacement] = 0;
+
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(z_displacement);
+                                    }
+                                }
+                            }
+                        }
+                    }
+                }
+            }
+            for (unsigned int level = 0; level < n_levels; ++level)
+            {
+                IndexSet relevant_dofs;
+                DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,level,relevant_dofs);
+                mg_level_constraints[level].add_lines(level_dirichlet_boundary_dofs[level]);
+                mg_level_constraints[level].make_consistent_in_parallel(
+                    dof_handler_displacement.locally_owned_mg_dofs(level),
+                    relevant_dofs,
+                    mpi_communicator
+                );
+                mg_level_constraints[level].close();
+            }
+
+        }
+        else
+        {
+            throw;
+        }
+    } else if (Input::geometry_base == GeometryOptions::l_shape) {
+        if (dim == 2)
+        {
+            for (const auto &cell: dof_handler.active_cell_iterators())
+            {
+                if(cell->is_locally_owned())
+                {
                     for (unsigned int face_number = 0;
                          face_number < GeometryInfo<dim>::faces_per_cell;
                          ++face_number) {
@@ -429,7 +747,7 @@ namespace SAND {
                                 const auto vert = cell->vertex(vertex_number);
                                 /*Find top left corner*/
                                 if (std::fabs(vert(0) - 0) < 1e-12 && std::fabs(
-                                        vert(1) - 2) < 1e-12) {
+                                            vert(1) - 2) < 1e-12) {
 
                                     const unsigned int x_displacement =
                                             cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
@@ -447,7 +765,7 @@ namespace SAND {
                                 }
                                 /*Find top right corner*/
                                 if (std::fabs(vert(0) - 1) < 1e-12 && std::fabs(
-                                        vert(1) - 2) < 1e-12) {
+                                            vert(1) - 2) < 1e-12) {
                                     const unsigned int x_displacement =
                                             cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
                                     const unsigned int y_displacement =
@@ -465,8 +783,80 @@ namespace SAND {
                         }
                     }
                 }
-            } else if (dim == 3) {
-                for (const auto &cell: dof_handler.active_cell_iterators()) {
+            }
+            const unsigned int n_levels = triangulation.n_global_levels();
+            for (unsigned int level = 0; level < n_levels; ++level)
+            {
+                for (auto cell=dof_handler_displacement.begin_active(level);
+                     cell!=dof_handler.end_active(level);
+                     ++cell)
+                {
+                    if(cell->is_locally_owned())
+                    {
+                        for (unsigned int face_number = 0;
+                             face_number < GeometryInfo<dim>::faces_per_cell;
+                             ++face_number)
+                        {
+                            if (cell->face(face_number)->at_boundary())
+                            {
+                                for (unsigned int vertex_number = 0;
+                                     vertex_number < GeometryInfo<dim>::vertices_per_cell;
+                                     ++vertex_number)
+                                {
+                                    const auto vert = cell->vertex(vertex_number);
+                                    /*Find bottom left corner*/
+                                    if (std::fabs(vert(0) - 0) < 1e-12 && std::fabs(
+                                                vert(1) - 2) < 1e-12)
+                                    {
+
+                                        const unsigned int x_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 0, 0);
+                                        const unsigned int y_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 1, 0);
+                                        /*set bottom left BC*/
+                                        level_boundary_values[level][x_displacement] = 0;
+                                        level_boundary_values[level][y_displacement] = 0;
+
+                                        level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+
+                                    }
+                                    /*Find bottom right corner*/
+                                    if (std::fabs(vert(0) - 1) < 1e-12 && std::fabs(
+                                                vert(1) - 2) < 1e-12)
+                                    {
+                                        const unsigned int x_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 0, 0);
+                                        const unsigned int y_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 1, 0);
+                                        level_boundary_values[level][x_displacement] = 0;
+                                        level_boundary_values[level][y_displacement] = 0;
+
+                                        level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+                                    }
+                                }
+                            }
+                        }
+                    }
+                }
+                IndexSet relevant_dofs;
+                DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,level,relevant_dofs);
+                mg_level_constraints[level].add_lines(level_dirichlet_boundary_dofs[level]);
+                mg_level_constraints[level].make_consistent_in_parallel(
+                    dof_handler_displacement.locally_owned_mg_dofs(level),
+                    relevant_dofs,
+                    mpi_communicator
+                );
+                mg_level_constraints[level].close();
+            }
+
+        }
+        else if (dim == 3)
+        {
+            for (const auto &cell: dof_handler.active_cell_iterators()) {
+                if(cell->is_locally_owned())
+                {
                     for (unsigned int face_number = 0;
                          face_number < GeometryInfo<dim>::faces_per_cell;
                          ++face_number) {
@@ -477,9 +867,9 @@ namespace SAND {
                                 const auto vert = cell->vertex(vertex_number);
                                 /*Find bottom left corner*/
                                 if (std::fabs(vert(0) - 0) < 1e-12 && std::fabs(
-                                        vert(1) - 2) < 1e-12 && ((std::fabs(
-                                        vert(2) - 0) < 1e-12) || (std::fabs(
-                                        vert(2) - 1) < 1e-12))) {
+                                            vert(1) - 2) < 1e-12 && ((std::fabs(
+                                                                          vert(2) - 0) < 1e-12) || (std::fabs(
+                                                                                                        vert(2) - 1) < 1e-12))) {
 
 
                                     const unsigned int x_displacement =
@@ -504,9 +894,9 @@ namespace SAND {
                                 }
                                 /*Find bottom right corner*/
                                 if (std::fabs(vert(0) - 1) < 1e-12 && std::fabs(
-                                        vert(1) - 2) < 1e-12 && ((std::fabs(
-                                        vert(2) - 0) < 1e-12) || (std::fabs(
-                                        vert(2) - 1) < 1e-12))) {
+                                            vert(1) - 2) < 1e-12 && ((std::fabs(
+                                                                          vert(2) - 0) < 1e-12) || (std::fabs(
+                                                                                                        vert(2) - 1) < 1e-12))) {
                                     const unsigned int x_displacement =
                                             cell->vertex_dof_index(vertex_number, 0, cell->active_fe_index());
                                     const unsigned int y_displacement =
@@ -530,213 +920,390 @@ namespace SAND {
                         }
                     }
                 }
-            } else {
-                throw;
             }
-        }
-
+            const unsigned int n_levels = triangulation.n_global_levels();
+            for (unsigned int level = 0; level < n_levels; ++level)
+            {
+                for (auto cell=dof_handler_displacement.begin_active(level);
+                     cell!=dof_handler.end_active(level);
+                     ++cell)
+                {
+                    if(cell->is_locally_owned())
+                    {
+                        for (unsigned int face_number = 0;
+                             face_number < GeometryInfo<dim>::faces_per_cell;
+                             ++face_number)
+                        {
+                            if (cell->face(face_number)->at_boundary())
+                            {
+                                for (unsigned int vertex_number = 0;
+                                     vertex_number < GeometryInfo<dim>::vertices_per_cell;
+                                     ++vertex_number)
+                                {
+                                    const auto vert = cell->vertex(vertex_number);
+                                    /*Find bottom left corner*/
+                                    if (std::fabs(vert(0) - 0) < 1e-12 && std::fabs(
+                                                vert(1) - 2) < 1e-12 && ((std::fabs(
+                                                vert(2) - 0) < 1e-12) || (std::fabs(
+                                                vert(2) - 1) < 1e-12)))
+                                    {
+
+                                        const unsigned int x_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 0, 0);
+                                        const unsigned int y_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 1, 0);
+                                        const unsigned int z_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 2, 0);
+                                        /*set bottom left BC*/
+                                        level_boundary_values[level][x_displacement] = 0;
+                                        level_boundary_values[level][y_displacement] = 0;
+                                        level_boundary_values[level][z_displacement] = 0;
+
+                                        level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(z_displacement);
+                                    }
+                                    /*Find bottom right corner*/
+                                    if (std::fabs(vert(0) - 1) < 1e-12 && std::fabs(
+                                                vert(1) - 2) < 1e-12 && ((std::fabs(
+                                                vert(2) - 0) < 1e-12) || (std::fabs(
+                                                vert(2) - 1) < 1e-12)))
+                                    {
+                                        const unsigned int x_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 0, 0);
+                                        const unsigned int y_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 1, 0);
+                                        const unsigned int z_displacement =
+                                                cell->mg_vertex_dof_index(level, vertex_number, 2, 0);
+                                        level_boundary_values[level][x_displacement] = 0;
+                                        level_boundary_values[level][y_displacement] = 0;
+                                        level_boundary_values[level][z_displacement] = 0;
+
+                                        level_dirichlet_boundary_dofs[level].insert(x_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(y_displacement);
+                                        level_dirichlet_boundary_dofs[level].insert(z_displacement);
+                                    }
+                                }
+                            }
+                        }
+                    }
+                }
+                IndexSet relevant_dofs;
+                DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,level,relevant_dofs);
+                mg_level_constraints[level].add_lines(level_dirichlet_boundary_dofs[level]);
+                mg_level_constraints[level].make_consistent_in_parallel(
+                    dof_handler_displacement.locally_owned_mg_dofs(level),
+                    relevant_dofs,
+                    mpi_communicator
+                );
+                mg_level_constraints[level].close();
+            }
 
+        } else {
+            throw;
+        }
     }
 
 
-    //This makes a giant 10-by-10 block matrix, and also sets up the necessary block vectors.  The
-    // sparsity pattern for this matrix includes the sparsity pattern for the filter matrix. It also initializes
-    // any block vectors we will use.
-    template<int dim>
-    void
-    KktSystem<dim>::setup_block_system() {
-        const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
-
-        //MAKE n_u and n_P*****************************************************************
-
-        /*Setup 10 by 10 block matrix*/
-
-        std::vector<unsigned int> block_component(10, 2);
-        block_component[0] = 0;
-        block_component[5] = 1;
-        const std::vector<types::global_dof_index> dofs_per_block =
-                DoFTools::count_dofs_per_fe_block(dof_handler, block_component);
-
-        const unsigned int n_p = dofs_per_block[0];
-        const unsigned int n_u = dofs_per_block[1];
-        std::cout << "n_p:  " << n_p << "   n_u:  " << n_u << std::endl;
-        const std::vector<unsigned int> block_sizes = {n_p, n_p, n_p, n_p, n_p, n_u, n_u, n_p, n_p, 1};
+}
 
-        BlockDynamicSparsityPattern dsp(10, 10);
 
-        for (unsigned int k = 0; k < 10; k++) {
-            for (unsigned int j = 0; j < 10; j++) {
-                dsp.block(j, k).reinit(block_sizes[j], block_sizes[k]);
-            }
+///This makes a giant 10-by-10 block matrix that when assembled will represents the 10 KKT equations that
+/// come from this problem, and also sets up the necessary block vectors.  The
+/// sparsity pattern for this matrix includes the sparsity pattern for the filter matrix. It also initializes
+/// any block vectors we will use.
+template<int dim>
+void
+KktSystem<dim>::setup_block_system() {
+
+    //MAKE n_u and n_P
+
+    /*Setup 10 by 10 block matrix*/
+    std::vector<unsigned int> block_component(10, 2);
+
+    block_component[0] = 0;
+    block_component[5] = 1;
+
+    const std::vector<types::global_dof_index> dofs_per_block =
+            DoFTools::count_dofs_per_fe_block(dof_handler, block_component);
+    const unsigned int n_p = dofs_per_block[0];
+    const unsigned int n_u = dofs_per_block[1];
+
+    pcout << "n_p:  " << n_p << "   n_u:  " << n_u << std::endl;
+
+    IndexSet locally_owned_dofs = dof_handler.locally_owned_dofs();
+    IndexSet locally_relevant_dofs;
+    DoFTools::extract_locally_relevant_dofs(dof_handler, locally_relevant_dofs);
+
+    dsp.reinit(10, 10);
+    owned_partitioning.resize(10);
+    owned_partitioning[0] = dof_handler.locally_owned_dofs().get_view(0, n_p);
+    owned_partitioning[1] = dof_handler.locally_owned_dofs().get_view(n_p, 2 * n_p);
+    owned_partitioning[2] = dof_handler.locally_owned_dofs().get_view(2 * n_p, 3 * n_p);
+    owned_partitioning[3] = dof_handler.locally_owned_dofs().get_view(3 * n_p, 4 * n_p);
+    owned_partitioning[4] = dof_handler.locally_owned_dofs().get_view(4 * n_p, 5 * n_p);
+    owned_partitioning[5] = dof_handler.locally_owned_dofs().get_view(5 * n_p, 5 * n_p + n_u);
+    owned_partitioning[6] = dof_handler.locally_owned_dofs().get_view(5 * n_p + n_u, 5 * n_p + 2 * n_u);
+    owned_partitioning[7] = dof_handler.locally_owned_dofs().get_view(5 * n_p + 2 * n_u, 6 * n_p + 2 * n_u);
+    owned_partitioning[8] = dof_handler.locally_owned_dofs().get_view(6 * n_p + 2 * n_u, 7 * n_p + 2 * n_u);
+    owned_partitioning[9] = dof_handler.locally_owned_dofs().get_view(7 * n_p + 2 * n_u, 7 * n_p + 2 * n_u + 1);
+    relevant_partitioning.resize(10);
+    relevant_partitioning[0] = locally_relevant_dofs.get_view(0, n_p);
+    relevant_partitioning[1] = locally_relevant_dofs.get_view(n_p, 2 * n_p);
+    relevant_partitioning[2] = locally_relevant_dofs.get_view(2 * n_p, 3 * n_p);
+    relevant_partitioning[3] = locally_relevant_dofs.get_view(3 * n_p, 4 * n_p);
+    relevant_partitioning[4] = locally_relevant_dofs.get_view(4 * n_p, 5 * n_p);
+    relevant_partitioning[5] = locally_relevant_dofs.get_view(5 * n_p, 5 * n_p + n_u);
+    relevant_partitioning[6] = locally_relevant_dofs.get_view(5 * n_p + n_u, 5 * n_p + 2 * n_u);
+    relevant_partitioning[7] = locally_relevant_dofs.get_view(5 * n_p + 2 * n_u, 6 * n_p + 2 * n_u);
+    relevant_partitioning[8] = locally_relevant_dofs.get_view(6 * n_p + 2 * n_u, 7 * n_p + 2 * n_u);
+    relevant_partitioning[9] = locally_relevant_dofs.get_view(7 * n_p + 2 * n_u, 7 * n_p + 2 * n_u + 1);
+
+    const std::vector<unsigned int> block_sizes = {n_p, n_p, n_p, n_p, n_p, n_u, n_u, n_p, n_p, 1};
+
+    for (unsigned int k = 0; k < 10; k++) {
+        for (unsigned int j = 0; j < 10; j++) {
+            dsp.block(j, k).reinit(block_sizes[j], block_sizes[k]);
         }
+    }
+    dsp.collect_sizes();
+    Table<2, DoFTools::Coupling> coupling(2 * dim + 8, 2 * dim + 8);
+    //Coupling for density
+    coupling[SolutionComponents::density<dim>][SolutionComponents::density<dim>] = DoFTools::always;
+
+    for (unsigned int i = 0; i < dim; i++) {
+        coupling[SolutionComponents::density<dim>][SolutionComponents::displacement<dim> +
+                i] = DoFTools::always;
+        coupling[SolutionComponents::displacement<dim> +
+                i][SolutionComponents::density<dim>] = DoFTools::always;
+    }
 
-        dsp.collect_sizes();
-
-        Table<2, DoFTools::Coupling> coupling(2 * dim + 8, 2 * dim + 8);
-//Coupling for density
-        coupling[SolutionComponents::density<dim>][SolutionComponents::density<dim>] = DoFTools::always;
+    coupling[SolutionComponents::density<dim>][SolutionComponents::unfiltered_density_multiplier<dim>] = DoFTools::always;
+    coupling[SolutionComponents::unfiltered_density_multiplier<dim>][SolutionComponents::density<dim>] = DoFTools::always;
 
-        for (unsigned int i = 0; i < dim; i++) {
-            coupling[SolutionComponents::density<dim>][SolutionComponents::displacement<dim> + i] = DoFTools::always;
-            coupling[SolutionComponents::displacement<dim> + i][SolutionComponents::density<dim>] = DoFTools::always;
-        }
+    for (unsigned int i = 0; i < dim; i++) {
+        coupling[SolutionComponents::density<dim>][SolutionComponents::displacement_multiplier<dim> +
+                i] = DoFTools::always;
+        coupling[SolutionComponents::displacement_multiplier<dim> +
+                i][SolutionComponents::density<dim>] = DoFTools::always;
+    }
 
-        coupling[SolutionComponents::density<dim>][SolutionComponents::unfiltered_density_multiplier<dim>] = DoFTools::always;
-        coupling[SolutionComponents::unfiltered_density_multiplier<dim>][SolutionComponents::density<dim>] = DoFTools::always;
+    //Coupling for displacement
+    for (unsigned int i = 0; i < dim; i++) {
 
-        for (unsigned int i = 0; i < dim; i++) {
-            coupling[SolutionComponents::density<dim>][SolutionComponents::displacement_multiplier<dim> +
-                                                       i] = DoFTools::always;
-            coupling[SolutionComponents::displacement_multiplier<dim> +
-                     i][SolutionComponents::density<dim>] = DoFTools::always;
+        for (unsigned int k = 0; k < dim; k++) {
+            coupling[SolutionComponents::displacement<dim> + i][
+                    SolutionComponents::displacement_multiplier<dim> +
+                    k] = DoFTools::always;
+            coupling[SolutionComponents::displacement_multiplier<dim> + k][
+                    SolutionComponents::displacement<dim> +
+                    i] = DoFTools::always;
         }
+    }
 
-//Coupling for displacement
-        for (unsigned int i = 0; i < dim; i++) {
+    // coupling for unfiltered density
+    coupling[SolutionComponents::unfiltered_density<dim>][SolutionComponents::density_lower_slack_multiplier<dim>] = DoFTools::always;
+    coupling[SolutionComponents::density_lower_slack_multiplier<dim>][SolutionComponents::unfiltered_density<dim>] = DoFTools::always;
+
+    coupling[SolutionComponents::unfiltered_density<dim>][SolutionComponents::density_upper_slack_multiplier<dim>] = DoFTools::always;
+    coupling[SolutionComponents::density_upper_slack_multiplier<dim>][SolutionComponents::unfiltered_density<dim>] = DoFTools::always;
+
+    coupling[SolutionComponents::unfiltered_density<dim>][SolutionComponents::unfiltered_density_multiplier<dim>] = DoFTools::always;
+    coupling[SolutionComponents::unfiltered_density_multiplier<dim>][SolutionComponents::unfiltered_density<dim>] = DoFTools::always;
+
+    //        Coupling for lower slack
+    coupling[SolutionComponents::density_lower_slack<dim>][SolutionComponents::density_lower_slack<dim>] = DoFTools::always;
+
+    coupling[SolutionComponents::density_lower_slack<dim>][SolutionComponents::density_lower_slack_multiplier<dim>] = DoFTools::always;
+    coupling[SolutionComponents::density_lower_slack_multiplier<dim>][SolutionComponents::density_lower_slack<dim>] = DoFTools::always;
+
+    //
+    coupling[SolutionComponents::density_upper_slack<dim>][SolutionComponents::density_upper_slack<dim>] = DoFTools::always;
+    coupling[SolutionComponents::density_upper_slack<dim>][SolutionComponents::density_upper_slack_multiplier<dim>] = DoFTools::always;
+    coupling[SolutionComponents::density_upper_slack_multiplier<dim>][SolutionComponents::density_upper_slack<dim>] = DoFTools::always;
+
+    coupling[SolutionComponents::density_upper_slack_multiplier<dim>][SolutionComponents::density_upper_slack_multiplier<dim>] = DoFTools::always;
+    constraints.reinit(locally_relevant_dofs);
+    constraints.clear();
+    DoFTools::make_hanging_node_constraints(dof_handler,constraints);
+    constraints.close();
+
+    system_matrix.clear();
+
+    //            DoFTools::make_sparsity_pattern(dof_handler, coupling, dsp, constraints, false);
+    DoFTools::make_sparsity_pattern(dof_handler, dsp, constraints, false);
+    SparsityTools::distribute_sparsity_pattern(dsp, dof_handler.locally_owned_dofs(), mpi_communicator,
+                                               locally_relevant_dofs);
+    //adds the row into the sparsity pattern for the total volume constraint
+    // for (const auto &cell: dof_handler.active_cell_iterators())
+    // {
+    //     if (cell->is_locally_owned())
+    //     {
+    //         std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+    //         cell->get_dof_indices(i);
+    //         dsp.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier).add(i[cell->get_fe().component_to_system_index(0, 0)], 0);
+    //         dsp.block(SolutionBlocks::total_volume_multiplier, SolutionBlocks::density).add(0, i[cell->get_fe().component_to_system_index(0, 0)]);
+    //     }
+    // }
+    // Because of the single volume multiplier element only being on one processor, this works, and the above does not.
+    for (unsigned int i = 0; i<n_p; i++)
+    {
+        dsp.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier).add(i,0);
+        dsp.block(SolutionBlocks::total_volume_multiplier, SolutionBlocks::density).add(0,i);
+    }
 
-            for (unsigned int k = 0; k < dim; k++) {
-                coupling[SolutionComponents::displacement<dim> + i][SolutionComponents::displacement_multiplier<dim> +
-                                                                    k] = DoFTools::always;
-                coupling[SolutionComponents::displacement_multiplier<dim> + k][SolutionComponents::displacement<dim> +
-                                                                               i] = DoFTools::always;
+    /*This finds neighbors whose values would be relevant, and adds them to the sparsity pattern of the matrix*/
+    setup_filter_matrix();
+    for (const auto &cell : dof_handler.active_cell_iterators()) {
+        if (cell->is_locally_owned())
+        {
+            std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+            cell->get_dof_indices(i);
+            const unsigned int cell_index = i[cell->get_fe().component_to_system_index(0, 0)];
+            for (const auto &neighbor_cell_index : density_filter.find_relevant_neighbors(cell_index))
+            {
+                dsp.block(SolutionBlocks::unfiltered_density_multiplier,
+                          SolutionBlocks::unfiltered_density).add(cell_index, neighbor_cell_index);
+                dsp.block(SolutionBlocks::unfiltered_density,
+                          SolutionBlocks::unfiltered_density_multiplier).add(cell_index, neighbor_cell_index);
             }
         }
+    }
+    
+    SparsityTools::distribute_sparsity_pattern(
+                dsp,
+                Utilities::MPI::all_gather(mpi_communicator,
+                                           dof_handler.locally_owned_dofs()),
+                mpi_communicator,
+                locally_relevant_dofs);
+    DoFTools::extract_locally_relevant_dofs(dof_handler, locally_relevant_dofs);
+    system_matrix.reinit(owned_partitioning, dsp, mpi_communicator);
+
+    locally_relevant_solution.reinit(owned_partitioning, relevant_partitioning, mpi_communicator);
+    distributed_solution.reinit(owned_partitioning, mpi_communicator);
+    system_rhs.reinit(owned_partitioning, mpi_communicator);
+
+    locally_relevant_solution.collect_sizes();
+    distributed_solution.collect_sizes();
+    system_rhs.collect_sizes();
+    system_matrix.collect_sizes();
+    IndexSet locally_owned_displacement_dofs = dof_handler_displacement.locally_owned_dofs();
+    std::vector<types::global_dof_index> displacement_dof_indices;
+    std::vector<types::global_dof_index> system_dof_indices;
+    for (const auto &displacement_cell : dof_handler_displacement.active_cell_iterators())
+        if (displacement_cell->is_locally_owned())
+        {
+            typename DoFHandler<dim>::active_cell_iterator system_cell (&displacement_cell->get_triangulation(),
+                                                                        displacement_cell->level(),
+                                                                        displacement_cell->index(),
+                                                                        &dof_handler);
 
-// coupling for unfiltered density
-        coupling[SolutionComponents::unfiltered_density<dim>][SolutionComponents::density_lower_slack_multiplier<dim>] = DoFTools::always;
-        coupling[SolutionComponents::density_lower_slack_multiplier<dim>][SolutionComponents::unfiltered_density<dim>] = DoFTools::always;
-
-        coupling[SolutionComponents::unfiltered_density<dim>][SolutionComponents::density_upper_slack_multiplier<dim>] = DoFTools::always;
-        coupling[SolutionComponents::density_upper_slack_multiplier<dim>][SolutionComponents::unfiltered_density<dim>] = DoFTools::always;
-
-        coupling[SolutionComponents::unfiltered_density<dim>][SolutionComponents::unfiltered_density_multiplier<dim>] = DoFTools::always;
-        coupling[SolutionComponents::unfiltered_density_multiplier<dim>][SolutionComponents::unfiltered_density<dim>] = DoFTools::always;
-
-
-
-
-//        Coupling for lower slack
-        coupling[SolutionComponents::density_lower_slack<dim>][SolutionComponents::density_lower_slack<dim>] = DoFTools::always;
-
-        coupling[SolutionComponents::density_lower_slack<dim>][SolutionComponents::density_lower_slack_multiplier<dim>] = DoFTools::always;
-        coupling[SolutionComponents::density_lower_slack_multiplier<dim>][SolutionComponents::density_lower_slack<dim>] = DoFTools::always;
-
-//
-        coupling[SolutionComponents::density_upper_slack<dim>][SolutionComponents::density_upper_slack<dim>] = DoFTools::always;
-        coupling[SolutionComponents::density_upper_slack<dim>][SolutionComponents::density_upper_slack_multiplier<dim>] = DoFTools::always;
-        coupling[SolutionComponents::density_upper_slack_multiplier<dim>][SolutionComponents::density_upper_slack<dim>] = DoFTools::always;
-
-        coupling[SolutionComponents::density_upper_slack_multiplier<dim>][SolutionComponents::density_upper_slack_multiplier<dim>] = DoFTools::always;
-
-        constraints.clear();
-        constraints.close();
+            displacement_dof_indices.resize (displacement_cell->get_fe().dofs_per_cell);
+            system_dof_indices.resize (system_cell->get_fe().dofs_per_cell);
 
-        DoFTools::make_sparsity_pattern(dof_handler, coupling, dsp, constraints);
+            displacement_cell->get_dof_indices (displacement_dof_indices);
+            system_cell->get_dof_indices (system_dof_indices);
 
-        //adds the row into the sparsity pattern for the total volume constraint
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
-            const unsigned int i = cell->active_cell_index();
-            dsp.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier).add(i, 0);
-            dsp.block(SolutionBlocks::total_volume_multiplier, SolutionBlocks::density).add(0, i);
+            for (unsigned int i=0; i<displacement_dof_indices.size(); ++i)
+            {
+                if(locally_owned_displacement_dofs.is_element(displacement_dof_indices[i]))
+                {
+                        displacement_to_system_dof_index_map[displacement_dof_indices[i]]
+                            = system_dof_indices[system_cell->get_fe().component_to_system_index(
+                            displacement_cell->get_fe().system_to_component_index(i).first+SolutionComponents::displacement<dim>,
+                            displacement_cell->get_fe().system_to_component_index(i).second
+                            )];
+                }
+                
+            }
         }
-
-        constraints.condense(dsp);
-        sparsity_pattern.copy_from(dsp);
-
-        //adds the row into the sparsity pattern for the total volume constraint
-        sparsity_pattern.block(SolutionBlocks::unfiltered_density,
-                               SolutionBlocks::unfiltered_density_multiplier).copy_from(
-                density_filter.filter_sparsity_pattern);
-        sparsity_pattern.block(SolutionBlocks::unfiltered_density_multiplier,
-                               SolutionBlocks::unfiltered_density).copy_from(density_filter.filter_sparsity_pattern);
-
-        std::ofstream out("sparsity.plt");
-        sparsity_pattern.print_gnuplot(out);
-
-        system_matrix.reinit(sparsity_pattern);
-
-
-        linear_solution.reinit(block_sizes);
-        system_rhs.reinit(block_sizes);
-
-        for (unsigned int j = 0; j < 10; j++) {
-            linear_solution.block(j).reinit(block_sizes[j]);
-            system_rhs.block(j).reinit(block_sizes[j]);
+    const types::global_dof_index disp_start_index = system_matrix.get_row_indices().block_start(
+            SolutionBlocks::displacement);
+    for (auto &index_pair : displacement_to_system_dof_index_map)
+        index_pair.second -=disp_start_index;
+    for (auto &index_pair : displacement_to_system_dof_index_map)
+    {
+        if(index_pair.first != index_pair.second)
+        {
+            std::cout << "inexact matching for index: " << index_pair.first << " and " << index_pair.second << std::endl;
         }
-
-        linear_solution.collect_sizes();
-        system_rhs.collect_sizes();
     }
+    
 
-    ///This  is  where  the  magic  happens.   The  equations  describing  the newtons method for finding 0s in the KKT conditions are implemented here.
-
-
-    template<int dim>
-    void
-    KktSystem<dim>::assemble_block_system(const BlockVector<double> &state, const double barrier_size) {
-        /*Remove any values from old iterations*/
-        system_matrix.reinit(sparsity_pattern);
-        linear_solution = 0;
-        system_rhs = 0;
-
-        QGauss<dim> nine_quadrature(fe_nine.degree + 1);
-        QGauss<dim> ten_quadrature(fe_ten.degree + 1);
-
-        hp::QCollection<dim> q_collection;
-        q_collection.push_back(nine_quadrature);
-        q_collection.push_back(ten_quadrature);
-
-        hp::FEValues<dim> hp_fe_values(fe_collection,
-                                       q_collection,
-                                       update_values | update_quadrature_points |
-                                       update_JxW_values | update_gradients);
-
-        QGauss<dim - 1> common_face_quadrature(fe_ten.degree + 1);
-
-        FEFaceValues<dim> fe_nine_face_values(fe_nine,
-                                              common_face_quadrature,
-                                              update_JxW_values |
-                                              update_gradients | update_values);
-        FEFaceValues<dim> fe_ten_face_values(fe_ten,
-                                             common_face_quadrature,
-                                             update_normal_vectors |
-                                             update_values);
-
-        FullMatrix<double> cell_matrix;
-        Vector<double> cell_rhs;
-        std::vector<types::global_dof_index> local_dof_indices;
-
-        const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
-        const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
-        const FEValuesExtractors::Scalar unfiltered_densities(SolutionComponents::unfiltered_density<dim>);
-        const FEValuesExtractors::Vector displacement_multipliers(SolutionComponents::displacement_multiplier<dim>);
-        const FEValuesExtractors::Scalar unfiltered_density_multipliers(
+}
+
+///The  equations  describing  the newtons method for finding 0s in the KKT conditions are implemented here.
+template<int dim>
+void
+KktSystem<dim>::assemble_block_system(const LA::MPI::BlockVector &distributed_state, const double barrier_size) {
+    /*Remove any values from old iterations*/
+
+    LA::MPI::BlockVector relevant_state(owned_partitioning, relevant_partitioning, mpi_communicator);
+    relevant_state = distributed_state;
+
+    system_matrix.reinit(owned_partitioning, dsp, mpi_communicator);
+    locally_relevant_solution = 0;
+    system_rhs = 0;
+
+    QGauss<dim> nine_quadrature(fe_nine.degree + 1);
+    QGauss<dim> ten_quadrature(fe_ten.degree + 1);
+
+    hp::QCollection<dim> q_collection;
+    q_collection.push_back(nine_quadrature);
+    q_collection.push_back(ten_quadrature);
+
+    hp::FEValues<dim> hp_fe_values(fe_collection,
+                                   q_collection,
+                                   update_values | update_quadrature_points |
+                                   update_JxW_values | update_gradients);
+
+    QGauss<dim - 1> common_face_quadrature(fe_ten.degree + 1);
+
+    FEFaceValues<dim> fe_nine_face_values(fe_nine,
+                                          common_face_quadrature,
+                                          update_JxW_values |
+                                          update_gradients | update_values);
+    FEFaceValues<dim> fe_ten_face_values(fe_ten,
+                                         common_face_quadrature,
+                                         update_normal_vectors |
+                                         update_values);
+
+    FullMatrix<double> cell_matrix;
+    Vector<double> cell_rhs;
+    std::vector<types::global_dof_index> local_dof_indices;
+
+    const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
+    const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
+    const FEValuesExtractors::Scalar unfiltered_densities(SolutionComponents::unfiltered_density<dim>);
+    const FEValuesExtractors::Vector displacement_multipliers(SolutionComponents::displacement_multiplier<dim>);
+    const FEValuesExtractors::Scalar unfiltered_density_multipliers(
                 SolutionComponents::unfiltered_density_multiplier<dim>);
-        const FEValuesExtractors::Scalar density_lower_slacks(SolutionComponents::density_lower_slack<dim>);
-        const FEValuesExtractors::Scalar density_lower_slack_multipliers(
+    const FEValuesExtractors::Scalar density_lower_slacks(SolutionComponents::density_lower_slack<dim>);
+    const FEValuesExtractors::Scalar density_lower_slack_multipliers(
                 SolutionComponents::density_lower_slack_multiplier<dim>);
-        const FEValuesExtractors::Scalar density_upper_slacks(SolutionComponents::density_upper_slack<dim>);
-        const FEValuesExtractors::Scalar density_upper_slack_multipliers(
+    const FEValuesExtractors::Scalar density_upper_slacks(SolutionComponents::density_upper_slack<dim>);
+    const FEValuesExtractors::Scalar density_upper_slack_multipliers(
                 SolutionComponents::density_upper_slack_multiplier<dim>);
-        const FEValuesExtractors::Scalar total_volume_multiplier(
+    const FEValuesExtractors::Scalar total_volume_multiplier(
                 SolutionComponents::total_volume_multiplier<dim>);
 
-        const Functions::ConstantFunction<dim> lambda(1.), mu(1.);
-
-        BlockVector<double> filtered_unfiltered_density_solution = state;
-        BlockVector<double> filter_adjoint_unfiltered_density_multiplier_solution = state;
-        filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density) = 0;
-        filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier) = 0;
-
-        density_filter.filter_matrix.vmult(
-                filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density),
-                state.block(SolutionBlocks::unfiltered_density));
-        density_filter.filter_matrix.Tvmult(filter_adjoint_unfiltered_density_multiplier_solution.block(
-                                                    SolutionBlocks::unfiltered_density_multiplier),
-                                            state.block(SolutionBlocks::unfiltered_density_multiplier));
-
-
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
+    const Functions::ConstantFunction<dim> lambda(Input::material_lambda), mu(Input::material_mu);
+
+    distributed_solution = distributed_state;
+    LA::MPI::BlockVector filtered_unfiltered_density_solution = distributed_solution;
+    LA::MPI::BlockVector filter_adjoint_unfiltered_density_multiplier_solution = distributed_solution;
+    filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density) = 0;
+    filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier) = 0;
+    density_filter.filter_matrix.vmult(filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density),distributed_solution.block(SolutionBlocks::unfiltered_density));
+    density_filter.filter_matrix_transpose.vmult(filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier),distributed_solution.block(SolutionBlocks::unfiltered_density_multiplier));
+
+    LA::MPI::BlockVector relevant_filtered_unfiltered_density_solution = locally_relevant_solution;
+    LA::MPI::BlockVector relevant_filter_adjoint_unfiltered_density_multiplier_solution = locally_relevant_solution;
+    relevant_filtered_unfiltered_density_solution =filtered_unfiltered_density_solution;
+    relevant_filter_adjoint_unfiltered_density_multiplier_solution = filter_adjoint_unfiltered_density_multiplier_solution;
+    for (const auto &cell: dof_handler.active_cell_iterators()) {
+        if(cell->is_locally_owned())
+        {
             hp_fe_values.reinit(cell);
             const FEValues<dim> &fe_values = hp_fe_values.get_present_fe_values();
             cell_matrix.reinit(cell->get_fe().n_dofs_per_cell(),
@@ -749,12 +1316,12 @@ namespace SAND {
             std::vector<Tensor<1, dim>> old_displacement_values(n_q_points);
             std::vector<double> old_displacement_divs(n_q_points);
             std::vector<SymmetricTensor<2, dim>> old_displacement_symmgrads(
-                    n_q_points);
+                        n_q_points);
             std::vector<Tensor<1, dim>> old_displacement_multiplier_values(
-                    n_q_points);
+                        n_q_points);
             std::vector<double> old_displacement_multiplier_divs(n_q_points);
             std::vector<SymmetricTensor<2, dim>> old_displacement_multiplier_symmgrads(
-                    n_q_points);
+                        n_q_points);
             std::vector<double> old_lower_slack_multiplier_values(n_q_points);
             std::vector<double> old_upper_slack_multiplier_values(n_q_points);
             std::vector<double> old_lower_slack_values(n_q_points);
@@ -776,37 +1343,37 @@ namespace SAND {
             lambda.value_list(fe_values.get_quadrature_points(), lambda_values);
             mu.value_list(fe_values.get_quadrature_points(), mu_values);
 
-            fe_values[densities].get_function_values(state,
+            fe_values[densities].get_function_values(relevant_state,
                                                      old_density_values);
-            fe_values[displacements].get_function_values(state,
+            fe_values[displacements].get_function_values(relevant_state,
                                                          old_displacement_values);
-            fe_values[displacements].get_function_divergences(state,
+            fe_values[displacements].get_function_divergences(relevant_state,
                                                               old_displacement_divs);
             fe_values[displacements].get_function_symmetric_gradients(
-                    state, old_displacement_symmgrads);
+                        relevant_state, old_displacement_symmgrads);
             fe_values[displacement_multipliers].get_function_values(
-                    state, old_displacement_multiplier_values);
+                        relevant_state, old_displacement_multiplier_values);
             fe_values[displacement_multipliers].get_function_divergences(
-                    state, old_displacement_multiplier_divs);
+                        relevant_state, old_displacement_multiplier_divs);
             fe_values[displacement_multipliers].get_function_symmetric_gradients(
-                    state, old_displacement_multiplier_symmgrads);
+                        relevant_state, old_displacement_multiplier_symmgrads);
             fe_values[density_lower_slacks].get_function_values(
-                    state, old_lower_slack_values);
+                        relevant_state, old_lower_slack_values);
             fe_values[density_lower_slack_multipliers].get_function_values(
-                    state, old_lower_slack_multiplier_values);
+                        relevant_state, old_lower_slack_multiplier_values);
             fe_values[density_upper_slacks].get_function_values(
-                    state, old_upper_slack_values);
+                        relevant_state, old_upper_slack_values);
             fe_values[density_upper_slack_multipliers].get_function_values(
-                    state, old_upper_slack_multiplier_values);
+                        relevant_state, old_upper_slack_multiplier_values);
             fe_values[unfiltered_densities].get_function_values(
-                    state, old_unfiltered_density_values);
+                        relevant_state, old_unfiltered_density_values);
             fe_values[unfiltered_density_multipliers].get_function_values(
-                    state, old_unfiltered_density_multiplier_values);
+                        relevant_state, old_unfiltered_density_multiplier_values);
             fe_values[unfiltered_densities].get_function_values(
-                    filtered_unfiltered_density_solution, filtered_unfiltered_density_values);
+                        relevant_filtered_unfiltered_density_solution, filtered_unfiltered_density_values);
             fe_values[unfiltered_density_multipliers].get_function_values(
-                    filter_adjoint_unfiltered_density_multiplier_solution,
-                    filter_adjoint_unfiltered_density_multiplier_values);
+                        relevant_filter_adjoint_unfiltered_density_multiplier_solution,
+                        filter_adjoint_unfiltered_density_multiplier_values);
 
             Tensor<1, dim> traction;
             traction[1] = -1;
@@ -832,7 +1399,7 @@ namespace SAND {
                     const double unfiltered_density_phi_i = fe_values[unfiltered_densities].value(i,
                                                                                                   q_point);
                     const double unfiltered_density_multiplier_phi_i = fe_values[unfiltered_density_multipliers].value(
-                            i, q_point);
+                                i, q_point);
 
                     const double lower_slack_multiplier_phi_i =
                             fe_values[density_lower_slack_multipliers].value(i,
@@ -858,18 +1425,18 @@ namespace SAND {
 
                         const SymmetricTensor<2, dim> displacement_multiplier_phi_j_symmgrad =
                                 fe_values[displacement_multipliers].symmetric_gradient(
-                                        j, q_point);
+                                    j, q_point);
                         const double displacement_multiplier_phi_j_div =
                                 fe_values[displacement_multipliers].divergence(j,
                                                                                q_point);
 
                         const double density_phi_j = fe_values[densities].value(
-                                j, q_point);
+                                    j, q_point);
 
                         const double unfiltered_density_phi_j = fe_values[unfiltered_densities].value(j,
                                                                                                       q_point);
                         const double unfiltered_density_multiplier_phi_j = fe_values[unfiltered_density_multipliers].value(
-                                j, q_point);
+                                    j, q_point);
 
 
                         const double lower_slack_phi_j =
@@ -890,91 +1457,91 @@ namespace SAND {
                         cell_matrix(i, j) +=
                                 fe_values.JxW(q_point) *
                                 (
-                                        -density_phi_i * unfiltered_density_multiplier_phi_j
-
-                                        - density_penalty_exponent * (density_penalty_exponent - 1)
-                                          * std::pow(
-                                                old_density_values[q_point],
-                                                density_penalty_exponent - 2)
-                                          * density_phi_i
-                                          * density_phi_j
-                                          * (old_displacement_multiplier_divs[q_point] * old_displacement_divs[q_point]
-                                             * lambda_values[q_point]
-                                             + 2 * mu_values[q_point]
-                                               * (old_displacement_symmgrads[q_point] *
-                                                  old_displacement_multiplier_symmgrads[q_point]))
-
-                                        - density_penalty_exponent * std::pow(
-                                                old_density_values[q_point],
-                                                density_penalty_exponent - 1)
-                                          * density_phi_i
-                                          * (displacement_multiplier_phi_j_div * old_displacement_divs[q_point]
-                                             * lambda_values[q_point]
-                                             + 2 * mu_values[q_point]
-                                               *
-                                               (old_displacement_symmgrads[q_point] *
-                                                displacement_multiplier_phi_j_symmgrad))
-
-                                        - density_penalty_exponent * std::pow(
-                                                old_density_values[q_point],
-                                                density_penalty_exponent - 1)
-                                          * density_phi_i
-                                          * (displacement_phi_j_div * old_displacement_multiplier_divs[q_point]
-                                             * lambda_values[q_point]
-                                             + 2 * mu_values[q_point]
-                                               * (old_displacement_multiplier_symmgrads[q_point] *
-                                                  displacement_phi_j_symmgrad)));
+                                    -density_phi_i * unfiltered_density_multiplier_phi_j
+
+                                    - density_penalty_exponent * (density_penalty_exponent - 1)
+                                    * std::pow(
+                                        old_density_values[q_point],
+                                        density_penalty_exponent - 2)
+                                    * density_phi_i
+                                    * density_phi_j
+                                    * (old_displacement_multiplier_divs[q_point] * old_displacement_divs[q_point]
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       * (old_displacement_symmgrads[q_point] *
+                                          old_displacement_multiplier_symmgrads[q_point]))
+
+                                    - density_penalty_exponent * std::pow(
+                                        old_density_values[q_point],
+                                        density_penalty_exponent - 1)
+                                    * density_phi_i
+                                    * (displacement_multiplier_phi_j_div * old_displacement_divs[q_point]
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       *
+                                       (old_displacement_symmgrads[q_point] *
+                                        displacement_multiplier_phi_j_symmgrad))
+
+                                    - density_penalty_exponent * std::pow(
+                                        old_density_values[q_point],
+                                        density_penalty_exponent - 1)
+                                    * density_phi_i
+                                    * (displacement_phi_j_div * old_displacement_multiplier_divs[q_point]
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       * (old_displacement_multiplier_symmgrads[q_point] *
+                                          displacement_phi_j_symmgrad)));
                         //Equation 1
 
                         cell_matrix(i, j) +=
                                 fe_values.JxW(q_point) * (
-                                        -density_penalty_exponent * std::pow(
-                                                old_density_values[q_point],
-                                                density_penalty_exponent - 1)
-                                        * density_phi_j
-                                        * (old_displacement_multiplier_divs[q_point] * displacement_phi_i_div
-                                           * lambda_values[q_point]
-                                           + 2 * mu_values[q_point]
-                                             * (old_displacement_multiplier_symmgrads[q_point] *
-                                                displacement_phi_i_symmgrad))
-
-                                        - std::pow(old_density_values[q_point],
-                                                   density_penalty_exponent)
-                                          * (displacement_multiplier_phi_j_div * displacement_phi_i_div
-                                             * lambda_values[q_point]
-                                             + 2 * mu_values[q_point]
-                                               * (displacement_multiplier_phi_j_symmgrad * displacement_phi_i_symmgrad))
+                                    -density_penalty_exponent * std::pow(
+                                        old_density_values[q_point],
+                                        density_penalty_exponent - 1)
+                                    * density_phi_j
+                                    * (old_displacement_multiplier_divs[q_point] * displacement_phi_i_div
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       * (old_displacement_multiplier_symmgrads[q_point] *
+                                          displacement_phi_i_symmgrad))
 
-                                );
+                                    - std::pow(old_density_values[q_point],
+                                               density_penalty_exponent)
+                                    * (displacement_multiplier_phi_j_div * displacement_phi_i_div
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       * (displacement_multiplier_phi_j_symmgrad * displacement_phi_i_symmgrad))
+
+                                    );
 
                         //Equation 2 has to do with the filter, which is calculated elsewhere.
                         cell_matrix(i, j) +=
                                 fe_values.JxW(q_point) * (
-                                        -1 * unfiltered_density_phi_i * lower_slack_multiplier_phi_j
-                                        + unfiltered_density_phi_i * upper_slack_multiplier_phi_j);
+                                    -1 * unfiltered_density_phi_i * lower_slack_multiplier_phi_j
+                                    + unfiltered_density_phi_i * upper_slack_multiplier_phi_j);
 
                         //Equation 3 - Primal Feasibility
 
                         cell_matrix(i, j) +=
                                 fe_values.JxW(q_point) * (
 
-                                        -1 * density_penalty_exponent * std::pow(
-                                                old_density_values[q_point],
-                                                density_penalty_exponent - 1)
-                                        * density_phi_j
-                                        * (old_displacement_divs[q_point] * displacement_multiplier_phi_i_div
-                                           * lambda_values[q_point]
-                                           + 2 * mu_values[q_point]
-                                             * (old_displacement_symmgrads[q_point] *
-                                                displacement_multiplier_phi_i_symmgrad))
-
-                                        + -1 * std::pow(old_density_values[q_point],
-                                                        density_penalty_exponent)
-                                          * (displacement_phi_j_div * displacement_multiplier_phi_i_div
-                                             * lambda_values[q_point]
-                                             + 2 * mu_values[q_point]
-                                               *
-                                               (displacement_phi_j_symmgrad * displacement_multiplier_phi_i_symmgrad)));
+                                    -1 * density_penalty_exponent * std::pow(
+                                        old_density_values[q_point],
+                                        density_penalty_exponent - 1)
+                                    * density_phi_j
+                                    * (old_displacement_divs[q_point] * displacement_multiplier_phi_i_div
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       * (old_displacement_symmgrads[q_point] *
+                                          displacement_multiplier_phi_i_symmgrad))
+
+                                    + -1 * std::pow(old_density_values[q_point],
+                                                    density_penalty_exponent)
+                                    * (displacement_phi_j_div * displacement_multiplier_phi_i_div
+                                       * lambda_values[q_point]
+                                       + 2 * mu_values[q_point]
+                                       *
+                                       (displacement_phi_j_symmgrad * displacement_multiplier_phi_i_symmgrad)));
 
                         //Equation 4 - more primal feasibility
                         cell_matrix(i, j) +=
@@ -984,102 +1551,144 @@ namespace SAND {
                         //Equation 5 - more primal feasibility
                         cell_matrix(i, j) +=
                                 -1 * fe_values.JxW(q_point) * upper_slack_multiplier_phi_i * (
-                                        -1 * unfiltered_density_phi_j - upper_slack_phi_j);
+                                    -1 * unfiltered_density_phi_j - upper_slack_phi_j);
 
                         //Equation 6 - more primal feasibility - part with filter added later
                         cell_matrix(i, j) +=
                                 -1 * fe_values.JxW(q_point) * unfiltered_density_multiplier_phi_i * (
-                                        density_phi_j);
+                                    density_phi_j);
 
                         //Equation 7 - complementary slackness
                         cell_matrix(i, j) += fe_values.JxW(q_point) *
-                                             (lower_slack_phi_i * lower_slack_multiplier_phi_j
-                                              + lower_slack_phi_i * lower_slack_phi_j *
-                                                old_lower_slack_multiplier_values[q_point] /
-                                                old_lower_slack_values[q_point]);
+                                (lower_slack_phi_i * lower_slack_multiplier_phi_j
+                                 + lower_slack_phi_i * lower_slack_phi_j *
+                                 old_lower_slack_multiplier_values[q_point] /
+                                 old_lower_slack_values[q_point]);
                         //Equation 8 - complementary slackness
                         cell_matrix(i, j) += fe_values.JxW(q_point) *
-                                             (upper_slack_phi_i * upper_slack_multiplier_phi_j
-                                              + upper_slack_phi_i * upper_slack_phi_j *
-                                                old_upper_slack_multiplier_values[q_point] /
-                                                old_upper_slack_values[q_point]);
+                                (upper_slack_phi_i * upper_slack_multiplier_phi_j
+                                 + upper_slack_phi_i * upper_slack_phi_j *
+                                 old_upper_slack_multiplier_values[q_point] /
+                                 old_upper_slack_values[q_point]);
                     }
 
                 }
-
             }
 
 
             MatrixTools::local_apply_boundary_values(boundary_values, local_dof_indices,
                                                      cell_matrix, cell_rhs, true);
 
+
             constraints.distribute_local_to_global(
-                    cell_matrix, cell_rhs, local_dof_indices, system_matrix, system_rhs);
+                        cell_matrix, cell_rhs, local_dof_indices, system_matrix, system_rhs);
 
         }
-        system_rhs = calculate_rhs(state, barrier_size);
 
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
-            const unsigned int i = cell->active_cell_index();
+    }
+    // MPI_BARRIER(MPI_COMM_WORLD);
+    system_matrix.compress(VectorOperation::add);
+    system_rhs = calculate_rhs(distributed_state, barrier_size);
+    double cell_measure;
+    for (const auto &cell: dof_handler.active_cell_iterators()) 
+    {
+        if(cell->is_locally_owned())
+        {
+            std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+            cell->get_dof_indices(i);
+            const unsigned int cell_i = i[cell->get_fe().component_to_system_index(0, 0)];
 
-            typename SparseMatrix<double>::iterator iter = density_filter.filter_matrix.begin(
-                    i);
-            for (; iter != density_filter.filter_matrix.end(i); iter++) {
-                unsigned int j = iter->column();
-                double value = iter->value() * cell->measure();
+            // typename LA::MPI::SparseMatrix::iterator iter = density_filter.filter_matrix.begin(cell_i);
+            for (const unsigned int j : density_filter.find_relevant_neighbors(cell_i)) 
+            {
+                // unsigned int j = iter->column();
+                double value = density_filter.filter_matrix(cell_i,j) * cell->measure();
+                double value_transpose = density_filter.filter_matrix_transpose(cell_i,j) * cell->measure();
 
                 system_matrix.block(SolutionBlocks::unfiltered_density_multiplier,
-                                    SolutionBlocks::unfiltered_density).add(i, j, value);
+                                    SolutionBlocks::unfiltered_density).set(cell_i, j, value);
                 system_matrix.block(SolutionBlocks::unfiltered_density,
-                                    SolutionBlocks::unfiltered_density_multiplier).add(j, i, value);
+                                    SolutionBlocks::unfiltered_density_multiplier).set(cell_i, j, value_transpose);
             }
 
-            system_matrix.block(SolutionBlocks::total_volume_multiplier, SolutionBlocks::density).add(0, i,
-                                                                                                      cell->measure());
-            system_matrix.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier).add(i, 0,
-                                                                                                      cell->measure());
+            cell_measure = cell->measure();
+
+            system_matrix.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier).set(cell_i, 0,
+                    cell->measure());
+            system_matrix.block(SolutionBlocks::total_volume_multiplier,SolutionBlocks::density).set(0,cell_i,
+                    cell->measure());
         }
-        std::cout << "assembled" << std::endl;
     }
+    system_matrix.compress(VectorOperation::insert);
+    // for (const auto &cell: dof_handler.active_cell_iterators()) 
+    // {
+    //     if(cell->is_locally_owned())
+    //     {
+    //         std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+    //         cell->get_dof_indices(i);
+    //         const unsigned int cell_i = i[cell->get_fe().component_to_system_index(0, 0)];
+
+    //         for (const unsigned int j : density_filter.find_relevant_neighbors(cell_i)) {
+    //             double value = system_matrix.block(SolutionBlocks::unfiltered_density_multiplier,
+    //                                 SolutionBlocks::unfiltered_density).el(j,cell_i);
+
+    //             system_matrix.block(SolutionBlocks::unfiltered_density,
+    //                                 SolutionBlocks::unfiltered_density_multiplier).set(j, cell_i, value);
+    //         }
+    //     }
+    // }
+    // system_matrix.compress(VectorOperation::insert);
+
+
+    pcout << "assembled " << std::endl;
+
+}
+
+///For use in the filter, this calculates the objective value we are working to minimize.
+template<int dim>
+double
+KktSystem<dim>::calculate_objective_value(const LA::MPI::BlockVector &distributed_state) const {
+    /*Remove any values from old iterations*/
 
-    template<int dim>
-    double
-    KktSystem<dim>::calculate_objective_value(const BlockVector<double> &state) const {
-        /*Remove any values from old iterations*/
+    locally_relevant_solution = distributed_state;
 
-        QGauss<dim> nine_quadrature(fe_nine.degree + 1);
-        QGauss<dim> ten_quadrature(fe_ten.degree + 1);
 
-        hp::QCollection<dim> q_collection;
-        q_collection.push_back(nine_quadrature);
-        q_collection.push_back(ten_quadrature);
+    QGauss<dim> nine_quadrature(fe_nine.degree + 1);
+    QGauss<dim> ten_quadrature(fe_ten.degree + 1);
 
-        hp::FEValues<dim> hp_fe_values(fe_collection,
-                                       q_collection,
-                                       update_values | update_quadrature_points |
-                                       update_JxW_values | update_gradients);
+    hp::QCollection<dim> q_collection;
+    q_collection.push_back(nine_quadrature);
+    q_collection.push_back(ten_quadrature);
 
-        QGauss<dim - 1> common_face_quadrature(fe_ten.degree + 1);
+    hp::FEValues<dim> hp_fe_values(fe_collection,
+                                   q_collection,
+                                   update_values | update_quadrature_points |
+                                   update_JxW_values | update_gradients);
 
-        FEFaceValues<dim> fe_nine_face_values(fe_nine,
-                                              common_face_quadrature,
-                                              update_JxW_values |
-                                              update_gradients | update_values);
-        FEFaceValues<dim> fe_ten_face_values(fe_ten,
-                                             common_face_quadrature,
-                                             update_normal_vectors |
-                                             update_values);
+    QGauss<dim - 1> common_face_quadrature(fe_ten.degree + 1);
 
-        FullMatrix<double> cell_matrix;
-        Vector<double> cell_rhs;
+    FEFaceValues<dim> fe_nine_face_values(fe_nine,
+                                          common_face_quadrature,
+                                          update_JxW_values |
+                                          update_gradients | update_values);
+    FEFaceValues<dim> fe_ten_face_values(fe_ten,
+                                         common_face_quadrature,
+                                         update_normal_vectors |
+                                         update_values);
 
-        const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
+    FullMatrix<double> cell_matrix;
+    Vector<double> cell_rhs;
 
-        Tensor<1, dim> traction;
-        traction[1] = -1;
+    const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
 
-        double objective_value = 0;
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
+    Tensor<1, dim> traction;
+    traction[1] = -1;
+    distributed_solution = distributed_state;
+    double objective_value = 0;
+    for (const auto &cell: dof_handler.active_cell_iterators())
+    {
+        if(cell->is_locally_owned())
+        {
             hp_fe_values.reinit(cell);
             const FEValues<dim> &fe_values = hp_fe_values.get_present_fe_values();
             const unsigned int dofs_per_cell = cell->get_fe().n_dofs_per_cell();
@@ -1088,209 +1697,262 @@ namespace SAND {
 
             std::vector<Tensor<1, dim>> old_displacement_values(n_q_points);
             fe_values[displacements].get_function_values(
-                    state, old_displacement_values);
+                        locally_relevant_solution, old_displacement_values);
 
             for (unsigned int face_number = 0;
                  face_number < GeometryInfo<dim>::faces_per_cell;
-                 ++face_number) {
+                 ++face_number)
+            {
                 if (cell->face(face_number)->at_boundary() && cell->face(face_number)->boundary_id()
-                                                              == BoundaryIds::down_force) {
-
-
+                        == BoundaryIds::down_force)
+                {
                     for (unsigned int face_q_point = 0;
                          face_q_point < n_face_q_points; ++face_q_point) {
                         for (unsigned int i = 0; i < dofs_per_cell; ++i) {
                             if (cell->material_id() == MaterialIds::without_multiplier) {
                                 fe_nine_face_values.reinit(cell, face_number);
                                 objective_value += traction
-                                                   * fe_nine_face_values[displacements].value(i,
-                                                                                              face_q_point)
-                                                   * fe_nine_face_values.JxW(face_q_point);
+                                        * fe_nine_face_values[displacements].value(i,
+                                                                                   face_q_point)
+                                        * fe_nine_face_values.JxW(face_q_point);
                             } else {
                                 fe_ten_face_values.reinit(cell, face_number);
                                 objective_value += traction
-                                                   * fe_ten_face_values[displacements].value(i,
-                                                                                             face_q_point)
-                                                   * fe_ten_face_values.JxW(face_q_point);
+                                        * fe_ten_face_values[displacements].value(i,
+                                                                                  face_q_point)
+                                        * fe_ten_face_values.JxW(face_q_point);
                             }
                         }
                     }
                 }
-
             }
         }
-        return objective_value;
     }
+    double objective_value_out;
+    MPI_Allreduce(&objective_value, &objective_value_out, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+
+    return objective_value;
+}
 
 
-    //As the KKT System know which vectors correspond to the slack variables, the sum of the logs of the slacks is computed here for use in the filter.
-    template<int dim>
-    double
-    KktSystem<dim>::calculate_barrier_distance(const BlockVector<double> &state) const {
-        double barrier_distance_log_sum = 0;
-        unsigned int vect_size = state.block(SolutionBlocks::density_lower_slack).size();
-        for (unsigned int k = 0; k < vect_size; k++) {
+///As the KKT System knows which vectors correspond to the slack variables, the sum of the logs of the slacks is computed here for use in the filter.
+template<int dim>
+double
+KktSystem<dim>::calculate_barrier_distance(const LA::MPI::BlockVector &state) const {
+    double barrier_distance_log_sum = 0;
+    unsigned int vect_size = state.block(SolutionBlocks::density_lower_slack).size();
+    distributed_solution = state;
+    for (unsigned int k = 0; k < vect_size; k++) {
+        if (distributed_solution.block(SolutionBlocks::density_lower_slack).in_local_range(k))
             barrier_distance_log_sum += std::log(state.block(SolutionBlocks::density_lower_slack)[k]);
-        }
-        for (unsigned int k = 0; k < vect_size; k++) {
+    }
+    for (unsigned int k = 0; k < vect_size; k++) {
+        if (distributed_solution.block(SolutionBlocks::density_upper_slack).in_local_range(k))
             barrier_distance_log_sum += std::log(state.block(SolutionBlocks::density_upper_slack)[k]);
-        }
-        return barrier_distance_log_sum;
     }
+    double out_barrier_distance_log_sum;
+    MPI_Allreduce(&barrier_distance_log_sum, &out_barrier_distance_log_sum, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+
+    return out_barrier_distance_log_sum;
+}
+
+///Calculates the norm of the RHS. While not the KKT norm, we also expect this to be 0 at a minimum.
+template<int dim>
+double
+KktSystem<dim>::calculate_rhs_norm(const LA::MPI::BlockVector &state, const double barrier_size) const {
+    return calculate_rhs(state, barrier_size).l2_norm();
+}
 
-    template<int dim>
-    double
-    KktSystem<dim>::calculate_rhs_norm(const BlockVector<double> &state, const double barrier_size) const {
-        return calculate_rhs(state, barrier_size).l2_norm();
-    }
 
+///Feasibility conditions appear on the RHS of the linear system, so I compute the RHS to find it. Could probably be combined with the objective value finding part to make it faster.
+template<int dim>
+double
+KktSystem<dim>::calculate_feasibility(const LA::MPI::BlockVector &state, const double barrier_size) const {
+    LA::MPI::BlockVector test_rhs = calculate_rhs(state, barrier_size);
 
-    //Feasibility conditions appear on the RHS of the linear system, so I compute the RHS to find it. Could probably be combined with the objective value finding part to make it faster.
-    template<int dim>
-    double
-    KktSystem<dim>::calculate_feasibility(const BlockVector<double> &state, const double barrier_size) const {
-        BlockVector<double> test_rhs = calculate_rhs(state, barrier_size);
-//        double feasibility = 0;
-//        feasibility +=
-//                test_rhs.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm() +
-//                test_rhs.block(SolutionBlocks::density_lower_slack_multiplier).l2_norm() +
-//                test_rhs.block(SolutionBlocks::density_upper_slack_multiplier).l2_norm() +
-//                test_rhs.block(SolutionBlocks::displacement_multiplier).l2_norm() +
-//                test_rhs.block(SolutionBlocks::density_lower_slack).l2_norm() +
-//                test_rhs.block(SolutionBlocks::density_upper_slack).l2_norm() +
-//                test_rhs.block(SolutionBlocks::total_volume_multiplier).l2_norm()+
-//                test_rhs.block(SolutionBlocks::density).l2_norm()+
-//                test_rhs.block(SolutionBlocks::unfiltered_density).l2_norm()+
-//                test_rhs.block(SolutionBlocks::displacement).l2_norm();
-//        return feasibility;
-
-        double norm = 0;
-        norm += std::pow(test_rhs.block(SolutionBlocks::displacement).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::density).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::displacement_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::total_volume_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::density_upper_slack_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::density_lower_slack_multiplier).l2_norm(), 2);
-        for (unsigned int k = 0; k < state.block(SolutionBlocks::density_upper_slack).size(); k++) {
-            norm += state.block(SolutionBlocks::density_upper_slack)[k] *
-                    state.block(SolutionBlocks::density_upper_slack_multiplier)[k]
-                    * state.block(SolutionBlocks::density_upper_slack)[k] *
-                    state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
+    double norm = 0;
+
+    distributed_solution = state;
+    double full_prod1 =1;
+    double full_prod2 = 1;
+
+    for (unsigned int k = 0; k < state.block(SolutionBlocks::density_upper_slack).size(); k++) {
+        double prod1 = 1;
+        double prod2 = 1;
+        if(state.block(SolutionBlocks::density_upper_slack).in_local_range(k))
+        {
+            prod1 = prod1 * state.block(SolutionBlocks::density_upper_slack)[k]
+                    * state.block(SolutionBlocks::density_upper_slack)[k];
         }
-        for (unsigned int k = 0; k < state.block(SolutionBlocks::density_lower_slack).size(); k++) {
-            norm += state.block(SolutionBlocks::density_lower_slack)[k] *
-                    state.block(SolutionBlocks::density_lower_slack_multiplier)[k]
-                    * state.block(SolutionBlocks::density_lower_slack)[k] *
-                    state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
+        if(state.block(SolutionBlocks::density_lower_slack).in_local_range(k))
+        {
+            prod2 = prod2 *  state.block(SolutionBlocks::density_lower_slack)[k]
+                    * state.block(SolutionBlocks::density_lower_slack)[k];
         }
-        return norm;
+        if(state.block(SolutionBlocks::density_upper_slack_multiplier).in_local_range(k))
+        {
+            prod1 = prod1 * state.block(SolutionBlocks::density_upper_slack_multiplier)[k]
+                    * state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
+        }
+        if(state.block(SolutionBlocks::density_lower_slack_multiplier).in_local_range(k))
+        {
+            prod2 = prod2 *  state.block(SolutionBlocks::density_lower_slack_multiplier)[k]
+                    * state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
+        }
+        MPI_Allreduce(&prod1, &full_prod1, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+        MPI_Allreduce(&prod2, &full_prod2, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+        norm = norm + full_prod1 + full_prod2;
     }
 
-    template<int dim>
-    double
-    KktSystem<dim>::calculate_convergence(const BlockVector<double> &state) const {
-        BlockVector<double> test_rhs = calculate_rhs(state, Input::min_barrier_size);
-        double norm = 0;
-
-        norm += std::pow(test_rhs.block(SolutionBlocks::displacement).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::density).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::displacement_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::total_volume_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::density_upper_slack_multiplier).l2_norm(), 2);
-        norm += std::pow(test_rhs.block(SolutionBlocks::density_lower_slack_multiplier).l2_norm(), 2);
-
-        for (unsigned int k = 0; k < state.block(SolutionBlocks::density_upper_slack).size(); k++) {
-            norm += state.block(SolutionBlocks::density_upper_slack)[k] *
-                    state.block(SolutionBlocks::density_upper_slack_multiplier)[k]
-                    * state.block(SolutionBlocks::density_upper_slack)[k] *
-                    state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
+    norm += std::pow(test_rhs.block(SolutionBlocks::displacement).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::density).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::displacement_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::total_volume_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::density_upper_slack_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::density_lower_slack_multiplier).l2_norm(), 2);
+
+    return norm;
+}
+
+///calculates the KKT norm of the system, representing how close the program is to convergence.
+template<int dim>
+double
+KktSystem<dim>::calculate_convergence(const LA::MPI::BlockVector &state) const {
+    LA::MPI::BlockVector test_rhs = calculate_rhs(state, Input::min_barrier_size);
+    double norm = 0;
+
+    distributed_solution = state;
+    double full_prod1 =1;
+    double full_prod2 = 1;
+
+    for (unsigned int k = 0; k < state.block(SolutionBlocks::density_upper_slack).size(); k++) {
+        double prod1 = 1;
+        double prod2 = 1;
+        if(state.block(SolutionBlocks::density_upper_slack).in_local_range(k))
+        {
+            prod1 = prod1 * state.block(SolutionBlocks::density_upper_slack)[k]
+                    * state.block(SolutionBlocks::density_upper_slack)[k];
         }
-        for (unsigned int k = 0; k < state.block(SolutionBlocks::density_lower_slack).size(); k++) {
-            norm += state.block(SolutionBlocks::density_lower_slack)[k] *
-                    state.block(SolutionBlocks::density_lower_slack_multiplier)[k]
-                    * state.block(SolutionBlocks::density_lower_slack)[k] *
-                    state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
+        if(state.block(SolutionBlocks::density_lower_slack).in_local_range(k))
+        {
+            prod2 = prod2 *  state.block(SolutionBlocks::density_lower_slack)[k]
+                    * state.block(SolutionBlocks::density_lower_slack)[k];
         }
-        norm = std::pow(norm, .5);
-
-        std::cout << "l2 norm: " << system_rhs.l2_norm() << std::endl;
-        std::cout << "KKT norm: " << norm << std::endl;
-        return norm;
+        if(state.block(SolutionBlocks::density_upper_slack_multiplier).in_local_range(k))
+        {
+            prod1 = prod1 * state.block(SolutionBlocks::density_upper_slack_multiplier)[k]
+                    * state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
+        }
+        if(state.block(SolutionBlocks::density_lower_slack_multiplier).in_local_range(k))
+        {
+            prod2 = prod2 *  state.block(SolutionBlocks::density_lower_slack_multiplier)[k]
+                    * state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
+        }
+        MPI_Allreduce(&prod1, &full_prod1, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+        MPI_Allreduce(&prod2, &full_prod2, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+        norm = norm + full_prod1 + full_prod2;
     }
 
-    template<int dim>
-    BlockVector<double>
-    KktSystem<dim>::calculate_rhs(const BlockVector<double> &state, const double barrier_size) const {
-        BlockVector<double> test_rhs;
-        test_rhs = system_rhs;
-        test_rhs = 0;
-
-
-        QGauss<dim> nine_quadrature(fe_nine.degree + 1);
-        QGauss<dim> ten_quadrature(fe_ten.degree + 1);
-
-        hp::QCollection<dim> q_collection;
-        q_collection.push_back(nine_quadrature);
-        q_collection.push_back(ten_quadrature);
-
-        hp::FEValues<dim> hp_fe_values(fe_collection,
-                                       q_collection,
-                                       update_values | update_quadrature_points |
-                                       update_JxW_values | update_gradients);
-
-        QGauss<dim - 1> common_face_quadrature(fe_ten.degree + 1);
-
-        FEFaceValues<dim> fe_nine_face_values(fe_nine,
-                                              common_face_quadrature,
-                                              update_JxW_values |
-                                              update_gradients | update_values);
-        FEFaceValues<dim> fe_ten_face_values(fe_ten,
-                                             common_face_quadrature,
-                                             update_normal_vectors |
-                                             update_values);
-
-        FullMatrix<double> cell_matrix;
-        Vector<double> cell_rhs;
-        std::vector<types::global_dof_index> local_dof_indices;
-
-        const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
-        const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
-        const FEValuesExtractors::Scalar unfiltered_densities(SolutionComponents::unfiltered_density<dim>);
-        const FEValuesExtractors::Vector displacement_multipliers(SolutionComponents::displacement_multiplier<dim>);
-        const FEValuesExtractors::Scalar unfiltered_density_multipliers(
+
+    norm += std::pow(test_rhs.block(SolutionBlocks::displacement).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::density).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::displacement_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::total_volume_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::density_upper_slack_multiplier).l2_norm(), 2);
+    norm += std::pow(test_rhs.block(SolutionBlocks::density_lower_slack_multiplier).l2_norm(), 2);
+
+    norm = std::pow(norm, .5);
+
+    pcout << "KKT norm: " << norm << std::endl;
+    return norm;
+}
+
+/// Makes the RHS of the KKT equations
+template<int dim>
+LA::MPI::BlockVector
+KktSystem<dim>::calculate_rhs(const LA::MPI::BlockVector &distributed_state, const double barrier_size) const {
+    LA::MPI::BlockVector test_rhs (system_rhs);
+    LA::MPI::BlockVector state (locally_relevant_solution);
+    state = distributed_state;
+    test_rhs = 0.;
+
+    QGauss<dim> nine_quadrature(fe_nine.degree + 1);
+    QGauss<dim> ten_quadrature(fe_ten.degree + 1);
+
+    hp::QCollection<dim> q_collection;
+    q_collection.push_back(nine_quadrature);
+    q_collection.push_back(ten_quadrature);
+
+    hp::FEValues<dim> hp_fe_values(fe_collection,
+                                   q_collection,
+                                   update_values | update_quadrature_points |
+                                   update_JxW_values | update_gradients);
+
+    QGauss<dim - 1> common_face_quadrature(fe_ten.degree + 1);
+
+    FEFaceValues<dim> fe_nine_face_values(fe_nine,
+                                          common_face_quadrature,
+                                          update_JxW_values |
+                                          update_gradients | update_values);
+    FEFaceValues<dim> fe_ten_face_values(fe_ten,
+                                         common_face_quadrature,
+                                         update_normal_vectors |
+                                         update_values);
+
+    FullMatrix<double> cell_matrix;
+    Vector<double> cell_rhs;
+    std::vector<types::global_dof_index> local_dof_indices;
+
+    const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
+    const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
+    const FEValuesExtractors::Scalar unfiltered_densities(SolutionComponents::unfiltered_density<dim>);
+    const FEValuesExtractors::Vector displacement_multipliers(SolutionComponents::displacement_multiplier<dim>);
+    const FEValuesExtractors::Scalar unfiltered_density_multipliers(
                 SolutionComponents::unfiltered_density_multiplier<dim>);
-        const FEValuesExtractors::Scalar density_lower_slacks(SolutionComponents::density_lower_slack<dim>);
-        const FEValuesExtractors::Scalar density_lower_slack_multipliers(
+    const FEValuesExtractors::Scalar density_lower_slacks(SolutionComponents::density_lower_slack<dim>);
+    const FEValuesExtractors::Scalar density_lower_slack_multipliers(
                 SolutionComponents::density_lower_slack_multiplier<dim>);
-        const FEValuesExtractors::Scalar density_upper_slacks(SolutionComponents::density_upper_slack<dim>);
-        const FEValuesExtractors::Scalar density_upper_slack_multipliers(
+    const FEValuesExtractors::Scalar density_upper_slacks(SolutionComponents::density_upper_slack<dim>);
+    const FEValuesExtractors::Scalar density_upper_slack_multipliers(
                 SolutionComponents::density_upper_slack_multiplier<dim>);
-        const FEValuesExtractors::Scalar total_volume_multiplier(
+    const FEValuesExtractors::Scalar total_volume_multiplier(
                 SolutionComponents::total_volume_multiplier<dim>);
 
 
-        const unsigned int n_face_q_points = common_face_quadrature.size();
+    const unsigned int n_face_q_points = common_face_quadrature.size();
+
+    const Functions::ConstantFunction<dim> lambda(1.), mu(1.);
 
-        const Functions::ConstantFunction<dim> lambda(1.), mu(1.);
+    locally_relevant_solution = state;
+    distributed_solution = state;
+    LA::MPI::BlockVector filtered_unfiltered_density_solution (distributed_solution);
+    LA::MPI::BlockVector filter_adjoint_unfiltered_density_multiplier_solution (distributed_solution);
+    filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density) = 0;
+    filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier) = 0;
 
-        BlockVector<double> filtered_unfiltered_density_solution = state;
-        BlockVector<double> filter_adjoint_unfiltered_density_multiplier_solution = state;
-        filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density) = 0;
-        filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier) = 0;
+    density_filter.filter_matrix.vmult(filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density),distributed_solution.block(SolutionBlocks::unfiltered_density));
+    density_filter.filter_matrix_transpose.vmult(filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier),distributed_solution.block(SolutionBlocks::unfiltered_density_multiplier));
 
-        density_filter.filter_matrix.vmult(
-                filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density),
-                state.block(SolutionBlocks::unfiltered_density));
-        density_filter.filter_matrix.Tvmult(filter_adjoint_unfiltered_density_multiplier_solution.block(
-                                                    SolutionBlocks::unfiltered_density_multiplier),
-                                            state.block(SolutionBlocks::unfiltered_density_multiplier));
-        const double old_volume_multiplier = state.block(SolutionBlocks::total_volume_multiplier)[0];
+    LA::MPI::BlockVector relevant_filtered_unfiltered_density_solution (locally_relevant_solution);
+    LA::MPI::BlockVector relevant_filter_adjoint_unfiltered_density_multiplier_solution (locally_relevant_solution);
+    relevant_filtered_unfiltered_density_solution = filtered_unfiltered_density_solution;
+    relevant_filter_adjoint_unfiltered_density_multiplier_solution = filter_adjoint_unfiltered_density_multiplier_solution;
 
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
+    double old_volume_multiplier_temp = 0;
+    double old_volume_multiplier;
+    if(distributed_state.block(SolutionBlocks::total_volume_multiplier).in_local_range(0))
+    {
+        old_volume_multiplier_temp = state.block(SolutionBlocks::total_volume_multiplier)[0];
+    }
+    MPI_Allreduce(&old_volume_multiplier_temp, &old_volume_multiplier, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+
+    for (const auto &cell: dof_handler.active_cell_iterators()) {
+        if(cell->is_locally_owned())
+        {
             hp_fe_values.reinit(cell);
             const FEValues<dim> &fe_values = hp_fe_values.get_present_fe_values();
             cell_matrix.reinit(cell->get_fe().n_dofs_per_cell(),
@@ -1303,12 +1965,12 @@ namespace SAND {
             std::vector<Tensor<1, dim>> old_displacement_values(n_q_points);
             std::vector<double> old_displacement_divs(n_q_points);
             std::vector<SymmetricTensor<2, dim>> old_displacement_symmgrads(
-                    n_q_points);
+                        n_q_points);
             std::vector<Tensor<1, dim>> old_displacement_multiplier_values(
-                    n_q_points);
+                        n_q_points);
             std::vector<double> old_displacement_multiplier_divs(n_q_points);
             std::vector<SymmetricTensor<2, dim>> old_displacement_multiplier_symmgrads(
-                    n_q_points);
+                        n_q_points);
             std::vector<double> old_lower_slack_multiplier_values(n_q_points);
             std::vector<double> old_upper_slack_multiplier_values(n_q_points);
             std::vector<double> old_lower_slack_values(n_q_points);
@@ -1338,30 +2000,30 @@ namespace SAND {
             fe_values[displacements].get_function_divergences(state,
                                                               old_displacement_divs);
             fe_values[displacements].get_function_symmetric_gradients(
-                    state, old_displacement_symmgrads);
+                        state, old_displacement_symmgrads);
             fe_values[displacement_multipliers].get_function_values(
-                    state, old_displacement_multiplier_values);
+                        state, old_displacement_multiplier_values);
             fe_values[displacement_multipliers].get_function_divergences(
-                    state, old_displacement_multiplier_divs);
+                        state, old_displacement_multiplier_divs);
             fe_values[displacement_multipliers].get_function_symmetric_gradients(
-                    state, old_displacement_multiplier_symmgrads);
+                        state, old_displacement_multiplier_symmgrads);
             fe_values[density_lower_slacks].get_function_values(
-                    state, old_lower_slack_values);
+                        state, old_lower_slack_values);
             fe_values[density_lower_slack_multipliers].get_function_values(
-                    state, old_lower_slack_multiplier_values);
+                        state, old_lower_slack_multiplier_values);
             fe_values[density_upper_slacks].get_function_values(
-                    state, old_upper_slack_values);
+                        state, old_upper_slack_values);
             fe_values[density_upper_slack_multipliers].get_function_values(
-                    state, old_upper_slack_multiplier_values);
+                        state, old_upper_slack_multiplier_values);
             fe_values[unfiltered_densities].get_function_values(
-                    state, old_unfiltered_density_values);
+                        state, old_unfiltered_density_values);
             fe_values[unfiltered_density_multipliers].get_function_values(
-                    state, old_unfiltered_density_multiplier_values);
+                        state, old_unfiltered_density_multiplier_values);
             fe_values[unfiltered_densities].get_function_values(
-                    filtered_unfiltered_density_solution, filtered_unfiltered_density_values);
+                        relevant_filtered_unfiltered_density_solution, filtered_unfiltered_density_values);
             fe_values[unfiltered_density_multipliers].get_function_values(
-                    filter_adjoint_unfiltered_density_multiplier_solution,
-                    filter_adjoint_unfiltered_density_multiplier_values);
+                        relevant_filter_adjoint_unfiltered_density_multiplier_solution,
+                        filter_adjoint_unfiltered_density_multiplier_values);
 
 
             Tensor<1, dim> traction;
@@ -1388,7 +2050,7 @@ namespace SAND {
                     const double unfiltered_density_phi_i = fe_values[unfiltered_densities].value(i,
                                                                                                   q_point);
                     const double unfiltered_density_multiplier_phi_i = fe_values[unfiltered_density_multipliers].value(
-                            i, q_point);
+                                i, q_point);
 
                     const double lower_slack_multiplier_phi_i =
                             fe_values[density_lower_slack_multipliers].value(i,
@@ -1404,72 +2066,75 @@ namespace SAND {
                             fe_values[density_upper_slack_multipliers].value(i,
                                                                              q_point);
 
-
                     //rhs eqn 0
                     cell_rhs(i) +=
                             -1 * fe_values.JxW(q_point) * (
-                                    -1 * density_penalty_exponent *
-                                    std::pow(old_density_values[q_point], density_penalty_exponent - 1) * density_phi_i
-                                    * (old_displacement_multiplier_divs[q_point] * old_displacement_divs[q_point]
-                                       * lambda_values[q_point]
-                                       + 2 * mu_values[q_point] * (old_displacement_symmgrads[q_point]
-                                                                   * old_displacement_multiplier_symmgrads[q_point]))
-                                    - density_phi_i * old_unfiltered_density_multiplier_values[q_point]
-                                    + old_volume_multiplier * density_phi_i
-                            );
+                                -1 * density_penalty_exponent *
+                                std::pow(old_density_values[q_point], density_penalty_exponent - 1) * density_phi_i
+                                * (old_displacement_multiplier_divs[q_point] * old_displacement_divs[q_point]
+                                   * lambda_values[q_point]
+                                   + 2 * mu_values[q_point] * (old_displacement_symmgrads[q_point]
+                                                               * old_displacement_multiplier_symmgrads[q_point]))
+                                - density_phi_i * old_unfiltered_density_multiplier_values[q_point]
+                                + old_volume_multiplier * density_phi_i
+                                );
 
                     //rhs eqn 1 - boundary terms counted later
                     cell_rhs(i) +=
-                            -1 * fe_values.JxW(q_point) * (
-                                    -1 * std::pow(old_density_values[q_point], density_penalty_exponent)
-                                    * (old_displacement_multiplier_divs[q_point] * displacement_phi_i_div
-                                       * lambda_values[q_point]
-                                       + 2 * mu_values[q_point] * (old_displacement_multiplier_symmgrads[q_point]
-                                                                   * displacement_phi_i_symmgrad))
-                            );
+                            -1 * fe_values.JxW(q_point)
+                            * (
+                                -1 * std::pow(old_density_values[q_point], density_penalty_exponent)
+                                * (
+                                    old_displacement_multiplier_divs[q_point] * displacement_phi_i_div
+                                    * lambda_values[q_point]
+                                    + 2 * mu_values[q_point] * (old_displacement_multiplier_symmgrads[q_point]
+                                                               * displacement_phi_i_symmgrad)
+                                   )
+                                );
 
                     //rhs eqn 2
                     cell_rhs(i) +=
                             -1 * fe_values.JxW(q_point) * (
-                                    unfiltered_density_phi_i *
-                                    filter_adjoint_unfiltered_density_multiplier_values[q_point]
-                                    + unfiltered_density_phi_i * old_upper_slack_multiplier_values[q_point]
-                                    + -1 * unfiltered_density_phi_i * old_lower_slack_multiplier_values[q_point]
-                            );
-
-
-
+                                unfiltered_density_phi_i *
+                                filter_adjoint_unfiltered_density_multiplier_values[q_point]
+                                + unfiltered_density_phi_i * old_upper_slack_multiplier_values[q_point]
+                                + -1 * unfiltered_density_phi_i * old_lower_slack_multiplier_values[q_point]
+                                );
 
                     //rhs eqn 3 - boundary terms counted later
                     cell_rhs(i) +=
                             -1 * fe_values.JxW(q_point) * (
-                                    -1 * std::pow(old_density_values[q_point], density_penalty_exponent)
-                                    * (old_displacement_divs[q_point] * displacement_multiplier_phi_i_div
-                                       * lambda_values[q_point]
-                                       + 2 * mu_values[q_point] * (displacement_multiplier_phi_i_symmgrad
-                                                                   * old_displacement_symmgrads[q_point]))
-                            );
+                                -1 * std::pow(old_density_values[q_point], density_penalty_exponent)
+                                * (old_displacement_divs[q_point] * displacement_multiplier_phi_i_div
+                                   * lambda_values[q_point]
+                                   + 2 * mu_values[q_point] * (displacement_multiplier_phi_i_symmgrad
+                                                               * old_displacement_symmgrads[q_point]))
+                                );
 
                     //rhs eqn 4
                     cell_rhs(i) +=
                             -1 * fe_values.JxW(q_point) *
                             (-1 * lower_slack_multiplier_phi_i
                              * (old_unfiltered_density_values[q_point] - old_lower_slack_values[q_point])
-                            );
+                             );
 
                     //rhs eqn 5
                     cell_rhs(i) +=
                             -1 * fe_values.JxW(q_point) * (
-                                    -1 * upper_slack_multiplier_phi_i
-                                    * (1 - old_unfiltered_density_values[q_point]
-                                       - old_upper_slack_values[q_point]));
+                                -1 * upper_slack_multiplier_phi_i
+                                * (1 - old_unfiltered_density_values[q_point]
+                                   - old_upper_slack_values[q_point]));
 
                     //rhs eqn 6
-                    cell_rhs(i) +=
+                    if (std::abs(old_density_values[q_point] - filtered_unfiltered_density_values[q_point])>1e-12)
+                    {
+                        cell_rhs(i) +=
                             -1 * fe_values.JxW(q_point) * (
-                                    -1 * unfiltered_density_multiplier_phi_i
-                                    * (old_density_values[q_point] - filtered_unfiltered_density_values[q_point])
-                            );
+                                -1 * unfiltered_density_multiplier_phi_i
+                                * (old_density_values[q_point] - filtered_unfiltered_density_values[q_point])
+                                );
+                    }
+
 
                     //rhs eqn 7
                     cell_rhs(i) +=
@@ -1489,39 +2154,38 @@ namespace SAND {
 
             }
 
-
             for (unsigned int face_number = 0;
                  face_number < GeometryInfo<dim>::faces_per_cell;
                  ++face_number) {
                 if (cell->face(face_number)->at_boundary() && cell->face(
-                        face_number)->boundary_id() == BoundaryIds::down_force) {
+                            face_number)->boundary_id() == BoundaryIds::down_force) {
                     for (unsigned int face_q_point = 0;
                          face_q_point < n_face_q_points; ++face_q_point) {
                         for (unsigned int i = 0; i < dofs_per_cell; ++i) {
                             if (cell->material_id() == MaterialIds::without_multiplier) {
                                 fe_nine_face_values.reinit(cell, face_number);
                                 cell_rhs(i) += -1
-                                               * traction
-                                               * fe_nine_face_values[displacements].value(i,
-                                                                                          face_q_point)
-                                               * fe_nine_face_values.JxW(face_q_point);
+                                        * traction
+                                        * fe_nine_face_values[displacements].value(i,
+                                                                                   face_q_point)
+                                        * fe_nine_face_values.JxW(face_q_point);
 
                                 cell_rhs(i) += -1 * traction
-                                               * fe_nine_face_values[displacement_multipliers].value(
-                                        i, face_q_point)
-                                               * fe_nine_face_values.JxW(face_q_point);
+                                        * fe_nine_face_values[displacement_multipliers].value(
+                                            i, face_q_point)
+                                        * fe_nine_face_values.JxW(face_q_point);
                             } else {
                                 fe_ten_face_values.reinit(cell, face_number);
                                 cell_rhs(i) += -1
-                                               * traction
-                                               * fe_ten_face_values[displacements].value(i,
-                                                                                         face_q_point)
-                                               * fe_ten_face_values.JxW(face_q_point);
+                                        * traction
+                                        * fe_ten_face_values[displacements].value(i,
+                                                                                  face_q_point)
+                                        * fe_ten_face_values.JxW(face_q_point);
 
                                 cell_rhs(i) += -1 * traction
-                                               * fe_ten_face_values[displacement_multipliers].value(
-                                        i, face_q_point)
-                                               * fe_ten_face_values.JxW(face_q_point);
+                                        * fe_ten_face_values[displacement_multipliers].value(
+                                            i, face_q_point)
+                                        * fe_ten_face_values.JxW(face_q_point);
                             }
                         }
                     }
@@ -1531,321 +2195,818 @@ namespace SAND {
 
             MatrixTools::local_apply_boundary_values(boundary_values, local_dof_indices,
                                                      cell_matrix, cell_rhs, true);
-
             constraints.distribute_local_to_global(
-                    cell_rhs, local_dof_indices, test_rhs);
-
+                        cell_rhs, local_dof_indices, test_rhs);
         }
+    }
+
+    test_rhs.compress(VectorOperation::add);
+    double total_volume_temp = 0;
+    double goal_volume_temp = 0;
+    double total_volume, goal_volume;
 
-        double total_volume = 0;
-        double goal_volume = 0;
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
-            total_volume += cell->measure() * state.block(SolutionBlocks::density)[cell->active_cell_index()];
-            goal_volume += cell->measure() * Input::volume_percentage;
+    distributed_solution = state;
+    for (const auto &cell: dof_handler.active_cell_iterators()) {
+        if(cell->is_locally_owned())
+        {
+            std::vector<unsigned int> i(cell->get_fe().n_dofs_per_cell());
+            cell->get_dof_indices(i);
+            if (distributed_solution.block(SolutionBlocks::density).in_local_range(i[cell->get_fe().component_to_system_index(0, 0)]))
+            {
+                total_volume_temp += cell->measure() * state.block(SolutionBlocks::density)[i[cell->get_fe().component_to_system_index(0, 0)]];
+                goal_volume_temp += cell->measure() * Input::volume_percentage;
+            }
         }
+    }
 
-        test_rhs.block(SolutionBlocks::total_volume_multiplier)[0] = goal_volume - total_volume;
+    MPI_Allreduce(&total_volume_temp, &total_volume, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+    MPI_Allreduce(&goal_volume_temp, &goal_volume, 1, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
 
-        return test_rhs;
 
+    if (test_rhs.block(SolutionBlocks::total_volume_multiplier).in_local_range(0))
+    {
+        test_rhs.block(SolutionBlocks::total_volume_multiplier)[0] = goal_volume - total_volume;
     }
+    test_rhs.compress(VectorOperation::insert);
+
+    return test_rhs;
 
+}
 
-    ///A  direct solver, for now. The complexity of the system means that an iterative solver algorithm will take some more work in the future.
-    template<int dim>
-    BlockVector<double>
-    KktSystem<dim>::solve(const BlockVector<double> &state, double barrier_size) {
-        constraints.condense(system_matrix);
-        double gmres_tolerance;
-        if (Input::use_eisenstat_walker) {
-            gmres_tolerance = std::max(
+///Solves the big system to get the newton step
+template<int dim>
+LA::MPI::BlockVector
+KktSystem<dim>::solve(const LA::MPI::BlockVector &state) {
+    double gmres_tolerance;
+    if (Input::use_eisenstat_walker) {
+        gmres_tolerance = std::max(
                     std::min(
-                            .1 * system_rhs.l2_norm() / (initial_rhs_error),
-                            .001
-                    ),
+                        .1 * system_rhs.l2_norm() / (initial_rhs_error),
+                        .001
+                        ),
                     Input::default_gmres_tolerance);
-        } else {
-            gmres_tolerance = Input::default_gmres_tolerance;
+    }
+    else {
+        gmres_tolerance = Input::default_gmres_tolerance*system_rhs.l2_norm();
+    }
+
+
+    locally_relevant_solution=state;
+    distributed_solution = state;
+
+    SolverControl solver_control(10000, gmres_tolerance);
+
+    // ************ BEGIN MAKING MF GMG ELASTICITY PRECONDITIONER ***************************
+    using SystemMFMatrixType = MF_Elasticity_Operator<dim, 1, double>;
+    using LevelMFMatrixType = MF_Elasticity_Operator<dim, 1, double>;
+
+    elasticity_matrix_mf.clear();
+    mg_matrices.clear_elements();
+
+    std::map< types::global_dof_index, Point< dim > > support_points;
+    std::map< types::global_dof_index, Point< dim > > support_points_displacement;
+
+    MappingQGeneric<dim,dim> generic_map_displacement(1);
+    MappingQGeneric<dim,dim> generic_map_1(1);
+    MappingQGeneric<dim,dim> generic_map_2(1);
+
+    hp::MappingCollection< dim, dim > hp_generic_map;
+
+    hp_generic_map.push_back(generic_map_1);
+    hp_generic_map.push_back(generic_map_2);
+
+    DoFTools::map_dofs_to_support_points(generic_map_displacement, dof_handler_displacement, support_points_displacement);
+    DoFTools::map_dofs_to_support_points(hp_generic_map, dof_handler, support_points);
+
+
+    const types::global_dof_index disp_mult_start_index = system_matrix.get_row_indices().block_start(SolutionBlocks::displacement_multiplier);
+
+    for (const auto &support_points_displacement_pair : support_points_displacement)
+    {
+        if (support_points_displacement_pair.second != support_points[support_points_displacement_pair.first+disp_mult_start_index])
+            pcout << "d = " << support_points_displacement_pair.first << ", points are " << support_points_displacement_pair.second << " and " << support_points[support_points_displacement_pair.first+disp_mult_start_index] << std::endl;
+    }
+
+    MPI_Barrier(MPI_COMM_WORLD);
+
+    std::vector<IndexSet> locally_owned_dofs = Utilities::MPI::all_gather(mpi_communicator, dof_handler_displacement.locally_owned_dofs());
+    IndexSet locally_active_dofs;
+    DoFTools::extract_locally_active_dofs(dof_handler_displacement, locally_active_dofs);
+    IndexSet locally_relevant_dofs;
+    DoFTools::extract_locally_relevant_dofs(dof_handler_displacement, locally_relevant_dofs);
+   // AffineConstraints<double> temp_displacement_constraints;
+    
+    
+
+    displacement_constraints.clear();
+    displacement_constraints.reinit(locally_relevant_dofs); //FIXME SHOULD THIS BE RELEVANT???
+    displacement_constraints.copy_from(mg_level_constraints[triangulation.n_global_levels()-1]);
+    std::cout << "displacement constraint number: " << displacement_constraints.n_constraints() <<std::endl;
+    displacement_constraints.close();
+    {
+        typename MatrixFree<dim, double>::AdditionalData additional_data;
+        additional_data.tasks_parallel_scheme =
+                MatrixFree<dim, double>::AdditionalData::none;
+        additional_data.mapping_update_flags =
+                (update_gradients | update_JxW_values | update_quadrature_points);
+        std::shared_ptr<MatrixFree<dim, double>> system_mf_storage(
+                    new MatrixFree<dim, double>());
+        system_mf_storage->reinit(generic_map_1,
+                                  dof_handler_displacement,
+                                  displacement_constraints,
+                                  QGauss<1>(fe_displacement.degree + 1),
+                                  additional_data);
+        elasticity_matrix_mf.initialize(system_mf_storage);
+    }
+
+
+    LinearAlgebra::distributed::Vector<double> distributed_displacement_sol;
+    LinearAlgebra::distributed::Vector<double> distributed_displacement_rhs;
+
+    elasticity_matrix_mf.initialize_dof_vector(distributed_displacement_sol);
+    elasticity_matrix_mf.initialize_dof_vector(distributed_displacement_rhs);
+
+    ChangeVectorTypes::copy_from_system_to_displacement_vector<double>(distributed_displacement_sol,distributed_solution.block(SolutionBlocks::displacement),displacement_to_system_dof_index_map);
+
+    ChangeVectorTypes::copy_from_system_to_displacement_vector<double>(distributed_displacement_rhs,system_rhs.block(SolutionBlocks::displacement),displacement_to_system_dof_index_map);
+
+    const unsigned int n_levels = triangulation.n_global_levels();
+    mg_matrices.resize(0, n_levels - 1);
+
+    mg_constrained_dofs.clear();
+    mg_constrained_dofs.initialize(dof_handler_displacement);
+    const std::set<types::boundary_id> empty_boundary_set;
+    // mg_constrained_dofs.make_zero_boundary_constraints(dof_handler_displacement,empty_boundary_set);
+
+
+    for (unsigned int level = 0; level < n_levels; ++level)
+    {
+        mg_constrained_dofs.add_user_constraints(level, mg_level_constraints[level]);
+    }
+
+    // for (unsigned int level = 0; level < n_levels; ++level)
+    // {
+    //     mg_level_constraints[level].print(std::cout);
+    // }
+
+    for (unsigned int level = 0; level < n_levels; ++level)
+    {
+        IndexSet relevant_dofs;
+        DoFTools::extract_locally_relevant_level_dofs(dof_handler_displacement,
+                                                      level,
+                                                      relevant_dofs);
+
+        typename MatrixFree<dim, double>::AdditionalData additional_data;
+        additional_data.tasks_parallel_scheme =
+                MatrixFree<dim, double>::AdditionalData::none;
+        additional_data.mapping_update_flags =
+                (update_gradients | update_JxW_values | update_quadrature_points);
+        additional_data.mg_level = level;
+
+        std::shared_ptr<MatrixFree<dim, double>> mg_mf_storage_level(
+                    new MatrixFree<dim, double>());
+        mg_mf_storage_level->reinit(generic_map_1,
+                                    dof_handler_displacement,
+                                    mg_level_constraints[level],
+                                    QGauss<1>(fe_displacement.degree + 1),
+                                    additional_data);
+
+        mg_matrices[level].clear();
+        mg_matrices[level].initialize(mg_mf_storage_level,
+                                      mg_constrained_dofs,
+                                      level);
+    }
+
+
+    //+++++++++++++++++++++++++EVALUATE MATRIX LEVEL DENSITIES HERE +++++++++++++++++++++++++++++++++++++
+
+
+    dof_handler_density.distribute_dofs(fe_density);
+
+    DoFRenumbering::component_wise(dof_handler_density);
+    DoFRenumbering::hierarchical(dof_handler_density);
+
+    dof_handler_density.distribute_mg_dofs();
+
+    active_density_vector.reinit(dof_handler_density.locally_owned_dofs(),triangulation.get_communicator());
+
+    ChangeVectorTypes::copy(active_density_vector,distributed_solution.block(SolutionBlocks::density));
+
+
+    const unsigned int n_cells = elasticity_matrix_mf.get_matrix_free()->n_cell_batches();
+    // {
+        
+
+    //     QGauss<dim> nine_quadrature(2);
+    //     QGauss<dim> ten_quadrature(2);
+
+    //     hp::QCollection<dim> q_collection;
+    //     q_collection.push_back(nine_quadrature);
+    //     q_collection.push_back(ten_quadrature);
+
+    //     hp::FEValues<dim> hp_fe_values(fe_collection,
+    //                                    q_collection,
+    //                                    update_values | update_quadrature_points |
+    //                                    update_JxW_values | update_gradients);
+
+
+
+    //     for (const auto &cell : dof_handler.active_cell_iterators())
+    //         if (cell->is_locally_owned())
+    //         {
+
+    //             hp_fe_values.reinit(cell);
+    //             const FEValues<dim> &fe_values = hp_fe_values.get_present_fe_values();
+
+    //             const unsigned int dofs_per_cell = fe_values.dofs_per_cell;
+    //             const unsigned int n_q_points = fe_values.n_quadrature_points;
+
+    //             std::vector<types::global_dof_index> local_dof_indices (dofs_per_cell);
+    //             cell->get_dof_indices (local_dof_indices);
+    //             Vector<double> cell_vector (dofs_per_cell);
+    //             Vector<double> local_projection (dofs_per_cell);
+    //             FullMatrix<double> local_mass_matrix (dofs_per_cell, dofs_per_cell);
+
+    //             std::vector<double> rhs_values(n_q_points);
+    //             std::vector<double> old_density_values(n_q_points);
+
+    //             const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
+    //             fe_values[densities].get_function_values(locally_relevant_solution, old_density_values);
+    //             double cell_density = old_density_values[0];
+
+    //             for (unsigned int i=0; i<rhs_values.size(); ++i)
+    //             {
+    //                 rhs_values[i] = cell_density;
+    //             }
+
+    //             local_projection = cell_density;
+
+    //             std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+    //             cell->get_dof_indices(i);
+    //             const unsigned int i_val = i[cell->get_fe().component_to_system_index(0, 0)];
+    //             active_density_vector[i_val] = cell_density;
+
+
+    //         }
+
+    //     // active_density_vector.compress(VectorOperation::insert);
+    // }
+    // MAKE ACTIVE_CELL_DATA
+    std::vector<types::global_dof_index> local_dof_indices(fe_density.dofs_per_cell);
+    active_cell_data.density.reinit(TableIndices<2>(n_cells, 1));
+    for (unsigned int cell=0; cell<n_cells; ++cell)
+    {
+        const unsigned int n_components_filled = elasticity_matrix_mf.get_matrix_free()->n_active_entries_per_cell_batch(cell);
+
+        for (unsigned int i=0; i<n_components_filled; ++i)
+        {
+            typename DoFHandler<dim>::active_cell_iterator FEQ_cell =elasticity_matrix_mf.get_matrix_free()->get_cell_iterator(cell,i);
+            typename DoFHandler<dim>::active_cell_iterator DG_cell(&(triangulation),
+                                                                   FEQ_cell->level(),
+                                                                   FEQ_cell->index(),
+                                                                   &dof_handler_density);
+
+            DG_cell->get_active_or_mg_dof_indices(local_dof_indices);
+
+            active_cell_data.density(cell, 0)[i] = active_density_vector(local_dof_indices[0]);
         }
-        SolverControl solver_control(10000, gmres_tolerance * system_rhs.l2_norm());
-
-        TopOptSchurPreconditioner<dim> preconditioner(system_matrix);
-        switch (Input::solver_choice) {
-            case SolverOptions::direct_solve: {
-                SparseDirectUMFPACK A_direct;
-                A_direct.initialize(system_matrix);
-                A_direct.vmult(linear_solution, system_rhs);
-                break;
-            }
-            case SolverOptions::exact_preconditioner_with_gmres: {
-                preconditioner.initialize(system_matrix, boundary_values, dof_handler, barrier_size, state);
-                SolverFGMRES<BlockVector<double>> A_fgmres(solver_control);
-                A_fgmres.solve(system_matrix, linear_solution, system_rhs, preconditioner);
-                std::cout << solver_control.last_step() << " steps to solve with GMRES" << std::endl;
-                break;
-            }
-            case SolverOptions::inexact_K_with_exact_A_gmres: {
-                preconditioner.initialize(system_matrix, boundary_values, dof_handler, barrier_size, state);
-                SolverFGMRES<BlockVector<double>> B_fgmres(solver_control);
-                B_fgmres.solve(system_matrix, linear_solution, system_rhs, preconditioner);
-                std::cout << solver_control.last_step() << " steps to solve with GMRES" << std::endl;
-                break;
-            }
-            case SolverOptions::inexact_K_with_inexact_A_gmres: {
-                preconditioner.initialize(system_matrix, boundary_values, dof_handler, barrier_size, state);
-                SolverFGMRES<BlockVector<double>> C_fgmres(solver_control);
-                C_fgmres.solve(system_matrix, linear_solution, system_rhs, preconditioner);
-                std::cout << solver_control.last_step() << " steps to solve with GMRES" << std::endl;
-                break;
+    }
+    
+    elasticity_matrix_mf.set_cell_data(active_cell_data);
+
+    //MAKE LEVEL DENSITY VECTOR
+
+    level_cell_data.resize(0,n_levels-1);
+    level_density_vector = 0.;
+    level_density_vector.resize(0,n_levels-1);
+
+    transfer.build(dof_handler_density);
+
+    transfer.interpolate_to_mg(dof_handler_density,
+                               level_density_vector,
+                               active_density_vector);
+
+    // MAKE LEVEL_CELL_DATA
+    for (unsigned int level=0; level<n_levels; ++level)
+    {
+        const unsigned int n_cells = mg_matrices[level].get_matrix_free()->n_cell_batches();
+
+        level_cell_data[level].density.reinit(TableIndices<2>(n_cells, 1));
+        for (unsigned int cell=0; cell<n_cells; ++cell)
+        {
+            const unsigned int n_components_filled = mg_matrices[level].get_matrix_free()->n_active_entries_per_cell_batch(cell);
+            for (unsigned int i=0; i<n_components_filled; ++i)
+            {
+
+                typename DoFHandler<dim>::level_cell_iterator FEQ_cell = mg_matrices[level].get_matrix_free()->get_cell_iterator(cell,i);
+                typename DoFHandler<dim>::level_cell_iterator DG_cell(&(triangulation),
+                                                                      FEQ_cell->level(),
+                                                                      FEQ_cell->index(),
+                                                                      &dof_handler_density);
+                DG_cell->get_active_or_mg_dof_indices(local_dof_indices);
+
+
+                level_cell_data[level].density(cell, 0)[i] = level_density_vector[level](local_dof_indices[0]);
             }
-            default:
-                throw;
-        }
-        constraints.distribute(linear_solution);
 
-        if (Input::output_parts_of_matrix) {
-            preconditioner.print_stuff(system_matrix);
         }
 
-        if (Input::output_full_preconditioned_matrix) {
-//            FullMatrix<double> preconditioned_full_mat(system_matrix.n(), system_matrix.n());
-//            const auto op_preconditioned_full_mat = linear_operator(preconditioner) * linear_operator(system_matrix);
-//            build_matrix_element_by_element(op_preconditioned_full_mat, preconditioned_full_mat);
-//            print_matrix("preconditioned_full_block_matrix.csv",preconditioned_full_mat);
-        }
+        // Store density tables and other data into the multigrid level matrix-free objects.
+
+        mg_matrices[level].set_cell_data (level_cell_data[level]);
+
+    }
+
+
+
 
-        if (Input::output_full_matrix) {
-//            const unsigned int vec_size = system_matrix.n();
-//            FullMatrix<double> full_mat(vec_size, vec_size);
-//            build_matrix_element_by_element(system_matrix,full_mat);
-//            std::ofstream Mat("full_block_matrix.csv");
-//            for (unsigned int i = 0; i < vec_size; i++) {
-//                Mat << full_mat(i, 0);
-//                for (unsigned int j = 1; j < vec_size; j++) {
-//                    Mat << "," << full_mat(i, j);
-//                }
-//                Mat << "\n";
-//            }
-//            Mat.close();
+    //+++++++++++++++++++++++++++++++++++++++++++++++++++++++++
+
+
+    mg_transfer.initialize_constraints(mg_constrained_dofs);
+    mg_transfer.build(dof_handler_displacement);
+
+    smoother_data.resize(0, triangulation.n_global_levels() - 1);
+
+    for (unsigned int level = 0; level < triangulation.n_global_levels();
+         ++level)
+    {
+        if (level > 0)
+        {
+            smoother_data[level].smoothing_range     = 15.;
+            smoother_data[level].degree              = 10;
+            smoother_data[level].eig_cg_n_iterations = 10;
         }
-        return linear_solution;
+        else
+        {
+            smoother_data[0].smoothing_range = 1e-3;
+            smoother_data[0].degree          = numbers::invalid_unsigned_int;
+            smoother_data[0].eig_cg_n_iterations = mg_matrices[0].m();
+        }
+        mg_matrices[level].compute_diagonal();
+        smoother_data[level].preconditioner =
+                mg_matrices[level].get_matrix_diagonal_inverse();
     }
 
-    template<int dim>
-    void
-    KktSystem<dim>::calculate_initial_rhs_error() {
-        initial_rhs_error = system_rhs.l2_norm();
+    mg_smoother.initialize(mg_matrices, smoother_data);
+
+    mg_coarse.initialize(mg_smoother);
+    mg::Matrix<LinearAlgebra::distributed::Vector<double>> mg_matrix(mg_matrices);
+
+    mg_interface_matrices.resize(0, triangulation.n_global_levels() - 1);
+    for (unsigned int level = 0; level < triangulation.n_global_levels();
+         ++level)
+    {
+        mg_interface_matrices[level].initialize(mg_matrices[level]);
     }
+    mg::Matrix<LinearAlgebra::distributed::Vector<double>> mg_interface(mg_interface_matrices);
+
+    Multigrid<LinearAlgebra::distributed::Vector<double>> mg(
+                mg_matrix, mg_coarse, mg_transfer, mg_smoother, mg_smoother);
+    mg.set_edge_matrices(mg_interface, mg_interface);
+    mg.set_cycle(Multigrid<LinearAlgebra::distributed::Vector<double>>::v_cycle);
+    mg.set_minlevel(0);
+    PreconditionMG<dim,LinearAlgebra::distributed::Vector<double>,MGTransferMatrixFree<dim, double>>
+            mf_gmg_preconditioner(dof_handler_displacement, mg, mg_transfer);
+
+
+// *************TEST SOLVE*************************
+// time the solve
+
+//    output(distributed_solution, 66);
+
+//    TimerOutput t(pcout, TimerOutput::never, TimerOutput::wall_times);
+//    {
+//    TimerOutput::Scope t_scope(t, "Solve_mfgmg");
+//    elasticity_matrix_mf.initialize_dof_vector(distributed_displacement_sol);
+//    elasticity_matrix_mf.initialize_dof_vector(distributed_displacement_rhs);
 
-    template<int dim>
-    BlockVector<double>
-    KktSystem<dim>::get_initial_state() {
+//    locally_relevant_solution = system_rhs;
+//    ChangeVectorTypes::copy_from_system_to_displacement_vector<double>(distributed_displacement_rhs,locally_relevant_solution.block(SolutionBlocks::displacement),displacement_to_system_dof_index_map);
 
-        std::vector<unsigned int> block_component(10, 2);
-        block_component[0] = 0;
-        block_component[5] = 1;
-        const std::vector<types::global_dof_index> dofs_per_block =
-                DoFTools::count_dofs_per_fe_block(dof_handler, block_component);
-        const unsigned int n_p = dofs_per_block[0];
-        const unsigned int n_u = dofs_per_block[1];
-        const std::vector<unsigned int> block_sizes = {n_p, n_p, n_p, n_p, n_p, n_u, n_u, n_p, n_p, 1};
+//     pcout << "real rhs norm: " << system_rhs.block(SolutionBlocks::displacement).l2_norm() << std::endl;
 
-        BlockVector<double> state(block_sizes);
-        {
-            using namespace SolutionBlocks;
-            state.block(density).add(density_ratio);
-            state.block(unfiltered_density).add(density_ratio);
-            state.block(unfiltered_density_multiplier)
-                    .add(density_ratio);
-            state.block(density_lower_slack).add(density_ratio);
-            state.block(density_lower_slack_multiplier).add(50);
-            state.block(density_upper_slack).add(1 - density_ratio);
-            state.block(density_upper_slack_multiplier).add(50);
-            state.block(total_volume_multiplier).add(1);
-            state.block(displacement).add(0);
-            state.block(displacement_multiplier).add(0);
+//    locally_relevant_solution = distributed_solution;
+//    ChangeVectorTypes::copy_from_system_to_displacement_vector<double>(distributed_displacement_sol,locally_relevant_solution.block(SolutionBlocks::displacement),displacement_to_system_dof_index_map);
+   
+//    SolverControl test_solver_control_1(20, 1e-6);
+//    SolverCG<LinearAlgebra::distributed::Vector<double>> CG_Solve_1(test_solver_control_1);
+
+//    pcout << "pre norm: " << distributed_displacement_rhs.l2_norm() << std::endl;
+
+//    try
+//    {
+//         // mf_gmg_preconditioner.vmult(distributed_displacement_sol, distributed_displacement_rhs);
+// //        CG_Solve.solve(elasticity_matrix_mf, distributed_displacement_sol, -1* distributed_displacement_rhs,    );
+//        CG_Solve_1.solve(elasticity_matrix_mf, distributed_displacement_sol, -1* distributed_displacement_rhs, mf_gmg_preconditioner);
+//    }
+//    catch(std::exception &exc)
+//    {
+//        pcout << "mfgmg diff: " << solver_control.initial_value()/solver_control.last_value() << std::endl;
+//    }
+
+//    pcout << "mfgmg solved in " << test_solver_control_1.last_step() <<  " steps" << std::endl;
+// //    try
+// //    {
+// // //        CG_Solve.solve(elasticity_matrix_mf, distributed_displacement_sol, -1* distributed_displacement_rhs,    PreconditionIdentity());
+// //        CG_Solve_2.solve(system_matrix.block(SolutionBlocks::displacement,SolutionBlocks::displacement_multiplier), distributed_solution.block(SolutionBlocks::displacement_multiplier), system_rhs.block(SolutionBlocks::displacement), PreconditionIdentity()  );
+// //    }
+// //    catch(std::exception &exc)
+// //    {
+// //        std::cout << "solve failed in " << test_solver_control_2.last_step() <<  " steps" << std::endl;
+// //        throw;
+// //    }
+
+// //    std::cout << "solved in " << test_solver_control_2.last_step() <<  " steps" << std::endl;
+
+
+//    }
+//    ChangeVectorTypes::copy_from_displacement_to_system_vector<double>(distributed_solution.block(SolutionBlocks::displacement), distributed_displacement_sol,displacement_to_system_dof_index_map);
+//    displacement_constraints.distribute(distributed_solution.block(SolutionBlocks::displacement));
+
+//     pcout << distributed_displacement_sol.linfty_norm() << "+++++++++++++" << std::endl;
+
+//     int a = Utilities::MPI::n_mpi_processes(mpi_communicator);
+
+//     ChangeVectorTypes::copy(distributed_solution.block(SolutionBlocks::density),active_density_vector);
+
+
+
+//     TrilinosWrappers::PreconditionAMG amg_pre;
+//     amg_pre.initialize(system_matrix.block(SolutionBlocks::displacement,SolutionBlocks::displacement_multiplier));
+//    {
+//     TimerOutput::Scope t_scope(t, "Solve_AMG");
+    
+//     SolverControl test_solver_control_2(50000, 1e-6);
+//     SolverCG<LA::MPI::Vector> CG_Solve_2(test_solver_control_2);
+
+//     distributed_solution.block(SolutionBlocks::displacement_multiplier) = 0.;
+
+//      try
+//    {
+//        CG_Solve_2.solve(system_matrix.block(SolutionBlocks::displacement,SolutionBlocks::displacement_multiplier), distributed_solution.block(SolutionBlocks::displacement_multiplier), system_rhs.block(SolutionBlocks::displacement), amg_pre);
+//    }
+//    catch(std::exception &exc)
+//    {
+//        std::cout << "solve failed in " << test_solver_control_2.last_step() <<  " steps" << std::endl;
+//        throw;
+//    }
+
+//    std::cout << "amg solved in " << test_solver_control_2.last_step() <<  " steps" << std::endl;
+
+//    }
+//     distributed_solution.block(SolutionBlocks::displacement_multiplier)=0;
+//    {
+//     TimerOutput::Scope t_scope(t, "Solve_CG");
+//     SolverControl test_solver_control_3(50000, 1e-6);
+//     SolverCG<LA::MPI::Vector> CG_Solve_3(test_solver_control_3);
+//      try
+//    {
+//        CG_Solve_3.solve(system_matrix.block(SolutionBlocks::displacement,SolutionBlocks::displacement_multiplier), distributed_solution.block(SolutionBlocks::displacement), system_rhs.block(SolutionBlocks::displacement), PreconditionIdentity());
+//    }
+//    catch(std::exception &exc)
+//    {
+//        std::cout << "solve failed in " << test_solver_control_3.last_step() <<  " steps" << std::endl;
+//        throw;
+//    }
+
+//     std::cout << "CG solved in " << test_solver_control_3.last_step() <<  " steps" << std::endl;
+
+//    }
+
+
+//    t.print_summary();
+//    MPI_Abort(mpi_communicator, 1);
+
+//    ***************END TEST SOLVE*************************
+
+
+
+    TopOptSchurPreconditioner<dim> preconditioner(system_matrix, dof_handler, elasticity_matrix_mf, mf_gmg_preconditioner, displacement_to_system_dof_index_map);
+    // pcout << "about to solve" << std::endl;
+    // preconditioner.initialize(system_matrix, boundary_values, dof_handler, distributed_solution);
+    // FullMatrix<double> out;
+    // out.reinit(system_matrix.m(),system_matrix.n());
+    // LA::MPI::BlockVector e_j (system_rhs);
+    // LA::MPI::BlockVector r_j (system_rhs);
+    // LA::MPI::BlockVector r2_j (system_rhs);
+    // for (unsigned int j=0; j<out.n(); ++j)
+    // {
+    //     e_j = 0.;
+    //     e_j(j) = 1;
+    //     system_matrix.vmult(system_rhs,e_j);
+    //     preconditioner.vmult(r2_j,system_rhs);
+
+    //     for (unsigned int i=0; i<out.m(); ++i)
+    //         out(i,j) = r2_j(i);
+    // }
+
+    // const unsigned int n = out.n();
+    // const unsigned int m = out.m();
+    // std::ofstream Xmat("preconditioned_mat.csv");
+    // for (unsigned int i = 0; i < m; i++)
+    // {
+    //     Xmat << out(i, 0);
+    //     for (unsigned int j = 1; j < n; j++)
+    //     {
+    //         Xmat << "," << out(i, j);
+    //     }
+    //     Xmat << "\n";
+    // }
+    // Xmat.close();
+    
+
+    
+
+    switch (Input::solver_choice)
+    {
+
+        // case SolverOptions::inexact_K_with_exact_A_gmres: {
+
+
+        //     preconditioner.initialize(system_matrix, boundary_values, dof_handler, distributed_solution);
+        //     pcout << "preconditioner initialized" << std::endl;
+        //     SolverFGMRES<LA::MPI::BlockVector> B_fgmres(solver_control);
+        //     B_fgmres.solve(system_matrix, distributed_solution, system_rhs, preconditioner);
+        //     pcout << solver_control.last_step() << " steps to solve with GMRES" << std::endl;
+        //     break;
+        // }
+        case SolverOptions::inexact_K_with_inexact_A_gmres: {
+            pcout << "size of rhs block 0 :  " << system_rhs.block(0).l1_norm()<< std::endl;
+            pcout << "size of rhs block 1 :  " << system_rhs.block(1).l1_norm()<< std::endl;
+            pcout << "size of rhs block 2 :  " << system_rhs.block(2).l1_norm()<< std::endl;
+            pcout << "size of rhs block 3 :  " << system_rhs.block(3).l1_norm()<< std::endl;
+            pcout << "size of rhs block 4 :  " << system_rhs.block(4).l1_norm()<< std::endl;
+            pcout << "size of rhs block 5 :  " << system_rhs.block(5).l1_norm()<< std::endl;
+            pcout << "size of rhs block 6 :  " << system_rhs.block(6).l1_norm()<< std::endl;
+            pcout << "size of rhs block 7 :  " << system_rhs.block(7).l1_norm()<< std::endl;
+            pcout << "size of rhs block 8 :  " << system_rhs.block(8).l1_norm()<< std::endl;
+            pcout << "size of rhs block 9 :  " << system_rhs.block(9).l1_norm()<< std::endl;
+
+            preconditioner.initialize(system_matrix, boundary_values, dof_handler, distributed_solution);
+            pcout << "preconditioner initialized" << std::endl;
+            distributed_solution = 0.;
+            SolverFGMRES<LA::MPI::BlockVector> C_fgmres(solver_control);
+            C_fgmres.solve(system_matrix, distributed_solution, system_rhs, preconditioner);
+            pcout << solver_control.last_step() << " steps to solve with FGMRES" << std::endl;
+            break;
         }
-        return state;
+        default:
+            throw;
+        
+    }
+
+    constraints.distribute(distributed_solution);
+    pcout << "size of distributed solution block 0 :  " << distributed_solution.block(0).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 1 :  " << distributed_solution.block(1).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 2 :  " << distributed_solution.block(2).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 3 :  " << distributed_solution.block(3).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 4 :  " << distributed_solution.block(4).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 5 :  " << distributed_solution.block(5).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 6 :  " << distributed_solution.block(6).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 7 :  " << distributed_solution.block(7).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 8 :  " << distributed_solution.block(8).l1_norm()<< std::endl;
+    pcout << "size of distributed solution block 9 :  " << distributed_solution.block(9).l1_norm()<< std::endl;
+    output(distributed_solution,100);
+    return distributed_solution;
+}
+
+///Calculates and stores the first RHS norm for comparison with future RHS norm values
+template<int dim>
+void
+KktSystem<dim>::calculate_initial_rhs_error() {
+    initial_rhs_error = system_rhs.l2_norm();
+}
+
+///Creates an initial state vector used as an initial guess for the nonlinear solver.
+template<int dim>
+LA::MPI::BlockVector
+KktSystem<dim>::get_initial_state() {
+
+    std::vector<unsigned int> block_component(10, 2);
+    block_component[SolutionBlocks::density] = 0;
+    block_component[SolutionBlocks::displacement] = 1;
+    const std::vector<types::global_dof_index> dofs_per_block =
+            DoFTools::count_dofs_per_fe_block(dof_handler, block_component);
+    const unsigned int n_p = dofs_per_block[0];
+    const unsigned int n_u = dofs_per_block[1];
+    const std::vector<unsigned int> block_sizes = {n_p, n_p, n_p, n_p, n_p, n_u, n_u, n_p, n_p, 1};
+
+    LA::MPI::BlockVector state(owned_partitioning, mpi_communicator);
+    {
+        using namespace SolutionBlocks;
+        state.block(density).add(density_ratio);
+        state.block(unfiltered_density).add(density_ratio);
+        state.block(unfiltered_density_multiplier)
+                .add(density_ratio);
+        state.block(density_lower_slack).add(density_ratio);
+        state.block(density_lower_slack_multiplier).add(50);
+        state.block(density_upper_slack).add(1 - density_ratio);
+        state.block(density_upper_slack_multiplier).add(50);
+        state.block(total_volume_multiplier).add(1);
+        state.block(displacement).add(0);
+        state.block(displacement_multiplier).add(0);
+        // state.compress(VectorOperation::add);
+
+        // RANDOM PART HERE
+        // for(unsigned int k = 0; k<n_p; ++k)
+        // {
+        //     // std::rand(001);
+        //     // assign random values to the density
+        //     double r = std::rand()/double(RAND_MAX);
+        //     state.block(density)[k] = r;
+        //     state.block(unfiltered_density)[k] = r;
+        // }
 
     }
+    state.compress(VectorOperation::add);
+    return state;
+}
 
-    template<int dim>
-    void
-    KktSystem<dim>::output(const BlockVector<double> &state, const unsigned int j) const {
-        std::vector<std::string> solution_names(1, "low_slack_multiplier");
-        std::vector<DataComponentInterpretation::DataComponentInterpretation> data_component_interpretation(
+///Outputs the current state to a vtk file
+template<int dim>
+void
+KktSystem<dim>::output(const LA::MPI::BlockVector &state, const unsigned int j) const {
+    locally_relevant_solution = state;
+    std::vector<std::string> solution_names(1, "low_slack_multiplier");
+    std::vector<DataComponentInterpretation::DataComponentInterpretation> data_component_interpretation(
                 1, DataComponentInterpretation::component_is_scalar);
-        solution_names.emplace_back("upper_slack_multiplier");
-        data_component_interpretation.push_back(
+    solution_names.emplace_back("upper_slack_multiplier");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        solution_names.emplace_back("low_slack");
-        data_component_interpretation.push_back(
+    solution_names.emplace_back("low_slack");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        solution_names.emplace_back("upper_slack");
-        data_component_interpretation.push_back(
+    solution_names.emplace_back("upper_slack");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        solution_names.emplace_back("unfiltered_density");
-        data_component_interpretation.push_back(
+    solution_names.emplace_back("unfiltered_density");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        for (unsigned int i = 0; i < dim; i++) {
-            solution_names.emplace_back("displacement");
-            data_component_interpretation.push_back(
-                    DataComponentInterpretation::component_is_part_of_vector);
-        }
-        for (unsigned int i = 0; i < dim; i++) {
-            solution_names.emplace_back("displacement_multiplier");
-            data_component_interpretation.push_back(
+    for (unsigned int i = 0; i < dim; i++) {
+        solution_names.emplace_back("displacement");
+        data_component_interpretation.push_back(
                     DataComponentInterpretation::component_is_part_of_vector);
-        }
-        solution_names.emplace_back("density_multiplier");
+    }
+    for (unsigned int i = 0; i < dim; i++) {
+        solution_names.emplace_back("displacement_multiplier");
         data_component_interpretation.push_back(
+                    DataComponentInterpretation::component_is_part_of_vector);
+    }
+    solution_names.emplace_back("density_multiplier");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        solution_names.emplace_back("density");
-        data_component_interpretation.push_back(
+    solution_names.emplace_back("density");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        solution_names.emplace_back("volume_multiplier");
-        data_component_interpretation.push_back(
+    solution_names.emplace_back("volume_multiplier");
+    data_component_interpretation.push_back(
                 DataComponentInterpretation::component_is_scalar);
-        DataOut<dim> data_out;
-        data_out.attach_dof_handler(dof_handler);
-        data_out.add_data_vector(state, solution_names,
-                                 DataOut<dim>::type_dof_data, data_component_interpretation);
-        data_out.build_patches();
-        std::ofstream output("solution" + std::to_string(j) + ".vtk");
-        data_out.write_vtk(output);
+    DataOut<dim> data_out;
+    data_out.attach_dof_handler(dof_handler);
+    data_out.add_data_vector(locally_relevant_solution,
+                             solution_names,
+                             DataOut<dim>::type_dof_data,
+                             data_component_interpretation);
+    data_out.build_patches();
+    std::string output("solution" + std::to_string(j) + ".vtu");
+    data_out.write_vtu_in_parallel(output, MPI_COMM_WORLD);
 
-    }
+}
 
-    template<>
-    void
-    KktSystem<2>::output_stl(const BlockVector<double> &state) {
-        double height = .25;
-        const int dim = 2;
-        std::ofstream stlfile;
-        stlfile.open("bridge.stl");
-        stlfile << "solid bridge\n" << std::scientific;
-
-        for (const auto &cell: dof_handler.active_cell_iterators()) {
-            if (state.block(
-                    SolutionBlocks::density)[cell->active_cell_index()] > 0.5) {
-                const Tensor<1, dim> edge_directions[2] = {cell->vertex(1) -
-                                                           cell->vertex(0),
-                                                           cell->vertex(2) -
-                                                           cell->vertex(0)};
-                const Tensor<2, dim> edge_tensor(
+
+
+///Outputs to a 3d-printable file. Not yet usable in parallel.
+template<>
+void
+KktSystem<2>::output_stl(const LA::MPI::BlockVector &state) {
+    double height = .25;
+    const int dim = 2;
+    std::ofstream stlfile;
+    stlfile.open("bridge.stl");
+    stlfile << "solid bridge\n" << std::scientific;
+
+    for (const auto &cell: dof_handler.active_cell_iterators()) {
+        if (state.block(
+                    SolutionBlocks::density)[cell->get_fe().component_to_system_index(0, 0)] > 0.5) {
+            const Tensor<1, dim> edge_directions[2] = {cell->vertex(1) -
+                                                       cell->vertex(0),
+                                                       cell->vertex(2) -
+                                                       cell->vertex(0)};
+            const Tensor<2, dim> edge_tensor(
                         {{edge_directions[0][0], edge_directions[0][1]},
                          {edge_directions[1][0], edge_directions[1][1]}});
-                const bool is_right_handed_cell = (determinant(edge_tensor) > 0);
-                if (is_right_handed_cell) {
-                    /* Write one side at z = 0. */
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+            const bool is_right_handed_cell = (determinant(edge_tensor) > 0);
+            if (is_right_handed_cell) {
+                /* Write one side at z = 0. */
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << -1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(0)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(0)[0] << " "
                             << cell->vertex(0)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << -1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(3)[0] << " "
+                stlfile << "         vertex " << cell->vertex(3)[0] << " "
                             << cell->vertex(3)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                    /* Write one side at z = height. */
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+                /* Write one side at z = height. */
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << 1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(0)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(0)[0] << " "
                             << cell->vertex(0)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << height << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << 1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(3)[0] << " "
+                stlfile << "         vertex " << cell->vertex(3)[0] << " "
                             << cell->vertex(3)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << height << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                } else /* The cell has a left-handed set up */
-                {
-                    /* Write one side at z = 0. */
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+            } else /* The cell has a left-handed set up */
+            {
+                /* Write one side at z = 0. */
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << -1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(0)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(0)[0] << " "
                             << cell->vertex(0)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << -1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(3)[0] << " "
+                stlfile << "         vertex " << cell->vertex(3)[0] << " "
                             << cell->vertex(3)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << 0.000000e+00 << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                    /* Write one side at z = height. */
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+                /* Write one side at z = height. */
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << 1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(0)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(0)[0] << " "
                             << cell->vertex(0)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << height << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                    stlfile << "   facet normal " << 0.000000e+00 << " "
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+                stlfile << "   facet normal " << 0.000000e+00 << " "
                             << 0.000000e+00 << " " << 1.000000e+00 << "\n";
-                    stlfile << "      outer loop\n";
-                    stlfile << "         vertex " << cell->vertex(1)[0] << " "
+                stlfile << "      outer loop\n";
+                stlfile << "         vertex " << cell->vertex(1)[0] << " "
                             << cell->vertex(1)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(2)[0] << " "
+                stlfile << "         vertex " << cell->vertex(2)[0] << " "
                             << cell->vertex(2)[1] << " " << height << "\n";
-                    stlfile << "         vertex " << cell->vertex(3)[0] << " "
+                stlfile << "         vertex " << cell->vertex(3)[0] << " "
                             << cell->vertex(3)[1] << " " << height << "\n";
-                    stlfile << "      endloop\n";
-                    stlfile << "   endfacet\n";
-                }
-                for (unsigned int face_number = 0;
-                     face_number < GeometryInfo<dim>::faces_per_cell;
-                     ++face_number) {
-                    const typename DoFHandler<dim>::face_iterator face =
-                            cell->face(face_number);
-                    if ((face->at_boundary()) ||
+                stlfile << "      endloop\n";
+                stlfile << "   endfacet\n";
+            }
+            for (unsigned int face_number = 0;
+                 face_number < GeometryInfo<dim>::faces_per_cell;
+                 ++face_number) {
+                const typename DoFHandler<dim>::face_iterator face =
+                        cell->face(face_number);
+                if ((face->at_boundary()) ||
                         (!face->at_boundary() &&
                          (state.block(
-                                 SolutionBlocks::density)[cell->neighbor(face_number)->active_cell_index()] <
+                              SolutionBlocks::density)[cell->neighbor(face_number)->get_fe().component_to_system_index(0, 0)] <
                           0.5))) {
-                        const Tensor<1, dim> normal_vector =
-                                (face->center() - cell->center());
-                        const double normal_norm = normal_vector.norm();
-                        if ((face->vertex(0)[0] - face->vertex(0)[0]) *
+                    const Tensor<1, dim> normal_vector =
+                            (face->center() - cell->center());
+                    const double normal_norm = normal_vector.norm();
+                    if ((face->vertex(0)[0] - face->vertex(0)[0]) *
                             (face->vertex(1)[1] - face->vertex(0)[1]) *
                             0.000000e+00 +
                             (face->vertex(0)[1] - face->vertex(0)[1]) * (0 - 0) *
@@ -1861,199 +3022,199 @@ namespace SAND {
                             (height - 0) *
                             (face->vertex(1)[1] - face->vertex(0)[1]) * 0 >
                             0) {
-                            stlfile << "   facet normal "
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " " << height
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " "
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " " << height
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                            stlfile << "   facet normal "
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " " << height
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " " << height
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " " << height
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " " << height
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                        } else {
-                            stlfile << "   facet normal "
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
+                    } else {
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " "
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " " << height
-                                    << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                            stlfile << "   facet normal "
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " " << height
+                                << "\n";
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " " << height
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " " << height
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " "
                                     << 0.000000e+00 << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " " << height
-                                    << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                        }
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " " << height
+                                << "\n";
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
                     }
                 }
             }
         }
-        stlfile << "endsolid bridge";
     }
+    stlfile << "endsolid bridge";
+}
 
-
-    template<>
-    void
-    KktSystem<3>::output_stl(const BlockVector<double> &state)
+///Outputs to a 3d-printable file. Not yet usable in parallel.
+template<>
+void
+KktSystem<3>::output_stl(const LA::MPI::BlockVector &state)
+{
+    std::ofstream stlfile;
+    stlfile.open("bridge.stl");
+    stlfile << "solid bridge\n" << std::scientific;
+    const int dim = 3;
+    for (const auto &cell : dof_handler.active_cell_iterators())
     {
-        std::ofstream stlfile;
-        stlfile.open("bridge.stl");
-        stlfile << "solid bridge\n" << std::scientific;
-        const int dim = 3;
-        for (const auto &cell : dof_handler.active_cell_iterators())
+        if (state.block(
+                    SolutionBlocks::unfiltered_density)[cell->get_fe().component_to_system_index(0, 0)] > 0.5)
         {
-            if (state.block(
-                    SolutionBlocks::unfiltered_density)[cell->active_cell_index()] > 0.5)
+            for (const auto n : cell->face_indices())
             {
-                for (const auto n : cell->face_indices())
+                bool create_boundary = false;
+                if (cell->at_boundary(n))
                 {
-                    bool create_boundary = false;
-                    if (cell->at_boundary(n))
-                    {
-                        create_boundary = true;
-                    }
-                    else if (state.block(
-                            SolutionBlocks::unfiltered_density)[cell->neighbor(n)->active_cell_index()] <= 0.5)
-                    {
-                        create_boundary = true;
-                    }
+                    create_boundary = true;
+                }
+                else if (state.block(
+                             SolutionBlocks::unfiltered_density)[cell->neighbor(n)->get_fe().component_to_system_index(0, 0)] <= 0.5)
+                {
+                    create_boundary = true;
+                }
 
-                    if (create_boundary)
-                    {
-                        const auto face = cell->face(n);
-                        const Tensor<1,dim> normal_vector = face->center() -
-                                                          cell->center();
-                        double normal_norm = normal_vector.norm();
-                        const Tensor<1,dim> edge_vectors_1 = face->vertex(1) - face->vertex(0);
-                        const Tensor<1,dim> edge_vectors_2 = face->vertex(2) - face->vertex(0);
-
-                        const Tensor<2, dim> edge_tensor (
-                                 {{edge_vectors_1[0], edge_vectors_1[1],edge_vectors_1[2]},
+                if (create_boundary)
+                {
+                    const auto face = cell->face(n);
+                    const Tensor<1,dim> normal_vector = face->center() -
+                            cell->center();
+                    double normal_norm = normal_vector.norm();
+                    const Tensor<1,dim> edge_vectors_1 = face->vertex(1) - face->vertex(0);
+                    const Tensor<1,dim> edge_vectors_2 = face->vertex(2) - face->vertex(0);
+
+                    const Tensor<2, dim> edge_tensor (
+                                {{edge_vectors_1[0], edge_vectors_1[1],edge_vectors_1[2]},
                                  {edge_vectors_2[0], edge_vectors_2[1],edge_vectors_2[2]},
                                  {normal_vector[0], normal_vector[1], normal_vector[2]}});
-                        const bool is_right_handed_cell = (determinant(edge_tensor) > 0);
+                    const bool is_right_handed_cell = (determinant(edge_tensor) > 0);
 
-                        if (is_right_handed_cell)
-                        {
-                            stlfile << "   facet normal "
+                    if (is_right_handed_cell)
+                    {
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << normal_vector[2] / normal_norm << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " "
                                     << face->vertex(0)[2] << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " "
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " "
                                     << face->vertex(1)[2] << "\n";
-                            stlfile << "         vertex " << face->vertex(2)[0]
-                                    << " " << face->vertex(2)[1] << " "
+                        stlfile << "         vertex " << face->vertex(2)[0]
+                                << " " << face->vertex(2)[1] << " "
                                     << face->vertex(2)[2] << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                            stlfile << "   facet normal "
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << normal_vector[2] / normal_norm << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " " << face->vertex(1)[2]
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(3)[0]
-                                    << " " << face->vertex(3)[1] << " " << face->vertex(3)[2]
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(2)[0]
-                                    << " " << face->vertex(2)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " " << face->vertex(1)[2]
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(3)[0]
+                                << " " << face->vertex(3)[1] << " " << face->vertex(3)[2]
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(2)[0]
+                                << " " << face->vertex(2)[1] << " "
                                     << face->vertex(2)[2] << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                        }
-                        else
-                        {
-                            stlfile << "   facet normal "
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
+                    }
+                    else
+                    {
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << normal_vector[2] / normal_norm << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(0)[0]
-                                    << " " << face->vertex(0)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(0)[0]
+                                << " " << face->vertex(0)[1] << " "
                                     << face->vertex(0)[2] << "\n";
-                            stlfile << "         vertex " << face->vertex(2)[0]
-                                    << " " << face->vertex(2)[1] << " "
+                        stlfile << "         vertex " << face->vertex(2)[0]
+                                << " " << face->vertex(2)[1] << " "
                                     << face->vertex(2)[2] << "\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " "
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " "
                                     << face->vertex(1)[2] << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                            stlfile << "   facet normal "
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
+                        stlfile << "   facet normal "
                                     << normal_vector[0] / normal_norm << " "
                                     << normal_vector[1] / normal_norm << " "
                                     << normal_vector[2] / normal_norm << "\n";
-                            stlfile << "      outer loop\n";
-                            stlfile << "         vertex " << face->vertex(1)[0]
-                                    << " " << face->vertex(1)[1] << " " << face->vertex(1)[2]
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(2)[0]
-                                    << " " << face->vertex(2)[1] << " " << face->vertex(2)[2]
-                                    << "\n";
-                            stlfile << "         vertex " << face->vertex(3)[0]
-                                    << " " << face->vertex(3)[1] << " "
+                        stlfile << "      outer loop\n";
+                        stlfile << "         vertex " << face->vertex(1)[0]
+                                << " " << face->vertex(1)[1] << " " << face->vertex(1)[2]
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(2)[0]
+                                << " " << face->vertex(2)[1] << " " << face->vertex(2)[2]
+                                << "\n";
+                        stlfile << "         vertex " << face->vertex(3)[0]
+                                << " " << face->vertex(3)[1] << " "
                                     << face->vertex(3)[2] << "\n";
-                            stlfile << "      endloop\n";
-                            stlfile << "   endfacet\n";
-                        }
-
+                        stlfile << "      endloop\n";
+                        stlfile << "   endfacet\n";
                     }
 
                 }
+
             }
         }
     }
 }
+}
 
 template class SAND::KktSystem<2>;
-template class SAND::KktSystem<3>;
\ No newline at end of file
+template class SAND::KktSystem<3>;
diff --git a/source/main.cc b/source/main.cc
new file mode 100644
index 0000000..f73c0af
--- /dev/null
+++ b/source/main.cc
@@ -0,0 +1,49 @@
+#include "../include/watchdog.h"
+#include "../include/input_information.h"
+#include <cstdlib>
+
+///Above are fairly normal files to include.  I also use the sparse direct package, which requiresBLAS/LAPACK
+/// to  perform  a  direct  solve  while  I  work  on  a  fast  iterative  solver  for  this problem.
+
+namespace SAND{
+    namespace Input{
+        unsigned int refinements;
+        unsigned int a_inv_iterations;
+        unsigned int k_inv_iterations;  
+    }
+}
+
+
+int
+main(int argc, char *argv[]) {
+    try
+    {
+        Utilities::MPI::MPI_InitFinalize mpi_initialization(argc, argv, 1);
+        {
+            using namespace SAND::Input;
+            refinements = atoi(argv[1]);
+            a_inv_iterations = atoi(argv[2]);
+            k_inv_iterations = atoi(argv[3]);
+        }
+        SAND::NonlinearWatchdog<SAND::Input::dim> elastic_problem;
+        elastic_problem.run();
+    }
+    catch (std::exception &exc) {
+        std::cerr << std::endl << std::endl
+                  << "----------------------------------------------------" << std::endl;
+        std::cerr << "Exception on processing: " << std::endl << exc.what()
+                  << std::endl << "Aborting!" << std::endl
+                  << "----------------------------------------------------" << std::endl;
+
+        return 1;
+    }
+    catch (...) {
+        std::cerr << std::endl << std::endl
+                  << "----------------------------------------------------" << std::endl;
+        std::cerr << "Unknown exception!" << std::endl << "Aborting!" << std::endl
+                  << "----------------------------------------------------" << std::endl;
+        return 1;
+    }
+
+    return 0;
+}
diff --git a/source/markov_filter.cc b/source/markov_filter.cc
index f5d2c5c..b367f20 100644
--- a/source/markov_filter.cc
+++ b/source/markov_filter.cc
@@ -5,6 +5,7 @@
 
 using namespace dealii;
 
+///Initialized the markov filter with the initial values
 void
 MarkovFilter::setup(const double objective_value_input, const double barrier_distance_input,
                                         const double feasibility_input, const double barrier_value_input) {
@@ -16,6 +17,7 @@ MarkovFilter::setup(const double objective_value_input, const double barrier_dis
     filter_barrier_function_value = feasibility + barrier_value * barrier_distance;
 }
 
+///Adds new information to the markov filter
 void
 MarkovFilter::add_point(const double objective_value_input, const  double barrier_distance_input,
                                     const double feasibility_input)
@@ -27,6 +29,8 @@ MarkovFilter::add_point(const double objective_value_input, const  double barrie
     filter_barrier_function_value = objective_value + barrier_value * barrier_distance;
 }
 
+///As the barrier always changes, this needs to be taken into account when accepting/rejecting a step.
+/// This allows each point to be viewed in comparison to the current barrier value.
 void
 MarkovFilter::update_barrier_value(const double barrier_value_input)
 {
@@ -34,6 +38,7 @@ MarkovFilter::update_barrier_value(const double barrier_value_input)
     filter_barrier_function_value = objective_value + barrier_value * barrier_distance;
 }
 
+///Checks if a new point passes the filter.
 bool
 MarkovFilter::check_filter(const double objective_value_input, const  double barrier_distance_input,
                                        const double feasibility_input) const
@@ -47,4 +52,4 @@ MarkovFilter::check_filter(const double objective_value_input, const  double bar
     {
         return false;
     }
-}
\ No newline at end of file
+}
diff --git a/source/matrix_free_elasticity.cc b/source/matrix_free_elasticity.cc
new file mode 100644
index 0000000..6da06dc
--- /dev/null
+++ b/source/matrix_free_elasticity.cc
@@ -0,0 +1,213 @@
+//
+// Created by justin on 2/17/21.
+//
+#include "../include/matrix_free_elasticity.h"
+#include "../include/input_information.h"
+#include "../include/parameters_and_components.h"
+namespace SAND {
+using namespace dealii;
+
+///Constructor
+template <int dim, int fe_degree, typename number>
+MF_Elasticity_Operator<dim, fe_degree, number>::MF_Elasticity_Operator()
+    : MatrixFreeOperators::Base<dim,LinearAlgebra::distributed::Vector<number>>(),
+    mpi_communicator(MPI_COMM_WORLD),
+    pcout(std::cout,(Utilities::MPI::this_mpi_process(mpi_communicator) == 0))
+{
+}
+
+///Clears the objects, removes density information
+template <int dim, int fe_degree, typename number>
+void MF_Elasticity_Operator<dim, fe_degree, number>::clear()
+{
+    this->cell_data = nullptr;
+    MatrixFreeOperators::Base<dim, LinearAlgebra::distributed::Vector<number>>::clear();
+}
+
+///Computes the diagonal for a preconditioner on the coarsest level.
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim,fe_degree,number>::compute_diagonal ()
+{
+    this->inverse_diagonal_entries.
+    reset(new DiagonalMatrix<dealii::LinearAlgebra::distributed::Vector<number>>());
+    this->diagonal_entries.
+    reset(new DiagonalMatrix<dealii::LinearAlgebra::distributed::Vector<number>>());
+
+    dealii::LinearAlgebra::distributed::Vector<number> &inverse_diagonal = this->inverse_diagonal_entries->get_vector();
+
+    dealii::LinearAlgebra::distributed::Vector<number> &diagonal = this->diagonal_entries->get_vector();
+
+    this->data->initialize_dof_vector(inverse_diagonal);
+    this->data->initialize_dof_vector(diagonal);
+    unsigned int dummy = 0;
+
+
+    this->data->cell_loop (&MF_Elasticity_Operator::local_compute_diagonal, this,
+                           diagonal, dummy);
+    this->data->cell_loop (&MF_Elasticity_Operator::local_compute_diagonal, this,
+                           inverse_diagonal, dummy);
+
+    this->set_constrained_entries_to_one(diagonal);
+    this->set_constrained_entries_to_one(inverse_diagonal);
+
+    // diagonal.compress(VectorOperation::add);
+    
+    for (auto &local_element : inverse_diagonal)
+      {
+//        Assert(local_element > 0.,
+//               ExcMessage("No diagonal entry in a positive definite operator "
+//                          "should be zero or negative."));
+        local_element = 1./local_element;
+      }
+      // inverse_diagonal.compress(VectorOperation::insert);
+    //   diagona.print(lstd::cout);
+      pcout << "diag size: " << diagonal.size() << " with l2 norm " << diagonal.l2_norm() << std::endl;
+}
+
+///Computes the diagonal value locally for a cell
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim,fe_degree,number>
+::local_compute_diagonal (const MatrixFree<dim,number>                     &data,
+                          dealii::LinearAlgebra::distributed::Vector<number>  &dst,
+                          const unsigned int &,
+                          const std::pair<unsigned int,unsigned int>       &cell_range) const
+{
+  // pcout << "local_compute_diagonal" << std::endl;
+  FEEvaluation<dim,fe_degree,fe_degree+1,dim,number> displacement (data, 0);
+
+  AlignedVector<VectorizedArray<number>> diagonal(displacement.dofs_per_cell);
+  
+  for (unsigned int cell=cell_range.first; cell<cell_range.second; ++cell)
+    {
+
+      VectorizedArray<number> cell_density = cell_data->density(cell, 0);
+      double penalized_density = std::pow(cell_density[0],Input::density_penalty_exponent);
+
+      displacement.reinit(cell);
+
+      for (unsigned int i=0; i<displacement.dofs_per_cell; ++i)
+        {
+          for (unsigned int j=0; j<displacement.dofs_per_cell; ++j)
+            displacement.begin_dof_values()[j] = VectorizedArray<number>();
+
+          displacement.begin_dof_values()[i] = make_vectorized_array<number> (1.);
+
+          displacement.evaluate (EvaluationFlags::gradients);
+
+          for (unsigned int q=0; q<displacement.n_q_points; ++q)
+            {
+              SymmetricTensor< 2, dim, VectorizedArray<double> > symgrad_term = penalized_density* 2.0 * Input::material_mu *displacement.get_symmetric_gradient(q);
+              VectorizedArray<number> div_term = trace(displacement.get_symmetric_gradient(q));
+
+              for (unsigned int d = 0; d < dim; ++d)
+              {
+                  symgrad_term[d][d] += penalized_density * Input::material_lambda * div_term;
+              }
+
+
+              displacement.submit_symmetric_gradient( symgrad_term , q);
+            }
+
+          displacement.integrate (EvaluationFlags::gradients);
+
+          diagonal[i] = displacement.begin_dof_values()[i];
+        }
+      
+      for (unsigned int i=0; i<displacement.dofs_per_cell; ++i)
+        displacement.begin_dof_values()[i] = diagonal[i];
+      displacement.distribute_local_to_global (dst);     
+
+    }
+}
+
+///Applies the elasticity operator locally. Matches what happens in KKT System
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim, fe_degree, number>::local_apply(
+        const MatrixFree<dim, number> &                   data,
+        LinearAlgebra::distributed::Vector<number> &      dst,
+        const LinearAlgebra::distributed::Vector<number> &src,
+        const std::pair<unsigned int, unsigned int> &     cell_range) const
+{
+  // pcout << "local_apply" << std::endl;
+    FEEvaluation<dim, 1, 2, dim, double> displacement(data,0);
+
+    for (unsigned int cell=cell_range.first; cell<cell_range.second; ++cell)
+    {
+        VectorizedArray<number> cell_density = cell_data->density(cell, 0);
+        double penalized_density = std::pow(cell_density[0],Input::density_penalty_exponent);
+
+        displacement.reinit(cell);
+//        displacement.read_dof_values(src);
+
+        displacement.gather_evaluate(src, EvaluationFlags::gradients);
+
+        for (unsigned int q = 0; q < displacement.n_q_points; ++q)
+        {
+            SymmetricTensor< 2, dim, VectorizedArray<double> > symgrad_term = penalized_density* 2.0 * Input::material_mu *displacement.get_symmetric_gradient(q);
+            VectorizedArray<number> div_term = penalized_density * Input::material_lambda * trace(displacement.get_symmetric_gradient(q));
+
+            for (unsigned int d = 0; d < dim; ++d)
+            {
+                symgrad_term[d][d] +=  div_term;
+            }
+
+            
+
+            displacement.submit_symmetric_gradient(symgrad_term, q);
+        }
+        displacement.integrate_scatter(EvaluationFlags::gradients, dst);
+    }
+
+}
+
+///Nothing is applied on a face on the LHS, so left blank.
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim, fe_degree, number>
+::local_apply_face(const dealii::MatrixFree<dim, number> &,
+                   dealii::LinearAlgebra::distributed::Vector<number> &,
+                   const dealii::LinearAlgebra::distributed::Vector<number> &,
+                   const std::pair<unsigned int, unsigned int> &) const
+{
+}
+
+///Nothing is applied on a face on the LHS, so left blank.
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim, fe_degree, number>
+::local_apply_boundary_face(const dealii::MatrixFree<dim, number> &,
+                            dealii::LinearAlgebra::distributed::Vector<number> &,
+                            const dealii::LinearAlgebra::distributed::Vector<number> &,
+                            const std::pair<unsigned int, unsigned int> &) const
+{
+}
+
+///Loops over all cells to apply the elasticity operatorto the entire LHS vector
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim,fe_degree,number>
+::apply_add (dealii::LinearAlgebra::distributed::Vector<number> &dst,
+             const dealii::LinearAlgebra::distributed::Vector<number> &src) const
+{
+    MatrixFreeOperators::Base<dim, dealii::LinearAlgebra::distributed::Vector<number>>::
+            data->cell_loop(&MF_Elasticity_Operator::local_apply, this, dst, src);
+}
+
+///Sets cell data (density) to be input given.
+template <int dim, int fe_degree, typename number>
+void
+MF_Elasticity_Operator<dim,fe_degree,number>::set_cell_data (const OperatorCellData<dim,number> &data)
+{
+    this->cell_data = &data;
+}
+
+
+
+}
+
+template class SAND::MF_Elasticity_Operator<2,1,double>;
+template class SAND::MF_Elasticity_Operator<3,1,double>;
+
diff --git a/source/poly_pre.cc b/source/poly_pre.cc
new file mode 100644
index 0000000..c5dad82
--- /dev/null
+++ b/source/poly_pre.cc
@@ -0,0 +1,7 @@
+#include "../include/poly_pre.h"
+#include "../include/schur_preconditioner.h"
+
+namespace SAND
+{
+
+}
diff --git a/source/schur_preconditioner.cc b/source/schur_preconditioner.cc
index 5711bd1..7582898 100644
--- a/source/schur_preconditioner.cc
+++ b/source/schur_preconditioner.cc
@@ -6,742 +6,1429 @@
 #include <deal.II/lac/sparse_matrix.h>
 #include <deal.II/base/timer.h>
 #include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/trilinos_solver.h>
+#include <deal.II/lac/trilinos_precondition.h>
+#include <deal.II/base/thread_management.h>
 #include "../include/schur_preconditioner.h"
 #include "../include/input_information.h"
 #include "../include/sand_tools.h"
-#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/base/config.h>
+#include <deal.II/base/array_view.h>
+#include <deal.II/base/index_set.h>
+#include <deal.II/base/mpi_tags.h>
+#include <deal.II/base/numbers.h>
+#include <deal.II/base/template_constraints.h>
 #include <fstream>
 
 namespace SAND {
-    using namespace dealii;
+using MatrixType  = dealii::TrilinosWrappers::SparseMatrix;
+using VectorType  = dealii::TrilinosWrappers::MPI::Vector;
+using PayloadType = dealii::TrilinosWrappers::internal::LinearOperatorImplementation::TrilinosPayload;
+using PayloadVectorType = typename PayloadType::VectorType;
+using size_type         = dealii::types::global_dof_index;
+
+namespace ChangeVectorTypes
+{
+template <typename number>
+void copy_from_displacement_to_system_vector(LA::MPI::Vector                                           &out,
+                                             const dealii::LinearAlgebra::distributed::Vector<number>  &in,
+                                             const std::map<types::global_dof_index,types::global_dof_index>  & displacement_to_system_dof_index_map)
+{
+    //    dealii::LinearAlgebra::ReadWriteVector<double> rwv(
+    //                out.locally_owned_elements());
+    //    rwv.import(in, VectorOperation::insert);
+    for (const auto &index_pair : displacement_to_system_dof_index_map)
+    {
+        out[index_pair.second] = in[index_pair.first];
+    }
+    //    out.import(rwv, VectorOperation::insert);
+}
+
+template <typename number>
+void copy_from_system_to_displacement_vector(dealii::LinearAlgebra::distributed::Vector<number>  &out,
+                                             const LA::MPI::Vector                                           &in,
+                                             const std::map<types::global_dof_index,types::global_dof_index>  & displacement_to_system_dof_index_map)
+{
+    //    dealii::LinearAlgebra::ReadWriteVector<double> rwv(
+    //                out.locally_owned_elements());
+    //    rwv.import(in, VectorOperation::insert);
+    for (const auto &index_pair : displacement_to_system_dof_index_map)
+    {
+        out[index_pair.first] = in[index_pair.second];
+    }
+    //    out.import(rwv, VectorOperation::insert);
+}
+
+template <typename number>
+void copy(LA::MPI::Vector &                                         out,
+          const dealii::LinearAlgebra::distributed::Vector<number> &in)
+{
+    dealii::LinearAlgebra::ReadWriteVector<double> rwv(
+                out.locally_owned_elements());
+    rwv.import(in, VectorOperation::insert);
+    out.import(rwv, VectorOperation::insert);
+}
+template <typename number>
+void copy(dealii::LinearAlgebra::distributed::Vector<number> &out,
+          const LA::MPI::Vector &                             in)
+{
+    dealii::LinearAlgebra::ReadWriteVector<double> rwv;
+    rwv.reinit(in);
+    out.import(rwv, VectorOperation::insert);
+}
+
+
+} // namespace ChangeVectorTypes
+
+
+
+using namespace dealii;
+
+
+    template<int dim>
+    PolyPreJ<dim>::PolyPreJ(const JinvMatrixPart<dim> &inner_matrix_in, const int degree_in):
+    degree(degree_in),
+    inner_matrix(inner_matrix_in)
+    {
+    }
+
     template<int dim>
-    TopOptSchurPreconditioner<dim>::TopOptSchurPreconditioner(BlockSparseMatrix<double> &matrix_in)
-            :
-            system_matrix(matrix_in),
-            n_rows(0),
-            n_columns(0),
-            n_block_rows(0),
-            n_block_columns(0),
-            other_solver_control(100000, 1e-10),
-            other_bicgstab(other_solver_control),
-            other_gmres(other_solver_control),
-            other_cg(other_solver_control),
-            a_mat(matrix_in.block(SolutionBlocks::displacement, SolutionBlocks::displacement_multiplier)),
-            b_mat(matrix_in.block(SolutionBlocks::density, SolutionBlocks::density)),
-            c_mat(matrix_in.block(SolutionBlocks::displacement,SolutionBlocks::density)),
-            e_mat(matrix_in.block(SolutionBlocks::displacement_multiplier,SolutionBlocks::density)),
-            f_mat(matrix_in.block(SolutionBlocks::unfiltered_density_multiplier,SolutionBlocks::unfiltered_density)),
-            d_m_mat(matrix_in.block(SolutionBlocks::density_upper_slack_multiplier, SolutionBlocks::density_upper_slack)),
-            d_1_mat(matrix_in.block(SolutionBlocks::density_lower_slack, SolutionBlocks::density_lower_slack)),
-            d_2_mat(matrix_in.block(SolutionBlocks::density_upper_slack, SolutionBlocks::density_upper_slack)),
-            m_vect(matrix_in.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier)),
-            timer(std::cout, TimerOutput::summary,
-                  TimerOutput::wall_times)
+    void
+    PolyPreJ<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
     {
+        LA::MPI::Vector temp_vec_1 = src;
+        LA::MPI::Vector temp_vec_2 = src;
+        for(int k=0; k<degree; k++)
+        {
+            temp_vec_2 = 0;
+            inner_matrix.vmult(temp_vec_2,temp_vec_1);
+            temp_vec_1 = temp_vec_2 + src;
+        }
+        dst = temp_vec_1;
+    }
 
+    template<int dim>
+    PolyPreK<dim>::PolyPreK(const KinvMatrixPart<dim> &inner_matrix_in, const int degree_in):
+    degree(degree_in),
+    inner_matrix(inner_matrix_in)
+    {
     }
 
     template<int dim>
-    void TopOptSchurPreconditioner<dim>::initialize(BlockSparseMatrix<double> &matrix, const std::map<types::global_dof_index, double> &boundary_values,const DoFHandler<dim> &dof_handler, const double barrier_size, const BlockVector<double> &state)
+    void
+    PolyPreK<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
     {
-        TimerOutput::Scope t(timer, "initialize");
+        LA::MPI::Vector temp_vec_1 = src;
+        LA::MPI::Vector temp_vec_2 = src;
+        for(int k=0; k<degree; k++)
         {
-            TimerOutput::Scope t(timer, "diag stuff");
-            for (auto&[dof_index, boundary_value]: boundary_values) {
-                const types::global_dof_index disp_start_index = system_matrix.get_row_indices().block_start(
-                        SolutionBlocks::displacement);
-                const types::global_dof_index disp_mult_start_index = system_matrix.get_row_indices().block_start(
-                        SolutionBlocks::displacement_multiplier);
-                const types::global_dof_index n_u = system_matrix.block(SolutionBlocks::displacement,
-                                                                        SolutionBlocks::displacement).m();
-                if ((dof_index >= disp_start_index) && (dof_index < disp_start_index + n_u)) {
-                    double diag_val = system_matrix.block(SolutionBlocks::displacement,
-                                                          SolutionBlocks::displacement).el(
+            temp_vec_2 = 0;
+            inner_matrix.vmult(temp_vec_2,temp_vec_1);
+            temp_vec_1 = temp_vec_2 + src;
+        }
+        dst = temp_vec_1;
+    }
+
+///Constructor... kinda big due to many references to matrices
+template<int dim>
+TopOptSchurPreconditioner<dim>::TopOptSchurPreconditioner(LA::MPI::BlockSparseMatrix &matrix_in, DoFHandler<dim> &big_dof_handler_in, MF_Elasticity_Operator<dim,1,double> &mf_elasticity_operator_in , PreconditionMG<dim,LinearAlgebra::distributed::Vector<double> ,MGTransferMatrixFree<dim, double>>
+                                                          &mf_gmg_preconditioner_in, std::map<types::global_dof_index,types::global_dof_index> &displacement_to_system_dof_index_map)
+    :
+      system_matrix(matrix_in),
+      mpi_communicator(MPI_COMM_WORLD),
+      n_rows(0),
+      n_columns(0),
+      n_block_rows(0),
+      n_block_columns(0),
+      other_solver_control(1000000, 1e-6),
+      other_bicgstab(other_solver_control),
+      other_gmres(other_solver_control),
+      other_cg(other_solver_control),
+      a_mat(matrix_in.block(SolutionBlocks::displacement, SolutionBlocks::displacement_multiplier)),
+      b_mat(matrix_in.block(SolutionBlocks::density, SolutionBlocks::density)),
+      c_mat(matrix_in.block(SolutionBlocks::displacement,SolutionBlocks::density)),
+      e_mat(matrix_in.block(SolutionBlocks::displacement_multiplier,SolutionBlocks::density)),
+      f_mat(matrix_in.block(SolutionBlocks::unfiltered_density_multiplier,SolutionBlocks::unfiltered_density)),
+      f_t_mat(matrix_in.block(SolutionBlocks::unfiltered_density,SolutionBlocks::unfiltered_density_multiplier)),
+      d_m_mat(matrix_in.block(SolutionBlocks::density_upper_slack_multiplier, SolutionBlocks::density_upper_slack)),
+      d_1_mat(matrix_in.block(SolutionBlocks::density_lower_slack, SolutionBlocks::density_lower_slack)),
+      d_2_mat(matrix_in.block(SolutionBlocks::density_upper_slack, SolutionBlocks::density_upper_slack)),
+      m_vect(matrix_in.block(SolutionBlocks::density, SolutionBlocks::total_volume_multiplier)),
+      solver_type("Amesos_Klu"),
+      additional_data(false, solver_type),
+      direct_solver_control(1, 0),
+      a_inv_direct(direct_solver_control, additional_data),
+      a_inv_mf_gmg(mf_elasticity_operator_in, mf_gmg_preconditioner_in, a_mat, displacement_to_system_dof_index_map),
+      pcout(std::cout,(Utilities::MPI::this_mpi_process(mpi_communicator) == 0)),
+      timer(pcout, TimerOutput::summary, TimerOutput::wall_times),
+      g_mat(f_mat, f_t_mat, d_8_mat),
+      h_mat(a_mat, b_mat, c_mat, e_mat, pre_amg, a_inv_direct, a_inv_mf_gmg),
+      j_inv_mat(h_mat, g_mat, d_m_mat),
+      k_inv_mat(h_mat, g_mat, d_m_mat),
+      j_inv_part(h_mat, g_mat, d_m_mat),
+      k_inv_part(h_mat, g_mat, d_m_mat),
+      big_dof_handler(big_dof_handler_in)
+{
+  
+
+}
+
+///Initializes the preconditioner with information about the boundary values and DoF Handler.
+template<int dim>
+void TopOptSchurPreconditioner<dim>::initialize(LA::MPI::BlockSparseMatrix &matrix, const std::map<types::global_dof_index, double> &boundary_values,const DoFHandler<dim> &dof_handler, const LA::MPI::BlockVector &distributed_state)
+{
+
+    a_inv_mf_gmg.set_exemplar_vector(distributed_state.block(SolutionBlocks::displacement));
+
+    TimerOutput::Scope t(timer, "initialize");
+    {
+        TimerOutput::Scope t(timer, "diag stuff");
+        const types::global_dof_index disp_start_index = system_matrix.get_row_indices().block_start(
+                    SolutionBlocks::displacement);
+        const types::global_dof_index disp_mult_start_index = system_matrix.get_row_indices().block_start(
+                    SolutionBlocks::displacement_multiplier);
+
+        for (auto &pair: boundary_values) {
+            const auto dof_index=pair.first;
+            const types::global_dof_index n_u = system_matrix.block(SolutionBlocks::displacement,
+                                                                    SolutionBlocks::displacement).m();
+            if ((dof_index >= disp_start_index) && (dof_index < disp_start_index + n_u)) {
+                double diag_val = system_matrix.block(SolutionBlocks::displacement,
+                                                      SolutionBlocks::displacement).el(
                             dof_index - disp_start_index, dof_index - disp_start_index);
-                    system_matrix.block(SolutionBlocks::displacement, SolutionBlocks::displacement_multiplier).set(
+
+                system_matrix.block(SolutionBlocks::displacement, SolutionBlocks::displacement_multiplier).set(
                             dof_index - disp_start_index, dof_index - disp_start_index, diag_val);
-                } else if ((dof_index >= disp_mult_start_index) && (dof_index < disp_mult_start_index + n_u)) {
-                    double diag_val = system_matrix.block(SolutionBlocks::displacement_multiplier,
-                                                          SolutionBlocks::displacement_multiplier).el(
+
+            }
+            else if ((dof_index >= disp_mult_start_index) && (dof_index < disp_mult_start_index + n_u))
+            {
+                double diag_val = system_matrix.block(SolutionBlocks::displacement_multiplier,
+                                                      SolutionBlocks::displacement_multiplier).el(
                             dof_index - disp_mult_start_index, dof_index - disp_mult_start_index);
-                    system_matrix.block(SolutionBlocks::displacement_multiplier, SolutionBlocks::displacement).set(
+                system_matrix.block(SolutionBlocks::displacement_multiplier, SolutionBlocks::displacement).set(
                             dof_index - disp_mult_start_index, dof_index - disp_mult_start_index, diag_val);
-                }
             }
+        }
 
 
-            //set diagonal to 0?
-            for (auto&[dof_index, boundary_value]: boundary_values) {
-                const types::global_dof_index disp_start_index = system_matrix.get_row_indices().block_start(
+        //set diagonal to 0?
+        for (auto &pair: boundary_values) {
+            const auto dof_index=pair.first;
+            const types::global_dof_index disp_start_index = system_matrix.get_row_indices().block_start(
                         SolutionBlocks::displacement);
-                const types::global_dof_index disp_mult_start_index = system_matrix.get_row_indices().block_start(
+            const types::global_dof_index disp_mult_start_index = system_matrix.get_row_indices().block_start(
                         SolutionBlocks::displacement_multiplier);
-                const types::global_dof_index n_u = system_matrix.block(SolutionBlocks::displacement,
-                                                                        SolutionBlocks::displacement).m();
-                if ((dof_index >= disp_start_index) && (dof_index < disp_start_index + n_u)) {
-                    system_matrix.block(SolutionBlocks::displacement, SolutionBlocks::displacement).set(
+            const types::global_dof_index n_u = system_matrix.block(SolutionBlocks::displacement,
+                                                                    SolutionBlocks::displacement).m();
+            if ((dof_index >= disp_start_index) && (dof_index < disp_start_index + n_u)) {
+                system_matrix.block(SolutionBlocks::displacement, SolutionBlocks::displacement).set(
                             dof_index - disp_start_index, dof_index - disp_start_index, 0);
-                } else if ((dof_index >= disp_mult_start_index) && (dof_index < disp_mult_start_index + n_u)) {
-                    system_matrix.block(SolutionBlocks::displacement_multiplier,
-                                        SolutionBlocks::displacement_multiplier).set(
+            } else if ((dof_index >= disp_mult_start_index) && (dof_index < disp_mult_start_index + n_u)) {
+                system_matrix.block(SolutionBlocks::displacement_multiplier,
+                                    SolutionBlocks::displacement_multiplier).set(
                             dof_index - disp_mult_start_index, dof_index - disp_mult_start_index, 0);
-                }
             }
         }
-        if (Input::solver_choice==SolverOptions::inexact_K_with_inexact_A_gmres)
-        {
 
-        }
-        else
-        {
-            TimerOutput::Scope t(timer, "build A inv");
-            a_inv_direct.initialize(a_mat);
-        }
-        {
-            TimerOutput::Scope t(timer, "reinit diag matrices");
-            d_3_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-            d_4_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-            d_5_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-            d_6_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-            d_7_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-            d_8_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-            d_m_inv_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density).get_sparsity_pattern());
-        }
+
+        system_matrix.compress(VectorOperation::insert);
+    }
+
+    {
+        TimerOutput::Scope t(timer, "reinit diag matrices");
+        d_3_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density));
+        d_4_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density));
+        d_5_mat.reinit(matrix.block(SolutionBlocks::density_lower_slack_multiplier, SolutionBlocks::density_lower_slack_multiplier));
+        d_6_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density));
+        d_7_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density));
+        d_8_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density));
+        d_m_inv_mat.reinit(matrix.block(SolutionBlocks::density, SolutionBlocks::density));
+
+
+        d_3_mat=0;
+        d_4_mat=0;
+        d_5_mat=0;
+        d_6_mat=0;
+        d_7_mat=0;
+        d_8_mat=0;
+        d_m_inv_mat=0;
+    }
+    {
+        const types::global_dof_index n_p = system_matrix.block(SolutionBlocks::density,
+                                                                SolutionBlocks::density).m();
+
+        std::vector<double> l_global(n_p);
+        std::vector<double> lm_global(n_p);
+        std::vector<double> u_global(n_p);
+        std::vector<double> um_global(n_p);
+        std::vector<double> m_global(n_p);
+
+        std::vector<double> l(n_p);
+        std::vector<double> lm(n_p);
+        std::vector<double> u(n_p);
+        std::vector<double> um(n_p);
+        std::vector<double> m(n_p);
+
+        TimerOutput::Scope t(timer, "build diag matrices");
+        for (const auto cell: dof_handler.active_cell_iterators())
         {
-            TimerOutput::Scope t(timer, "build diag matrices");
-            for (const auto cell: dof_handler.active_cell_iterators())
+            if(cell->is_locally_owned())
             {
-                const double i = cell->active_cell_index();
-                const double m = cell->measure();
-                double d_3_value = -1 * state.block(SolutionBlocks::density_lower_slack_multiplier)[i] /
-                                   (m * state.block(SolutionBlocks::density_lower_slack)[i]);
-                double d_4_value = -1 * state.block(SolutionBlocks::density_upper_slack_multiplier)[i] /
-                                   (m * state.block(SolutionBlocks::density_upper_slack)[i]);
-                double d_5_value = state.block(SolutionBlocks::density_lower_slack_multiplier)[i] /
-                                   (state.block(SolutionBlocks::density_lower_slack)[i]);
-                double d_6_value = state.block(SolutionBlocks::density_upper_slack_multiplier)[i] /
-                                   (state.block(SolutionBlocks::density_upper_slack)[i]);
-                double d_7_value = (m * (state.block(SolutionBlocks::density_lower_slack_multiplier)[i] *
-                                         state.block(SolutionBlocks::density_upper_slack)[i] +
-                                         state.block(SolutionBlocks::density_upper_slack_multiplier)[i] *
-                                         state.block(SolutionBlocks::density_lower_slack)[i]))
-                                   / (state.block(SolutionBlocks::density_lower_slack)[i] *
-                                      state.block(SolutionBlocks::density_upper_slack)[i]);
-                double d_8_value = (state.block(SolutionBlocks::density_lower_slack)[i] *
-                                    state.block(SolutionBlocks::density_upper_slack)[i])
-                                   / (m * (state.block(SolutionBlocks::density_lower_slack_multiplier)[i] *
-                                           state.block(SolutionBlocks::density_upper_slack)[i] +
-                                           state.block(SolutionBlocks::density_upper_slack_multiplier)[i] *
-                                           state.block(SolutionBlocks::density_lower_slack)[i]));
-                d_3_mat.set(i, i, d_3_value);
-                d_4_mat.set(i, i, d_4_value);
-                d_5_mat.set(i, i, d_5_value);
-                d_6_mat.set(i, i, d_6_value);
-                d_7_mat.set(i, i, d_7_value);
-                d_8_mat.set(i, i, d_8_value);
-                d_m_inv_mat.set(i, i, 1 / m);
+                std::vector<types::global_dof_index> i(cell->get_fe().n_dofs_per_cell());
+                cell->get_dof_indices(i);
 
-            }
-        }
+                const int i_ind = cell->get_fe().component_to_system_index(0,0);
 
-        pre_j.reinit(matrix.block(SolutionBlocks::density,SolutionBlocks::density).n());
-        pre_k.reinit(matrix.block(SolutionBlocks::density,SolutionBlocks::density).n());
-        g_d_m_inv_density.reinit(matrix.block(SolutionBlocks::density,SolutionBlocks::density).n());
-        k_g_d_m_inv_density.reinit(matrix.block(SolutionBlocks::density,SolutionBlocks::density).n());
+                if(distributed_state.block(SolutionBlocks::density_lower_slack_multiplier).in_local_range(i[i_ind]))
+                {
+                    lm[i[i_ind]] = distributed_state.block(SolutionBlocks::density_lower_slack_multiplier)[i[i_ind]];
+                    m[i[i_ind]] = cell->measure();
+                }
 
-        auto op_g = linear_operator(f_mat) * linear_operator(d_8_mat) *
-                    transpose_operator(linear_operator(f_mat));
+                if(distributed_state.block(SolutionBlocks::density_lower_slack).in_local_range(i[i_ind]))
+                {
+                    l[i[i_ind]] =  distributed_state.block(SolutionBlocks::density_lower_slack)[i[i_ind]];
+                }
 
-        auto op_h = op_g;
-        PreconditionSSOR<SparseMatrix<double>> preconditioner;
-        preconditioner.initialize(a_mat, 1.2);
-        SolverControl            solver_control(1000, 1e-12);
-        SolverCG<Vector<double>> a_solver_cg(solver_control);
-        auto a_inv_op = inverse_operator(linear_operator(a_mat),a_solver_cg,preconditioner);
+                if(distributed_state.block(SolutionBlocks::density_upper_slack_multiplier).in_local_range(i[i_ind]))
+                {
+                    um[i[i_ind]]= distributed_state.block(SolutionBlocks::density_upper_slack_multiplier)[i[i_ind]];
+                }
 
-        if (Input::solver_choice==SolverOptions::inexact_K_with_inexact_A_gmres)
-        {
-            op_h = linear_operator(b_mat)
-                   - transpose_operator(linear_operator(c_mat)) * a_inv_op * linear_operator(e_mat)
-                   - transpose_operator(linear_operator(e_mat)) * a_inv_op * linear_operator(c_mat);
-        }
-        else
-        {
-            op_h = linear_operator(b_mat)
-                   - transpose_operator(linear_operator(c_mat)) * linear_operator(a_inv_direct) * linear_operator(e_mat)
-                   - transpose_operator(linear_operator(e_mat)) * linear_operator(a_inv_direct) * linear_operator(c_mat);
+                if(distributed_state.block(SolutionBlocks::density_upper_slack).in_local_range(i[i_ind]))
+                {
+                    u[i[i_ind]] = distributed_state.block(SolutionBlocks::density_upper_slack)[i[i_ind]];
+                }
+            }
         }
 
-        if(Input::solver_choice == SolverOptions::inexact_K_with_inexact_A_gmres || Input::solver_choice == SolverOptions::inexact_K_with_exact_A_gmres)
-        {
+        MPI_Allreduce(lm.data(), lm_global.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(l.data(), l_global.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(um.data(), um_global.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(u.data(), u_global.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
+        MPI_Allreduce(m.data(), m_global.data(), n_p, MPI_DOUBLE, MPI_SUM, MPI_COMM_WORLD);
 
-        }
-        else
+        for (unsigned int k=0; k< n_p; k++)
         {
+            if(distributed_state.block(0).in_local_range(k))
             {
-                TimerOutput::Scope t(timer, "build g_mat");
-                g_mat.reinit(b_mat.n(), b_mat.n());
-                build_matrix_element_by_element(op_g, g_mat);
+                d_3_mat.set(k, k, -1 * lm_global[k]/(m_global[k]*l_global[k]));
+                d_4_mat.set(k, k, -1 * um_global[k]/(m_global[k]*u_global[k]));
+                d_5_mat.set(k, k, lm_global[k]/l_global[k]);
+                d_6_mat.set(k, k, um_global[k]/u_global[k]);
+                d_7_mat.set(k, k, m_global[k]*(lm_global[k]*u_global[k] + um_global[k]*l_global[k])/(l_global[k]*u_global[k]));
+                d_8_mat.set(k, k, l_global[k]*u_global[k]/(m_global[k]*(lm_global[k]*u_global[k] + um_global[k]*l_global[k])));
+                d_m_inv_mat.set(k, k, 1 / m_global[k]);
             }
+        }
+    }
+    d_3_mat.compress(VectorOperation::insert);
+    d_4_mat.compress(VectorOperation::insert);
+    d_5_mat.compress(VectorOperation::insert);
+    d_6_mat.compress(VectorOperation::insert);
+    d_7_mat.compress(VectorOperation::insert);
+    d_8_mat.compress(VectorOperation::insert);
+    d_m_inv_mat.compress(VectorOperation::insert);
+
+    pre_j=distributed_state.block(SolutionBlocks::density);
+    pre_k=distributed_state.block(SolutionBlocks::density);
+    g_d_m_inv_density=distributed_state.block(SolutionBlocks::density);
+    k_g_d_m_inv_density=distributed_state.block(SolutionBlocks::density);
+
+    LA::MPI::Vector density_exemplar = distributed_state.block(SolutionBlocks::density);
+    LA::MPI::Vector displacement_exemplar = distributed_state.block(SolutionBlocks::displacement);
+
+    density_exemplar = 0.;
+    displacement_exemplar = 0.;
+    g_mat.initialize(density_exemplar, d_m_inv_mat);
+    h_mat.initialize(density_exemplar, displacement_exemplar,d_m_inv_mat);
+    j_inv_mat.initialize(density_exemplar,d_m_inv_mat);
+    k_inv_mat.initialize(density_exemplar,d_m_inv_mat);
+    // j_inv_part.initialize(density_exemplar);
+    // k_inv_part.initialize(density_exemplar);
+
+    num_mults = 0;
+}
 
+///Application of the preconditioner, broken up into 5 parts.
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
 
-            {
-                TimerOutput::Scope t(timer, "build h_mat");
-                h_mat.reinit(b_mat.n(), b_mat.n());
-                build_matrix_element_by_element(op_h, h_mat);
-            }
+    LA::MPI::BlockVector dst_tmp = dst;
+    dst_tmp = 0.;
+     LA::MPI::BlockVector src_temp = src;
 
-            {
-                TimerOutput::Scope t(timer, "build k_inv_mat");
-                auto op_k_inv = -1 * op_g * linear_operator(d_m_inv_mat) * op_h -
-                                linear_operator(d_m_mat);
-                k_inv_mat.reinit(b_mat.n(), b_mat.n());
-                build_matrix_element_by_element(op_k_inv, k_inv_mat);
-            }
-        }
+    // pcout << "size of matrix block:  " << system_matrix.block(9,8).linfty_norm() << "   " << system_matrix.block(5,6).linfty_norm() << std::endl;
+    LA::MPI::BlockVector temp_src;
+    {
+        dst = 0.;
+        TimerOutput::Scope t(timer, "part 1");
+        vmult_step_1(dst, src);
+        temp_src = dst;
+        pcout << "step 1 done: " << dst.l2_norm() << std::endl;
+    }
 
+    {
+        dst = 0.;
+        TimerOutput::Scope t(timer, "part 2");
+        vmult_step_2(dst, temp_src);
+        temp_src = dst;
+        pcout << "step 2 done: " << dst.l2_norm() << std::endl;
+    }
 
+    {
+        dst = 0.;
+        TimerOutput::Scope t(timer, "part 3");
+        vmult_step_3(dst, temp_src);
+        temp_src = dst;
+        pcout << "step 3 done: " << dst.l2_norm() << std::endl;
+    }
 
-        if (Input::solver_choice == SolverOptions::exact_preconditioner_with_gmres)
-        {
-            TimerOutput::Scope t(timer, "invert k_mat");
-            k_mat.copy_from(k_inv_mat);
-            k_mat.invert();
-        }
+    {
+        dst = 0.;
+        TimerOutput::Scope t(timer, "part 4");
+        vmult_step_4(dst, temp_src);
+        temp_src = dst;
+        pcout << "step 4 done: " << dst.l2_norm() << std::endl;
+    }
+
+    dst = 0.;
+    vmult_step_5(dst, temp_src);
+    pcout << "step 5 done: " << dst.l2_norm() << std::endl;
+    num_mults++;
 
+}
+
+///Not implemented
+template<int dim>
+void TopOptSchurPreconditioner<dim>::Tvmult(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+    dst = src;
+}
+
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult_add(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+    LA::MPI::BlockVector dst_temp = dst;
+    vmult(dst_temp, src);
+    dst += dst_temp;
+}
+
+///Not implemented
+template<int dim>
+void TopOptSchurPreconditioner<dim>::Tvmult_add(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+    dst = src;
+}
+
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult_step_1(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+    dst = src;
+    auto dst_temp = dst;
+    auto dst_temp2 = dst;
+    auto dst_temp3 = dst;
+
+    d_5_mat.vmult(dst_temp2.block(SolutionBlocks::density_lower_slack_multiplier),src.block(SolutionBlocks::density_lower_slack_multiplier));
+    d_6_mat.vmult(dst_temp3.block(SolutionBlocks::density_upper_slack_multiplier),src.block(SolutionBlocks::density_upper_slack_multiplier));
+
+    dst.block(SolutionBlocks::unfiltered_density) = dst_temp.block(SolutionBlocks::unfiltered_density)
+            - dst_temp2.block(SolutionBlocks::density_lower_slack_multiplier)
+            + dst_temp3.block(SolutionBlocks::density_upper_slack_multiplier)
+            + src.block(SolutionBlocks::density_lower_slack)
+            - src.block(SolutionBlocks::density_upper_slack);
+}
+
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult_step_2(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+    dst = src;
+    auto dst_temp = dst;
+    auto dst_temp2 = dst;
+    auto dst_temp3 = dst;
+    d_8_mat.vmult(dst_temp2.block(SolutionBlocks::unfiltered_density), src.block(SolutionBlocks::unfiltered_density));
+    f_mat.vmult(dst_temp3.block(SolutionBlocks::unfiltered_density),dst_temp2.block(SolutionBlocks::unfiltered_density));
+    dst.block(SolutionBlocks::unfiltered_density_multiplier) = dst_temp.block(SolutionBlocks::unfiltered_density_multiplier) - dst_temp3.block(SolutionBlocks::unfiltered_density);
+
+}
+
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult_step_3(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+
+    dst = src;
+    auto dst_temp = dst;
+
+    if (Input::solver_choice==SolverOptions::inexact_K_with_inexact_A_gmres)
+    {
+
+        a_inv_mf_gmg.set_tol(0);
+        a_inv_mf_gmg.set_iter(100);
+
+        a_inv_mf_gmg.vmult(dst_temp.block(SolutionBlocks::displacement_multiplier),src.block(SolutionBlocks::displacement_multiplier));
+        a_inv_mf_gmg.vmult(dst_temp.block(SolutionBlocks::displacement),src.block(SolutionBlocks::displacement));
+
+        a_inv_mf_gmg.set_tol(Input::a_rel_tol);
+        a_inv_mf_gmg.set_iter(Input::a_inv_iterations);
+
+        c_mat.Tvmult(dst_temp.block(SolutionBlocks::density_upper_slack),dst_temp.block(SolutionBlocks::displacement_multiplier));
+        e_mat.Tvmult(dst_temp.block(SolutionBlocks::density_lower_slack),dst_temp.block(SolutionBlocks::displacement));
+
+        dst.block(SolutionBlocks::density) = dst_temp.block(SolutionBlocks::density) + dst_temp.block(SolutionBlocks::density_upper_slack) + dst_temp.block(SolutionBlocks::density_lower_slack);
+
+    }
+    else
+    {
+        a_inv_direct.vmult(dst_temp.block(SolutionBlocks::displacement_multiplier),src.block(SolutionBlocks::displacement_multiplier));
+        a_inv_direct.vmult(dst_temp.block(SolutionBlocks::displacement),src.block(SolutionBlocks::displacement));
+        c_mat.Tvmult(dst_temp.block(SolutionBlocks::density_upper_slack),dst_temp.block(SolutionBlocks::displacement_multiplier));
+        e_mat.Tvmult(dst_temp.block(SolutionBlocks::density_lower_slack),dst_temp.block(SolutionBlocks::displacement));
+        dst.block(SolutionBlocks::density) = dst_temp.block(SolutionBlocks::density) - dst_temp.block(SolutionBlocks::density_upper_slack) - dst_temp.block(SolutionBlocks::density_lower_slack);
     }
 
+}
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        BlockVector<double> temp_src;
-        {
-            TimerOutput::Scope t(timer, "part 1");
-            vmult_step_1(dst, src);
-            temp_src = dst;
-        }
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult_step_4(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const {
+    dst = src;
+    auto dst_temp = dst;
+    auto k_density_mult =  src.block(SolutionBlocks::density);
+
+
+    TrilinosWrappers::PreconditionIdentity preconditioner;
+    preconditioner.initialize(b_mat);
+
+    // PolyPreK<dim> poly_pre_k(k_inv_part,0);
+    // PolyPreJ<dim> poly_pre_j(j_inv_part,0);
+
+    auto d_m_inv_density = g_d_m_inv_density;
+    d_m_inv_mat.vmult(d_m_inv_density,src.block(SolutionBlocks::density));
+    g_mat.vmult(g_d_m_inv_density,d_m_inv_density);
+    
+    SolverControl step_4_gmres_control_1 (Input::k_inv_iterations, g_d_m_inv_density.l2_norm()*Input::k_rel_tol);
+    SolverFGMRES<LA::MPI::Vector> step_4_gmres_1 (step_4_gmres_control_1);
+    try {
+        pcout << "SOLVE 1" << std::endl;
+        k_density_mult = 0.;
+        step_4_gmres_1.solve(k_inv_mat,k_g_d_m_inv_density,g_d_m_inv_density, PreconditionIdentity() );
+    }
+    catch (std::exception &exc)
+    {
+        pcout << "Failure of linear solver 4-1 with convergence of " << step_4_gmres_control_1.last_value()/step_4_gmres_control_1.initial_value()<< std::endl;
+        //                throw;
+    }
+    SolverControl step_4_gmres_control_2 (Input::k_inv_iterations, src.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm()*Input::k_rel_tol);
+    SolverFGMRES<LA::MPI::Vector> step_4_gmres_2 (step_4_gmres_control_2);
+    try {
+        pcout << "SOLVE 2" << std::endl;
+        k_density_mult = 0.;
+        step_4_gmres_2.solve(k_inv_mat,k_density_mult,src.block(SolutionBlocks::unfiltered_density_multiplier), PreconditionIdentity());
+    } catch (std::exception &exc)
+    {
 
-        {
-            TimerOutput::Scope t(timer, "part 2");
-            vmult_step_2(dst, temp_src);
-            temp_src = dst;
-        }
+        pcout << "Failure of linear solver 4-2 with convergence of " << step_4_gmres_control_2.last_value()/step_4_gmres_control_2.initial_value()<< std::endl;
+        //                throw;
+    }
 
+    if (num_mults == -10)
+    {
+        TimerOutput::Scope t(timer, "k_mult");
+        SolverControl step_5_gmres_control_4 (100000, 1e-12*g_d_m_inv_density.l2_norm());
+        step_5_gmres_control_4.enable_history_data();
+        SolverFGMRES<LA::MPI::Vector> step_5_gmres_4(step_5_gmres_control_4);
+        try {
+            TimerOutput::Scope t(timer, "actual inverse 5.3");
+            pcout << "SOLVE TEST" << std::endl;
+            dst_temp.block(SolutionBlocks::density) = 0.;
+            step_5_gmres_4.solve(k_inv_mat,dst_temp.block(SolutionBlocks::density), g_d_m_inv_density , PreconditionIdentity());
+        } catch (std::exception &exc)
         {
-            TimerOutput::Scope t(timer, "part 3");
-            vmult_step_3(dst, temp_src);
-            temp_src = dst;
+            pcout << "Failure of linear solver step_5_gmres_4" << std::endl;
+            pcout << "first residual: " << step_5_gmres_control_4.initial_value() << std::endl;
+            pcout << "last residual: " << step_5_gmres_control_4.last_value() << std::endl;
+            //                    throw;
         }
+        auto history = step_5_gmres_control_4.get_history_data();
+        for (int i=0; i< step_5_gmres_control_4.last_step()+1; ++i)
         {
-            TimerOutput::Scope t(timer, "part 4");
-            vmult_step_4(dst, temp_src);
-            temp_src = dst;
+            pcout << i << "   " << history[i]/step_5_gmres_control_4.initial_value() << std::endl;
         }
-        vmult_step_5(dst, temp_src);
-    }
-
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::Tvmult(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        dst = src;
-    }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult_add(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        BlockVector<double> dst_temp = dst;
-        vmult(dst_temp, src);
-        dst += dst_temp;
+        
     }
+    dst.block(SolutionBlocks::total_volume_multiplier) = transpose_operator<VectorType, VectorType, PayloadType>(m_vect)*k_g_d_m_inv_density
+            - transpose_operator<VectorType, VectorType, PayloadType>(m_vect)*k_density_mult
+            +dst_temp.block(SolutionBlocks::total_volume_multiplier);
+    
+}
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::Tvmult_add(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        dst = src;
+///The only non-triangular vmult step, applies inverses down the block diagonal.
+template<int dim>
+void TopOptSchurPreconditioner<dim>::vmult_step_5(LA::MPI::BlockVector &dst, const LA::MPI::BlockVector &src) const 
+{
+    {
+        //First Block Inverse
+        TimerOutput::Scope t(timer, "inverse 1");
+        dst.block(SolutionBlocks::density_lower_slack_multiplier) = linear_operator<VectorType,VectorType,PayloadType>(d_3_mat) * src.block(SolutionBlocks::density_lower_slack_multiplier) +
+                linear_operator<VectorType,VectorType,PayloadType>(d_m_inv_mat) * src.block(SolutionBlocks::density_lower_slack);
+        dst.block(SolutionBlocks::density_upper_slack_multiplier) = linear_operator<VectorType,VectorType,PayloadType>(d_4_mat) * src.block(SolutionBlocks::density_upper_slack_multiplier) +
+                linear_operator<VectorType,VectorType,PayloadType>(d_m_inv_mat) * src.block(SolutionBlocks::density_upper_slack);
+        dst.block(SolutionBlocks::density_lower_slack) = linear_operator<VectorType,VectorType,PayloadType>(d_m_inv_mat) * src.block(SolutionBlocks::density_lower_slack_multiplier);
+        dst.block(SolutionBlocks::density_upper_slack) = linear_operator<VectorType,VectorType,PayloadType>(d_m_inv_mat) * src.block(SolutionBlocks::density_upper_slack_multiplier);
     }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult_step_1(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        dst = src;
-        dst.block(SolutionBlocks::unfiltered_density) += -1 * linear_operator(d_5_mat)*src.block(SolutionBlocks::density_lower_slack_multiplier) +
-                linear_operator(d_6_mat) * src.block(SolutionBlocks::density_upper_slack_multiplier) + src.block(SolutionBlocks::density_lower_slack)
-                - src.block(SolutionBlocks::density_upper_slack);
+    {
+        //Second Block Inverse
+        TimerOutput::Scope t(timer, "inverse 2");
+        dst.block(SolutionBlocks::unfiltered_density) =
+                linear_operator<VectorType,VectorType,PayloadType>(d_8_mat) * src.block(SolutionBlocks::unfiltered_density);
     }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult_step_2(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        dst = src;
-        dst.block(SolutionBlocks::unfiltered_density_multiplier) += -1 * linear_operator(f_mat) * linear_operator(d_8_mat) * src.block(SolutionBlocks::unfiltered_density);
-    }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult_step_3(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        dst = src;
-        if (Input::solver_choice == SolverOptions::inexact_K_with_inexact_A_gmres)
+    {
+        //Third Block Inverse
+        TimerOutput::Scope t(timer, "inverse 3");
+        if (Input::solver_choice==SolverOptions::inexact_K_with_inexact_A_gmres)
         {
-            PreconditionSSOR<SparseMatrix<double>> preconditioner;
-            preconditioner.initialize(a_mat, 1.2);
-            SolverControl            solver_control(1000, 1e-12);
-            SolverCG<Vector<double>> a_solver_cg(solver_control);
-            auto a_inv_op = inverse_operator(linear_operator(a_mat),a_solver_cg,preconditioner);
-            dst.block(SolutionBlocks::density)+= -1 * transpose_operator(linear_operator(e_mat)) * a_inv_op * src.block(SolutionBlocks::displacement)
-                                                 - transpose_operator(linear_operator(c_mat)) * a_inv_op * src.block(SolutionBlocks::displacement_multiplier);
+            LA::MPI::BlockVector dst_temp = dst;
+
+            //                SolverControl            solver_control(100000, 1e-6);
+            //                SolverCG<LA::MPI::Vector> a_solver_cg(solver_control);
+
+            //                auto a_inv_op = inverse_operator(linear_operator<VectorType,VectorType,PayloadType>(a_mat),a_solver_cg, pre_amg);
+
+            //                dst.block(SolutionBlocks::displacement) = a_inv_op * src.block(SolutionBlocks::displacement_multiplier);
+            //                dst.block(SolutionBlocks::displacement_multiplier) = a_inv_op * src.block(SolutionBlocks::displacement);
+
+            a_inv_mf_gmg.set_tol(0);
+            a_inv_mf_gmg.set_iter(100);
+            a_inv_mf_gmg.vmult( dst_temp.block(SolutionBlocks::displacement), src.block(SolutionBlocks::displacement_multiplier));
+            a_inv_mf_gmg.vmult( dst_temp.block(SolutionBlocks::displacement_multiplier), src.block(SolutionBlocks::displacement));
+            a_inv_mf_gmg.set_tol(Input::a_rel_tol);
+            a_inv_mf_gmg.set_iter(Input::a_inv_iterations);
+
+            dst.block(SolutionBlocks::displacement) = -1 * dst_temp.block(SolutionBlocks::displacement);
+            dst.block(SolutionBlocks::displacement_multiplier) = -1 * dst_temp.block(SolutionBlocks::displacement_multiplier);
         }
         else
         {
-            dst.block(SolutionBlocks::density)+= -1 * transpose_operator(linear_operator(e_mat)) * linear_operator(a_inv_direct) * src.block(SolutionBlocks::displacement)
-                                                 - transpose_operator(linear_operator(c_mat)) * linear_operator(a_inv_direct) * src.block(SolutionBlocks::displacement_multiplier);
+            a_inv_direct.vmult( dst.block(SolutionBlocks::displacement), src.block(SolutionBlocks::displacement_multiplier));
+            a_inv_direct.vmult( dst.block(SolutionBlocks::displacement_multiplier), src.block(SolutionBlocks::displacement));
         }
 
-    }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult_step_4(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        dst = src;
-        Vector<double> k_density_mult;
-        k_density_mult.reinit(src.block(SolutionBlocks::density).size());
+    }
+    {
+        //Fourth (ugly) Block Inverse
+        TimerOutput::Scope t(timer, "inverse 4");
 
 
 
         if (Input::solver_choice == SolverOptions::exact_preconditioner_with_gmres)
         {
-            g_d_m_inv_density = linear_operator(g_mat) * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density);
-            k_g_d_m_inv_density = linear_operator(k_mat) * g_d_m_inv_density;
-            k_density_mult = linear_operator(k_mat) * src.block(SolutionBlocks::unfiltered_density_multiplier);
+            //                pre_j = src.block(SolutionBlocks::density) + linear_operator<VectorType,VectorType,PayloadType>(h_mat) * linear_operator<VectorType,VectorType,PayloadType>(d_m_inv_mat) * src.block(SolutionBlocks::unfiltered_density_multiplier);
+            //                pre_k = -1* linear_operator<VectorType,VectorType,PayloadType>(g_mat) * linear_operator<VectorType,VectorType,PayloadType>(d_m_inv_mat) * src.block(SolutionBlocks::density) + src.block(SolutionBlocks::unfiltered_density_multiplier);
+            //                dst.block(SolutionBlocks::unfiltered_density_multiplier) = transpose_operator<VectorType, VectorType, PayloadType>(k_mat) * pre_j;
+            //                dst.block(SolutionBlocks::density) = linear_operator<VectorType,VectorType,PayloadType>(k_mat) * pre_k;
         }
 
-        else if (Input::solver_choice == SolverOptions::inexact_K_with_exact_A_gmres)
+        else if (Input::solver_choice == SolverOptions::inexact_K_with_inexact_A_gmres)
         {
-            auto op_g = linear_operator(f_mat) * linear_operator(d_8_mat) *
-                    transpose_operator(linear_operator(f_mat));
-
-            auto op_h = linear_operator(b_mat)
-                   - transpose_operator(linear_operator(c_mat)) * linear_operator(a_inv_direct) * linear_operator(e_mat)
-                   - transpose_operator(linear_operator(e_mat)) * linear_operator(a_inv_direct) * linear_operator(c_mat);
 
-            auto op_k_inv = -1 * op_g * linear_operator(d_m_inv_mat) * op_h - linear_operator(d_m_mat);
+            // TrilinosWrappers::PreconditionIdentity preconditioner;
+            // preconditioner.initialize(b_mat);
+            auto pre_pre_k = pre_k;
+            auto pre_pre_pre_k = pre_k;
+            auto d_m_inv_unfil_density_mult = pre_k;
+            auto h_d_m_inv_unfil_density_mult = pre_k;
 
-            g_d_m_inv_density = op_g * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density);
-
-            SolverControl step_4_gmres_control_1 (10000, g_d_m_inv_density.l2_norm()*1e-6);
-            SolverGMRES<Vector<double>> step_4_gmres_1 (step_4_gmres_control_1);
+            {
+                TimerOutput::Scope t(timer, "not inverse 5.1");
+                d_m_inv_mat.vmult(d_m_inv_unfil_density_mult, src.block(SolutionBlocks::unfiltered_density_multiplier));
+                h_mat.vmult(h_d_m_inv_unfil_density_mult,d_m_inv_unfil_density_mult);
+                pre_j = src.block(SolutionBlocks::density) + h_d_m_inv_unfil_density_mult;
+                d_m_inv_mat.vmult(pre_pre_pre_k,src.block(SolutionBlocks::density));
+                g_mat.vmult(pre_pre_k,pre_pre_pre_k);
+                pre_k =  -1 * pre_pre_k + src.block(SolutionBlocks::unfiltered_density_multiplier);
+            }
+            SolverControl step_5_gmres_control_1 (Input::k_inv_iterations, Input::k_rel_tol*pre_j.l2_norm());
+            SolverFGMRES<LA::MPI::Vector> step_5_gmres_1 (step_5_gmres_control_1);
             try {
-                k_g_d_m_inv_density = inverse_operator(op_k_inv, step_4_gmres_1, PreconditionIdentity()) *
-                                      g_d_m_inv_density;
+                TimerOutput::Scope t(timer, "actual inverse 5.1");
+                dst.block(SolutionBlocks::unfiltered_density_multiplier) = 0.;
+                step_5_gmres_1.solve(j_inv_mat, dst.block(SolutionBlocks::unfiltered_density_multiplier), pre_j , PreconditionIdentity());
             } catch (std::exception &exc)
             {
-                std::cerr << "Failure of linear solver step_4_gmres_1" << std::endl;
-                std::cout << "first residual: " << step_4_gmres_control_1.initial_value() << std::endl;
-                std::cout << "last residual: " << step_4_gmres_control_1.last_value() << std::endl;
-                throw;
+                pcout << "Failure of linear solver 5-1 with convergence of " << step_5_gmres_control_1.last_value()/step_5_gmres_control_1.initial_value()<< std::endl;
+                //                    throw;
             }
 
-            SolverControl step_4_gmres_control_2 (10000, src.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm()*1e-6);
-            SolverGMRES<Vector<double>> step_4_gmres_2 (step_4_gmres_control_2);
+
+            SolverControl step_5_gmres_control_2 (Input::k_inv_iterations, Input::k_rel_tol*pre_k.l2_norm());
+            SolverFGMRES<LA::MPI::Vector> step_5_gmres_2 (step_5_gmres_control_2);
             try {
-                k_density_mult = inverse_operator(op_k_inv,step_4_gmres_2, PreconditionIdentity()) *
-                                 src.block(SolutionBlocks::unfiltered_density_multiplier);
+                TimerOutput::Scope t(timer, "actual inverse 5.2");
+                dst.block(SolutionBlocks::density) = 0.;
+                step_5_gmres_2.solve(k_inv_mat,dst.block(SolutionBlocks::density), pre_k , PreconditionIdentity());
             } catch (std::exception &exc)
             {
-                std::cerr << "Failure of linear solver step_4_gmres_2" << std::endl;
-                std::cout << "first residual: " << step_4_gmres_control_2.initial_value() << std::endl;
-                std::cout << "last residual: " << step_4_gmres_control_2.last_value() << std::endl;
-                throw;
+                pcout << "Failure of linear solver 5-2 with convergence of " << step_5_gmres_control_2.last_value()/step_5_gmres_control_2.initial_value()<< std::endl;
+                //                    throw;
             }
         }
-        else if (Input::solver_choice == SolverOptions::inexact_K_with_inexact_A_gmres)
+        else if (Input::solver_choice == SolverOptions::inexact_K_with_exact_A_gmres)
         {
-            PreconditionSSOR<SparseMatrix<double>> preconditioner;
-            preconditioner.initialize(a_mat, 1.2);
-            SolverControl            solver_control(1000, 1e-12);
-            SolverCG<Vector<double>> a_solver_cg(solver_control);
-            auto a_inv_op = inverse_operator(linear_operator(a_mat),a_solver_cg,preconditioner);
 
-            auto op_g = linear_operator(f_mat) * linear_operator(d_8_mat) *
-                        transpose_operator(linear_operator(f_mat));
+            // TrilinosWrappers::PreconditionIdentity preconditioner;
+            // preconditioner.initialize(b_mat);
+            auto pre_pre_k = pre_k;
+            auto pre_pre_pre_k = pre_k;
+            auto d_m_inv_unfil_density_mult = pre_k;
+            auto h_d_m_inv_unfil_density_mult = pre_k;
 
-            auto op_h = linear_operator(b_mat)
-                        - transpose_operator(linear_operator(c_mat)) * a_inv_op * linear_operator(e_mat)
-                        - transpose_operator(linear_operator(e_mat)) * a_inv_op * linear_operator(c_mat);
-
-            auto op_k_inv = -1 * op_g * linear_operator(d_m_inv_mat) * op_h - linear_operator(d_m_mat);
-
-            g_d_m_inv_density = op_g * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density);
-
-            SolverControl step_4_gmres_control_1 (10000, g_d_m_inv_density.l2_norm()*1e-6);
-            SolverGMRES<Vector<double>> step_4_gmres_1 (step_4_gmres_control_1);
+            {
+                TimerOutput::Scope t(timer, "not inverse 5.1");
+                d_m_inv_mat.vmult(d_m_inv_unfil_density_mult, src.block(SolutionBlocks::unfiltered_density_multiplier));
+                h_mat.vmult(h_d_m_inv_unfil_density_mult,d_m_inv_unfil_density_mult);
+                pre_j = src.block(SolutionBlocks::density) + h_d_m_inv_unfil_density_mult;
+                d_m_inv_mat.vmult(pre_pre_pre_k,src.block(SolutionBlocks::density));
+                g_mat.vmult(pre_pre_k,pre_pre_pre_k);
+                pre_k =  -1 * pre_pre_k + src.block(SolutionBlocks::unfiltered_density_multiplier);
+            }
+            SolverControl step_5_gmres_control_1 (Input::k_inv_iterations, Input::k_rel_tol*pre_j.l2_norm());
+            SolverFGMRES<LA::MPI::Vector> step_5_gmres_1 (step_5_gmres_control_1);
             try {
-                k_g_d_m_inv_density = inverse_operator(op_k_inv, step_4_gmres_1, PreconditionIdentity()) *
-                                      g_d_m_inv_density;
+                TimerOutput::Scope t(timer, "actual inverse 5.1");
+                dst.block(SolutionBlocks::unfiltered_density_multiplier) = 0.;
+                pcout << "SOLVE 3" << std::endl;
+                step_5_gmres_1.solve(j_inv_mat, dst.block(SolutionBlocks::unfiltered_density_multiplier), pre_j , PreconditionIdentity());
             } catch (std::exception &exc)
             {
-                std::cerr << "Failure of linear solver step_4_gmres_1" << std::endl;
-                std::cout << "first residual: " << step_4_gmres_control_1.initial_value() << std::endl;
-                std::cout << "last residual: " << step_4_gmres_control_1.last_value() << std::endl;
-                throw;
+                pcout << "Failure of linear solver step_5_gmres_1" << std::endl;
+                pcout << "first residual: " << step_5_gmres_control_1.initial_value() << std::endl;
+                pcout << "last residual: " << step_5_gmres_control_1.last_value() << std::endl;
+                //                    throw;
             }
 
-            SolverControl step_4_gmres_control_2 (10000, src.block(SolutionBlocks::unfiltered_density_multiplier).l2_norm()*1e-6);
-            SolverGMRES<Vector<double>> step_4_gmres_2 (step_4_gmres_control_2);
+
+            SolverControl step_5_gmres_control_2 (Input::k_inv_iterations, Input::k_rel_tol*pre_k.l2_norm());
+            SolverFGMRES<LA::MPI::Vector> step_5_gmres_2 (step_5_gmres_control_2);
             try {
-                k_density_mult = inverse_operator(op_k_inv,step_4_gmres_2, PreconditionIdentity()) *
-                                 src.block(SolutionBlocks::unfiltered_density_multiplier);
+                TimerOutput::Scope t(timer, "actual inverse 5.2");
+                dst.block(SolutionBlocks::density) = 0.;
+                pcout << "SOLVE 4" << std::endl;
+                step_5_gmres_2.solve(k_inv_mat,dst.block(SolutionBlocks::density), pre_k , PreconditionIdentity());
             } catch (std::exception &exc)
             {
-                std::cerr << "Failure of linear solver step_4_gmres_2" << std::endl;
-                std::cout << "first residual: " << step_4_gmres_control_2.initial_value() << std::endl;
-                std::cout << "last residual: " << step_4_gmres_control_2.last_value() << std::endl;
-                throw;
+                pcout << "Failure of linear solver step_5_gmres_2" << std::endl;
+                pcout << "first residual: " << step_5_gmres_control_2.initial_value() << std::endl;
+                pcout << "last residual: " << step_5_gmres_control_2.last_value() << std::endl;
+                //                    throw;
             }
         }
         else
         {
-            std::cout << "shouldn't get here";
+            pcout << "shouldn't get here";
             throw;
         }
 
+    }
+    {
+        
+        dst.block(SolutionBlocks::total_volume_multiplier) = src.block(SolutionBlocks::total_volume_multiplier);
 
-        dst.block(SolutionBlocks::total_volume_multiplier) += transpose_operator(linear_operator(m_vect))*k_g_d_m_inv_density;
-        dst.block(SolutionBlocks::total_volume_multiplier) -= transpose_operator(linear_operator(m_vect))*k_density_mult;
 
     }
+    
+}
 
+///I used to use this function to output parts of the preconditioner for debugging.
+template<int dim>
+void TopOptSchurPreconditioner<dim>::print_stuff()
+{
 
 
+}
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::vmult_step_5(BlockVector<double> &dst, const BlockVector<double> &src) const {
-        {
-            //First Block Inverse
-            TimerOutput::Scope t(timer, "inverse 1");
-            dst.block(SolutionBlocks::density_lower_slack_multiplier) = linear_operator(d_3_mat) * src.block(SolutionBlocks::density_lower_slack_multiplier) +
-                    linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density_lower_slack);
-            dst.block(SolutionBlocks::density_upper_slack_multiplier) = linear_operator(d_4_mat) * src.block(SolutionBlocks::density_upper_slack_multiplier) +
-                    linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density_upper_slack);
-            dst.block(SolutionBlocks::density_lower_slack) = linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density_lower_slack_multiplier);
-            dst.block(SolutionBlocks::density_upper_slack) = linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density_upper_slack_multiplier);
-        }
+//******************************* Direct Trilinos Solver ***********************************
 
+///Constructor
+VmultTrilinosSolverDirect::VmultTrilinosSolverDirect(SolverControl &cn,
+                                                     const TrilinosWrappers::SolverDirect::AdditionalData &data)
+    : solver_direct(cn, data)
+{
+   
+}
 
-        {
-            //Second Block Inverse
-            TimerOutput::Scope t(timer, "inverse 2");
-            dst.block(SolutionBlocks::unfiltered_density) =
-                    linear_operator(d_8_mat) * src.block(SolutionBlocks::unfiltered_density);
-        }
+///Initialize a direct solver - works well up to a point of refinement, and then refuses to solve.
+void VmultTrilinosSolverDirect::initialize(LA::MPI::SparseMatrix &a_mat)
+{
+    reinit(a_mat);
+    solver_direct.initialize(a_mat);
+    size = a_mat.n();
+}
 
+///rephrases the solve as a vmult for easier use.
+void
+VmultTrilinosSolverDirect::vmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const
+{
+    solver_direct.solve(dst, src);
+}
 
-        {
-            //Third Block Inverse
-            TimerOutput::Scope t(timer, "inverse 3");
-            if(Input::solver_choice == SolverOptions::inexact_K_with_inexact_A_gmres)
-            {
-                PreconditionSSOR<SparseMatrix<double>> preconditioner;
-                preconditioner.initialize(a_mat, 1.2);
-                SolverControl            solver_control(1000, 1e-12);
-                SolverCG<Vector<double>> a_solver_cg(solver_control);
-                auto a_inv_op = inverse_operator(linear_operator(a_mat),a_solver_cg,preconditioner);
-                dst.block(SolutionBlocks::displacement) = a_inv_op * src.block(SolutionBlocks::displacement_multiplier);
-                dst.block(SolutionBlocks::displacement_multiplier) = a_inv_op * src.block(SolutionBlocks::displacement);
-            } else
-            {
-                dst.block(SolutionBlocks::displacement) = linear_operator(a_inv_direct) * src.block(SolutionBlocks::displacement_multiplier);
-                dst.block(SolutionBlocks::displacement_multiplier) = linear_operator(a_inv_direct) * src.block(SolutionBlocks::displacement);
-            }
+///rephrases the solve as a vmult for easier use.
+void VmultTrilinosSolverDirect::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    solver_direct.solve(dst, src);
+}
 
-        }
+///rephrases the solve as a vmult for easier use - note this is a symmetric matrix
+void
+VmultTrilinosSolverDirect::Tvmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const
+{
+    solver_direct.solve(dst, src);
+}
 
+///rephrases the solve as a vmult for easier use - note this is a symmetric matrix.
+void VmultTrilinosSolverDirect::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    solver_direct.solve(dst, src);
+}
 
-        {
-            //Fourth (ugly) Block Inverse
-            TimerOutput::Scope t(timer, "inverse 4");
 
 
+// **************** A inv MF GMG **********************
 
-            if (Input::solver_choice == SolverOptions::exact_preconditioner_with_gmres)
-            {
-                pre_j = src.block(SolutionBlocks::density) + linear_operator(h_mat) * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::unfiltered_density_multiplier);
-                pre_k = -1* linear_operator(g_mat) * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density) + src.block(SolutionBlocks::unfiltered_density_multiplier);
-                dst.block(SolutionBlocks::unfiltered_density_multiplier) = transpose_operator(linear_operator(k_mat)) * pre_j;
-                dst.block(SolutionBlocks::density) = linear_operator(k_mat) * pre_k;
-            }
+///Initializes an object that performs the A inverse operation using matrix free GMG
+template<int dim>
+AInvMatMFGMG<dim>::AInvMatMFGMG(MF_Elasticity_Operator<dim,1,double> &mf_elasticity_operator_in , PreconditionMG<dim, LinearAlgebra::distributed::Vector<double>, MGTransferMatrixFree<dim, double> > &mf_gmg_preconditioner_in, LA::MPI::SparseMatrix &a_mat, std::map<types::global_dof_index,types::global_dof_index> &displacement_to_system_dof_index_map_in)
+    : mf_elasticity_operator(mf_elasticity_operator_in),
+      mf_gmg_preconditioner(mf_gmg_preconditioner_in),
+      a_mat_wrapped(a_mat),
+      displacement_to_system_dof_index_map(displacement_to_system_dof_index_map_in)
 
-            else if (Input::solver_choice == SolverOptions::inexact_K_with_exact_A_gmres)
-            {
-                auto op_g = linear_operator(f_mat) * linear_operator(d_8_mat) *
-                            transpose_operator(linear_operator(f_mat));
+{
+    mf_elasticity_operator.initialize_dof_vector(temp_dst);
+    mf_elasticity_operator.initialize_dof_vector(temp_src);
+}
 
-                auto op_h = linear_operator(b_mat)
-                            - transpose_operator(linear_operator(c_mat)) * linear_operator(a_inv_direct) * linear_operator(e_mat)
-                            - transpose_operator(linear_operator(e_mat)) * linear_operator(a_inv_direct) * linear_operator(c_mat);
+///Performs the A inverse operation
+template<int dim>
+void AInvMatMFGMG<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
 
-                auto op_k_inv = -1 * op_g * linear_operator(d_m_inv_mat) * op_h - linear_operator(d_m_mat);
+    SolverControl            solver_control(iterations, src.l2_norm()*tolerance);
+    SolverCG<LinearAlgebra::distributed::Vector<double>> a_solver_cg(solver_control);
 
-                pre_j = src.block(SolutionBlocks::density) + op_h * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::unfiltered_density_multiplier);
-                pre_k = -1* op_g * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density) + src.block(SolutionBlocks::unfiltered_density_multiplier);
+    ChangeVectorTypes::copy_from_system_to_displacement_vector<double>(temp_src, src, displacement_to_system_dof_index_map);
+    try{
+        temp_dst = 0.;
+        a_solver_cg.solve(mf_elasticity_operator,temp_dst,temp_src, mf_gmg_preconditioner);
+    }
+    catch (std::exception &exc)
+    {
+        // std::cout << "failed with a reduction of: " << solver_control.initial_value()/solver_control.last_value() << std::endl;
+    }
 
-                SolverControl step_5_gmres_control_1 (10000, pre_j.l2_norm()*1e-6);
-                SolverGMRES<Vector<double>> step_5_gmres_1 (step_5_gmres_control_1);
-                try {
-                    dst.block(SolutionBlocks::unfiltered_density_multiplier) = inverse_operator(transpose_operator(op_k_inv), step_5_gmres_1, PreconditionIdentity()) *
-                                          pre_j;
-                } catch (std::exception &exc)
-                {
-                    std::cerr << "Failure of linear solver step_5_gmres_1" << std::endl;
-                    std::cout << "first residual: " << step_5_gmres_control_1.initial_value() << std::endl;
-                    std::cout << "last residual: " << step_5_gmres_control_1.last_value() << std::endl;
-                    throw;
-                }
+    ChangeVectorTypes::copy_from_displacement_to_system_vector<double>(dst,temp_dst, displacement_to_system_dof_index_map);
+    dst.compress(VectorOperation::insert);
 
-                SolverControl step_5_gmres_control_2 (10000, pre_k.l2_norm()*1e-6);
-                SolverGMRES<Vector<double>> step_5_gmres_2 (step_5_gmres_control_2);
-                try {
-                    dst.block(SolutionBlocks::density) = inverse_operator(op_k_inv, step_5_gmres_2, PreconditionIdentity()) *
-                                                                               pre_k;
-                } catch (std::exception &exc)
-                {
-                    std::cerr << "Failure of linear solver step_5_gmres_2" << std::endl;
-                    std::cout << "first residual: " << step_5_gmres_control_2.initial_value() << std::endl;
-                    std::cout << "last residual: " << step_5_gmres_control_2.last_value() << std::endl;
-                    throw;
-                }
-            }
-            else if (Input::solver_choice == SolverOptions::inexact_K_with_inexact_A_gmres)
-            {
-                PreconditionSSOR<SparseMatrix<double>> preconditioner;
-                preconditioner.initialize(a_mat, 1.2);
-                SolverControl            solver_control(1000, 1e-12);
-                SolverCG<Vector<double>> a_solver_cg(solver_control);
-                auto a_inv_op = inverse_operator(linear_operator(a_mat),a_solver_cg,preconditioner);
-
-                auto op_g = linear_operator(f_mat) * linear_operator(d_8_mat) *
-                            transpose_operator(linear_operator(f_mat));
-
-                auto op_h = linear_operator(b_mat)
-                            - transpose_operator(linear_operator(c_mat)) * a_inv_op * linear_operator(e_mat)
-                            - transpose_operator(linear_operator(e_mat)) * a_inv_op * linear_operator(c_mat);
-
-                auto op_k_inv = -1 * op_g * linear_operator(d_m_inv_mat) * op_h - linear_operator(d_m_mat);
-
-                pre_j = src.block(SolutionBlocks::density) + op_h * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::unfiltered_density_multiplier);
-                pre_k = -1* op_g * linear_operator(d_m_inv_mat) * src.block(SolutionBlocks::density) + src.block(SolutionBlocks::unfiltered_density_multiplier);
-
-                SolverControl step_5_gmres_control_1 (10000, pre_j.l2_norm()*1e-6);
-                SolverGMRES<Vector<double>> step_5_gmres_1 (step_5_gmres_control_1);
-                try {
-                    dst.block(SolutionBlocks::unfiltered_density_multiplier) = inverse_operator(transpose_operator(op_k_inv), step_5_gmres_1, PreconditionIdentity()) *
-                                                                               pre_j;
-                } catch (std::exception &exc)
-                {
-                    std::cerr << "Failure of linear solver step_5_gmres_1" << std::endl;
-                    std::cout << "first residual: " << step_5_gmres_control_1.initial_value() << std::endl;
-                    std::cout << "last residual: " << step_5_gmres_control_1.last_value() << std::endl;
-                    throw;
-                }
+}
 
-                SolverControl step_5_gmres_control_2 (10000, pre_k.l2_norm()*1e-6);
-                SolverGMRES<Vector<double>> step_5_gmres_2 (step_5_gmres_control_2);
-                try {
-                    dst.block(SolutionBlocks::density) = inverse_operator(op_k_inv, step_5_gmres_2, PreconditionIdentity()) *
-                                                         pre_k;
-                } catch (std::exception &exc)
-                {
-                    std::cerr << "Failure of linear solver step_5_gmres_2" << std::endl;
-                    std::cout << "first residual: " << step_5_gmres_control_2.initial_value() << std::endl;
-                    std::cout << "last residual: " << step_5_gmres_control_2.last_value() << std::endl;
-                    throw;
-                }
-            }
-            else
-            {
-                std::cout << "shouldn't get here";
-                throw;
-            }
+///Performs the A inverse operation - note A is symmetric
+template<int dim>
+void AInvMatMFGMG<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    SolverControl            solver_control(iterations, src.l2_norm()*tolerance);
+    SolverCG<LinearAlgebra::distributed::Vector<double>> a_solver_cg(solver_control);
+
+    ChangeVectorTypes::copy_from_system_to_displacement_vector<double>(temp_src, src, displacement_to_system_dof_index_map);
+    temp_dst = 0.;
+    a_solver_cg.solve(mf_elasticity_operator,temp_dst,temp_src, mf_gmg_preconditioner);
+    ChangeVectorTypes::copy_from_displacement_to_system_vector<double>(dst,temp_dst, displacement_to_system_dof_index_map);
+}
+///Change the solver tolerance if needed
+template<int dim>
+void AInvMatMFGMG<dim>::set_tol(double tol_in)
+{
+    tolerance = tol_in;
+}
+
+///Change the maximum number of iterations if needed.
+template<int dim>
+void AInvMatMFGMG<dim>::set_iter(unsigned int iterations_in)
+{
+    iterations = iterations_in;
+}
+
+
+// ******************     GMATRIX     ***********************
+
+GMatrix::GMatrix(const LA::MPI::SparseMatrix &f_mat_in, const LA::MPI::SparseMatrix &f_t_mat_in, LA::MPI::SparseMatrix &d_8_mat_in)
+    :
+      f_mat(f_mat_in),
+      f_t_mat(f_t_mat_in),
+      d_8_mat(d_8_mat_in)
+{
+
+}
+
+void
+GMatrix::initialize(LA::MPI::Vector &exemplar_density_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in)
+{
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_1 = 0.;
+    temp_vect_2 = 0.;
+
+    d_m_inv_mat.copy_from(d_m_inv_mat_in);
+}
+
+
+void GMatrix::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    temp_vect_1 = 0.;
+    temp_vect_2 = 0.;
+    dst = 0.;
+    f_t_mat.vmult(temp_vect_1,src);
+    d_8_mat.vmult(temp_vect_2, temp_vect_1);
+    f_mat.vmult(dst,temp_vect_2);
+}
+
+
+
+void GMatrix::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    temp_vect_1 = 0.;
+    temp_vect_2 = 0.;
+    dst = 0.;
+    f_t_mat.Tvmult(temp_vect_1,src);
+    d_8_mat.vmult(temp_vect_2, temp_vect_1);
+    f_mat.vmult(dst,temp_vect_2);
+}
+
+
+// ******************     HMatrix     ***********************
+
+template<int dim>
+HMatrix<dim>::HMatrix(LA::MPI::SparseMatrix &a_mat_in, const LA::MPI::SparseMatrix &b_mat_in, const LA::MPI::SparseMatrix &c_mat_in, const LA::MPI::SparseMatrix &e_mat_in,TrilinosWrappers::PreconditionAMG &pre_amg_in,VmultTrilinosSolverDirect &a_inv_direct_in, AInvMatMFGMG<dim> &a_inv_mf_gmg_in)
+    :
+      a_mat(a_mat_in),
+      b_mat(b_mat_in),
+      c_mat(c_mat_in),
+      e_mat(e_mat_in),
+      pre_amg(pre_amg_in),
+      a_inv_direct(a_inv_direct_in),
+      a_inv_mf_gmg(a_inv_mf_gmg_in)
+{
+
+}
+
+template<int dim>
+void
+HMatrix<dim>::initialize(LA::MPI::Vector &exemplar_density_vector,  LA::MPI::Vector &exemplar_displacement_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in)
+{
+    temp_vect_1 = exemplar_displacement_vector;
+    temp_vect_2 = exemplar_displacement_vector;
+    temp_vect_3 = exemplar_displacement_vector;
+    temp_vect_4 = exemplar_displacement_vector;
+    temp_vect_5 = exemplar_density_vector;
+    temp_vect_6 = exemplar_density_vector;
+    temp_vect_7 = exemplar_density_vector;
+
+    temp_vect_1 = 0.;
+    temp_vect_2 = 0.;
+    temp_vect_3 = 0.;
+    temp_vect_4 = 0.;
+    temp_vect_5 = 0.;
+    temp_vect_6 = 0.;
+    temp_vect_7 = 0.;
+
+    d_m_inv_mat.copy_from(d_m_inv_mat_in);
+
+
+}
+
+template<int dim>
+void HMatrix<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    if (Input::solver_choice==SolverOptions::inexact_K_with_inexact_A_gmres)
+    {
+        c_mat.vmult(temp_vect_1,src);
+        e_mat.vmult(temp_vect_2,src);
+
+        try
+        {
+            a_inv_mf_gmg.vmult(temp_vect_3,temp_vect_1);
+        } catch (std::exception &exc)
+        {
 
         }
+        try
         {
-            dst.block(SolutionBlocks::total_volume_multiplier) = src.block(SolutionBlocks::total_volume_multiplier);
+            a_inv_mf_gmg.vmult(temp_vect_4,temp_vect_2);
+        } catch (std::exception &exc)
+        {
+
         }
+
+        c_mat.Tvmult(temp_vect_6,temp_vect_4);
+        e_mat.Tvmult(temp_vect_5,temp_vect_3);
+
+        b_mat.vmult(temp_vect_7,src);
+        dst =  temp_vect_7 + temp_vect_6 + temp_vect_5;
     }
+    else
+    {
+        c_mat.vmult(temp_vect_1,src);
+        e_mat.vmult(temp_vect_2,src);
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::get_sparsity_pattern(BlockDynamicSparsityPattern &bdsp) {
-        mass_sparsity.copy_from(bdsp);
+        a_inv_direct.vmult(temp_vect_3,temp_vect_1);
+        a_inv_direct.vmult(temp_vect_4,temp_vect_2);
+
+        c_mat.Tvmult(temp_vect_6,temp_vect_4);
+        e_mat.Tvmult(temp_vect_5,temp_vect_3);
+
+        b_mat.vmult(temp_vect_7,src);
+        dst =  temp_vect_7 - temp_vect_6 - temp_vect_5;
     }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::assemble_mass_matrix(const BlockVector<double> &state,
-                                                              const hp::FECollection<dim> &fe_collection,
-                                                              const DoFHandler<dim> &dof_handler,
-                                                              const AffineConstraints<double> &constraints,
-                                                              const BlockSparsityPattern &bsp) {
-        timer.reset();
-
-        approx_h_mat.reinit(bsp);
-
-        /*Remove any values from old iterations*/
-        QGauss<dim> nine_quadrature(fe_collection[0].degree + 1);
-        QGauss<dim> ten_quadrature(fe_collection[1].degree + 1);
-
-        hp::QCollection<dim> q_collection;
-        q_collection.push_back(nine_quadrature);
-        q_collection.push_back(ten_quadrature);
-
-        hp::FEValues<dim> hp_fe_values(fe_collection,
-                                       q_collection,
-                                       update_values | update_quadrature_points |
-                                       update_JxW_values | update_gradients);
-        FullMatrix<double> cell_matrix;
-        Vector<double>     cell_rhs;
-        std::vector<types::global_dof_index> local_dof_indices;
-
-        const FEValuesExtractors::Scalar densities(SolutionComponents::density<dim>);
-        const FEValuesExtractors::Vector displacements(SolutionComponents::displacement<dim>);
-        const FEValuesExtractors::Scalar unfiltered_densities(SolutionComponents::unfiltered_density<dim>);
-        const FEValuesExtractors::Vector displacement_multipliers(SolutionComponents::displacement_multiplier<dim>);
-        const FEValuesExtractors::Scalar unfiltered_density_multipliers(
-                SolutionComponents::unfiltered_density_multiplier<dim>);
-        const FEValuesExtractors::Scalar density_lower_slacks(SolutionComponents::density_lower_slack<dim>);
-        const FEValuesExtractors::Scalar density_lower_slack_multipliers(
-                SolutionComponents::density_lower_slack_multiplier<dim>);
-        const FEValuesExtractors::Scalar density_upper_slacks(SolutionComponents::density_upper_slack<dim>);
-        const FEValuesExtractors::Scalar density_upper_slack_multipliers(
-                SolutionComponents::density_upper_slack_multiplier<dim>);
-        const FEValuesExtractors::Scalar total_volume_multiplier(
-                SolutionComponents::total_volume_multiplier<dim>);
-
-        const Functions::ConstantFunction<dim> lambda(1.), mu(1.);
-
-        BlockVector<double> filtered_unfiltered_density_solution = state;
-        BlockVector<double> filter_adjoint_unfiltered_density_multiplier_solution = state;
-        filtered_unfiltered_density_solution.block(SolutionBlocks::unfiltered_density) = 0;
-        filter_adjoint_unfiltered_density_multiplier_solution.block(SolutionBlocks::unfiltered_density_multiplier) = 0;
-
-
-        for (const auto &cell : dof_handler.active_cell_iterators()) {
-            hp_fe_values.reinit(cell);
-            const FEValues<dim> &fe_values = hp_fe_values.get_present_fe_values();
-            cell_matrix.reinit(cell->get_fe().n_dofs_per_cell(),
-                               cell->get_fe().n_dofs_per_cell());
-            cell_rhs.reinit(cell->get_fe().n_dofs_per_cell());
-
-            const unsigned int n_q_points = fe_values.n_quadrature_points;
-
-            std::vector<double> old_density_values(n_q_points);
-            std::vector<double> old_displacement_divs(n_q_points);
-            std::vector<SymmetricTensor<2, dim>> old_displacement_symmgrads(
-                    n_q_points);
-            std::vector<double> old_displacement_multiplier_divs(n_q_points);
-            std::vector<SymmetricTensor<2, dim>> old_displacement_multiplier_symmgrads(
-                    n_q_points);
-            std::vector<double> lambda_values(n_q_points);
-            std::vector<double> mu_values(n_q_points);
-
-            const unsigned int dofs_per_cell = cell->get_fe().n_dofs_per_cell();
-
-            cell_matrix = 0;
-            cell_rhs = 0;
-            local_dof_indices.resize(cell->get_fe().n_dofs_per_cell());
-            cell->get_dof_indices(local_dof_indices);
-
-            lambda.value_list(fe_values.get_quadrature_points(), lambda_values);
-            mu.value_list(fe_values.get_quadrature_points(), mu_values);
-
-            fe_values[densities].get_function_values(state,
-                                                     old_density_values);
-            fe_values[displacements].get_function_divergences(state,
-                                                              old_displacement_divs);
-            fe_values[displacements].get_function_symmetric_gradients(
-                    state, old_displacement_symmgrads);
-            fe_values[displacement_multipliers].get_function_divergences(
-                    state, old_displacement_multiplier_divs);
-            fe_values[displacement_multipliers].get_function_symmetric_gradients(
-                    state, old_displacement_multiplier_symmgrads);
-
-            Tensor<1, dim> traction;
-            traction[1] = -1;
-
-            for (unsigned int q_point = 0; q_point < n_q_points; ++q_point) {
-
-                for (unsigned int i = 0; i < dofs_per_cell; ++i) {
-
-                    const double unfiltered_density_phi_i = fe_values[unfiltered_densities].value(i,
-                                                                                                  q_point);
-                    const double density_phi_i = fe_values[densities].value(i,q_point);
-
-                    for (unsigned int j = 0; j < dofs_per_cell; ++j) {
-
-                        const double unfiltered_density_phi_j = fe_values[unfiltered_densities].value(j,
-                                                                                                      q_point);
-                        const double density_phi_j = fe_values[densities].value(j,q_point);
-
-
-
-                        double value =   unfiltered_density_phi_i
-                                       * unfiltered_density_phi_j
-                                       * (-1 * Input::density_penalty_exponent * Input::density_penalty_exponent - Input::density_penalty_exponent)
-                                       * std::pow(old_density_values[q_point],Input::density_penalty_exponent - 2)
-                                       *
-                                       (old_displacement_divs[q_point] * old_displacement_multiplier_divs[q_point]
-                                        * lambda_values[q_point]
-                                        +
-                                        2 * mu_values[q_point] * (old_displacement_symmgrads[q_point] *
-                                                                  old_displacement_multiplier_symmgrads[q_point]));
-
-
-                        value +=   density_phi_i
-                                * density_phi_j
-                                * (-2 * Input::density_penalty_exponent * Input::density_penalty_exponent)
-                                * std::pow(old_density_values[q_point],Input::density_penalty_exponent - 2)
-                                * old_displacement_symmgrads[q_point].norm() *
-                                old_displacement_multiplier_symmgrads[q_point].norm();
-
-                        if (value != 0)
-                        {
-                            cell_matrix(i, j) +=
-                                    fe_values.JxW(q_point) * value ;
-                        }
-                    }
+}
 
-                }
 
-            }
+template<int dim>
+void HMatrix<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    if (Input::solver_choice==SolverOptions::inexact_K_with_inexact_A_gmres)
+    {
+        c_mat.vmult(temp_vect_1,src);
+        e_mat.vmult(temp_vect_2,src);
+
+
+        try
+        {
+            a_inv_mf_gmg.vmult(temp_vect_3,temp_vect_1);
+
+        } catch (std::exception &exc)
+        {
 
-            constraints.distribute_local_to_global(cell_matrix, local_dof_indices, approx_h_mat);
         }
+        try
+        {
+            a_inv_mf_gmg.vmult(temp_vect_4,temp_vect_2);
 
-    }
+        } catch (std::exception &exc)
+        {
 
+        }
 
-    template<int dim>
-    void TopOptSchurPreconditioner<dim>::print_stuff(const BlockSparseMatrix<double> &matrix)
+        c_mat.Tvmult(temp_vect_6,temp_vect_4);
+        e_mat.Tvmult(temp_vect_5,temp_vect_3);
+
+        b_mat.vmult(temp_vect_7,src);
+        dst =  temp_vect_7 + temp_vect_6 + temp_vect_5;
+    }
+    else
     {
+        c_mat.vmult(temp_vect_1,src);
+        e_mat.vmult(temp_vect_2,src);
 
-//        print_matrix("OAmat.csv",a_mat);
-//        print_matrix("OBmat.csv",b_mat);
-//        print_matrix("OCmat.csv",c_mat);
-//        print_matrix("OEmat.csv",e_mat);
-//        print_matrix("OFmat.csv",f_mat);
-        FullMatrix<double> g_mat;
-        FullMatrix<double> h_mat;
-        FullMatrix<double> k_inv_mat;
-        g_mat.reinit(b_mat.m(),b_mat.n());
-        h_mat.reinit(b_mat.m(),b_mat.n());
-        k_inv_mat.reinit(b_mat.m(),b_mat.n());
-        auto op_g = linear_operator(f_mat) * linear_operator(d_8_mat) *
-                    transpose_operator(linear_operator(f_mat));
-
-        auto op_h = linear_operator(b_mat)
-                    - transpose_operator(linear_operator(c_mat)) * linear_operator(a_inv_direct) * linear_operator(e_mat)
-                    - transpose_operator(linear_operator(e_mat)) * linear_operator(a_inv_direct) * linear_operator(c_mat);
-
-        auto op_k_inv = -1 * op_g * linear_operator(d_m_inv_mat) * op_h - linear_operator(d_m_mat);
-        build_matrix_element_by_element(op_g,g_mat);
-        build_matrix_element_by_element(op_h,h_mat);
-        build_matrix_element_by_element(op_k_inv,k_inv_mat);
-//        print_matrix("OGmat.csv",g_mat);
-//        print_matrix("OHmat.csv",h_mat);
-//        print_matrix("OKinvmat.csv",k_inv_mat);
+        a_inv_direct.vmult(temp_vect_3,temp_vect_1);
+        a_inv_direct.vmult(temp_vect_4,temp_vect_2);
 
+        c_mat.Tvmult(temp_vect_6,temp_vect_4);
+        e_mat.Tvmult(temp_vect_5,temp_vect_3);
 
+        b_mat.vmult(temp_vect_7,src);
+        dst =  temp_vect_7 - temp_vect_6 - temp_vect_5;
     }
+
+}
+
+
+// ******************     HMatrixDirect     ***********************
+
+template<int dim>
+HMatrixDirect<dim>::HMatrixDirect(LA::MPI::SparseMatrix &a_mat_in, const LA::MPI::SparseMatrix &b_mat_in, const LA::MPI::SparseMatrix &c_mat_in, const LA::MPI::SparseMatrix &e_mat_in,TrilinosWrappers::PreconditionAMG &pre_amg_in,VmultTrilinosSolverDirect &a_inv_direct_in, AInvMatMFGMG<dim> &a_inv_mf_gmg_in)
+    :
+      a_mat(a_mat_in),
+      b_mat(b_mat_in),
+      c_mat(c_mat_in),
+      e_mat(e_mat_in),
+      pre_amg(pre_amg_in),
+      a_inv_direct(a_inv_direct_in),
+      a_inv_mf_gmg(a_inv_mf_gmg_in)
+{
+
+}
+
+template<int dim>
+void
+HMatrixDirect<dim>::initialize(LA::MPI::Vector &exemplar_density_vector,  LA::MPI::Vector &exemplar_displacement_vector)
+{
+    temp_vect_1 = exemplar_displacement_vector;
+    temp_vect_2 = exemplar_displacement_vector;
+    temp_vect_3 = exemplar_displacement_vector;
+    temp_vect_4 = exemplar_displacement_vector;
+    temp_vect_5 = exemplar_density_vector;
+    temp_vect_6 = exemplar_density_vector;
+    temp_vect_7 = exemplar_density_vector;
+
+
+}
+
+template<int dim>
+void HMatrixDirect<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+
+        c_mat.vmult(temp_vect_1,src);
+        e_mat.vmult(temp_vect_2,src);
+
+        a_inv_direct.vmult(temp_vect_3,temp_vect_1);
+        a_inv_direct.vmult(temp_vect_4,temp_vect_2);
+
+        c_mat.Tvmult(temp_vect_6,temp_vect_4);
+        e_mat.Tvmult(temp_vect_5,temp_vect_3);
+
+        b_mat.vmult(temp_vect_7,src);
+        dst =  temp_vect_7 - temp_vect_6 - temp_vect_5;
+
+
+
+}
+
+
+template<int dim>
+void HMatrixDirect<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+
+        c_mat.vmult(temp_vect_1,src);
+        e_mat.vmult(temp_vect_2,src);
+
+        a_inv_direct.vmult(temp_vect_3,temp_vect_1);
+        a_inv_direct.vmult(temp_vect_4,temp_vect_2);
+
+        c_mat.Tvmult(temp_vect_6,temp_vect_4);
+        e_mat.Tvmult(temp_vect_5,temp_vect_3);
+
+        b_mat.vmult(temp_vect_7,src);
+        dst =  temp_vect_7 - temp_vect_6 - temp_vect_5;
+
+}
+
+
+// ******************     JinvMatrix     ***********************
+template<int dim>
+JinvMatrix<dim>::JinvMatrix(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in)
+    :
+      h_mat(h_mat_in),
+      g_mat(g_mat_in),
+      d_m_mat(d_m_mat_in)
+{
+
+}
+
+template<int dim>
+void
+JinvMatrix<dim>::initialize(LA::MPI::Vector &exemplar_density_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in)
+{
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_3 = exemplar_density_vector;
+    temp_vect_4 = exemplar_density_vector;
+    d_m_inv_mat.copy_from(d_m_inv_mat_in);
+
+}
+
+template<int dim>
+void JinvMatrix<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    g_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    h_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+template<int dim>
+void JinvMatrix<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    h_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    g_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+// ******************     JinvMatrixPart     ***********************
+template<int dim>
+JinvMatrixPart<dim>::JinvMatrixPart(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in)
+    :
+      h_mat(h_mat_in),
+      g_mat(g_mat_in),
+      d_m_mat(d_m_mat_in)
+{
+}
+
+template<int dim>
+void
+JinvMatrixPart<dim>::initialize(LA::MPI::Vector &exemplar_density_vector)
+{
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_3 = exemplar_density_vector;
+    temp_vect_4 = exemplar_density_vector;
+
+}
+
+template<int dim>
+void JinvMatrixPart<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    g_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    h_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_inv_mat.vmult(temp_vect_4,temp_vect_3);
+    dst = -1 * temp_vect_4;
+}
+
+template<int dim>
+void JinvMatrixPart<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    h_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    g_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_inv_mat.vmult(temp_vect_4,temp_vect_3);
+    dst = -1 * temp_vect_4;
+}
+
+// ******************     JinvMatrixDirect     ***********************
+template<int dim>
+JinvMatrixDirect<dim>::JinvMatrixDirect(HMatrixDirect<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in)
+    :
+      h_mat(h_mat_in),
+      g_mat(g_mat_in),
+      d_m_mat(d_m_mat_in)
+{
+
+}
+
+template<int dim>
+void
+JinvMatrixDirect<dim>::initialize(LA::MPI::Vector &exemplar_density_vector)
+{
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_3 = exemplar_density_vector;
+    temp_vect_4 = exemplar_density_vector;
+
+}
+
+template<int dim>
+void JinvMatrixDirect<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    g_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    h_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+template<int dim>
+void JinvMatrixDirect<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    h_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    g_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+
+// ******************     KinvMatrix     ***********************
+template<int dim>
+KinvMatrix<dim>::KinvMatrix(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in)
+    :
+      h_mat(h_mat_in),
+      g_mat(g_mat_in),
+      d_m_mat(d_m_mat_in)
+{
+
+}
+
+template<int dim>
+void
+KinvMatrix<dim>::initialize(LA::MPI::Vector &exemplar_density_vector, LA::MPI::SparseMatrix &d_m_inv_mat_in)
+{
+
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_3 = exemplar_density_vector;
+    temp_vect_4 = exemplar_density_vector;
+
+    temp_vect_1 = 0.;
+    temp_vect_2 = 0.;
+    temp_vect_3 = 0.;
+    temp_vect_4 = 0.;
+
+    d_m_inv_mat.copy_from(d_m_inv_mat_in);
+
 }
+
+template<int dim>
+void KinvMatrix<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    h_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    g_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+template<int dim>
+void KinvMatrix<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    g_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    h_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+// ******************     KinvMatrixPart    ***********************
+template<int dim>
+KinvMatrixPart<dim>::KinvMatrixPart(HMatrix<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in)
+    :
+      h_mat(h_mat_in),
+      g_mat(g_mat_in),
+      d_m_mat(d_m_mat_in)
+{
+
+}
+
+template<int dim>
+void
+KinvMatrixPart<dim>::initialize(LA::MPI::Vector &exemplar_density_vector)
+{
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_3 = exemplar_density_vector;
+    temp_vect_4 = exemplar_density_vector;
+
+}
+
+template<int dim>
+void KinvMatrixPart<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+
+    h_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    g_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_inv_mat.vmult(temp_vect_4,temp_vect_3);
+
+    dst = temp_vect_4;
+    //kinv is -Dm-GDmH
+    //kinv scaled would be I+DminvGDminvH
+    //kpart is -DminvGDmH
+
+}
+
+template<int dim>
+void KinvMatrixPart<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    g_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    h_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_inv_mat.vmult(temp_vect_4,temp_vect_3);
+
+    dst = temp_vect_4;
+    //kinv is -Dm-GDmH
+    //kinv scaled would be I+DminvGDminvH
+    //kpart is -DminvGDmH
+}
+
+// ******************     KinvMatrixDirect     ***********************
+template<int dim>
+KinvMatrixDirect<dim>::KinvMatrixDirect(HMatrixDirect<dim> &h_mat_in, GMatrix &g_mat_in, const LA::MPI::SparseMatrix &d_m_mat_in)
+    :
+      h_mat(h_mat_in),
+      g_mat(g_mat_in),
+      d_m_mat(d_m_mat_in)
+{
+
+}
+
+template<int dim>
+void
+KinvMatrixDirect<dim>::initialize(LA::MPI::Vector &exemplar_density_vector)
+{
+    temp_vect_1 = exemplar_density_vector;
+    temp_vect_2 = exemplar_density_vector;
+    temp_vect_3 = exemplar_density_vector;
+    temp_vect_4 = exemplar_density_vector;
+
+}
+
+template<int dim>
+void KinvMatrixDirect<dim>::vmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    h_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    g_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+template<int dim>
+void KinvMatrixDirect<dim>::Tvmult(LA::MPI::Vector &dst, const LA::MPI::Vector &src) const
+{
+    g_mat.vmult(temp_vect_1,src);
+    d_m_inv_mat.vmult(temp_vect_2,temp_vect_1);
+    h_mat.vmult(temp_vect_3,temp_vect_2);
+    d_m_mat.vmult(temp_vect_4,src);
+
+    dst = -1*temp_vect_4 - temp_vect_3;
+}
+
+
+
+
+//**************************************************
+
+
+AMatWrapped::AMatWrapped(LA::MPI::SparseMatrix &a_mat_in)
+    :
+      a_mat(a_mat_in)
+{
+}
+void AMatWrapped::vmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const
+{
+    ChangeVectorTypes::copy(temp_src, src);
+    a_mat.vmult(temp_dst,temp_src);
+    ChangeVectorTypes::copy(dst, temp_dst);
+}
+void AMatWrapped::Tvmult(LinearAlgebra::distributed::Vector<double> &dst, const LinearAlgebra::distributed::Vector<double> &src) const
+{
+    ChangeVectorTypes::copy(temp_src, src);
+    a_mat.Tvmult(temp_dst,temp_src);
+    ChangeVectorTypes::copy(dst, temp_dst);
+}
+}
+
+
+
 template class SAND::TopOptSchurPreconditioner<2>;
-template class SAND::TopOptSchurPreconditioner<3>;
\ No newline at end of file
+template class SAND::TopOptSchurPreconditioner<3>;
+
+template class SAND::AInvMatMFGMG<2>;
+template class SAND::AInvMatMFGMG<3>;
+
+template class SAND::JinvMatrix<2>;
+template class SAND::JinvMatrix<3>;
+
+template class SAND::KinvMatrix<2>;
+template class SAND::KinvMatrix<3>;
+
+template class SAND::HMatrix<2>;
+template class SAND::HMatrix<3>;
+
diff --git a/source/watchdog.cc b/source/watchdog.cc
new file mode 100644
index 0000000..8ba8657
--- /dev/null
+++ b/source/watchdog.cc
@@ -0,0 +1,478 @@
+#include <deal.II/lac/block_vector.h>
+#include <deal.II/lac/packaged_operation.h>
+#include <deal.II/grid/tria.h>
+#include <deal.II/grid/grid_refinement.h>
+#include <iostream>
+#include "../include/markov_filter.h"
+#include "../include/kkt_system.h"
+#include "../include/input_information.h"
+#include "../include/watchdog.h"
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/lac/trilinos_parallel_block_vector.h>
+#include <deal.II/lac/generic_linear_algebra.h>
+#include <deal.II/base/conditional_ostream.h>
+#include <deal.II/base/utilities.h>
+
+///Above are fairly normal files to include.  I also use the sparse direct package, which requiresBLAS/LAPACK
+/// to  perform  a  direct  solve  while  I  work  on  a  fast  iterative  solver  for  this problem.
+
+namespace SAND {
+    namespace LA
+    {
+        using namespace dealii::LinearAlgebraTrilinos;
+    }
+
+
+    using namespace dealii;
+
+    ///Constructor
+    template<int dim>
+    NonlinearWatchdog<dim>::NonlinearWatchdog()
+            :
+              mpi_communicator(MPI_COMM_WORLD),
+              pcout(std::cout,(Utilities::MPI::this_mpi_process(mpi_communicator) == 0)),
+              overall_timer(pcout, TimerOutput::never, TimerOutput::wall_times)
+    {
+    }
+
+    ///A binary search figures out the maximum step that meets the dual feasibility - that s>0 and z>0. The fraction to boundary increases as the barrier size decreases.
+
+    template<int dim>
+    std::pair<double,double>
+    NonlinearWatchdog<dim>::calculate_max_step_size(const LA::MPI::BlockVector &state, const LA::MPI::BlockVector &step) const {
+
+        double step_size_s_low = 0;
+        double step_size_z_low = 0;
+        double step_size_s_high = 1;
+        double step_size_z_high = 1;
+        double step_size_s, step_size_z;
+        LA::MPI::BlockVector state_test_s = state;
+        state_test_s = 0;
+        LA::MPI::BlockVector state_test_z = state;
+        state_test_z = 0;
+        for (unsigned int k = 0; k < 50; k++)
+        {
+
+            step_size_s = (step_size_s_low + step_size_s_high) / 2;
+            step_size_z = (step_size_z_low + step_size_z_high) / 2;
+            const LA::MPI::BlockVector state_test_s =
+                    (Input::fraction_to_boundary * state) + (step_size_s * step);
+
+            const LA::MPI::BlockVector state_test_z =
+                    (Input::fraction_to_boundary * state) + (step_size_z * step);
+
+            const bool accept_s = (state_test_s.block(SolutionBlocks::density_lower_slack).is_non_negative())
+                                  && (state_test_s.block(SolutionBlocks::density_upper_slack).is_non_negative());
+            const bool accept_z = (state_test_z.block(SolutionBlocks::density_lower_slack_multiplier).is_non_negative())
+                                  && (state_test_z.block(SolutionBlocks::density_upper_slack_multiplier).is_non_negative());
+
+            if (accept_s) {
+                step_size_s_low = step_size_s;
+            } else {
+                step_size_s_high = step_size_s;
+            }
+            if (accept_z) {
+                step_size_z_low = step_size_z;
+            } else {
+                step_size_z_high = step_size_z;
+            }
+        }
+        pcout << "s step : " << step_size_s_low << " z size : " << step_size_z_low << std::endl;
+        return {step_size_s_low, step_size_z_low};
+    }
+
+    ///Creates a rhs vector that we can use to look at the magnitude of the KKT conditions.  This is then used for testing the convergence before shrinking barrier size, as well as in the calculation of the l1 merit.
+
+    template<int dim>
+    const LA::MPI::BlockVector
+    NonlinearWatchdog<dim>::find_max_step(const LA::MPI::BlockVector &state)
+    {
+        TimerOutput::Scope t(overall_timer, "find step");
+        {
+            TimerOutput::Scope t(overall_timer, "assemble");
+            kkt_system.assemble_block_system(state, barrier_size);
+        }
+
+        pcout << "pre" << std::endl;
+        LA::MPI::BlockVector step;
+        {
+            TimerOutput::Scope t(overall_timer, "solve");
+            step = kkt_system.solve(state);
+        }
+
+        pcout << "post" << std::endl;
+        const auto max_step_sizes= calculate_max_step_size(state,step);
+        const double step_size_s = max_step_sizes.first;
+        const double step_size_z = max_step_sizes.second;
+        LA::MPI::BlockVector max_step(10);
+
+        max_step.block(SolutionBlocks::density) = step_size_s * step.block(SolutionBlocks::density);
+        max_step.block(SolutionBlocks::displacement) = step_size_s * step.block(SolutionBlocks::displacement);
+        max_step.block(SolutionBlocks::unfiltered_density) = step_size_s * step.block(SolutionBlocks::unfiltered_density);
+        max_step.block(SolutionBlocks::density_lower_slack) = step_size_s * step.block(SolutionBlocks::density_lower_slack);
+        max_step.block(SolutionBlocks::density_upper_slack) = step_size_s * step.block(SolutionBlocks::density_upper_slack);
+        max_step.block(SolutionBlocks::unfiltered_density_multiplier) = step_size_z * step.block(SolutionBlocks::unfiltered_density_multiplier);
+        max_step.block(SolutionBlocks::density_lower_slack_multiplier) = step_size_z * step.block(SolutionBlocks::density_lower_slack_multiplier);
+        max_step.block(SolutionBlocks::density_upper_slack_multiplier) = step_size_z * step.block(SolutionBlocks::density_upper_slack_multiplier);
+        max_step.block(SolutionBlocks::displacement_multiplier) = step_size_z * step.block(SolutionBlocks::displacement_multiplier);
+        max_step.block(SolutionBlocks::total_volume_multiplier) = step_size_z * step.block(SolutionBlocks::total_volume_multiplier);
+
+        pcout << "here" << std::endl;
+        return max_step;
+    }
+
+    ///This is a simple back-stepping algorithm for a line search - keeps shrinking step size until it finds a step where the markov filter requirement is met.
+
+    template<int dim>
+    LA::MPI::BlockVector
+    NonlinearWatchdog<dim>::take_scaled_step(const LA::MPI::BlockVector &state,const LA::MPI::BlockVector &max_step) const
+    {
+        double step_size = 1;
+            for(unsigned int k = 0; k<10; k++)
+            {
+                if(markov_filter.check_filter(kkt_system.calculate_objective_value(state), kkt_system.calculate_barrier_distance(state), kkt_system.calculate_feasibility(state,barrier_size)))
+                {
+                    break;
+                }
+                else
+                {
+                    step_size = step_size/2;
+                }
+            }
+        return state + (step_size * max_step);
+
+    }
+
+
+
+    ///Checks to see if the KKT conditions are sufficiently met to lower barrier size.
+    template<int dim>
+    bool
+    NonlinearWatchdog<dim>::check_convergence(const LA::MPI::BlockVector &state) const
+    {
+              if (kkt_system.calculate_convergence(state) < Input::required_norm)
+              {
+                  return true;
+              }
+              else
+              {
+                  return false;
+              }
+    }
+
+    ///This updates the barrier value using the selected barrier scheme - more work could be done to optimize
+    /// the performance of the mixed method
+    template<int dim>
+    void
+    NonlinearWatchdog<dim>::update_barrier(LA::MPI::BlockVector &current_state)
+    {
+        ///The LOQO scheme uses information about the similarity of the slack/slack multiplier product as a
+        /// heuristic for decreasing barrier value
+        if (Input::barrier_reduction == BarrierOptions::loqo)
+        {
+            double loqo_min = 1000;
+            double loqo_average;
+            double lower_prod;
+            double full_lower_prod;
+            double upper_prod;
+            double full_upper_prod;
+            unsigned int vect_size = current_state.block(SolutionBlocks::density_lower_slack).size();
+            for(unsigned int k = 0; k < vect_size; k++)
+            {
+                lower_prod = 1;
+                if (current_state.block(SolutionBlocks::density_lower_slack).in_local_range(k))
+                    lower_prod=lower_prod * current_state.block(SolutionBlocks::density_lower_slack)[k];
+                if (current_state.block(SolutionBlocks::density_lower_slack_multiplier).in_local_range(k))
+                    lower_prod=lower_prod * current_state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
+
+                upper_prod=1;
+                if (current_state.block(SolutionBlocks::density_upper_slack).in_local_range(k))
+                    upper_prod=upper_prod * current_state.block(SolutionBlocks::density_upper_slack)[k];
+                if (current_state.block(SolutionBlocks::density_upper_slack_multiplier).in_local_range(k))
+                    upper_prod=upper_prod * current_state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
+
+                MPI_Allreduce(&lower_prod, &full_lower_prod, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+                MPI_Allreduce(&upper_prod, &full_upper_prod, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+                if (full_lower_prod < loqo_min)
+                {
+                    loqo_min = full_lower_prod;
+                }
+                if (full_upper_prod < loqo_min)
+                {
+                    loqo_min = full_upper_prod;
+                }
+            }
+            loqo_average = (current_state.block(SolutionBlocks::density_lower_slack)*current_state.block(SolutionBlocks::density_lower_slack_multiplier)
+                            + current_state.block(SolutionBlocks::density_upper_slack)*current_state.block(SolutionBlocks::density_upper_slack_multiplier)
+                           )/(2*vect_size);
+            double loqo_complimentarity_deviation = loqo_min/loqo_average;
+            pcout << "loqo cd: " << loqo_complimentarity_deviation << std::endl;
+            double loqo_multiplier;
+            if((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation)<2)
+            {
+                loqo_multiplier = .1*std::pow((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation),3);
+            }
+            else
+            {
+                loqo_multiplier = .8;
+            }
+            pcout << "loqo mult: " << loqo_multiplier << std::endl;
+            if (loqo_multiplier< 0)
+            {
+                barrier_size = std::abs(loqo_multiplier) * loqo_average;
+            }
+            else
+            {
+                barrier_size = loqo_multiplier * loqo_average;
+            }
+            if (barrier_size < Input::min_barrier_size)
+            {
+                barrier_size=Input::min_barrier_size;
+            }
+        }
+
+        ///The monotome scheme fully solves the problem with one barrier size before decreasing the
+        /// barrier and starting again
+        if (Input::barrier_reduction == BarrierOptions::monotone)
+        {
+            if (kkt_system.calculate_rhs_norm(current_state,barrier_size) < barrier_size * 1e-3)
+            {
+                barrier_size = barrier_size * .7;
+            }
+            if (barrier_size < Input::min_barrier_size)
+            {
+                barrier_size=Input::min_barrier_size;
+            }
+        }
+
+        ///The mixed method uses LOQO unless it gets stuck, at which point it switches to monotone, allowing for an adaptive method
+        /// that still globally converges the barrier value to 0.
+        if (Input::barrier_reduction == BarrierOptions::mixed)
+        {
+            if (mixed_barrier_monotone_mode)
+            {
+                if (kkt_system.calculate_rhs_norm(current_state,barrier_size) < barrier_size)
+                {
+                    barrier_size = barrier_size * .8;
+                    mixed_barrier_monotone_mode=false;
+                    pcout << "monotone mode turned off" << std::endl;
+                }
+            }
+            else
+            {
+                double loqo_min = 1000;
+                double loqo_average;
+                unsigned int vect_size = current_state.block(SolutionBlocks::density_lower_slack).size();
+                double lower_prod, full_lower_prod, upper_prod, full_upper_prod;
+                for(unsigned int k = 0; k < vect_size; k++)
+                {
+                    lower_prod = 1;
+                    if (current_state.block(SolutionBlocks::density_lower_slack).in_local_range(k))
+                        lower_prod=lower_prod * current_state.block(SolutionBlocks::density_lower_slack)[k];
+                    if (current_state.block(SolutionBlocks::density_lower_slack_multiplier).in_local_range(k))
+                        lower_prod=lower_prod * current_state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
+
+                    upper_prod=1;
+                    if (current_state.block(SolutionBlocks::density_upper_slack).in_local_range(k))
+                        upper_prod=upper_prod * current_state.block(SolutionBlocks::density_upper_slack)[k];
+                    if (current_state.block(SolutionBlocks::density_upper_slack_multiplier).in_local_range(k))
+                        upper_prod=upper_prod * current_state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
+
+                    MPI_Allreduce(&lower_prod, &full_lower_prod, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+                    MPI_Allreduce(&upper_prod, &full_upper_prod, 1, MPI_DOUBLE, MPI_PROD, MPI_COMM_WORLD);
+
+                    if (full_lower_prod < loqo_min)
+                    {
+                        loqo_min = full_lower_prod;
+                    }
+                    if (full_upper_prod < loqo_min)
+                    {
+                        loqo_min = full_upper_prod;
+                    }
+                }
+                loqo_average = (current_state.block(SolutionBlocks::density_lower_slack)*current_state.block(SolutionBlocks::density_lower_slack_multiplier)
+                                + current_state.block(SolutionBlocks::density_upper_slack)*current_state.block(SolutionBlocks::density_upper_slack_multiplier)
+                               )/(2*vect_size);
+                double loqo_complimentarity_deviation = loqo_min/loqo_average;
+                double loqo_multiplier;
+                if((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation)<2)
+                {
+                    loqo_multiplier = .1*std::pow((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation),3);
+                }
+                else
+                {
+                    loqo_multiplier = 1/.8;
+                    mixed_barrier_monotone_mode = true;
+                    pcout << "monotone mode turned on" << std::endl;
+                }
+                if (loqo_multiplier<.01)
+                {
+                    barrier_size = .01 * loqo_average;
+                }
+                else
+                {
+                    barrier_size = loqo_multiplier * loqo_average;
+                }
+                if (barrier_size < Input::min_barrier_size)
+                {
+                    barrier_size=Input::min_barrier_size;
+                }
+            }
+        }
+
+    }
+
+    template<int dim>
+    void
+    NonlinearWatchdog<dim>::perform_initial_setup()
+    {
+        barrier_size = Input::initial_barrier_size;
+        kkt_system.create_triangulation();
+        kkt_system.setup_boundary_values();
+        pcout << "setup kkt system" << std::endl;
+        kkt_system.setup_block_system();
+        pcout << "setup kkt system" << std::endl;
+
+        if (Input::barrier_reduction==BarrierOptions::mixed)
+        {
+            mixed_barrier_monotone_mode = false;
+        }
+    }
+
+
+    template<int dim>
+    void
+    NonlinearWatchdog<dim>::nonlinear_step(LA::MPI::BlockVector &current_state, LA::MPI::BlockVector &current_step, const unsigned int max_uphill_steps, unsigned int &iteration_number)
+    {
+
+        bool converged = false;
+        //while not converged
+        while(!converged && iteration_number < Input::max_steps)
+        {
+            bool found_step = false;
+            //save current state as watchdog state
+
+            const LA::MPI::BlockVector watchdog_state = current_state;
+            LA::MPI::BlockVector watchdog_step;
+            //for 1-8 steps - this is the number of steps away we will let it go uphill before demanding downhill
+            for(unsigned int k = 0; k<max_uphill_steps; k++)
+            {
+
+                //compute step from current state  - function from kktSystem
+                current_step = find_max_step(current_state);
+
+                // save the first of these as the watchdog step
+                if(k==0)
+                {
+                    watchdog_step = current_step;
+                    if (iteration_number == 0)
+                    {
+                        kkt_system.calculate_initial_rhs_error();
+                    }
+                }
+
+                //apply full step to current state
+                current_state=current_state+current_step;
+
+
+                //if new state passes filter
+                if(markov_filter.check_filter(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size)))
+                {
+                    //Accept current state
+                    //iterate number of steps by number of steps taken in this process
+                    iteration_number = iteration_number + k + 1;
+                    found_step = true;
+                    pcout << "found workable step after " << k+1 << " iterations"<<std::endl;
+                    //break for loop
+                    markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
+                    break;
+                    //end if
+                }
+                //end for
+            }
+            //if found step = false
+            if (!found_step)
+            {
+                //Compute step from current state
+                current_step = find_max_step(current_state);
+                //find step length so that merit of stretch state - sized step from current length - is less than merit of (current state + descent requirement * linear derivative of merit of current state in direction of current step)
+                //update stretch state with found step length
+                const LA::MPI::BlockVector stretch_state = take_scaled_step(current_state, current_step);
+                //if current merit is less than watchdog merit, or if stretch merit is less than earlier goal merit
+                if(markov_filter.check_filter(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size)))
+                {
+                    current_state = stretch_state;
+                    iteration_number = iteration_number + max_uphill_steps + 1;
+                    markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
+                }
+                else
+                {
+                    //if merit of stretch state is bigger than watchdog merit
+                    if (markov_filter.check_filter(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size)))
+                    {
+                        //find step length from watchdog state that meets descent requirement
+                        current_state = take_scaled_step(watchdog_state, watchdog_step);
+                        //update iteration count
+                        iteration_number = iteration_number +  max_uphill_steps + 1;
+                        markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
+
+                    }
+                    else
+                    {
+                        //calculate direction from stretch state
+                        const LA::MPI::BlockVector stretch_step = find_max_step(stretch_state);
+                        //find step length from stretch state that meets descent requirement
+                        current_state = take_scaled_step(stretch_state, stretch_step);
+                        //update iteration count
+                        iteration_number = iteration_number + max_uphill_steps + 2;
+                        markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
+                    }
+                }
+            }
+            //output current state
+            kkt_system.output(current_state,iteration_number);
+
+            converged = check_convergence(current_state);
+            update_barrier(current_state);
+            markov_filter.update_barrier_value(barrier_size);
+            pcout << "barrier size is now " << barrier_size << " on iteration number " << iteration_number << std::endl;
+
+
+            overall_timer.leave_subsection();
+            overall_timer.print_summary();
+            overall_timer.enter_subsection("Total Time");
+
+        }//end while
+    }
+
+    ///Contains watchdog algorithm
+    template<int dim>
+    void
+    NonlinearWatchdog<dim>::run() {
+        overall_timer.enter_subsection("Total Time");
+
+        perform_initial_setup();
+
+        const unsigned int max_uphill_steps = 8;
+        unsigned int iteration_number = 0;
+
+        //while barrier value above minimal value and total iterations under some value
+        LA::MPI::BlockVector current_state = kkt_system.get_initial_state();
+        LA::MPI::BlockVector current_step;
+
+        markov_filter.setup(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size), barrier_size);
+
+        // std::cout << "finished setup - beginning watchdog steps" << std::endl;
+
+        while((barrier_size > Input::min_barrier_size || !check_convergence(current_state)) && iteration_number < Input::max_steps)
+        {
+            nonlinear_step(current_state, current_step, max_uphill_steps, iteration_number);
+        }
+//        kkt_system.output_stl(current_state);
+    }
+
+} // namespace SAND
+
+
+template class SAND::NonlinearWatchdog<2>;
+template class SAND::NonlinearWatchdog<3>;
diff --git a/source/watchdog_main.cc b/source/watchdog_main.cc
deleted file mode 100644
index e2134cd..0000000
--- a/source/watchdog_main.cc
+++ /dev/null
@@ -1,442 +0,0 @@
-#include <deal.II/lac/block_vector.h>
-#include <deal.II/lac/packaged_operation.h>
-#include <deal.II/grid/tria.h>
-#include <deal.II/grid/grid_refinement.h>
-#include <iostream>
-#include "../include/markov_filter.h"
-#include "../include/kkt_system.h"
-#include "../include/input_information.h"
-#include <deal.II/lac/generic_linear_algebra.h>
-
-///Above are fairly normal files to include.  I also use the sparse direct package, which requiresBLAS/LAPACK
-/// to  perform  a  direct  solve  while  I  work  on  a  fast  iterative  solver  for  this problem.
-/// Below is the main class for this problem.
-
-namespace SAND {
-    namespace LA
-    {
-        using namespace dealii::LinearAlgebraPETSc;
-    }
-
-
-    using namespace dealii;
-
-    template<int dim>
-    class SANDTopOpt {
-    public:
-        SANDTopOpt();
-
-        void
-        run();
-
-    private:
-
-        std::pair<double,double>
-        calculate_max_step_size(const BlockVector<double> &state, const BlockVector<double> &step) const;
-
-        const BlockVector<double>
-        find_max_step(const BlockVector<double> &state);
-
-        BlockVector<double>
-        take_scaled_step(const BlockVector<double> &state,const BlockVector<double> &max_step) const;
-
-        bool
-        check_convergence(const BlockVector<double> &state) const;
-
-        void
-        update_barrier(BlockVector<double> &current_state);
-
-        KktSystem<dim> kkt_system;
-        MarkovFilter markov_filter;
-        double barrier_size;
-        TimerOutput overall_timer;
-        bool mixed_barrier_monotone_mode;
-    };
-
-    template<int dim>
-    SANDTopOpt<dim>::SANDTopOpt()
-            :overall_timer(std::cout, TimerOutput::never, TimerOutput::wall_times)
-    {
-    }
-
-    ///A binary search figures out the maximum step that meets the dual feasibility - that s>0 and z>0. The fraction to boundary increases as the barrier size decreases.
-
-    template<int dim>
-    std::pair<double,double>
-    SANDTopOpt<dim>::calculate_max_step_size(const BlockVector<double> &state, const BlockVector<double> &step) const {
-
-        double step_size_s_low = 0;
-        double step_size_z_low = 0;
-        double step_size_s_high = 1;
-        double step_size_z_high = 1;
-        double step_size_s, step_size_z;
-
-
-        for (unsigned int k = 0; k < 50; k++)
-        {
-
-            step_size_s = (step_size_s_low + step_size_s_high) / 2;
-            step_size_z = (step_size_z_low + step_size_z_high) / 2;
-            const BlockVector<double> state_test_s =
-                    (Input::fraction_to_boundary * state) + (step_size_s * step);
-
-            const BlockVector<double> state_test_z =
-                    (Input::fraction_to_boundary * state) + (step_size_z * step);
-
-            const bool accept_s = (state_test_s.block(SolutionBlocks::density_lower_slack).is_non_negative())
-                                  && (state_test_s.block(SolutionBlocks::density_upper_slack).is_non_negative());
-            const bool accept_z = (state_test_z.block(SolutionBlocks::density_lower_slack_multiplier).is_non_negative())
-                                  && (state_test_z.block(SolutionBlocks::density_upper_slack_multiplier).is_non_negative());
-
-            if (accept_s) {
-                step_size_s_low = step_size_s;
-            } else {
-                step_size_s_high = step_size_s;
-            }
-            if (accept_z) {
-                step_size_z_low = step_size_z;
-            } else {
-                step_size_z_high = step_size_z;
-            }
-        }
-        return {step_size_s_low, step_size_z_low};
-    }
-
-///Creates a rhs vector that we can use to look at the magnitude of the KKT conditions.  This is then used for testing the convergence before shrinking barrier size, as well as in the calculation of the l1 merit.
-
-    template<int dim>
-    const BlockVector<double>
-    SANDTopOpt<dim>::find_max_step(const BlockVector<double> &state)
-    {
-        kkt_system.assemble_block_system(state, barrier_size);
-        const BlockVector<double> step = kkt_system.solve(state,barrier_size);
-
-        const auto max_step_sizes= calculate_max_step_size(state,step);
-        const double step_size_s = max_step_sizes.first;
-        const double step_size_z = max_step_sizes.second;
-        BlockVector<double> max_step(10);
-
-        max_step.block(SolutionBlocks::density) = step_size_s * step.block(SolutionBlocks::density);
-        max_step.block(SolutionBlocks::displacement) = step_size_s * step.block(SolutionBlocks::displacement);
-        max_step.block(SolutionBlocks::unfiltered_density) = step_size_s * step.block(SolutionBlocks::unfiltered_density);
-        max_step.block(SolutionBlocks::density_lower_slack) = step_size_s * step.block(SolutionBlocks::density_lower_slack);
-        max_step.block(SolutionBlocks::density_upper_slack) = step_size_s * step.block(SolutionBlocks::density_upper_slack);
-        max_step.block(SolutionBlocks::unfiltered_density_multiplier) = step_size_z * step.block(SolutionBlocks::unfiltered_density_multiplier);
-        max_step.block(SolutionBlocks::density_lower_slack_multiplier) = step_size_z * step.block(SolutionBlocks::density_lower_slack_multiplier);
-        max_step.block(SolutionBlocks::density_upper_slack_multiplier) = step_size_z * step.block(SolutionBlocks::density_upper_slack_multiplier);
-        max_step.block(SolutionBlocks::displacement_multiplier) = step_size_z * step.block(SolutionBlocks::displacement_multiplier);
-        max_step.block(SolutionBlocks::total_volume_multiplier) = step_size_z * step.block(SolutionBlocks::total_volume_multiplier);
-
-        return max_step;
-    }
-
-    ///This is my back-stepping algorithm for a line search - keeps shrinking step size until it finds a step where the merit is decreased.
-
-    template<int dim>
-    BlockVector<double>
-    SANDTopOpt<dim>::take_scaled_step(const BlockVector<double> &state,const BlockVector<double> &max_step) const
-    {
-        double step_size = 1;
-            for(unsigned int k = 0; k<10; k++)
-            {
-                if(markov_filter.check_filter(kkt_system.calculate_objective_value(state), kkt_system.calculate_barrier_distance(state), kkt_system.calculate_feasibility(state,barrier_size)))
-                {
-                    break;
-                }
-                else
-                {
-                    step_size = step_size/2;
-                }
-            }
-        return state + (step_size * max_step);
-
-    }
-
-
-
-    ///Checks to see if the KKT conditions are sufficiently met to lower barrier size.
-    template<int dim>
-    bool
-    SANDTopOpt<dim>::check_convergence(const BlockVector<double> &state) const
-    {
-              if (kkt_system.calculate_convergence(state) < Input::required_norm)
-              {
-                  return true;
-              }
-              else
-              {
-                  return false;
-              }
-    }
-
-    template<int dim>
-    void
-    SANDTopOpt<dim>::update_barrier(BlockVector<double> &current_state)
-    {
-        if (Input::barrier_reduction == BarrierOptions::loqo)
-        {
-            double loqo_min = 1000;
-            double loqo_average;
-            unsigned int vect_size = current_state.block(SolutionBlocks::density_lower_slack).size();
-            for(unsigned int k = 0; k < vect_size; k++)
-            {
-                if (current_state.block(SolutionBlocks::density_lower_slack)[k]*current_state.block(SolutionBlocks::density_lower_slack_multiplier)[k] < loqo_min)
-                {
-                    loqo_min = current_state.block(SolutionBlocks::density_lower_slack)[k]*current_state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
-                }
-                if (current_state.block(SolutionBlocks::density_upper_slack)[k]*current_state.block(SolutionBlocks::density_upper_slack_multiplier)[k] < loqo_min)
-                {
-                    loqo_min = current_state.block(SolutionBlocks::density_upper_slack)[k]*current_state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
-                }
-            }
-            loqo_average = (current_state.block(SolutionBlocks::density_lower_slack)*current_state.block(SolutionBlocks::density_lower_slack_multiplier)
-                            + current_state.block(SolutionBlocks::density_upper_slack)*current_state.block(SolutionBlocks::density_upper_slack_multiplier)
-                           )/(2*vect_size);
-            double loqo_complimentarity_deviation = loqo_min/loqo_average;
-            double loqo_multiplier;
-            if((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation)<2)
-            {
-                loqo_multiplier = .1*std::pow((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation),3);
-            }
-            else
-            {
-                loqo_multiplier = .8;
-            }
-            if (loqo_multiplier< 0)
-            {
-                barrier_size = .2 * loqo_average;
-            }
-            else
-            {
-                barrier_size = loqo_multiplier * loqo_average;
-            }
-            if (barrier_size < Input::min_barrier_size)
-            {
-                barrier_size=Input::min_barrier_size;
-            }
-        }
-
-        if (Input::barrier_reduction == BarrierOptions::monotone)
-        {
-            if (kkt_system.calculate_rhs_norm(current_state,barrier_size) < barrier_size * 1e-3)
-            {
-                barrier_size = barrier_size * .7;
-            }
-            if (barrier_size < Input::min_barrier_size)
-            {
-                barrier_size=Input::min_barrier_size;
-            }
-        }
-
-        if (Input::barrier_reduction == BarrierOptions::mixed)
-        {
-            if (mixed_barrier_monotone_mode)
-            {
-                if (kkt_system.calculate_rhs_norm(current_state,barrier_size) < barrier_size)
-                {
-                    barrier_size = barrier_size * .8;
-                    mixed_barrier_monotone_mode=false;
-                    std::cout << "monotone mode turned off" << std::endl;
-                }
-            }
-            else
-            {
-                double loqo_min = 1000;
-                double loqo_average;
-                unsigned int vect_size = current_state.block(SolutionBlocks::density_lower_slack).size();
-                for(unsigned int k = 0; k < vect_size; k++)
-                {
-                    if (current_state.block(SolutionBlocks::density_lower_slack)[k]*current_state.block(SolutionBlocks::density_lower_slack_multiplier)[k] < loqo_min)
-                    {
-                        loqo_min = current_state.block(SolutionBlocks::density_lower_slack)[k]*current_state.block(SolutionBlocks::density_lower_slack_multiplier)[k];
-                    }
-                    if (current_state.block(SolutionBlocks::density_upper_slack)[k]*current_state.block(SolutionBlocks::density_upper_slack_multiplier)[k] < loqo_min)
-                    {
-                        loqo_min = current_state.block(SolutionBlocks::density_upper_slack)[k]*current_state.block(SolutionBlocks::density_upper_slack_multiplier)[k];
-                    }
-                }
-                loqo_average = (current_state.block(SolutionBlocks::density_lower_slack)*current_state.block(SolutionBlocks::density_lower_slack_multiplier)
-                                + current_state.block(SolutionBlocks::density_upper_slack)*current_state.block(SolutionBlocks::density_upper_slack_multiplier)
-                               )/(2*vect_size);
-                double loqo_complimentarity_deviation = loqo_min/loqo_average;
-                double loqo_multiplier;
-                if((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation)<2)
-                {
-                    loqo_multiplier = .1*std::pow((.05 * (1-loqo_complimentarity_deviation)/loqo_complimentarity_deviation),3);
-                }
-                else
-                {
-                    loqo_multiplier = 1/.8;
-                    mixed_barrier_monotone_mode = true;
-                    std::cout << "monotone mode turned on" << std::endl;
-                }
-                if (loqo_multiplier<.01)
-                {
-                    barrier_size = .01 * loqo_average;
-                }
-                else
-                {
-                    barrier_size = loqo_multiplier * loqo_average;
-                }
-                if (barrier_size < Input::min_barrier_size)
-                {
-                    barrier_size=Input::min_barrier_size;
-                }
-            }
-        }
-
-    }
-
-    ///Contains watchdog algorithm
-    template<int dim>
-    void
-    SANDTopOpt<dim>::run() {
-        overall_timer.enter_subsection("Total Time");
-        barrier_size = Input::initial_barrier_size;
-        kkt_system.create_triangulation();
-        kkt_system.setup_boundary_values();
-        kkt_system.setup_filter_matrix();
-        kkt_system.setup_block_system();
-
-        if (Input::barrier_reduction==BarrierOptions::mixed)
-        {
-            mixed_barrier_monotone_mode = false;
-        }
-
-        const unsigned int max_uphill_steps = 8;
-        unsigned int iteration_number = 0;
-        //while barrier value above minimal value and total iterations under some value
-        BlockVector<double> current_state = kkt_system.get_initial_state();
-        BlockVector<double> current_step;
-        markov_filter.setup(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size), barrier_size);
-
-        while((barrier_size > Input::min_barrier_size || !check_convergence(current_state)) && iteration_number < Input::max_steps)
-        {
-            bool converged = false;
-            //while not converged
-            while(!converged && iteration_number < Input::max_steps)
-            {
-                bool found_step = false;
-                //save current state as watchdog state
-
-                const BlockVector<double> watchdog_state = current_state;
-                BlockVector<double> watchdog_step;
-                //for 1-8 steps - this is the number of steps away we will let it go uphill before demanding downhill
-                for(unsigned int k = 0; k<max_uphill_steps; k++)
-                {
-
-                    //compute step from current state  - function from kktSystem
-                    current_step = find_max_step(current_state);
-
-                    // save the first of these as the watchdog step
-                    if(k==0)
-                    {
-                        watchdog_step = current_step;
-                        if (iteration_number == 0)
-                        {
-                            kkt_system.calculate_initial_rhs_error();
-                        }
-                    }
-                    //apply full step to current state
-                    current_state=current_state+current_step;
-
-
-                    //if new state passes filter
-                    if(markov_filter.check_filter(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size)))
-                    {
-                        //Accept current state
-                        //iterate number of steps by number of steps taken in this process
-                        iteration_number = iteration_number + k + 1;
-                        found_step = true;
-                        std::cout << "found workable step after " << k+1 << " iterations"<<std::endl;
-                        //break for loop
-                        markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
-                        break;
-                        //end if
-                    }
-                    //end for
-                }
-                //if found step = false
-                if (!found_step)
-                {
-                    //Compute step from current state
-                    current_step = find_max_step(current_state);
-                    //find step length so that merit of stretch state - sized step from current length - is less than merit of (current state + descent requirement * linear derivative of merit of current state in direction of current step)
-                    //update stretch state with found step length
-                    const BlockVector<double> stretch_state = take_scaled_step(current_state, current_step);
-                    //if current merit is less than watchdog merit, or if stretch merit is less than earlier goal merit
-                    if(markov_filter.check_filter(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size)))
-                    {
-                        current_state = stretch_state;
-                        iteration_number = iteration_number + max_uphill_steps + 1;
-                        markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
-                    }
-                    else
-                    {
-                        //if merit of stretch state is bigger than watchdog merit
-                        if (markov_filter.check_filter(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size)))
-                        {
-                            //find step length from watchdog state that meets descent requirement
-                            current_state = take_scaled_step(watchdog_state, watchdog_step);
-                            //update iteration count
-                            iteration_number = iteration_number +  max_uphill_steps + 1;
-                            markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
-
-                        }
-                        else
-                        {
-                            //calculate direction from stretch state
-                            const BlockVector<double> stretch_step = find_max_step(stretch_state);
-                            //find step length from stretch state that meets descent requirement
-                            current_state = take_scaled_step(stretch_state, stretch_step);
-                            //update iteration count
-                            iteration_number = iteration_number + max_uphill_steps + 2;
-                            markov_filter.add_point(kkt_system.calculate_objective_value(current_state), kkt_system.calculate_barrier_distance(current_state), kkt_system.calculate_feasibility(current_state,barrier_size));
-                        }
-                    }
-                }
-                //output current state
-                kkt_system.output(current_state,iteration_number);
-
-                converged = check_convergence(current_state);
-                update_barrier(current_state);
-                markov_filter.update_barrier_value(barrier_size);
-                std::cout << "barrier size is now " << barrier_size << " on iteration number " << iteration_number << std::endl;
-
-                overall_timer.leave_subsection();
-                overall_timer.print_summary();
-                overall_timer.enter_subsection("Total Time");
-                //end while
-            }
-
-        }
-        kkt_system.output_stl(current_state);
-    }
-
-} // namespace SAND
-
-int
-main() {
-    try {
-        SAND::SANDTopOpt<SAND::Input::dim> elastic_problem_2d;
-        elastic_problem_2d.run();
-    }
-    catch (std::exception &exc) {
-        std::cerr << std::endl << std::endl
-                  << "----------------------------------------------------" << std::endl;
-        std::cerr << "Exception on processing: " << std::endl << exc.what()
-                  << std::endl << "Aborting!" << std::endl
-                  << "----------------------------------------------------" << std::endl;
-
-        return 1;
-    }
-    catch (...) {
-        std::cerr << std::endl << std::endl
-                  << "----------------------------------------------------" << std::endl;
-        std::cerr << "Unknown exception!" << std::endl << "Aborting!" << std::endl
-                  << "----------------------------------------------------" << std::endl;
-        return 1;
-    }
-
-    return 0;
-}