17 files changed, 424 insertions, 80 deletions
diff --git a/gnuradio-core/src/lib/general/CMakeLists.txt b/gnuradio-core/src/lib/general/CMakeLists.txt
index 399e07599..b671c963b 100644
--- a/gnuradio-core/src/lib/general/CMakeLists.txt
+++ b/gnuradio-core/src/lib/general/CMakeLists.txt
@@ -292,6 +292,7 @@ set(gr_core_general_triple_threats
     gr_annotator_raw
     gr_burst_tagger
     gr_correlate_access_code_tag_bb
+    gr_tag_debug
 )
 
 foreach(file_tt ${gr_core_general_triple_threats})
diff --git a/gnuradio-core/src/lib/general/general.i b/gnuradio-core/src/lib/general/general.i
index fe2cbdb82..c0ce65527 100644
--- a/gnuradio-core/src/lib/general/general.i
+++ b/gnuradio-core/src/lib/general/general.i
@@ -141,6 +141,7 @@
 #include <gr_correlate_access_code_tag_bb.h>
 #include <gr_add_ff.h>
 #include <gr_vector_map.h>
+#include <gr_tag_debug.h>
 %}
 
 %include "gri_control_loop.i"
@@ -262,3 +263,4 @@
 %include "gr_correlate_access_code_tag_bb.i"
 %include "gr_add_ff.i"
 %include "gr_vector_map.i"
+%include "gr_tag_debug.i"
diff --git a/gnuradio-core/src/lib/general/gr_tag_debug.cc b/gnuradio-core/src/lib/general/gr_tag_debug.cc
new file mode 100644
index 000000000..c4031f438
--- /dev/null
+++ b/gnuradio-core/src/lib/general/gr_tag_debug.cc
@@ -0,0 +1,100 @@
+/* -*- c++ -*- */
+/*
+ * Copyright 2012 Free Software Foundation, Inc.
+ *
+ * This file is part of GNU Radio
+ *
+ * GNU Radio is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 3, or (at your option)
+ * any later version.
+ *
+ * GNU Radio is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with GNU Radio; see the file COPYING.  If not, write to
+ * the Free Software Foundation, Inc., 51 Franklin Street,
+ * Boston, MA 02110-1301, USA.
+ */
+
+#ifdef HAVE_CONFIG_H
+#include "config.h"
+#endif
+
+#include <gr_tag_debug.h>
+#include <gr_io_signature.h>
+#include <iostream>
+#include <iomanip>
+
+gr_tag_debug_sptr
+gr_make_tag_debug(size_t sizeof_stream_item, const std::string &name)
+{
+  return gnuradio::get_initial_sptr
+    (new gr_tag_debug(sizeof_stream_item, name));
+}
+
+gr_tag_debug::gr_tag_debug(size_t sizeof_stream_item, const std::string &name)
+  : gr_sync_block("tag_debug",
+		  gr_make_io_signature(1, -1, sizeof_stream_item),
+		  gr_make_io_signature(0, 0, 0)),
+    d_name(name), d_display(true)
+{
+}
+
+std::vector<gr_tag_t>
+gr_tag_debug::current_tags()
+{
+  gruel::scoped_lock l(d_mutex);
+  return d_tags;
+}
+
+void
+gr_tag_debug::set_display(bool d)
+{
+  gruel::scoped_lock l(d_mutex);
+  d_display = d;
+}
+
+int
+gr_tag_debug::work(int noutput_items,
+		   gr_vector_const_void_star &input_items,
+		   gr_vector_void_star &output_items)
+{
+  gruel::scoped_lock l(d_mutex);
+
+  if(d_display) {
+    std::cout << std::endl
+	      << "----------------------------------------------------------------------";
+    std::cout << std::endl << "Tag Debug: " << d_name << std::endl;
+  }
+
+  uint64_t abs_N, end_N;
+  for(size_t i = 0; i < input_items.size(); i++) {
+    abs_N = nitems_read(i);
+    end_N = abs_N + (uint64_t)(noutput_items);
+
+    d_tags.clear();
+    get_tags_in_range(d_tags, i, abs_N, end_N);
+
+    if(d_display) {
+      std::cout << "Input Stream: " << i << std::endl;
+      for(d_tags_itr = d_tags.begin(); d_tags_itr != d_tags.end(); d_tags_itr++) {
+	std::cout << std::setw(10) << "Offset: " << d_tags_itr->offset
+		  << std::setw(10) << "Source: " << pmt::pmt_symbol_to_string(d_tags_itr->srcid)
+		  << std::setw(10) << "Key: " << pmt::pmt_symbol_to_string(d_tags_itr->key)
+		  << std::setw(10) << "Value: ";
+	pmt::pmt_print(d_tags_itr->value);
+      }
+    }
+  }
+
+  if(d_display) {
+    std::cout << "----------------------------------------------------------------------";
+    std::cout << std::endl;
+  }
+
+  return noutput_items;
+}
diff --git a/gnuradio-core/src/lib/general/gr_tag_debug.h b/gnuradio-core/src/lib/general/gr_tag_debug.h
new file mode 100644
index 000000000..57578884a
--- /dev/null
+++ b/gnuradio-core/src/lib/general/gr_tag_debug.h
@@ -0,0 +1,85 @@
+/* -*- c++ -*- */
+/*
+ * Copyright 2012 Free Software Foundation, Inc.
+ *
+ * This file is part of GNU Radio
+ *
+ * GNU Radio is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 3, or (at your option)
+ * any later version.
+ *
+ * GNU Radio is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with GNU Radio; see the file COPYING.  If not, write to
+ * the Free Software Foundation, Inc., 51 Franklin Street,
+ * Boston, MA 02110-1301, USA.
+ */
+
+#ifndef INCLUDED_GR_TAG_DEBUG_H
+#define INCLUDED_GR_TAG_DEBUG_H
+
+#include <gr_core_api.h>
+#include <gr_sync_block.h>
+#include <gruel/thread.h>
+#include <stddef.h>
+
+class gr_tag_debug;
+typedef boost::shared_ptr<gr_tag_debug> gr_tag_debug_sptr;
+
+GR_CORE_API gr_tag_debug_sptr
+gr_make_tag_debug(size_t sizeof_stream_item, const std::string &name);
+
+/*!
+ * \brief Bit bucket that prints out any tag received.
+ * \ingroup sink_blk
+ *
+ * This block collects all tags sent to it on all input ports and
+ * displays them to stdout in a formatted way. The \p name parameter
+ * is used to identify which debug sink generated the tag, so when
+ * connecting a block to this debug sink, an appropriate name is
+ * something that identifies the input block.
+ *
+ * This block otherwise acts as a NULL sink in that items from the
+ * input stream are ignored. It is designed to be able to attach to
+ * any block and watch all tags streaming out of that block for
+ * debugging purposes.
+ *
+ * The tags from the last call to this work function are stored and
+ * can be retrieved using the function 'current_tags'.
+ */
+class GR_CORE_API gr_tag_debug : public gr_sync_block
+{
+ private:
+  friend GR_CORE_API gr_tag_debug_sptr
+    gr_make_tag_debug(size_t sizeof_stream_item, const std::string &name);
+  gr_tag_debug(size_t sizeof_stream_item, const std::string &name);
+
+  std::string d_name;
+  std::vector<gr_tag_t> d_tags;
+  std::vector<gr_tag_t>::iterator d_tags_itr;
+  bool d_display;
+  gruel::mutex d_mutex;
+
+ public:
+  /*!
+   * \brief Returns a vector of gr_tag_t items as of the last call to
+   * work.
+   */
+  std::vector<gr_tag_t> current_tags();
+
+  /*!
+   * \brief Set the display of tags to stdout on/off.
+   */
+  void set_display(bool d);
+
+  int work(int noutput_items,
+	   gr_vector_const_void_star &input_items,
+	   gr_vector_void_star &output_items);
+};
+
+#endif /* INCLUDED_GR_TAG_DEBUG_H */
diff --git a/gnuradio-core/src/lib/general/gr_tag_debug.i b/gnuradio-core/src/lib/general/gr_tag_debug.i
new file mode 100644
index 000000000..3af1bdcfe
--- /dev/null
+++ b/gnuradio-core/src/lib/general/gr_tag_debug.i
@@ -0,0 +1,35 @@
+/* -*- c++ -*- */
+/*
+ * Copyright 2012 Free Software Foundation, Inc.
+ *
+ * This file is part of GNU Radio
+ *
+ * GNU Radio is free software; you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation; either version 3, or (at your option)
+ * any later version.
+ *
+ * GNU Radio is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with GNU Radio; see the file COPYING.  If not, write to
+ * the Free Software Foundation, Inc., 51 Franklin Street,
+ * Boston, MA 02110-1301, USA.
+ */
+
+GR_SWIG_BLOCK_MAGIC(gr,tag_debug)
+
+%include <gr_tags.i>
+
+gr_tag_debug_sptr
+gr_make_tag_debug(size_t sizeof_stream_item, const std::string &name);
+
+class gr_tag_debug : public gr_sync_block
+{
+public:
+  std::vector<gr_tag_t> current_tags();
+  void set_display(bool d);
+};
diff --git a/gnuradio-core/src/python/gnuradio/gr/qa_tag_debug.py b/gnuradio-core/src/python/gnuradio/gr/qa_tag_debug.py
new file mode 100755
index 000000000..81babca04
--- /dev/null
+++ b/gnuradio-core/src/python/gnuradio/gr/qa_tag_debug.py
@@ -0,0 +1,43 @@
+#!/usr/bin/env python
+#
+# Copyright 2012 Free Software Foundation, Inc.
+#
+# This file is part of GNU Radio
+#
+# GNU Radio is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 3, or (at your option)
+# any later version.
+#
+# GNU Radio is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with GNU Radio; see the file COPYING.  If not, write to
+# the Free Software Foundation, Inc., 51 Franklin Street,
+# Boston, MA 02110-1301, USA.
+#
+
+from gnuradio import gr, gr_unittest
+
+class test_tag_debug(gr_unittest.TestCase):
+
+    def setUp(self):
+        self.tb = gr.top_block()
+
+    def tearDown(self):
+        self.tb = None
+
+    def test_001(self):
+        # Just run some data through and make sure it doesn't puke.
+        src_data = (1, 2, 3, 4, 5, 6, 7, 8, 9, 10)
+        src = gr.vector_source_i(src_data)
+        op = gr.tag_debug(gr.sizeof_int, "tag QA")
+        self.tb.connect(src, op)
+        self.tb.run()
+        x = op.current_tags()
+
+if __name__ == '__main__':
+    gr_unittest.run(test_tag_debug, "test_tag_debug.xml")
diff --git a/gr-filter/include/filter/fir_filter_with_buffer.h b/gr-filter/include/filter/fir_filter_with_buffer.h
index 8b5d9e064..007eae3fa 100644
--- a/gr-filter/include/filter/fir_filter_with_buffer.h
+++ b/gr-filter/include/filter/fir_filter_with_buffer.h
@@ -40,6 +40,7 @@ namespace gr {
       private:
 	std::vector<float> d_taps;
 	unsigned int  d_ntaps;
+	float        *d_buffer_ptr;
 	float        *d_buffer;
 	unsigned int  d_idx;
 	float       **d_aligned_taps;
@@ -136,6 +137,7 @@ namespace gr {
       private:
 	std::vector<gr_complex> d_taps;
 	unsigned int  d_ntaps;
+	gr_complex   *d_buffer_ptr;
 	gr_complex   *d_buffer;
 	unsigned int  d_idx;
 	gr_complex  **d_aligned_taps;
@@ -232,6 +234,7 @@ namespace gr {
       private:
 	std::vector<float> d_taps;
 	unsigned int  d_ntaps;
+	gr_complex   *d_buffer_ptr;
 	gr_complex   *d_buffer;
 	unsigned int  d_idx;
 	float       **d_aligned_taps;
diff --git a/gr-filter/lib/fir_filter_with_buffer.cc b/gr-filter/lib/fir_filter_with_buffer.cc
index 105214087..7a35a9225 100644
--- a/gr-filter/lib/fir_filter_with_buffer.cc
+++ b/gr-filter/lib/fir_filter_with_buffer.cc
@@ -40,7 +40,7 @@ namespace gr {
 	d_align = volk_get_alignment();
 	d_naligned = d_align / sizeof(float);
 
-	d_buffer = NULL;
+	d_buffer_ptr = NULL;
 	d_aligned_taps = NULL;
 	set_taps(taps);
 
@@ -50,9 +50,9 @@ namespace gr {
 
       fir_filter_with_buffer_fff::~fir_filter_with_buffer_fff()
       {
-	if(d_buffer != NULL) {
-	  fft::free(d_buffer);
-	  d_buffer = NULL;
+	if(d_buffer_ptr != NULL) {
+	  fft::free(d_buffer_ptr);
+	  d_buffer_ptr = NULL;
 	}
 	
 	// Free aligned taps
@@ -71,9 +71,9 @@ namespace gr {
       void
       fir_filter_with_buffer_fff::set_taps(const std::vector<float> &taps)
       {
-	if(d_buffer != NULL) {
-	  fft::free(d_buffer);
-	  d_buffer = NULL;
+	if(d_buffer_ptr != NULL) {
+	  fft::free(d_buffer_ptr);
+	  d_buffer_ptr = NULL;
 	}
 
 	// Free the taps if already allocated
@@ -89,8 +89,15 @@ namespace gr {
 	d_taps = taps;
 	std::reverse(d_taps.begin(), d_taps.end());
 
-	d_buffer = fft::malloc_float(2*d_ntaps);
-	memset(d_buffer, 0, 2*d_ntaps*sizeof(float));
+	// We allocate enough to be able to look back and forth
+	// d_naligned beyond the buffer boundaries and make sure these
+	// are zeroed out (or they may be nan, which will cause
+	// problems). We then set d_buffer to the position in the
+	// d_buffer_ptr such that we only touch the internally
+	// allocated space.
+	d_buffer_ptr = fft::malloc_float(2*(d_ntaps + d_naligned));
+	memset(d_buffer_ptr, 0, 2*(d_ntaps + d_naligned)*sizeof(float));
+	d_buffer = d_buffer_ptr + d_naligned;
 
 	// Allocate aligned taps
 	d_aligned_taps = (float**)malloc(d_naligned*sizeof(float**));
@@ -186,7 +193,7 @@ namespace gr {
 	d_align = volk_get_alignment();
 	d_naligned = d_align / sizeof(gr_complex);
 
-	d_buffer = NULL;
+	d_buffer_ptr = NULL;
 	d_aligned_taps = NULL;
 	set_taps(taps);
 
@@ -196,9 +203,9 @@ namespace gr {
 
       fir_filter_with_buffer_ccc::~fir_filter_with_buffer_ccc()
       {
-	if(d_buffer != NULL) {
-	  fft::free(d_buffer);
-	  d_buffer = NULL;
+	if(d_buffer_ptr != NULL) {
+	  fft::free(d_buffer_ptr);
+	  d_buffer_ptr = NULL;
 	}
 	
 	// Free aligned taps
@@ -217,9 +224,9 @@ namespace gr {
       void
       fir_filter_with_buffer_ccc::set_taps(const std::vector<gr_complex> &taps)
       {
-	if(d_buffer != NULL) {
-	  fft::free(d_buffer);
-	  d_buffer = NULL;
+	if(d_buffer_ptr != NULL) {
+	  fft::free(d_buffer_ptr);
+	  d_buffer_ptr = NULL;
 	}
 
 	// Free the taps if already allocated
@@ -235,8 +242,15 @@ namespace gr {
 	d_taps = taps;
 	std::reverse(d_taps.begin(), d_taps.end());
 
-	d_buffer = fft::malloc_complex(2*d_ntaps);
-	memset(d_buffer, 0, 2*d_ntaps*sizeof(gr_complex));
+	// We allocate enough to be able to look back and forth
+	// d_naligned beyond the buffer boundaries and make sure these
+	// are zeroed out (or they may be nan, which will cause
+	// problems). We then set d_buffer to the position in the
+	// d_buffer_ptr such that we only touch the internally
+	// allocated space.
+	d_buffer_ptr = fft::malloc_complex(2*(d_ntaps + d_naligned));
+	memset(d_buffer_ptr, 0, 2*(d_ntaps + d_naligned)*sizeof(gr_complex));
+	d_buffer = d_buffer_ptr + d_naligned;
 
 	// Allocate aligned taps
 	d_aligned_taps = (gr_complex**)malloc(d_naligned*sizeof(gr_complex**));
@@ -332,7 +346,7 @@ namespace gr {
 	d_align = volk_get_alignment();
 	d_naligned = d_align / sizeof(gr_complex);
 
-	d_buffer = NULL;
+	d_buffer_ptr = NULL;
 	d_aligned_taps = NULL;
 	set_taps(taps);
 
@@ -342,9 +356,9 @@ namespace gr {
 
       fir_filter_with_buffer_ccf::~fir_filter_with_buffer_ccf()
       {
-	if(d_buffer != NULL) {
-	  fft::free(d_buffer);
-	  d_buffer = NULL;
+	if(d_buffer_ptr != NULL) {
+	  fft::free(d_buffer_ptr);
+	  d_buffer_ptr = NULL;
 	}
 	
 	// Free aligned taps
@@ -363,9 +377,9 @@ namespace gr {
       void
       fir_filter_with_buffer_ccf::set_taps(const std::vector<float> &taps)
       {
-	if(d_buffer != NULL) {
-	  fft::free(d_buffer);
-	  d_buffer = NULL;
+	if(d_buffer_ptr != NULL) {
+	  fft::free(d_buffer_ptr);
+	  d_buffer_ptr = NULL;
 	}
 
 	// Free the taps if already allocated
@@ -381,8 +395,15 @@ namespace gr {
 	d_taps = taps;
 	std::reverse(d_taps.begin(), d_taps.end());
 
-	d_buffer = fft::malloc_complex(2*d_ntaps);
-	memset(d_buffer, 0, 2*d_ntaps*sizeof(gr_complex));
+	// We allocate enough to be able to look back and forth
+	// d_naligned beyond the buffer boundaries and make sure these
+	// are zeroed out (or they may be nan, which will cause
+	// problems). We then set d_buffer to the position in the
+	// d_buffer_ptr such that we only touch the internally
+	// allocated space.
+	d_buffer_ptr = fft::malloc_complex(2*(d_ntaps + d_naligned));
+	memset(d_buffer_ptr, 0, 2*(d_ntaps + d_naligned)*sizeof(gr_complex));
+	d_buffer = d_buffer_ptr + d_naligned;
 
 	// Allocate aligned taps
 	d_aligned_taps = (float**)malloc(d_naligned*sizeof(float**));
diff --git a/gr-filter/lib/qa_fir_filter_with_buffer.cc b/gr-filter/lib/qa_fir_filter_with_buffer.cc
index f8af9ea0b..6a1744b0a 100644
--- a/gr-filter/lib/qa_fir_filter_with_buffer.cc
+++ b/gr-filter/lib/qa_fir_filter_with_buffer.cc
@@ -39,8 +39,6 @@ namespace gr {
 #define MAX_DATA        (16383)
 #define	ERR_DELTA	(1e-5)
 
-#define	NELEM(x) (sizeof(x) / sizeof(x[0]))
-
     static float
     uniform() 
     {
@@ -58,8 +56,8 @@ namespace gr {
     random_complex(gr_complex *buf, unsigned n)
     {
       for(unsigned i = 0; i < n; i++) {
-	float re = rint(uniform () * MAX_DATA);
-	float im = rint(uniform () * MAX_DATA);
+	float re = rint(uniform() * MAX_DATA);
+	float im = rint(uniform() * MAX_DATA);
 	buf[i] = gr_complex(re, im);
       }
     }
@@ -148,7 +146,7 @@ namespace gr {
 	      new kernel::fir_filter_with_buffer_fff(f1_taps);
 
 	    // zero the output, then do the filtering
-	    memset(actual_output, 0, sizeof(actual_output));
+	    memset(actual_output, 0, OUTPUT_LEN*sizeof(o_type));
 	    f1->filterNdec(actual_output, input, ol/decimate, decimate);
 
 	    // check results
@@ -263,7 +261,7 @@ namespace gr {
 	      new kernel::fir_filter_with_buffer_ccc(f1_taps);
 
 	    // zero the output, then do the filtering
-	    memset(actual_output, 0, sizeof(actual_output));
+	    memset(actual_output, 0, OUTPUT_LEN*sizeof(o_type));
 	    f1->filterNdec(actual_output, input, ol/decimate, decimate);
 
 	    // check results
diff --git a/gr-filter/lib/qa_mmse_fir_interpolator_cc.cc b/gr-filter/lib/qa_mmse_fir_interpolator_cc.cc
index 02e0b32fe..268b8801c 100644
--- a/gr-filter/lib/qa_mmse_fir_interpolator_cc.cc
+++ b/gr-filter/lib/qa_mmse_fir_interpolator_cc.cc
@@ -27,6 +27,7 @@
 #include <cppunit/TestAssert.h>
 #include <qa_mmse_fir_interpolator_cc.h>
 #include <filter/mmse_fir_interpolator_cc.h>
+#include <fft/fft.h>
 #include <cstdio>
 #include <cmath>
 #include <stdexcept>
@@ -35,8 +36,6 @@
 namespace gr {
   namespace filter {
     
-#define	NELEM(x) (sizeof(x) / sizeof(x[0]))
-
     static float
     test_fcn_sin(double index)
     {
@@ -62,9 +61,9 @@ namespace gr {
     qa_mmse_fir_interpolator_cc::t1()
     {
       static const unsigned N = 100;
-      __GR_ATTR_ALIGNED(8) gr_complex input[N + 10];
+      gr_complex *input = fft::malloc_complex(N + 10);
 
-      for(unsigned i = 0; i < NELEM(input); i++)
+      for(unsigned i = 0; i < N+10; i++)
 	input[i] = test_fcn((double) i);
 
       mmse_fir_interpolator_cc intr;
@@ -79,6 +78,7 @@ namespace gr {
 	  // printf ("%9.6f  %9.6f  %9.6f\n", expected, actual, expected - actual);
 	}
       }
+      fft::free(input);
     }
 
     /*
diff --git a/gr-filter/lib/qa_mmse_fir_interpolator_ff.cc b/gr-filter/lib/qa_mmse_fir_interpolator_ff.cc
index 128b638b9..54387fd9b 100644
--- a/gr-filter/lib/qa_mmse_fir_interpolator_ff.cc
+++ b/gr-filter/lib/qa_mmse_fir_interpolator_ff.cc
@@ -27,14 +27,13 @@
 #include <cppunit/TestAssert.h>
 #include <qa_mmse_fir_interpolator_ff.h>
 #include <filter/mmse_fir_interpolator_ff.h>
+#include <fft/fft.h>
 #include <cstdio>
 #include <cmath>
 
 namespace gr {
   namespace filter {
     
-#define	NELEM(x) (sizeof(x) / sizeof(x[0]))
-
     static float
     test_fcn(double index)
     {
@@ -45,10 +44,12 @@ namespace gr {
     void
     qa_mmse_fir_interpolator_ff::t1()
     {
+      // use aligned malloc and make sure that everything in this
+      // buffer is properly initialized.
       static const unsigned N = 100;
-      float input[N + 10];
+      float *input = fft::malloc_float(N + 10);
 
-      for(unsigned i = 0; i < NELEM(input); i++)
+      for(unsigned i = 0; i < N+10; i++)
 	input[i] = test_fcn((double) i);
 
       mmse_fir_interpolator_ff intr;
@@ -63,6 +64,7 @@ namespace gr {
 	  // printf ("%9.6f  %9.6f  %9.6f\n", expected, actual, expected - actual);
 	}
       }
+      fft::free(input);
     }
 
   } /* namespace filter */
diff --git a/gr-filter/python/qa_pfb_channelizer.py b/gr-filter/python/qa_pfb_channelizer.py
index 3d35c46e4..c0ed8327d 100755
--- a/gr-filter/python/qa_pfb_channelizer.py
+++ b/gr-filter/python/qa_pfb_channelizer.py
@@ -70,10 +70,10 @@ class test_pfb_channelizer(gr_unittest.TestCase):
 
         # Adjusted phase rotations for data
         p0 = 0
-        p1 = 1.6335486
-        p2 = -3.01609
-        p3 = 3.01609
-        p4 = -1.6335486
+        p1 =  math.pi*0.51998885
+        p2 = -math.pi*0.96002233
+        p3 =  math.pi*0.96002233
+        p4 = -math.pi*0.51998885
 
         # Create known data as complex sinusoids at the different baseband freqs
         # the different channel numbering is due to channelizer output order.
diff --git a/grc/blocks/block_tree.xml b/grc/blocks/block_tree.xml
index 0b0b6854e..f94bd30bd 100644
--- a/grc/blocks/block_tree.xml
+++ b/grc/blocks/block_tree.xml
@@ -34,6 +34,7 @@
 		<block>gr_message_sink</block>
 		<block>pad_sink</block>
 		<block>virtual_sink</block>
+		<block>gr_tag_debug</block>
 	</cat>
 	<cat>
 		<name>Operators</name>
diff --git a/grc/blocks/gr_tag_debug.xml b/grc/blocks/gr_tag_debug.xml
new file mode 100644
index 000000000..4af7729be
--- /dev/null
+++ b/grc/blocks/gr_tag_debug.xml
@@ -0,0 +1,82 @@
+<?xml version="1.0"?>
+<!--
+###################################################
+## Tag Debug
+###################################################
+ -->
+<block>
+	<name>Tag Debug</name>
+	<key>gr_tag_debug</key>
+	<import>from gnuradio import gr</import>
+	<make>gr.tag_debug($type.size*$vlen, $name)</make>
+	<callback>set_display($display)</callback>
+	<param>
+		<name>Input Type</name>
+		<key>type</key>
+		<type>enum</type>
+		<option>
+			<name>Complex</name>
+			<key>complex</key>
+			<opt>size:gr.sizeof_gr_complex</opt>
+		</option>
+		<option>
+			<name>Float</name>
+			<key>float</key>
+			<opt>size:gr.sizeof_float</opt>
+		</option>
+		<option>
+			<name>Int</name>
+			<key>int</key>
+			<opt>size:gr.sizeof_int</opt>
+		</option>
+		<option>
+			<name>Short</name>
+			<key>short</key>
+			<opt>size:gr.sizeof_short</opt>
+		</option>
+		<option>
+			<name>Byte</name>
+			<key>byte</key>
+			<opt>size:gr.sizeof_char</opt>
+		</option>
+	</param>
+	<param>
+		<name>Name</name>
+		<key>name</key>
+		<type>string</type>
+	</param>
+	<param>
+		<name>Num Inputs</name>
+		<key>num_inputs</key>
+		<value>1</value>
+		<type>int</type>
+	</param>
+	<param>
+		<name>Vec Length</name>
+		<key>vlen</key>
+		<value>1</value>
+		<type>int</type>
+	</param>
+	<param>
+		<name>Display</name>
+		<key>display</key>
+		<value>True</value>
+		<type>bool</type>
+		<option>
+			<name>On</name>
+			<key>True</key>
+		</option>
+		<option>
+			<name>Off</name>
+			<key>False</key>
+		</option>
+	</param>
+	<check>$num_inputs &gt;= 1</check>
+	<check>$vlen &gt; 0</check>
+	<sink>
+		<name>in</name>
+		<type>$type</type>
+		<vlen>$vlen</vlen>
+		<nports>$num_inputs</nports>
+	</sink>
+</block>
diff --git a/volk/include/volk/volk_32fc_s32fc_x2_rotator_32fc_a.h b/volk/include/volk/volk_32fc_s32fc_x2_rotator_32fc_a.h
index 80c55e75f..05732b1ea 100644
--- a/volk/include/volk/volk_32fc_s32fc_x2_rotator_32fc_a.h
+++ b/volk/include/volk/volk_32fc_s32fc_x2_rotator_32fc_a.h
@@ -174,12 +174,10 @@ static inline void volk_32fc_s32fc_x2_rotator_32fc_a_avx(lv_32fc_t* outVector, c
     printf("%f, %f\n", lv_creal(phase_Ptr[2]), lv_cimag(phase_Ptr[2]));
     printf("%f, %f\n", lv_creal(phase_Ptr[3]), lv_cimag(phase_Ptr[3]));
     printf("incr: %f, %f\n", lv_creal(incr), lv_cimag(incr));*/
-    __m256 aVal, phase_Val, inc_Val, yl, yh, tmp1, tmp2, z, ylp, yhp, tmp1p, tmp2p, negated, zeros;
+    __m256 aVal, phase_Val, inc_Val, yl, yh, tmp1, tmp2, z, ylp, yhp, tmp1p, tmp2p;
     
     phase_Val = _mm256_loadu_ps((float*)phase_Ptr);
     inc_Val = _mm256_set_ps(lv_cimag(incr), lv_creal(incr),lv_cimag(incr), lv_creal(incr),lv_cimag(incr), lv_creal(incr),lv_cimag(incr), lv_creal(incr));
-    zeros = _mm256_set1_ps(0.0);
-    negated = _mm256_set1_ps(-1.0);
     const unsigned int fourthPoints = num_points / 4;
 
     
diff --git a/volk/include/volk/volk_32fc_x2_dot_prod_32fc_a.h b/volk/include/volk/volk_32fc_x2_dot_prod_32fc_a.h
index cb2ac4c67..166a883a7 100644
--- a/volk/include/volk/volk_32fc_x2_dot_prod_32fc_a.h
+++ b/volk/include/volk/volk_32fc_x2_dot_prod_32fc_a.h
@@ -18,40 +18,26 @@ static inline void volk_32fc_x2_dot_prod_32fc_a_generic(lv_32fc_t* result, const
   unsigned int n_2_ccomplex_blocks = num_bytes >> 4;
   unsigned int isodd = (num_bytes >> 3) &1;
 
-
-
   float sum0[2] = {0,0};
   float sum1[2] = {0,0};
   unsigned int i = 0;
 
-
   for(i = 0; i < n_2_ccomplex_blocks; ++i) {
-
-
     sum0[0] += in[0] * tp[0] - in[1] * tp[1];
     sum0[1] += in[0] * tp[1] + in[1] * tp[0];
     sum1[0] += in[2] * tp[2] - in[3] * tp[3];
     sum1[1] += in[2] * tp[3] + in[3] * tp[2];
 
-
     in += 4;
     tp += 4;
-
   }
 
-
   res[0] = sum0[0] + sum1[0];
   res[1] = sum0[1] + sum1[1];
 
-
-
   for(i = 0; i < isodd; ++i) {
-
-
     *result += input[(num_bytes >> 3) - 1] * taps[(num_bytes >> 3) - 1];
-
   }
-
 }
 
 #endif /*LV_HAVE_GENERIC*/
@@ -177,14 +163,8 @@ static inline void volk_32fc_x2_dot_prod_32fc_a_sse_64(lv_32fc_t* result, const
      );
 
 
-  int getem = num_bytes % 16;
-
-
-  for(; getem > 0; getem -= 8) {
-
-
+  if(((num_bytes >> 3) & 1)) {
     *result += (input[(num_bytes >> 3) - 1] * taps[(num_bytes >> 3) - 1]);
-
   }
 
   return;
@@ -363,7 +343,7 @@ static inline void volk_32fc_x2_dot_prod_32fc_a_sse3(lv_32fc_t* result, const lv
 
   dotProduct += ( dotProductVector[0] + dotProductVector[1] );
 
-  if((num_bytes >> 2) != 0) {
+  if(((num_bytes >> 3) & 1) != 0) {
     dotProduct += (*a) * (*b);
   }
 
@@ -377,9 +357,7 @@ static inline void volk_32fc_x2_dot_prod_32fc_a_sse3(lv_32fc_t* result, const lv
 #include <smmintrin.h>
 
 static inline void volk_32fc_x2_dot_prod_32fc_a_sse4_1(lv_32fc_t* result, const lv_32fc_t* input, const lv_32fc_t* taps, unsigned int num_bytes) {
-  volk_32fc_x2_dot_prod_32fc_a_sse3(result, input, taps, num_bytes);
-  // SSE3 version runs twice as fast as the SSE4.1 version, so turning off SSE4 version for now
-   /*
+
     __m128 xmm0, xmm1, xmm2, xmm3, xmm4, xmm5, xmm6, xmm7, real0, real1, im0, im1;
     float *p_input, *p_taps;
     __m64 *p_result;
@@ -442,12 +420,8 @@ static inline void volk_32fc_x2_dot_prod_32fc_a_sse4_1(lv_32fc_t* result, const
 
     }
 
-
-
-
     real1 = _mm_xor_ps(real1, (__m128)neg);
 
-
     im0 = _mm_add_ps(im0, im1);
     real0 = _mm_add_ps(real0, real1);
 
@@ -459,7 +433,6 @@ static inline void volk_32fc_x2_dot_prod_32fc_a_sse4_1(lv_32fc_t* result, const
 
     *result += input[i] * taps[i];
     }
-  */
 }
 
 #endif /*LV_HAVE_SSE4_1*/
diff --git a/volk/lib/testqa.cc b/volk/lib/testqa.cc
index 813e62217..d1eb1cacb 100644
--- a/volk/lib/testqa.cc
+++ b/volk/lib/testqa.cc
@@ -35,8 +35,8 @@ VOLK_RUN_TESTS(volk_32fc_deinterleave_64f_x2_a, 1e-4, 0, 20460, 1);
 VOLK_RUN_TESTS(volk_32fc_s32f_deinterleave_real_16i_a, 0, 32768, 20460, 1);
 VOLK_RUN_TESTS(volk_32fc_deinterleave_real_32f_a, 1e-4, 0, 20460, 1);
 VOLK_RUN_TESTS(volk_32fc_deinterleave_real_64f_a, 1e-4, 0, 20460, 1);
-VOLK_RUN_TESTS(volk_32fc_x2_dot_prod_32fc_a, 1e-4, 0, 204600, 1);
-VOLK_RUN_TESTS(volk_32fc_32f_dot_prod_32fc_a, 1e-4, 0, 204600, 1);
+VOLK_RUN_TESTS(volk_32fc_x2_dot_prod_32fc_a, 1e-4, 0, 2046000, 1);
+VOLK_RUN_TESTS(volk_32fc_32f_dot_prod_32fc_a, 1e-4, 0, 2046000, 1);
 VOLK_RUN_TESTS(volk_32fc_index_max_16u_a, 3, 0, 20460, 1);
 VOLK_RUN_TESTS(volk_32fc_s32f_magnitude_16i_a, 1, 32768, 20460, 1);
 VOLK_RUN_TESTS(volk_32fc_magnitude_32f_a, 1e-4, 0, 20460, 1);