From 620797ac18193905ad0d1ac3f82c3d7570c28eae Mon Sep 17 00:00:00 2001
From: Isaac Connor <iconnor@connortechnology.com>
Date: Mon, 10 Apr 2017 21:54:23 -0400
Subject: [PATCH] replace swresample with libavresample

---
 CMakeLists.txt          |  30 +-
 src/CMakeLists.txt      |   2 +-
 src/zm_videostore.cpp   | 659 +++++++++++++++++++++++-----------------
 src/zm_videostore.h     |  10 +-
 zoneminder-config.cmake |   4 +-
 5 files changed, 406 insertions(+), 299 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 559ad2bdc..1971c268f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -564,21 +564,21 @@ if(NOT ZM_NO_FFMPEG)
 	endif(SWSCALE_LIBRARIES)
 
 	# rescale (using find_library and find_path)
-	find_library(SWRESAMPLE_LIBRARIES swresample)
-	if(SWRESAMPLE_LIBRARIES)
-		set(HAVE_LIBSWRESAMPLE 1)
-		list(APPEND ZM_BIN_LIBS "${SWRESAMPLE_LIBRARIES}")
-		find_path(SWRESAMPLE_INCLUDE_DIR "libswresample/swresample.h" /usr/include/ffmpeg)
-		if(SWRESAMPLE_INCLUDE_DIR)
-			include_directories("${SWRESAMPLE_INCLUDE_DIR}")
-			set(CMAKE_REQUIRED_INCLUDES "${SWRESAMPLE_INCLUDE_DIR}")
-		endif(SWRESAMPLE_INCLUDE_DIR)
-		mark_as_advanced(FORCE SWRESAMPLE_LIBRARIES SWRESAMPLE_INCLUDE_DIR)
-		check_include_file("libswresample/swresample.h" HAVE_LIBSWRESAMPLE_SWRESAMPLE_H)
-		set(optlibsfound "${optlibsfound} SWResample")
-	else(SWRESAMPLE_LIBRARIES)
-		set(optlibsnotfound "${optlibsnotfound} SWResample")
-	endif(SWRESAMPLE_LIBRARIES)
+	find_library(AVRESAMPLE_LIBRARIES avresample)
+	if(AVRESAMPLE_LIBRARIES)
+		set(HAVE_LIBAVRESAMPLE 1)
+		list(APPEND ZM_BIN_LIBS "${AVRESAMPLE_LIBRARIES}")
+		find_path(AVRESAMPLE_INCLUDE_DIR "libavresample/avresample.h" /usr/include/ffmpeg)
+		if(AVRESAMPLE_INCLUDE_DIR)
+			include_directories("${AVRESAMPLE_INCLUDE_DIR}")
+			set(CMAKE_REQUIRED_INCLUDES "${AVRESAMPLE_INCLUDE_DIR}")
+		endif(AVRESAMPLE_INCLUDE_DIR)
+		mark_as_advanced(FORCE AVRESAMPLE_LIBRARIES AVRESAMPLE_INCLUDE_DIR)
+		check_include_file("libavresample/avresample.h" HAVE_LIBAVRESAMPLE_AVRESAMPLE_H)
+		set(optlibsfound "${optlibsfound} AVResample")
+	else(AVRESAMPLE_LIBRARIES)
+		set(optlibsnotfound "${optlibsnotfound} AVResample")
+	endif(AVRESAMPLE_LIBRARIES)
 
 	# Find the path to the ffmpeg executable
 	find_program(FFMPEG_EXECUTABLE 
diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index e33f0f0bb..6a68a8acd 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -4,7 +4,7 @@
 configure_file(zm_config.h.in "${CMAKE_CURRENT_BINARY_DIR}/zm_config.h" @ONLY)
 
 # Group together all the source files that are used by all the binaries (zmc, zma, zmu, zms etc)
-set(ZM_BIN_SRC_FILES zm_box.cpp zm_buffer.cpp zm_camera.cpp zm_comms.cpp zm_config.cpp zm_coord.cpp zm_curl_camera.cpp zm.cpp zm_db.cpp zm_logger.cpp zm_event.cpp zm_exception.cpp zm_file_camera.cpp zm_ffmpeg_camera.cpp zm_image.cpp zm_jpeg.cpp zm_libvlc_camera.cpp zm_local_camera.cpp zm_monitor.cpp zm_ffmpeg.cpp zm_mpeg.cpp zm_packetqueue.cpp zm_poly.cpp zm_regexp.cpp zm_remote_camera.cpp zm_remote_camera_http.cpp zm_remote_camera_rtsp.cpp zm_rtp.cpp zm_rtp_ctrl.cpp zm_rtp_data.cpp zm_rtp_source.cpp zm_rtsp.cpp zm_rtsp_auth.cpp zm_sdp.cpp zm_signal.cpp zm_stream.cpp zm_thread.cpp zm_time.cpp zm_timer.cpp zm_user.cpp zm_utils.cpp zm_video.cpp zm_videostore.cpp zm_zone.cpp zm_storage.cpp)
+set(ZM_BIN_SRC_FILES zm_box.cpp zm_buffer.cpp zm_camera.cpp zm_comms.cpp zm_config.cpp zm_coord.cpp zm_curl_camera.cpp zm.cpp zm_db.cpp zm_logger.cpp zm_event.cpp zm_exception.cpp zm_file_camera.cpp zm_ffmpeg_camera.cpp zm_image.cpp zm_jpeg.cpp zm_libvlc_camera.cpp zm_local_camera.cpp zm_monitor.cpp zm_monitorstream.cpp zm_ffmpeg.cpp zm_mpeg.cpp zm_packetqueue.cpp zm_poly.cpp zm_regexp.cpp zm_remote_camera.cpp zm_remote_camera_http.cpp zm_remote_camera_rtsp.cpp zm_rtp.cpp zm_rtp_ctrl.cpp zm_rtp_data.cpp zm_rtp_source.cpp zm_rtsp.cpp zm_rtsp_auth.cpp zm_sdp.cpp zm_signal.cpp zm_stream.cpp zm_thread.cpp zm_time.cpp zm_timer.cpp zm_user.cpp zm_utils.cpp zm_video.cpp zm_videostore.cpp zm_zone.cpp zm_storage.cpp)
 
 # A fix for cmake recompiling the source files for every target.
 add_library(zm STATIC ${ZM_BIN_SRC_FILES})
diff --git a/src/zm_videostore.cpp b/src/zm_videostore.cpp
index b4d2ef741..7048746d9 100644
--- a/src/zm_videostore.cpp
+++ b/src/zm_videostore.cpp
@@ -1,4 +1,3 @@
-//
 // ZoneMinder Video Storage Implementation
 // Written by Chris Wiggins
 // http://chriswiggins.co.nz
@@ -214,175 +213,14 @@ VideoStore::VideoStore(const char *filename_in, const char *format_in,
     audio_input_context = audio_input_stream->codec;
 
     if ( audio_input_context->codec_id != AV_CODEC_ID_AAC ) {
-#ifdef HAVE_LIBSWRESAMPLE
       resample_context = NULL;
-			char error_buffer[256];
+			static char error_buffer[256];
       avcodec_string(error_buffer, sizeof(error_buffer), audio_input_context, 0 );
       Debug(3, "Got something other than AAC (%s)", error_buffer );
       audio_output_stream = NULL;
-
-      audio_output_codec = avcodec_find_encoder(AV_CODEC_ID_AAC);
-      if ( audio_output_codec ) {
-Debug(2, "Have audio output codec");
-        audio_output_stream = avformat_new_stream( oc, audio_output_codec );
-
-        audio_output_context = audio_output_stream->codec;
-
-        if ( audio_output_context ) {
-
-Debug(2, "Have audio_output_context");
-          AVDictionary *opts = NULL;
-          av_dict_set(&opts, "strict", "experimental", 0);
-
-          /* put sample parameters */
-          audio_output_context->bit_rate = audio_input_context->bit_rate;
-          audio_output_context->sample_rate = audio_input_context->sample_rate;
-          audio_output_context->channels = audio_input_context->channels;
-          audio_output_context->channel_layout = audio_input_context->channel_layout;
-          audio_output_context->sample_fmt = audio_input_context->sample_fmt;
-          //audio_output_context->refcounted_frames = 1;
-
-          if (audio_output_codec->supported_samplerates) {
-            int found = 0;
-            for ( unsigned int i = 0; audio_output_codec->supported_samplerates[i]; i++) {
-              if ( audio_output_context->sample_rate == audio_output_codec->supported_samplerates[i] ) {
-                found = 1;
-                break;
-              }
-            }
-            if ( found ) {
-              Debug(3, "Sample rate is good");
-            } else {
-              audio_output_context->sample_rate = audio_output_codec->supported_samplerates[0];
-              Debug(1, "Sampel rate is no good, setting to (%d)", audio_output_codec->supported_samplerates[0] );
-            }
-          }
-
-        /* check that the encoder supports s16 pcm input */
-        if (!check_sample_fmt( audio_output_codec, audio_output_context->sample_fmt)) {
-          Debug( 3, "Encoder does not support sample format %s, setting to FLTP",
-              av_get_sample_fmt_name( audio_output_context->sample_fmt));
-          audio_output_context->sample_fmt = AV_SAMPLE_FMT_FLTP;
-        }
-
-        //audio_output_stream->time_base = audio_input_stream->time_base;
-        audio_output_context->time_base = (AVRational){ 1, audio_output_context->sample_rate };
-
-        Debug(3, "Audio Time bases input stream (%d/%d) input codec: (%d/%d) output_stream (%d/%d) output codec (%d/%d)", 
-            audio_input_stream->time_base.num,
-            audio_input_stream->time_base.den,
-            audio_input_context->time_base.num,
-            audio_input_context->time_base.den,
-            audio_output_stream->time_base.num,
-            audio_output_stream->time_base.den,
-            audio_output_context->time_base.num,
-            audio_output_context->time_base.den
-            );
-
-        ret = avcodec_open2(audio_output_context, audio_output_codec, &opts );
-        if ( ret < 0 ) {
-          av_strerror(ret, error_buffer, sizeof(error_buffer));
-          Fatal( "could not open codec (%d) (%s)\n", ret, error_buffer );
-        } else {
-
-          Debug(1, "Audio output bit_rate (%d) sample_rate(%d) channels(%d) fmt(%d) layout(%d) frame_size(%d), refcounted_frames(%d)", 
-              audio_output_context->bit_rate,
-              audio_output_context->sample_rate,
-              audio_output_context->channels,
-              audio_output_context->sample_fmt,
-              audio_output_context->channel_layout,
-              audio_output_context->frame_size,
-              audio_output_context->refcounted_frames
-              );
-#if 1
-          /** Create the FIFO buffer based on the specified output sample format. */
-          if (!(fifo = av_audio_fifo_alloc(audio_output_context->sample_fmt,
-                  audio_output_context->channels, 1))) {
-            Error("Could not allocate FIFO\n");
-            return;
-          }
-#endif
-          output_frame_size = audio_output_context->frame_size;
-          /** Create a new frame to store the audio samples. */
-          if (!(input_frame = zm_av_frame_alloc())) {
-            Error("Could not allocate input frame");
-            return;
-          }
-
-          /** Create a new frame to store the audio samples. */
-          if (!(output_frame = zm_av_frame_alloc())) {
-            Error("Could not allocate output frame");
-            av_frame_free(&input_frame);
-            return;
-          }
-          /**
-         * Create a resampler context for the conversion.
-         * Set the conversion parameters.
-         * Default channel layouts based on the number of channels
-         * are assumed for simplicity (they are sometimes not detected
-         * properly by the demuxer and/or decoder).
-         */
-        resample_context = swr_alloc_set_opts(NULL,
-                                              av_get_default_channel_layout(audio_output_context->channels),
-                                              audio_output_context->sample_fmt,
-                                              audio_output_context->sample_rate,
-                                              av_get_default_channel_layout( audio_input_context->channels),
-                                              audio_input_context->sample_fmt,
-                                              audio_input_context->sample_rate,
-                                              0, NULL);
-        if (!resample_context) {
-            Error( "Could not allocate resample context\n");
-            return;
-        }
-        /**
-        * Perform a sanity check so that the number of converted samples is
-        * not greater than the number of samples to be converted.
-        * If the sample rates differ, this case has to be handled differently
-        */
-        av_assert0(audio_output_context->sample_rate == audio_input_context->sample_rate);
-        /** Open the resampler with the specified parameters. */
-        if ((ret = swr_init(resample_context)) < 0) {
-            Error( "Could not open resample context\n");
-            swr_free(&resample_context);
-            return;
-        }
-        /**
-         * Allocate as many pointers as there are audio channels.
-         * Each pointer will later point to the audio samples of the corresponding
-         * channels (although it may be NULL for interleaved formats).
-         */
-        if (!( converted_input_samples = (uint8_t *)calloc( audio_output_context->channels, sizeof(*converted_input_samples))) ) {
-          Error( "Could not allocate converted input sample pointers\n");
-          return;
-        }
-        /**
-         * Allocate memory for the samples of all channels in one consecutive
-         * block for convenience.
-         */
-        if ((ret = av_samples_alloc( &converted_input_samples, NULL,
-                audio_output_context->channels,
-                audio_output_context->frame_size,
-                audio_output_context->sample_fmt, 0)) < 0) {
-          Error( "Could not allocate converted input samples (error '%s')\n",
-              av_make_error_string(ret).c_str() );
-
-          av_freep(converted_input_samples);
-          free(converted_input_samples);
-          return;
-        }
-        Debug(2, "Success opening AAC codec");
-        } 
-        av_dict_free(&opts);
-        } else {
-          Error( "could not allocate codec context for AAC\n");
-        }
-      } else {
-        Error( "could not find codec for AAC\n");
+      if ( ! setup_resampler() ) {
+        return;
       }
-#else
-      Error("Not built with libswresample library. Cannot do audio conversion to AAC");
-      audio_output_stream = NULL;
-#endif
     } else {
       Debug(3, "Got AAC" );
 
@@ -390,32 +228,32 @@ Debug(2, "Have audio_output_context");
       if ( ! audio_output_stream ) {
         Error("Unable to create audio out stream\n");
         audio_output_stream = NULL;
-      }
-      audio_output_context = audio_output_stream->codec;
-
-      ret = avcodec_copy_context(audio_output_context, audio_input_context);
-      if (ret < 0) {
-        Fatal("Unable to copy audio context %s\n", av_make_error_string(ret).c_str());
-      }   
-      audio_output_context->codec_tag = 0;
-      if ( audio_output_context->channels > 1 ) {
-        Warning("Audio isn't mono, changing it.");
-        audio_output_context->channels = 1;
       } else {
-        Debug(3, "Audio is mono");
-      }
+        audio_output_context = audio_output_stream->codec;
+
+        ret = avcodec_copy_context(audio_output_context, audio_input_context);
+        if (ret < 0) {
+          Error("Unable to copy audio context %s\n", av_make_error_string(ret).c_str());
+          audio_output_stream = NULL;
+        } else {
+          audio_output_context->codec_tag = 0;
+          if ( audio_output_context->channels > 1 ) {
+            Warning("Audio isn't mono, changing it.");
+            audio_output_context->channels = 1;
+          } else {
+            Debug(3, "Audio is mono");
+          }
+        }   
+      } // end if audio_output_stream
     } // end if is AAC
 
-if ( audio_output_stream ) {
-    if (oc->oformat->flags & AVFMT_GLOBALHEADER) {
-      audio_output_context->flags |= CODEC_FLAG_GLOBAL_HEADER;
-    }
+    if ( audio_output_stream ) {
+      if (oc->oformat->flags & AVFMT_GLOBALHEADER) {
+        audio_output_context->flags |= CODEC_FLAG_GLOBAL_HEADER;
+      }
     }
 
-  } else {
-    Debug(3, "No Audio output stream");
-    audio_output_stream = NULL;
-  }    
+  } // end if audio_input_stream
 
   /* open the output file, if needed */
   if (!(output_format->flags & AVFMT_NOFILE)) {
@@ -529,8 +367,242 @@ Debug(2, "writing flushed packet pts(%d) dts(%d) duration(%d)", pkt.pts, pkt.dts
   avformat_free_context(oc);
 
 #ifdef HAVE_LIBSWRESAMPLE
-  if ( resample_context )
-    swr_free( &resample_context );
+  //if ( resample_context )
+    //swr_free( &resample_context );
+#endif
+}
+
+bool VideoStore::setup_resampler() {
+#ifdef HAVE_LIBSWRESAMPLE
+			static char error_buffer[256];
+
+    audio_output_codec = avcodec_find_encoder(AV_CODEC_ID_AAC);
+    if ( ! audio_output_codec ) {
+        Error("Could not find codec for AAC");
+      return false;
+    }
+    Debug(2, "Have audio output codec");
+
+    audio_output_stream = avformat_new_stream( oc, audio_output_codec );
+    audio_output_context = audio_output_stream->codec;
+
+    if ( ! audio_output_context ) {
+      Error( "could not allocate codec context for AAC\n");
+      audio_output_stream = NULL;
+      return false;
+    }
+
+    Debug(2, "Have audio_output_context");
+
+    AVDictionary *opts = NULL;
+    av_dict_set(&opts, "strict", "experimental", 0);
+
+    /* put sample parameters */
+    audio_output_context->bit_rate = audio_input_context->bit_rate;
+    audio_output_context->sample_rate = audio_input_context->sample_rate;
+    audio_output_context->channels = audio_input_context->channels;
+    audio_output_context->channel_layout = audio_input_context->channel_layout;
+    audio_output_context->sample_fmt = audio_input_context->sample_fmt;
+    //audio_output_context->refcounted_frames = 1;
+
+    if (audio_output_codec->supported_samplerates) {
+      int found = 0;
+      for ( unsigned int i = 0; audio_output_codec->supported_samplerates[i]; i++) {
+        if ( audio_output_context->sample_rate == audio_output_codec->supported_samplerates[i] ) {
+          found = 1;
+          break;
+        }
+      }
+      if ( found ) {
+        Debug(3, "Sample rate is good");
+      } else {
+        audio_output_context->sample_rate = audio_output_codec->supported_samplerates[0];
+        Debug(1, "Sampel rate is no good, setting to (%d)", audio_output_codec->supported_samplerates[0] );
+      }
+    }
+
+    /* check that the encoder supports s16 pcm input */
+    if (!check_sample_fmt( audio_output_codec, audio_output_context->sample_fmt)) {
+      Debug( 3, "Encoder does not support sample format %s, setting to FLTP",
+          av_get_sample_fmt_name( audio_output_context->sample_fmt));
+      audio_output_context->sample_fmt = AV_SAMPLE_FMT_FLTP;
+    }
+
+    //audio_output_stream->time_base = audio_input_stream->time_base;
+    audio_output_context->time_base = (AVRational){ 1, audio_output_context->sample_rate };
+
+    Debug(3, "Audio Time bases input stream (%d/%d) input codec: (%d/%d) output_stream (%d/%d) output codec (%d/%d)", 
+        audio_input_stream->time_base.num,
+        audio_input_stream->time_base.den,
+        audio_input_context->time_base.num,
+        audio_input_context->time_base.den,
+        audio_output_stream->time_base.num,
+        audio_output_stream->time_base.den,
+        audio_output_context->time_base.num,
+        audio_output_context->time_base.den
+        );
+
+    ret = avcodec_open2(audio_output_context, audio_output_codec, &opts );
+    av_dict_free(&opts);
+    if ( ret < 0 ) {
+      av_strerror(ret, error_buffer, sizeof(error_buffer));
+      Fatal( "could not open codec (%d) (%s)\n", ret, error_buffer );
+      audio_output_codec = NULL;
+      audio_output_context = NULL;
+      audio_output_stream = NULL;
+      return false;
+    } 
+
+    Debug(1, "Audio output bit_rate (%d) sample_rate(%d) channels(%d) fmt(%d) layout(%d) frame_size(%d), refcounted_frames(%d)", 
+        audio_output_context->bit_rate,
+        audio_output_context->sample_rate,
+        audio_output_context->channels,
+        audio_output_context->sample_fmt,
+        audio_output_context->channel_layout,
+        audio_output_context->frame_size,
+        audio_output_context->refcounted_frames
+        );
+#if 1
+    /** Create the FIFO buffer based on the specified output sample format. */
+    if (!(fifo = av_audio_fifo_alloc(audio_output_context->sample_fmt,
+            audio_output_context->channels, 1))) {
+      Error("Could not allocate FIFO\n");
+      return false;
+    }
+#endif
+    output_frame_size = audio_output_context->frame_size;
+    /** Create a new frame to store the audio samples. */
+    if (!(input_frame = zm_av_frame_alloc())) {
+      Error("Could not allocate input frame");
+      return false;
+    }
+
+    /** Create a new frame to store the audio samples. */
+    if (!(output_frame = zm_av_frame_alloc())) {
+      Error("Could not allocate output frame");
+      av_frame_free(&input_frame);
+      return false;
+    }
+
+#if 0
+    /**
+     * Create a resampler context for the conversion.
+     * Set the conversion parameters.
+     * Default channel layouts based on the number of channels
+     * are assumed for simplicity (they are sometimes not detected
+     * properly by the demuxer and/or decoder).
+     */
+    resample_context = swr_alloc_set_opts(NULL,
+        av_get_default_channel_layout(audio_output_context->channels),
+        audio_output_context->sample_fmt,
+        audio_output_context->sample_rate,
+        av_get_default_channel_layout( audio_input_context->channels),
+        audio_input_context->sample_fmt,
+        audio_input_context->sample_rate,
+        0, NULL);
+
+    if (!resample_context) {
+      Error( "Could not allocate resample context\n");
+      return;
+    }
+    /**
+     * Perform a sanity check so that the number of converted samples is
+     * not greater than the number of samples to be converted.
+     * If the sample rates differ, this case has to be handled differently
+     */
+    av_assert0(audio_output_context->sample_rate == audio_input_context->sample_rate);
+    /** Open the resampler with the specified parameters. */
+    if ((ret = swr_init(resample_context)) < 0) {
+      Error( "Could not open resample context\n");
+      swr_free(&resample_context);
+      return;
+    }
+#else 
+    // Setup the audio resampler
+    resample_context = avresample_alloc_context();
+    if (!resample_context) {
+      Error( "Could not allocate resample context\n");
+      return false;
+    }
+
+    // Some formats (i.e. WAV) do not produce the proper channel layout
+    if ( audio_input_context->channel_layout == 0 ) {
+      Error( "Could not allocate resample context channgel_layout\n");
+    //av_opt_set_int( resample_context, "in_channel_layout",  av_get_channel_layout( m_profile->channels == 1 ? "mono" : "stereo" ), 0 );
+    } else {
+      av_opt_set_int( resample_context, "in_channel_layout",  audio_input_context->channel_layout, 0 );
+    }
+
+    av_opt_set_int( resample_context, "in_sample_fmt",     audio_input_context->sample_fmt, 0);
+    av_opt_set_int( resample_context, "in_sample_rate",    audio_input_context->sample_rate, 0);
+    av_opt_set_int( resample_context, "in_channels",       audio_input_context->channels,0);
+    av_opt_set_int( resample_context, "out_channel_layout", audio_output_context->channel_layout, 0);
+    av_opt_set_int( resample_context, "out_sample_fmt",     audio_output_context->sample_fmt, 0);
+    av_opt_set_int( resample_context, "out_sample_rate",    audio_output_context->sample_rate, 0);
+    av_opt_set_int( resample_context, "out_channels",       audio_output_context->channels, 0);
+
+    ret = avresample_open( resample_context );
+    if ( ret < 0 ) {
+      Error( "Could not open resample context\n");
+      return false;
+    }
+
+#if 0
+    /**
+     * Allocate as many pointers as there are audio channels.
+     * Each pointer will later point to the audio samples of the corresponding
+     * channels (although it may be NULL for interleaved formats).
+     */
+    if (!( converted_input_samples = (uint8_t *)calloc( audio_output_context->channels, sizeof(*converted_input_samples))) ) {
+      Error( "Could not allocate converted input sample pointers\n");
+      return;
+    }
+    /**
+     * Allocate memory for the samples of all channels in one consecutive
+     * block for convenience.
+     */
+    if ((ret = av_samples_alloc( &converted_input_samples, NULL,
+            audio_output_context->channels,
+            audio_output_context->frame_size,
+            audio_output_context->sample_fmt, 0)) < 0) {
+      Error( "Could not allocate converted input samples (error '%s')\n",
+          av_make_error_string(ret).c_str() );
+
+      av_freep(converted_input_samples);
+      free(converted_input_samples);
+      return;
+    }
+#endif
+
+    output_frame->nb_samples = audio_output_context->frame_size;
+    output_frame->format = audio_output_context->sample_fmt;
+    output_frame->channel_layout = audio_output_context->channel_layout;
+
+    // The codec gives us the frame size, in samples, we calculate the size of the samples buffer in bytes
+    unsigned int audioSampleBuffer_size = av_samples_get_buffer_size( NULL, audio_output_context->channels, audio_output_context->frame_size, audio_output_context->sample_fmt, 0 );
+    converted_input_samples = (uint8_t*) av_malloc( audioSampleBuffer_size );
+
+    if ( !converted_input_samples ) { 
+      Error( "Could not allocate converted input sample pointers\n");
+      return false;
+    }
+
+    // Setup the data pointers in the AVFrame
+    if ( avcodec_fill_audio_frame( 
+          output_frame, 
+          audio_output_context->channels, 
+          audio_output_context->sample_fmt, 
+          (const uint8_t*) converted_input_samples, 
+          audioSampleBuffer_size, 0 ) < 0 ) {
+      Error( "Could not allocate converted input sample pointers\n");
+      return false;
+    }
+
+#endif
+return true;
+#else
+Error("Not built with libswresample library. Cannot do audio conversion to AAC");
+return false;
 #endif
 }
 
@@ -634,47 +706,47 @@ int VideoStore::writeVideoFramePacket( AVPacket *ipkt ) {
 
 #if 0
   if (video_output_context->codec_type == AVMEDIA_TYPE_VIDEO && (output_format->flags & AVFMT_RAWPICTURE)) {
-  AVPicture pict;
-Debug(3, "video and RAWPICTURE");
+    AVPicture pict;
+    Debug(3, "video and RAWPICTURE");
     /* store AVPicture in AVPacket, as expected by the output format */
     avpicture_fill(&pict, opkt.data, video_output_context->pix_fmt, video_output_context->width, video_output_context->height, 0);
-  av_image_fill_arrays( 
-    opkt.data = (uint8_t *)&pict;
-    opkt.size = sizeof(AVPicture);
-    opkt.flags |= AV_PKT_FLAG_KEY;
-   } else {
-Debug(4, "Not video and RAWPICTURE");
-  }
+    av_image_fill_arrays( 
+        opkt.data = (uint8_t *)&pict;
+        opkt.size = sizeof(AVPicture);
+        opkt.flags |= AV_PKT_FLAG_KEY;
+        } else {
+        Debug(4, "Not video and RAWPICTURE");
+        }
 #endif
 
-  AVPacket safepkt;
-  memcpy(&safepkt, &opkt, sizeof(AVPacket));
+        AVPacket safepkt;
+        memcpy(&safepkt, &opkt, sizeof(AVPacket));
 
-  if ((opkt.data == NULL)||(opkt.size < 1)) {
-    Warning("%s:%d: Mangled AVPacket: discarding frame", __FILE__, __LINE__ ); 
-    dumpPacket( ipkt);
-    dumpPacket(&opkt);
+        if ((opkt.data == NULL)||(opkt.size < 1)) {
+        Warning("%s:%d: Mangled AVPacket: discarding frame", __FILE__, __LINE__ ); 
+        dumpPacket( ipkt);
+        dumpPacket(&opkt);
 
-  } else if ((previous_dts > 0) && (previous_dts > opkt.dts)) {
-    Warning("%s:%d: DTS out of order: %lld \u226E %lld; discarding frame", __FILE__, __LINE__, previous_dts, opkt.dts); 
-    previous_dts = opkt.dts; 
-    dumpPacket(&opkt);
+        } else if ((previous_dts > 0) && (previous_dts > opkt.dts)) {
+        Warning("%s:%d: DTS out of order: %lld \u226E %lld; discarding frame", __FILE__, __LINE__, previous_dts, opkt.dts); 
+        previous_dts = opkt.dts; 
+        dumpPacket(&opkt);
 
-  } else {
+        } else {
 
-    previous_dts = opkt.dts; // Unsure if av_interleaved_write_frame() clobbers opkt.dts when out of order, so storing in advance
-    previous_pts = opkt.pts;
-    ret = av_interleaved_write_frame(oc, &opkt);
-    if(ret<0){
-      // There's nothing we can really do if the frame is rejected, just drop it and get on with the next
-      Warning("%s:%d: Writing frame [av_interleaved_write_frame()] failed: %s(%d)  ", __FILE__, __LINE__,  av_make_error_string(ret).c_str(), (ret));
-      dumpPacket(&safepkt);
-    }
-  }
+          previous_dts = opkt.dts; // Unsure if av_interleaved_write_frame() clobbers opkt.dts when out of order, so storing in advance
+          previous_pts = opkt.pts;
+          ret = av_interleaved_write_frame(oc, &opkt);
+          if(ret<0){
+            // There's nothing we can really do if the frame is rejected, just drop it and get on with the next
+            Warning("%s:%d: Writing frame [av_interleaved_write_frame()] failed: %s(%d)  ", __FILE__, __LINE__,  av_make_error_string(ret).c_str(), (ret));
+            dumpPacket(&safepkt);
+          }
+        }
 
-  zm_av_packet_unref(&opkt); 
+        zm_av_packet_unref(&opkt); 
 
-  return 0;
+        return 0;
 
 }
 
@@ -693,7 +765,7 @@ int VideoStore::writeAudioFramePacket( AVPacket *ipkt ) {
   Debug(5, "after init packet" );
 
 #if 1
- //Scale the PTS of the outgoing packet to be the correct time base
+  //Scale the PTS of the outgoing packet to be the correct time base
   if ( ipkt->pts != AV_NOPTS_VALUE ) {
     if ( !audio_last_pts ) {
       opkt.pts = 0;
@@ -739,10 +811,10 @@ int VideoStore::writeAudioFramePacket( AVPacket *ipkt ) {
     Debug(1,"opkt.dts(%d) must be <= opkt.pts(%d). Decompression must happen before presentation.", opkt.dts, opkt.pts );
     opkt.dts = opkt.pts;
   }
-    //opkt.pts = AV_NOPTS_VALUE;
-    //opkt.dts = AV_NOPTS_VALUE;
+  //opkt.pts = AV_NOPTS_VALUE;
+  //opkt.dts = AV_NOPTS_VALUE;
 
-    // I wonder if we could just use duration instead of all the hoop jumping above?
+  // I wonder if we could just use duration instead of all the hoop jumping above?
   opkt.duration = av_rescale_q(ipkt->duration, audio_input_stream->time_base, audio_output_stream->time_base);
 #else
 #endif
@@ -751,48 +823,48 @@ int VideoStore::writeAudioFramePacket( AVPacket *ipkt ) {
   opkt.pos = -1;
   opkt.flags = ipkt->flags;
   opkt.stream_index = ipkt->stream_index;
-Debug(2, "Stream index is %d", opkt.stream_index );
+  Debug(2, "Stream index is %d", opkt.stream_index );
 
   if ( audio_output_codec ) {
 
 #ifdef HAVE_LIBSWRESAMPLE
-  // Need to re-encode
+    // Need to re-encode
 #if 0
-  ret = avcodec_send_packet( audio_input_context, ipkt );
-  if ( ret < 0 ) {
-    Error("avcodec_send_packet fail %s", av_make_error_string(ret).c_str());
-    return 0;
-  }
+    ret = avcodec_send_packet( audio_input_context, ipkt );
+    if ( ret < 0 ) {
+      Error("avcodec_send_packet fail %s", av_make_error_string(ret).c_str());
+      return 0;
+    }
 
-  ret = avcodec_receive_frame( audio_input_context, input_frame );
-  if ( ret < 0 ) {
-    Error("avcodec_receive_frame fail %s", av_make_error_string(ret).c_str());
-    return 0;
-  }
-Debug(2, "Frame: samples(%d), format(%d), sample_rate(%d), channel layout(%d) refd(%d)", 
-input_frame->nb_samples,
-input_frame->format,
-input_frame->sample_rate,
-input_frame->channel_layout,
-audio_output_context->refcounted_frames
-);
+    ret = avcodec_receive_frame( audio_input_context, input_frame );
+    if ( ret < 0 ) {
+      Error("avcodec_receive_frame fail %s", av_make_error_string(ret).c_str());
+      return 0;
+    }
+    Debug(2, "Frame: samples(%d), format(%d), sample_rate(%d), channel layout(%d) refd(%d)", 
+        input_frame->nb_samples,
+        input_frame->format,
+        input_frame->sample_rate,
+        input_frame->channel_layout,
+        audio_output_context->refcounted_frames
+        );
 
-  ret = avcodec_send_frame( audio_output_context, input_frame );
-  if ( ret < 0 ) {
+    ret = avcodec_send_frame( audio_output_context, input_frame );
+    if ( ret < 0 ) {
+      av_frame_unref( input_frame );
+      Error("avcodec_send_frame fail(%d),  %s codec is open(%d) is_encoder(%d)", ret, av_make_error_string(ret).c_str(),
+          avcodec_is_open( audio_output_context ),
+          av_codec_is_encoder( audio_output_context->codec)
+          );
+      return 0;
+    }
+    ret = avcodec_receive_packet( audio_output_context, &opkt );
+    if ( ret < 0 ) {
+      av_frame_unref( input_frame );
+      Error("avcodec_receive_packet fail %s", av_make_error_string(ret).c_str());
+      return 0;
+    }
     av_frame_unref( input_frame );
-    Error("avcodec_send_frame fail(%d),  %s codec is open(%d) is_encoder(%d)", ret, av_make_error_string(ret).c_str(),
-avcodec_is_open( audio_output_context ),
-av_codec_is_encoder( audio_output_context->codec)
-);
-    return 0;
-  }
-  ret = avcodec_receive_packet( audio_output_context, &opkt );
-  if ( ret < 0 ) {
-    av_frame_unref( input_frame );
-    Error("avcodec_receive_packet fail %s", av_make_error_string(ret).c_str());
-    return 0;
-  }
-  av_frame_unref( input_frame );
 #else
 
 
@@ -803,13 +875,13 @@ av_codec_is_encoder( audio_output_context->codec)
      * to flush it.
      */
     if ((ret = avcodec_decode_audio4(audio_input_context, input_frame,
-                                       &data_present, ipkt)) < 0) {
-        Error( "Could not decode frame (error '%s')\n",
-                av_make_error_string(ret).c_str());
-        dumpPacket( ipkt );
-        av_frame_free(&input_frame);
-        zm_av_packet_unref(&opkt);
-        return 0;
+            &data_present, ipkt)) < 0) {
+      Error( "Could not decode frame (error '%s')\n",
+          av_make_error_string(ret).c_str());
+      dumpPacket( ipkt );
+      av_frame_free(&input_frame);
+      zm_av_packet_unref(&opkt);
+      return 0;
     }
     if ( ! data_present ) {
       Debug(2, "Not ready to transcode a frame yet.");
@@ -820,7 +892,33 @@ av_codec_is_encoder( audio_output_context->codec)
     int frame_size = input_frame->nb_samples;
     Debug(4, "Frame size: %d", frame_size );
 
+#if 1 
+// Resample the input into the audioSampleBuffer until we proceed the whole decoded data
+      if ( (ret = avresample_convert( resample_context,
+                      NULL,
+                      0,
+                      0,
+                      input_frame->data,
+                      0,
+                      input_frame->nb_samples )) < 0 )
+      {
+      Error( "Could not resample frame (error '%s')\n",
+          av_make_error_string(ret).c_str());
+      return 0;
+      }
 
+      if ( avresample_available( resample_context ) < output_frame->nb_samples ) {
+        Debug(1, "No enough samples yet");
+        return 0;
+      }
+// Read a frame audio data from the resample fifo
+        if ( avresample_read( resample_context, output_frame->data, output_frame->nb_samples ) != output_frame->nb_samples )
+        {
+          Warning( "Error reading resampled audio: " );
+          return 0;
+        }
+
+#else
     Debug(4, "About to convert");
 
     /** Convert the samples using the resampler. */
@@ -877,14 +975,15 @@ av_codec_is_encoder( audio_output_context->codec)
       Error( "Could not read data from FIFO\n");
       return 0;
     }
+#endif
 
     /** Set a timestamp based on the sample rate for the container. */
     output_frame->pts = av_rescale_q( opkt.pts, audio_output_context->time_base, audio_output_stream->time_base );
 
-  // convert the packet to the codec timebase from the stream timebase
-Debug(3, "output_frame->pts(%d) best effort(%d)", output_frame->pts, 
-av_frame_get_best_effort_timestamp(output_frame)
- );
+    // convert the packet to the codec timebase from the stream timebase
+    Debug(3, "output_frame->pts(%d) best effort(%d)", output_frame->pts, 
+        av_frame_get_best_effort_timestamp(output_frame)
+        );
     /**
      * Encode the audio frame and store it in the temporary packet.
      * The output audio stream encoder is used to do this.
@@ -901,24 +1000,24 @@ av_frame_get_best_effort_timestamp(output_frame)
       zm_av_packet_unref(&opkt);
       return 0;
     }
-  
 
-Debug(2, "opkt dts (%d) pts(%d) duration:(%d)", opkt.dts, opkt.pts, opkt.duration );
+
+    Debug(2, "opkt dts (%d) pts(%d) duration:(%d)", opkt.dts, opkt.pts, opkt.duration );
 
     // Convert tb from code back to stream
     //av_packet_rescale_ts(&opkt, audio_output_context->time_base, audio_output_stream->time_base);
-if (opkt.pts != AV_NOPTS_VALUE)  {
-             opkt.pts      = av_rescale_q( opkt.pts,      audio_output_context->time_base, audio_output_stream->time_base);
-}
-         if ( opkt.dts != AV_NOPTS_VALUE)
-             opkt.dts      = av_rescale_q( opkt.dts,      audio_output_context->time_base, audio_output_stream->time_base);
-         if ( opkt.duration > 0)
-             opkt.duration = av_rescale_q( opkt.duration, audio_output_context->time_base, audio_output_stream->time_base);
-Debug(2, "opkt dts (%d) pts(%d) duration:(%d) pos(%d) ", opkt.dts, opkt.pts, opkt.duration, opkt.pos );
+    if (opkt.pts != AV_NOPTS_VALUE)  {
+      opkt.pts      = av_rescale_q( opkt.pts,      audio_output_context->time_base, audio_output_stream->time_base);
+    }
+    if ( opkt.dts != AV_NOPTS_VALUE)
+      opkt.dts      = av_rescale_q( opkt.dts,      audio_output_context->time_base, audio_output_stream->time_base);
+    if ( opkt.duration > 0)
+      opkt.duration = av_rescale_q( opkt.duration, audio_output_context->time_base, audio_output_stream->time_base);
+    Debug(2, "opkt dts (%d) pts(%d) duration:(%d) pos(%d) ", opkt.dts, opkt.pts, opkt.duration, opkt.pos );
 
 
-//opkt.dts = AV_NOPTS_VALUE;
- 
+    //opkt.dts = AV_NOPTS_VALUE;
+
 
 #endif
 #endif
diff --git a/src/zm_videostore.h b/src/zm_videostore.h
index b9c68bd4e..43f508a6b 100644
--- a/src/zm_videostore.h
+++ b/src/zm_videostore.h
@@ -8,6 +8,9 @@ extern "C"  {
 #ifdef HAVE_LIBSWRESAMPLE
 #include "libswresample/swresample.h"
 #endif
+#ifdef HAVE_LIBAVRESAMPLE
+#include "libavresample/avresample.h"
+#endif
 }
 
 #if HAVE_LIBAVCODEC
@@ -44,7 +47,10 @@ private:
   AVAudioFifo *fifo;
   int output_frame_size;
 #ifdef HAVE_LIBSWRESAMPLE
-  SwrContext *resample_context = NULL;
+  //SwrContext *resample_context = NULL;
+#endif
+#ifdef HAVE_LIBAVRESAMPLE
+AVAudioResampleContext* resample_context;
 #endif
   uint8_t *converted_input_samples = NULL;
     
@@ -66,6 +72,8 @@ private:
 
   int64_t filter_in_rescale_delta_last;
 
+  bool setup_resampler();
+
 public:
 	VideoStore(const char *filename_in, const char *format_in, AVStream *video_input_stream, AVStream *audio_input_stream, int64_t nStartTime, Monitor * p_monitor );
 	~VideoStore();
diff --git a/zoneminder-config.cmake b/zoneminder-config.cmake
index 05da91ff0..3b35684b5 100644
--- a/zoneminder-config.cmake
+++ b/zoneminder-config.cmake
@@ -53,8 +53,8 @@
 #cmakedefine HAVE_LIBAVUTIL_MATHEMATICS_H 1
 #cmakedefine HAVE_LIBSWSCALE 1
 #cmakedefine HAVE_LIBSWSCALE_SWSCALE_H 1
-#cmakedefine HAVE_LIBSWRESAMPLE 1
-#cmakedefine HAVE_LIBSWRESAMPLE_SWRESAMPLE_H 1
+#cmakedefine HAVE_LIBAVRESAMPLE 1
+#cmakedefine HAVE_LIBAVRESAMPLE_AVRESAMPLE_H 1
 #cmakedefine HAVE_LIBVLC 1
 #cmakedefine HAVE_VLC_VLC_H 1
 #cmakedefine HAVE_LIBX264 1