Move HLSOutputStream implementation to its own cc/hh file.

Signed-off-by: Stefan Westerfeld <stefan@space.twc.de>

Move HLSOutputStream implementation to its own cc/hh file.
Signed-off-by: Stefan Westerfeld <stefan@space.twc.de>
1f083c5a · Stefan Westerfeld · 16500f19 · 1f083c5a · 1f083c5a · 1f083c5a
Commit 1f083c5a authored Jun 25, 2020 by Stefan Westerfeld
Showing with 563 additions and 512 deletions

Makefile.am src/Makefile.am +1 -1

hlsoutputstream.cc src/hlsoutputstream.cc +448 -0

hlsoutputstream.hh src/hlsoutputstream.hh +112 -0

testhls.cc src/testhls.cc +2 -511

No files found.
--- a/src/Makefile.am
+++ b/src/Makefile.am
@@ -5,7 +5,7 @@ COMMON_SRC = utils.hh utils.cc convcode.hh convcode.cc random.hh random.cc wavda
 	     audiostream.cc audiostream.hh sfinputstream.cc sfinputstream.hh stdoutwavoutputstream.cc stdoutwavoutputstream.hh \
 	     sfoutputstream.cc sfoutputstream.hh rawinputstream.cc rawinputstream.hh rawoutputstream.cc rawoutputstream.hh \
 	     rawconverter.cc rawconverter.hh mp3inputstream.cc mp3inputstream.hh wmcommon.cc wmcommon.hh fft.cc fft.hh \
-	     limiter.cc limiter.hh shortcode.cc shortcode.hh mpegts.cc mpegts.hh
+	     limiter.cc limiter.hh shortcode.cc shortcode.hh mpegts.cc mpegts.hh hlsoutputstream.cc hlsoutputstream.hh
 COMMON_LIBS = $(SNDFILE_LIBS) $(FFTW_LIBS) $(LIBGCRYPT_LIBS) $(LIBMPG123_LIBS) $(FFMPEG_LIBS)

 audiowmark_SOURCES = audiowmark.cc wmget.cc wmadd.cc $(COMMON_SRC)

--- a/src/hlsoutputstream.cc
+++ b/src/hlsoutputstream.cc
+/*
+ * Copyright (C) 2018-2020 Stefan Westerfeld
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include "hlsoutputstream.hh"
+
+/* HLSOutputStream is based on code from ffmpeg: doc/examples/muxing.c */
+
+/*
+ * Copyright (c) 2003 Fabrice Bellard
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+ * THE SOFTWARE.
+ */
+
+using std::vector;
+using std::string;
+using std::min;
+
+HLSOutputStream::HLSOutputStream (int n_channels, int sample_rate, int bit_depth) :
+  m_bit_depth (bit_depth),
+  m_sample_rate (sample_rate),
+  m_n_channels (n_channels),
+  m_audio_buffer (n_channels)
+{
+}
+
+/* Add an output stream. */
+void
+HLSOutputStream::add_stream (AVCodec **codec, enum AVCodecID codec_id)
+{
+    AVCodecContext *c;
+    int i;
+
+    /* find the encoder */
+    *codec = avcodec_find_encoder(codec_id);
+    if (!(*codec)) {
+        fprintf(stderr, "Could not find encoder for '%s'\n",
+                avcodec_get_name(codec_id));
+        exit(1);
+    }
+
+    m_st = avformat_new_stream (m_fmt_ctx, NULL);
+    if (!m_st) {
+        fprintf(stderr, "Could not allocate stream\n");
+        exit(1);
+    }
+    m_st->id = m_fmt_ctx->nb_streams - 1;
+    c = avcodec_alloc_context3(*codec);
+    if (!c) {
+        fprintf(stderr, "Could not alloc an encoding context\n");
+        exit(1);
+    }
+    m_enc = c;
+
+    switch ((*codec)->type) {
+    case AVMEDIA_TYPE_AUDIO:
+        c->sample_fmt  = (*codec)->sample_fmts ?
+            (*codec)->sample_fmts[0] : AV_SAMPLE_FMT_FLTP;
+        c->bit_rate    = 128000;
+        c->sample_rate = 44100;
+        if ((*codec)->supported_samplerates) {
+            c->sample_rate = (*codec)->supported_samplerates[0];
+            for (i = 0; (*codec)->supported_samplerates[i]; i++) {
+                if ((*codec)->supported_samplerates[i] == 44100)
+                    c->sample_rate = 44100;
+            }
+        }
+        c->channels        = av_get_channel_layout_nb_channels(c->channel_layout);
+        c->channel_layout = AV_CH_LAYOUT_STEREO;
+        if ((*codec)->channel_layouts) {
+            c->channel_layout = (*codec)->channel_layouts[0];
+            for (i = 0; (*codec)->channel_layouts[i]; i++) {
+                if ((*codec)->channel_layouts[i] == AV_CH_LAYOUT_STEREO)
+                    c->channel_layout = AV_CH_LAYOUT_STEREO;
+            }
+        }
+        c->channels     = av_get_channel_layout_nb_channels(c->channel_layout);
+        m_st->time_base = (AVRational){ 1, c->sample_rate };
+        break;
+
+    default:
+        break;
+    }
+
+    /* Some formats want stream headers to be separate. */
+    if (m_fmt_ctx->oformat->flags & AVFMT_GLOBALHEADER)
+        c->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
+}
+
+
+AVFrame *
+HLSOutputStream::alloc_audio_frame(enum AVSampleFormat sample_fmt, uint64_t channel_layout, int sample_rate, int nb_samples)
+{
+    AVFrame *frame = av_frame_alloc();
+    int ret;
+
+    if (!frame) {
+        fprintf(stderr, "Error allocating an audio frame\n");
+        exit(1);
+    }
+
+    frame->format = sample_fmt;
+    frame->channel_layout = channel_layout;
+    frame->sample_rate = sample_rate;
+    frame->nb_samples = nb_samples;
+
+    if (nb_samples) {
+        ret = av_frame_get_buffer(frame, 0);
+        if (ret < 0) {
+            fprintf(stderr, "Error allocating an audio buffer\n");
+            exit(1);
+        }
+    }
+
+    return frame;
+}
+
+
+void
+HLSOutputStream::open_audio (AVCodec *codec, AVDictionary *opt_arg)
+{
+    AVCodecContext *c;
+    int nb_samples;
+    int ret;
+    AVDictionary *opt = NULL;
+
+    c = m_enc;
+
+    /* open it */
+    av_dict_copy(&opt, opt_arg, 0);
+    ret = avcodec_open2(c, codec, &opt);
+    av_dict_free(&opt);
+    if (ret < 0) {
+        fprintf(stderr, "Could not open audio codec: %s\n", av_err2str(ret));
+        exit(1);
+    }
+
+    if (c->codec->capabilities & AV_CODEC_CAP_VARIABLE_FRAME_SIZE)
+        nb_samples = 10000;
+    else
+        nb_samples = c->frame_size;
+
+    m_frame     = alloc_audio_frame(c->sample_fmt, c->channel_layout,
+                                         c->sample_rate, nb_samples);
+    m_tmp_frame = alloc_audio_frame(AV_SAMPLE_FMT_S16, c->channel_layout,
+                                         c->sample_rate, nb_samples);
+
+    /* copy the stream parameters to the muxer */
+    ret = avcodec_parameters_from_context(m_st->codecpar, c);
+    if (ret < 0) {
+        fprintf(stderr, "Could not copy the stream parameters\n");
+        exit(1);
+    }
+
+    /* create resampler context */
+        m_swr_ctx = swr_alloc();
+        if (!m_swr_ctx) {
+            fprintf(stderr, "Could not allocate resampler context\n");
+            exit(1);
+        }
+
+        /* set options */
+        av_opt_set_int       (m_swr_ctx, "in_channel_count",   c->channels,       0);
+        av_opt_set_int       (m_swr_ctx, "in_sample_rate",     c->sample_rate,    0);
+        av_opt_set_sample_fmt(m_swr_ctx, "in_sample_fmt",      AV_SAMPLE_FMT_S16, 0);
+        av_opt_set_int       (m_swr_ctx, "out_channel_count",  c->channels,       0);
+        av_opt_set_int       (m_swr_ctx, "out_sample_rate",    c->sample_rate,    0);
+        av_opt_set_sample_fmt(m_swr_ctx, "out_sample_fmt",     c->sample_fmt,     0);
+
+        /* initialize the resampling context */
+        if ((ret = swr_init(m_swr_ctx)) < 0) {
+            fprintf(stderr, "Failed to initialize the resampling context\n");
+            exit(1);
+        }
+}
+
+/* Prepare a 16 bit dummy audio frame of 'frame_size' samples and
+ * 'nb_channels' channels. */
+AVFrame *
+HLSOutputStream::get_audio_frame()
+{
+    AVFrame *frame = m_tmp_frame;
+    int j, i;
+    int16_t *q = (int16_t*)frame->data[0];
+
+    if (m_audio_buffer.can_read_frames() < size_t (frame->nb_samples))
+      return NULL;
+
+    vector<float> samples = m_audio_buffer.read_frames (frame->nb_samples);
+
+    size_t t = 0;
+    for (j = 0; j < frame->nb_samples; j++)
+      {
+        for (i = 0; i < m_enc->channels; i++)
+          {
+            if (t < samples.size())
+              {
+                *q++ = (int)(samples[t] * 32768);
+                t++;
+              }
+            else
+              *q++ = 0;
+          }
+      }
+
+    frame->pts = m_next_pts;
+    m_next_pts  += frame->nb_samples;
+
+    return frame;
+}
+
+
+int
+HLSOutputStream::write_frame (const AVRational *time_base, AVStream *st, AVPacket *pkt)
+{
+    /* rescale output packet timestamp values from codec to stream timebase */
+    av_packet_rescale_ts(pkt, *time_base, st->time_base);
+    pkt->stream_index = st->index;
+
+    /* Write the compressed frame to the media file. */
+    return av_interleaved_write_frame (m_fmt_ctx, pkt);
+}
+
+
+/*
+ * encode one audio frame and send it to the muxer
+ * return 1 when encoding is finished, 0 otherwise
+ */
+int
+HLSOutputStream::write_audio_frame()
+{
+    AVCodecContext *c;
+    AVPacket pkt = { 0 }; // data and size must be 0;
+    AVFrame *frame;
+    int ret;
+    int got_packet;
+    int dst_nb_samples;
+
+    av_init_packet(&pkt);
+    c = m_enc;
+
+    frame = get_audio_frame();
+
+    if (frame) {
+        /* convert samples from native format to destination codec format, using the resampler */
+            /* compute destination number of samples */
+            dst_nb_samples = av_rescale_rnd(swr_get_delay(m_swr_ctx, c->sample_rate) + frame->nb_samples,
+                                            c->sample_rate, c->sample_rate, AV_ROUND_UP);
+            av_assert0(dst_nb_samples == frame->nb_samples);
+
+        /* when we pass a frame to the encoder, it may keep a reference to it
+         * internally;
+         * make sure we do not overwrite it here
+         */
+        ret = av_frame_make_writable(m_frame);
+        if (ret < 0)
+            exit(1);
+
+        /* convert to destination format */
+        ret = swr_convert(m_swr_ctx,
+                          m_frame->data, dst_nb_samples,
+                          (const uint8_t **)frame->data, frame->nb_samples);
+        if (ret < 0) {
+            fprintf(stderr, "Error while converting\n");
+            exit(1);
+        }
+        frame = m_frame;
+
+        frame->pts = av_rescale_q(m_samples_count + m_start_pos, (AVRational){1, c->sample_rate}, c->time_base);
+        m_samples_count += dst_nb_samples;
+    }
+
+    ret = avcodec_encode_audio2(c, &pkt, frame, &got_packet);
+    if (ret < 0) {
+        fprintf(stderr, "Error encoding audio frame: %s\n", av_err2str(ret));
+        exit(1);
+    }
+
+    if (got_packet)
+      {
+        if (m_cut_aac_frames)
+          {
+            m_cut_aac_frames--;
+          }
+        else if (m_keep_aac_frames)
+          {
+            ret = write_frame (&c->time_base, m_st, &pkt);
+            if (ret < 0)
+              {
+                fprintf(stderr, "Error while writing audio frame: %s\n",
+                        av_err2str(ret));
+                exit(1);
+              }
+            m_keep_aac_frames--;
+          }
+      }
+
+    return (frame || got_packet) ? 0 : 1;
+}
+
+void
+HLSOutputStream::close_stream()
+{
+    avcodec_free_context(&m_enc);
+    av_frame_free(&m_frame);
+    av_frame_free(&m_tmp_frame);
+    swr_free(&m_swr_ctx);
+}
+
+Error
+HLSOutputStream::open (const string& out_filename, size_t cut_aac_frames, size_t keep_aac_frames, double pts_start, size_t delete_input_start)
+{
+  avformat_alloc_output_context2 (&m_fmt_ctx, NULL, "mpegts", NULL);
+  if (!m_fmt_ctx)
+    return Error ("failed to alloc avformat output context");
+
+  string filename = out_filename;
+  if (filename == "-")
+    filename = "pipe:1";
+
+  int ret = avio_open (&m_fmt_ctx->pb, filename.c_str(), AVIO_FLAG_WRITE);
+  if (ret < 0)
+    {
+      error ("Could not open output: %s\n", av_err2str (ret));
+      return Error ("open hls output failed");
+    }
+
+  AVDictionary *opt = nullptr;
+  AVCodec *audio_codec;
+  add_stream (&audio_codec, AV_CODEC_ID_AAC);
+  open_audio (audio_codec, opt);
+
+  /* Write the stream header, if any. */
+  ret = avformat_write_header (m_fmt_ctx, &opt);
+  if (ret < 0)
+    {
+      error ("Error occurred when writing output file: %s\n",  av_err2str(ret));
+      return Error ("avformat_write_header failed\n");
+    }
+  av_dump_format (m_fmt_ctx, 0, filename.c_str(), 1);
+
+  m_delete_input_start = delete_input_start;
+  m_cut_aac_frames = cut_aac_frames;
+  m_keep_aac_frames = keep_aac_frames;
+
+  // FIXME: correct?
+  m_start_pos = pts_start * m_sample_rate - cut_aac_frames * 1024;
+  m_start_pos += 1024;
+
+  return Error::Code::NONE;
+}
+
+Error
+HLSOutputStream::close()
+{
+  write(); // drain
+
+  av_write_trailer (m_fmt_ctx);
+
+  close_stream();
+
+  /* Close the output file. */
+  if (!(m_fmt_ctx->oformat->flags & AVFMT_NOFILE))
+    avio_closep (&m_fmt_ctx->pb);
+
+  /* free the stream */
+  avformat_free_context (m_fmt_ctx);
+
+  return Error::Code::NONE;
+}
+
+void
+HLSOutputStream::write()
+{
+  while (write_audio_frame() == 0);
+}
+
+Error
+HLSOutputStream::write_frames (const std::vector<float>& frames)
+{
+  // if we don't need any more aac frames, just throw away samples (save cpu cycles)
+  if (m_keep_aac_frames == 0)
+    return Error::Code::NONE;
+
+  m_audio_buffer.write_frames (frames);
+
+  size_t delete_input = min (m_delete_input_start, m_audio_buffer.can_read_frames());
+  if (delete_input)
+    {
+      m_audio_buffer.read_frames (delete_input);
+      m_delete_input_start -= delete_input;
+    }
+
+  while (m_audio_buffer.can_read_frames() >= 1024)
+    {
+      write_audio_frame();
+    }
+  return Error::Code::NONE;
+}
+
+int
+HLSOutputStream::bit_depth() const
+{
+  return m_bit_depth;
+}
+
+int
+HLSOutputStream::sample_rate() const
+{
+  return m_sample_rate;
+}
+
+int
+HLSOutputStream::n_channels() const
+{
+  return m_n_channels;
+}
+
+
--- a/src/hlsoutputstream.hh
+++ b/src/hlsoutputstream.hh
+/*
+ * Copyright (C) 2018-2020 Stefan Westerfeld
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#ifndef AUDIOWMARK_HLS_OUTPUT_STREAM_HH
+#define AUDIOWMARK_HLS_OUTPUT_STREAM_HH
+
+#include "audiostream.hh"
+
+#include <assert.h>
+
+extern "C" {
+#include <libavformat/avformat.h>
+#include <libavutil/opt.h>
+#include <libswresample/swresample.h>
+#include <libavutil/avassert.h>
+#include <libavutil/timestamp.h>
+#undef av_err2str
+#define av_err2str(errnum) av_make_error_string((char*)__builtin_alloca(AV_ERROR_MAX_STRING_SIZE), AV_ERROR_MAX_STRING_SIZE, errnum)
+}
+
+/* FIXME: fix duplication with wmadd.cc */
+class AudioBuffer
+{
+  const int           n_channels = 0;
+  std::vector<float>  buffer;
+
+public:
+  AudioBuffer (int n_channels) :
+    n_channels (n_channels)
+  {
+  }
+  void
+  write_frames (const std::vector<float>& samples)
+  {
+    buffer.insert (buffer.end(), samples.begin(), samples.end());
+  }
+  std::vector<float>
+  read_frames (size_t frames)
+  {
+    assert (frames * n_channels <= buffer.size());
+    const auto begin = buffer.begin();
+    const auto end   = begin + frames * n_channels;
+    std::vector<float> result (begin, end);
+    buffer.erase (begin, end);
+    return result;
+  }
+  size_t
+  can_read_frames() const
+  {
+    return buffer.size() / n_channels;
+  }
+};
+
+class HLSOutputStream : public AudioOutputStream {
+  AVStream         *m_st = nullptr;
+  AVCodecContext   *m_enc = nullptr;
+  AVFormatContext  *m_fmt_ctx = nullptr;
+
+  /* pts of the next frame that will be generated */
+  int64_t           m_next_pts = 0;
+  int               m_samples_count = 0;
+  int               m_start_pos = 0;
+
+  AVFrame          *m_frame = nullptr;
+  AVFrame          *m_tmp_frame = nullptr;
+
+  size_t            m_cut_aac_frames = 0;
+  size_t            m_keep_aac_frames = 0;
+
+  SwrContext       *m_swr_ctx = nullptr;
+
+  int               m_bit_depth = 0;
+  int               m_sample_rate = 0;
+  int               m_n_channels = 0;
+  AudioBuffer       m_audio_buffer;
+  size_t            m_delete_input_start = 0;
+
+  void add_stream (AVCodec **codec, enum AVCodecID codec_id);
+  void open_audio (AVCodec *codec, AVDictionary *opt_arg);
+  AVFrame *get_audio_frame();
+  int write_audio_frame();
+  void close_stream();
+  AVFrame *alloc_audio_frame(enum AVSampleFormat sample_fmt, uint64_t channel_layout, int sample_rate, int nb_samples);
+  int write_frame (const AVRational *time_base, AVStream *st, AVPacket *pkt);
+public:
+  HLSOutputStream (int n_channels, int sample_rate, int bit_depth);
+
+  Error open (const std::string& output_filename, size_t cut_aac_frames, size_t keep_aac_frames, double pts_start, size_t delete_input_start);
+  int bit_depth() const override;
+  int sample_rate() const override;
+  int n_channels() const override;
+  Error write_frames (const std::vector<float>& frames) override;
+  void write();
+  Error close();
+};
+
+#endif /* AUDIOWMARK_HLS_OUTPUT_STREAM_HH */
+
--- a/src/testhls.cc
+++ b/src/testhls.cc
-/*,
+/*
 * Copyright (C) 2018-2020 Stefan Westerfeld
 *
 * This program is free software: you can redistribute it and/or modify
@@ -25,16 +25,7 @@
 #include "wavdata.hh"
 #include "wmcommon.hh"
 #include "sfinputstream.hh"
-
-extern "C" {
-#include <libavformat/avformat.h>
-#include <libavutil/opt.h>
-#include <libswresample/swresample.h>
-#include <libavutil/avassert.h>
-#include <libavutil/timestamp.h>
-#undef av_err2str
-#define av_err2str(errnum) av_make_error_string((char*)__builtin_alloca(AV_ERROR_MAX_STRING_SIZE), AV_ERROR_MAX_STRING_SIZE, errnum)
-}
+#include "hlsoutputstream.hh"

 using std::string;
 using std::regex;
@@ -84,506 +75,6 @@ ff_decode (const string& filename, WavData& out_wav_data)
  return err;
 }

-/*------------------------------- start code from ffmpeg...muxing.c -------------------------------*/
-
-/*
- * Copyright (c) 2003 Fabrice Bellard
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to deal
- * in the Software without restriction, including without limitation the rights
- * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
- * THE SOFTWARE.
- */
-
-class AudioBuffer
-{
-  const int     n_channels = 0;
-  vector<float> buffer;
-
-public:
-  AudioBuffer (int n_channels) :
-    n_channels (n_channels)
-  {
-  }
-  void
-  write_frames (const vector<float>& samples)
-  {
-    buffer.insert (buffer.end(), samples.begin(), samples.end());
-  }
-  vector<float>
-  read_frames (size_t frames)
-  {
-    assert (frames * n_channels <= buffer.size());
-    const auto begin = buffer.begin();
-    const auto end   = begin + frames * n_channels;
-    vector<float> result (begin, end);
-    buffer.erase (begin, end);
-    return result;
-  }
-  size_t
-  can_read_frames() const
-  {
-    return buffer.size() / n_channels;
-  }
-};
-
-// a wrapper around a single output AVStream
-class HLSOutputStream : public AudioOutputStream {
-  AVStream         *m_st = nullptr;
-  AVCodecContext   *m_enc = nullptr;
-  AVFormatContext  *m_fmt_ctx = nullptr;
-
-  /* pts of the next frame that will be generated */
-  int64_t           m_next_pts = 0;
-  int               m_samples_count = 0;
-  int               m_start_pos = 0;
-
-  AVFrame          *m_frame = nullptr;
-  AVFrame          *m_tmp_frame = nullptr;
-
-  size_t            m_cut_aac_frames = 0;
-  size_t            m_keep_aac_frames = 0;
-
-  SwrContext       *m_swr_ctx = nullptr;
-
-  int               m_bit_depth = 0;
-  int               m_sample_rate = 0;
-  int               m_n_channels = 0;
-  AudioBuffer       m_audio_buffer;
-  size_t            m_delete_input_start = 0;
-
-  void add_stream (AVCodec **codec, enum AVCodecID codec_id);
-  void open_audio (AVCodec *codec, AVDictionary *opt_arg);
-  AVFrame *get_audio_frame();
-  int write_audio_frame();
-  void close_stream();
-  AVFrame *alloc_audio_frame(enum AVSampleFormat sample_fmt, uint64_t channel_layout, int sample_rate, int nb_samples);
-  int write_frame (const AVRational *time_base, AVStream *st, AVPacket *pkt);
-public:
-  HLSOutputStream (int n_channels, int sample_rate, int bit_depth);
-
-  Error open (const string& output_filename, size_t cut_aac_frames, size_t keep_aac_frames, double pts_start, size_t delete_input_start);
-  int bit_depth() const override;
-  int sample_rate() const override;
-  int n_channels() const override;
-  Error write_frames (const std::vector<float>& frames) override;
-  void write();
-  Error close();
-};
-
-HLSOutputStream::HLSOutputStream (int n_channels, int sample_rate, int bit_depth) :
-  m_bit_depth (bit_depth),
-  m_sample_rate (sample_rate),
-  m_n_channels (n_channels),
-  m_audio_buffer (n_channels)
-{
-}
-
-/* Add an output stream. */
-void
-HLSOutputStream::add_stream (AVCodec **codec, enum AVCodecID codec_id)
-{
-    AVCodecContext *c;
-    int i;
-
-    /* find the encoder */
-    *codec = avcodec_find_encoder(codec_id);
-    if (!(*codec)) {
-        fprintf(stderr, "Could not find encoder for '%s'\n",
-                avcodec_get_name(codec_id));
-        exit(1);
-    }
-
-    m_st = avformat_new_stream (m_fmt_ctx, NULL);
-    if (!m_st) {
-        fprintf(stderr, "Could not allocate stream\n");
-        exit(1);
-    }
-    m_st->id = m_fmt_ctx->nb_streams - 1;
-    c = avcodec_alloc_context3(*codec);
-    if (!c) {
-        fprintf(stderr, "Could not alloc an encoding context\n");
-        exit(1);
-    }
-    m_enc = c;
-
-    switch ((*codec)->type) {
-    case AVMEDIA_TYPE_AUDIO:
-        c->sample_fmt  = (*codec)->sample_fmts ?
-            (*codec)->sample_fmts[0] : AV_SAMPLE_FMT_FLTP;
-        c->bit_rate    = 128000;
-        c->sample_rate = 44100;
-        if ((*codec)->supported_samplerates) {
-            c->sample_rate = (*codec)->supported_samplerates[0];
-            for (i = 0; (*codec)->supported_samplerates[i]; i++) {
-                if ((*codec)->supported_samplerates[i] == 44100)
-                    c->sample_rate = 44100;
-            }
-        }
-        c->channels        = av_get_channel_layout_nb_channels(c->channel_layout);
-        c->channel_layout = AV_CH_LAYOUT_STEREO;
-        if ((*codec)->channel_layouts) {
-            c->channel_layout = (*codec)->channel_layouts[0];
-            for (i = 0; (*codec)->channel_layouts[i]; i++) {
-                if ((*codec)->channel_layouts[i] == AV_CH_LAYOUT_STEREO)
-                    c->channel_layout = AV_CH_LAYOUT_STEREO;
-            }
-        }
-        c->channels     = av_get_channel_layout_nb_channels(c->channel_layout);
-        m_st->time_base = (AVRational){ 1, c->sample_rate };
-        break;
-
-    default:
-        break;
-    }
-
-    /* Some formats want stream headers to be separate. */
-    if (m_fmt_ctx->oformat->flags & AVFMT_GLOBALHEADER)
-        c->flags |= AV_CODEC_FLAG_GLOBAL_HEADER;
-}
-
-
-AVFrame *
-HLSOutputStream::alloc_audio_frame(enum AVSampleFormat sample_fmt, uint64_t channel_layout, int sample_rate, int nb_samples)
-{
-    AVFrame *frame = av_frame_alloc();
-    int ret;
-
-    if (!frame) {
-        fprintf(stderr, "Error allocating an audio frame\n");
-        exit(1);
-    }
-
-    frame->format = sample_fmt;
-    frame->channel_layout = channel_layout;
-    frame->sample_rate = sample_rate;
-    frame->nb_samples = nb_samples;
-
-    if (nb_samples) {
-        ret = av_frame_get_buffer(frame, 0);
-        if (ret < 0) {
-            fprintf(stderr, "Error allocating an audio buffer\n");
-            exit(1);
-        }
-    }
-
-    return frame;
-}
-
-
-void
-HLSOutputStream::open_audio (AVCodec *codec, AVDictionary *opt_arg)
-{
-    AVCodecContext *c;
-    int nb_samples;
-    int ret;
-    AVDictionary *opt = NULL;
-
-    c = m_enc;
-
-    /* open it */
-    av_dict_copy(&opt, opt_arg, 0);
-    ret = avcodec_open2(c, codec, &opt);
-    av_dict_free(&opt);
-    if (ret < 0) {
-        fprintf(stderr, "Could not open audio codec: %s\n", av_err2str(ret));
-        exit(1);
-    }
-
-    if (c->codec->capabilities & AV_CODEC_CAP_VARIABLE_FRAME_SIZE)
-        nb_samples = 10000;
-    else
-        nb_samples = c->frame_size;
-
-    m_frame     = alloc_audio_frame(c->sample_fmt, c->channel_layout,
-                                         c->sample_rate, nb_samples);
-    m_tmp_frame = alloc_audio_frame(AV_SAMPLE_FMT_S16, c->channel_layout,
-                                         c->sample_rate, nb_samples);
-
-    /* copy the stream parameters to the muxer */
-    ret = avcodec_parameters_from_context(m_st->codecpar, c);
-    if (ret < 0) {
-        fprintf(stderr, "Could not copy the stream parameters\n");
-        exit(1);
-    }
-
-    /* create resampler context */
-        m_swr_ctx = swr_alloc();
-        if (!m_swr_ctx) {
-            fprintf(stderr, "Could not allocate resampler context\n");
-            exit(1);
-        }
-
-        /* set options */
-        av_opt_set_int       (m_swr_ctx, "in_channel_count",   c->channels,       0);
-        av_opt_set_int       (m_swr_ctx, "in_sample_rate",     c->sample_rate,    0);
-        av_opt_set_sample_fmt(m_swr_ctx, "in_sample_fmt",      AV_SAMPLE_FMT_S16, 0);
-        av_opt_set_int       (m_swr_ctx, "out_channel_count",  c->channels,       0);
-        av_opt_set_int       (m_swr_ctx, "out_sample_rate",    c->sample_rate,    0);
-        av_opt_set_sample_fmt(m_swr_ctx, "out_sample_fmt",     c->sample_fmt,     0);
-
-        /* initialize the resampling context */
-        if ((ret = swr_init(m_swr_ctx)) < 0) {
-            fprintf(stderr, "Failed to initialize the resampling context\n");
-            exit(1);
-        }
-}
-
-/* Prepare a 16 bit dummy audio frame of 'frame_size' samples and
- * 'nb_channels' channels. */
-AVFrame *
-HLSOutputStream::get_audio_frame()
-{
-    AVFrame *frame = m_tmp_frame;
-    int j, i;
-    int16_t *q = (int16_t*)frame->data[0];
-
-    if (m_audio_buffer.can_read_frames() < size_t (frame->nb_samples))
-      return NULL;
-
-    vector<float> samples = m_audio_buffer.read_frames (frame->nb_samples);
-
-    size_t t = 0;
-    for (j = 0; j < frame->nb_samples; j++)
-      {
-        for (i = 0; i < m_enc->channels; i++)
-          {
-            if (t < samples.size())
-              {
-                *q++ = (int)(samples[t] * 32768);
-                t++;
-              }
-            else
-              *q++ = 0;
-          }
-      }
-
-    frame->pts = m_next_pts;
-    m_next_pts  += frame->nb_samples;
-
-    return frame;
-}
-
-
-int
-HLSOutputStream::write_frame (const AVRational *time_base, AVStream *st, AVPacket *pkt)
-{
-    /* rescale output packet timestamp values from codec to stream timebase */
-    av_packet_rescale_ts(pkt, *time_base, st->time_base);
-    pkt->stream_index = st->index;
-
-    /* Write the compressed frame to the media file. */
-    return av_interleaved_write_frame (m_fmt_ctx, pkt);
-}
-
-
-/*
- * encode one audio frame and send it to the muxer
- * return 1 when encoding is finished, 0 otherwise
- */
-int
-HLSOutputStream::write_audio_frame()
-{
-    AVCodecContext *c;
-    AVPacket pkt = { 0 }; // data and size must be 0;
-    AVFrame *frame;
-    int ret;
-    int got_packet;
-    int dst_nb_samples;
-
-    av_init_packet(&pkt);
-    c = m_enc;
-
-    frame = get_audio_frame();
-
-    if (frame) {
-        /* convert samples from native format to destination codec format, using the resampler */
-            /* compute destination number of samples */
-            dst_nb_samples = av_rescale_rnd(swr_get_delay(m_swr_ctx, c->sample_rate) + frame->nb_samples,
-                                            c->sample_rate, c->sample_rate, AV_ROUND_UP);
-            av_assert0(dst_nb_samples == frame->nb_samples);
-
-        /* when we pass a frame to the encoder, it may keep a reference to it
-         * internally;
-         * make sure we do not overwrite it here
-         */
-        ret = av_frame_make_writable(m_frame);
-        if (ret < 0)
-            exit(1);
-
-        /* convert to destination format */
-        ret = swr_convert(m_swr_ctx,
-                          m_frame->data, dst_nb_samples,
-                          (const uint8_t **)frame->data, frame->nb_samples);
-        if (ret < 0) {
-            fprintf(stderr, "Error while converting\n");
-            exit(1);
-        }
-        frame = m_frame;
-
-        frame->pts = av_rescale_q(m_samples_count + m_start_pos, (AVRational){1, c->sample_rate}, c->time_base);
-        m_samples_count += dst_nb_samples;
-    }
-
-    ret = avcodec_encode_audio2(c, &pkt, frame, &got_packet);
-    if (ret < 0) {
-        fprintf(stderr, "Error encoding audio frame: %s\n", av_err2str(ret));
-        exit(1);
-    }
-
-    if (got_packet)
-      {
-        if (m_cut_aac_frames)
-          {
-            m_cut_aac_frames--;
-          }
-        else if (m_keep_aac_frames)
-          {
-            ret = write_frame (&c->time_base, m_st, &pkt);
-            if (ret < 0)
-              {
-                fprintf(stderr, "Error while writing audio frame: %s\n",
-                        av_err2str(ret));
-                exit(1);
-              }
-            m_keep_aac_frames--;
-          }
-      }
-
-    return (frame || got_packet) ? 0 : 1;
-}
-
-void
-HLSOutputStream::close_stream()
-{
-    avcodec_free_context(&m_enc);
-    av_frame_free(&m_frame);
-    av_frame_free(&m_tmp_frame);
-    swr_free(&m_swr_ctx);
-}
-
-Error
-HLSOutputStream::open (const string& out_filename, size_t cut_aac_frames, size_t keep_aac_frames, double pts_start, size_t delete_input_start)
-{
-  avformat_alloc_output_context2 (&m_fmt_ctx, NULL, "mpegts", NULL);
-  if (!m_fmt_ctx)
-    return Error ("failed to alloc avformat output context");
-
-  string filename = out_filename;
-  if (filename == "-")
-    filename = "pipe:1";
-
-  int ret = avio_open (&m_fmt_ctx->pb, filename.c_str(), AVIO_FLAG_WRITE);
-  if (ret < 0)
-    {
-      error ("Could not open output: %s\n", av_err2str (ret));
-      return Error ("open hls output failed");
-    }
-
-  AVDictionary *opt = nullptr;
-  AVCodec *audio_codec;
-  add_stream (&audio_codec, AV_CODEC_ID_AAC);
-  open_audio (audio_codec, opt);
-
-  /* Write the stream header, if any. */
-  ret = avformat_write_header (m_fmt_ctx, &opt);
-  if (ret < 0)
-    {
-      error ("Error occurred when writing output file: %s\n",  av_err2str(ret));
-      return Error ("avformat_write_header failed\n");
-    }
-  av_dump_format (m_fmt_ctx, 0, filename.c_str(), 1);
-
-  m_delete_input_start = delete_input_start;
-  m_cut_aac_frames = cut_aac_frames;
-  m_keep_aac_frames = keep_aac_frames;
-
-  // FIXME: correct?
-  m_start_pos = pts_start * m_sample_rate - cut_aac_frames * 1024;
-  m_start_pos += 1024;
-
-  return Error::Code::NONE;
-}
-
-Error
-HLSOutputStream::close()
-{
-  write(); // drain
-
-  av_write_trailer (m_fmt_ctx);
-
-  close_stream();
-
-  /* Close the output file. */
-  if (!(m_fmt_ctx->oformat->flags & AVFMT_NOFILE))
-    avio_closep (&m_fmt_ctx->pb);
-
-  /* free the stream */
-  avformat_free_context (m_fmt_ctx);
-
-  return Error::Code::NONE;
-}
-
-void
-HLSOutputStream::write()
-{
-  while (write_audio_frame() == 0);
-}
-
-Error
-HLSOutputStream::write_frames (const std::vector<float>& frames)
-{
-  // if we don't need any more aac frames, just throw away samples (save cpu cycles)
-  if (m_keep_aac_frames == 0)
-    return Error::Code::NONE;
-
-  m_audio_buffer.write_frames (frames);
-
-  size_t delete_input = min (m_delete_input_start, m_audio_buffer.can_read_frames());
-  if (delete_input)
-    {
-      m_audio_buffer.read_frames (delete_input);
-      m_delete_input_start -= delete_input;
-    }
-
-  while (m_audio_buffer.can_read_frames() >= 1024)
-    {
-      write_audio_frame();
-    }
-  return Error::Code::NONE;
-}
-
-int
-HLSOutputStream::bit_depth() const
-{
-  return m_bit_depth;
-}
-
-int
-HLSOutputStream::sample_rate() const
-{
-  return m_sample_rate;
-}
-
-int
-HLSOutputStream::n_channels() const
-{
-  return m_n_channels;
-}
-
 int
 hls_embed_context (const string& in_dir, const string& out_dir, const string& filename, const string& audio_master)
 {