Merge branch 'sample-rate'

a4525f59 · Stefan Westerfeld · af85c13c · af977c42 · a4525f59 · af85c13c
Commit a4525f59 authored Feb 04, 2019 by Stefan Westerfeld
9 changed files
--- a/Dockerfile
+++ b/Dockerfile
@@ -8,6 +8,7 @@ RUN apt-get install -y autoconf
 RUN apt-get install -y libtool
 RUN apt-get install -y autoconf-archive
 RUN apt-get install -y libgcrypt20-dev
+RUN apt-get install -y libzita-resampler-dev

 ADD . /audiowmark
 WORKDIR /audiowmark

--- a/README
+++ b/README
-Audio Watermarking
-
-(TODO)
-
-Building fftw
-
-audiowmark needs the single prevision variant of fftw3.
-
-If you are building fftw3 from source, use the `--enable-float`
-configure parameter to build it, e.g.::
-
-	cd ${FFTW3_SOURCE}
-	./configure --enable-float --enable-sse && \
-	make && \
-	sudo make install
-
-or, when building from git
-
-	cd ${FFTW3_GIT}
-	./bootstrap.sh --enable-shared --enable-sse --enable-float && \
-	make && \
-	sudo make install
-
-Docker Build
-
-You should be able to execute audiowmark via Docker.
-Example that outputs the usage message:
-
-  docker build -t audiowmark .
-  docker run -v <local-data-directory>:/data -it audiowmark -h
--- a/README.adoc
+++ b/README.adoc
+= audiowmark - Audio Watermarking
+
+== Description
+
+`audiowmark` is an Open Source solution for audio watermarking. A sound file
+(typically wav) is read by the software, and a 128-bit message is stored in a
+watermark in the output sound file. For human listeners, the files typically
+sound the same.
+
+However, the 128-bit message can be retrieved from the output sound file. Our
+tests show, that even if the file is converted to mp3 or ogg (with bitrates
+higher than 128 kbit/s), the watermark usually can be retrieved without
+problems. The process of retrieving the message does not need the original
+audio file (blind decoding).
+
+Internally, audiowmark is using the patchwork algorithm to hide the data in the
+spectrum of the audio file. Some pseoudo-randomly selected amplitudes of the
+frequency bands of a 1024-value FFTs are increased or decreased slightly, which
+can be detected later. The algorithm used here is inspired by
+
+  Martin Steinebach: Digitale Wasserzeichen für Audiodaten.
+  Darmstadt University of Technology 2004, ISBN 3-8322-2507-2
+
+== Adding/Retrieving a Watermark
+
+To add a watermark to the soundfile in.wav with a 128-bit message (which is
+specified as hex-string):
+
+  audiowmark add in.wav out.wav 0123456789abcdef0011223344556677
+
+To get the 128-bit message from the watermarked file, use:
+
+  audiowmark get out.wav
+
+== Watermark Key
+
+Since the software is Open Source, a watermarking key should be used to ensure
+that the message bits cannot be retrieved by somebody else (which would also
+allow removing the watermark without loss of quality). The watermark key
+controls all pseudo-random parameters of the algorithm. This means that
+it determines which frequency bands are increased or decreased to store a
+0 bit or a 1 bit. Without the key, it is impossible to decode the message
+bits from the audio file alone.
+
+Our watermarking key is a 128-bit AES key. A key can be generated using
+
+  audiowmark gen-key test.key
+
+and can be used for the add/get commands as follows:
+
+  audiowmark add --key test.key in.wav out.wav 0123456789abcdef0011223344556677
+  audiowmark get --key test.key out.wav
+
+== Dependencies
+
+If you compile from source, audiowmark needs the follwing libraries:
+
+* libfftw3
+* libsndfile
+* libgcrypt
+* libzita-resampler
+
+== Building fftw
+
+audiowmark needs the single prevision variant of fftw3.
+
+If you are building fftw3 from source, use the `--enable-float`
+configure parameter to build it, e.g.::
+
+	cd ${FFTW3_SOURCE}
+	./configure --enable-float --enable-sse && \
+	make && \
+	sudo make install
+
+or, when building from git
+
+	cd ${FFTW3_GIT}
+	./bootstrap.sh --enable-shared --enable-sse --enable-float && \
+	make && \
+	sudo make install
+
+== Docker Build
+
+You should be able to execute audiowmark via Docker.
+Example that outputs the usage message:
+
+  docker build -t audiowmark .
+  docker run -v <local-data-directory>:/data -it audiowmark -h
--- a/configure.ac
+++ b/configure.ac
@@ -17,6 +17,18 @@ AC_DEFUN([AC_SNDFILE_REQUIREMENTS],
    AC_SUBST(SNDFILE_LIBS)
 ])

+dnl
+dnl zita resampler
+dnl
+AC_DEFUN([AC_ZITA_REQUIREMENTS],
+[
+    AC_CHECK_LIB(zita-resampler, _Z28zita_resampler_major_versionv,[],
+      [
+        AC_MSG_ERROR([You need to install libzita-resampler to build this package.])
+      ]
+    )
+])
+
 dnl FFTW3
 AC_DEFUN([AC_FFTW_CHECK],
 [
@@ -45,6 +57,7 @@ AC_DEFUN([AC_FFTW_CHECK],
 ])

 AC_SNDFILE_REQUIREMENTS
+AC_ZITA_REQUIREMENTS
 AC_FFTW_CHECK
 AM_PATH_LIBGCRYPT


--- a/src/audiowmark.cc
+++ b/src/audiowmark.cc
--- a/src/ber-test.sh
+++ b/src/ber-test.sh
@@ -19,10 +19,8 @@ fi
    ls test/T*
  elif [ "x$AWM_SET" == "xbig" ]; then
    cat test_list
-  elif [ "x$AWM_SET" == "xhuge" ]; then
-    ls huge/T*
-  elif [ "x$AWM_SET" == "xhuge2" ]; then
-    ls huge2/T*
+  elif [ "x$AWM_SET" != "x" ] && [ -d "$AWM_SET" ] && [ -f "$AWM_SET/T001"*wav ]; then
+    ls $AWM_SET/T*
  else
    echo "bad AWM_SET $AWM_SET" >&2
    exit 1
@@ -62,12 +60,6 @@ do
      lame -b $2 ${AWM_FILE}.wav ${AWM_FILE}.mp3 --quiet
      rm ${AWM_FILE}.wav
      ffmpeg -i ${AWM_FILE}.mp3 ${AWM_FILE}.wav -v quiet -nostdin
-
-      # some (low) mpeg quality settings use a lower sample rate
-      if [ "x$(soxi -r ${AWM_FILE}.wav)" != "x44100" ]; then
-        sox ${AWM_FILE}.wav ${AWM_FILE}r.wav rate 44100
-        mv ${AWM_FILE}r.wav ${AWM_FILE}.wav
-      fi
    elif [ "x$TRANSFORM" == "xdouble-mp3" ]; then
      if [ "x$2" == "x" ]; then
        echo "need mp3 bitrate" >&2
@@ -82,12 +74,6 @@ do
      lame -b $2 ${AWM_FILE}.wav ${AWM_FILE}.mp3 --quiet
      rm ${AWM_FILE}.wav
      ffmpeg -i ${AWM_FILE}.mp3 ${AWM_FILE}.wav -v quiet -nostdin
-
-      # some (low) mpeg quality settings use a lower sample rate
-      if [ "x$(soxi -r ${AWM_FILE}.wav)" != "x44100" ]; then
-        sox ${AWM_FILE}.wav ${AWM_FILE}r.wav rate 44100
-        mv ${AWM_FILE}r.wav ${AWM_FILE}.wav
-      fi
    elif [ "x$TRANSFORM" == "xogg" ]; then
      if [ "x$2" == "x" ]; then
        echo "need ogg bitrate" >&2

--- a/src/random.cc
+++ b/src/random.cc
@@ -108,7 +108,7 @@ void
 Random::refill_buffer()
 {
  const size_t block_size = 256;
-  unsigned char zeros[block_size] = { 0, };
+  static unsigned char zeros[block_size] = { 0, };
  unsigned char cipher_text[block_size];

  gcry_error_t gcry_ret = gcry_cipher_encrypt (aes_ctr_cipher, cipher_text, block_size, zeros, block_size);

--- a/src/wavdata.cc
+++ b/src/wavdata.cc
@@ -17,11 +17,11 @@ WavData::WavData()
 {
 }

-WavData::WavData (const vector<float>& samples, int n_channels, float mix_freq, int bit_depth)
+WavData::WavData (const vector<float>& samples, int n_channels, int sample_rate, int bit_depth)
 {
  m_samples     = samples;
  m_n_channels  = n_channels;
-  m_mix_freq    = mix_freq;
+  m_sample_rate = sample_rate;
  m_bit_depth   = bit_depth;
 }

@@ -76,7 +76,7 @@ WavData::load (const string& filename)
  for (size_t i = 0; i < m_samples.size(); i++)
    m_samples[i] = isamples[i] * norm;

-  m_mix_freq    = sfinfo.samplerate;
+  m_sample_rate = sfinfo.samplerate;
  m_n_channels  = sfinfo.channels;

  switch (sfinfo.format & SF_FORMAT_SUBMASK)
@@ -121,7 +121,7 @@ WavData::save (const string& filename)
 {
  SF_INFO sfinfo = {0,};

-  sfinfo.samplerate = lrint (m_mix_freq);
+  sfinfo.samplerate = m_sample_rate;
  sfinfo.channels   = m_n_channels;

  if (m_bit_depth > 16)
@@ -179,10 +179,10 @@ WavData::save (const string& filename)
  return true;
 }

-float
-WavData::mix_freq() const
+int
+WavData::sample_rate() const
 {
-  return m_mix_freq;
+  return m_sample_rate;
 }

 int

--- a/src/wavdata.hh
+++ b/src/wavdata.hh
@@ -7,19 +7,19 @@
 class WavData
 {
  std::vector<float> m_samples;
-  float              m_mix_freq   = 0;
-  int                m_n_channels = 0;
-  int                m_bit_depth  = 0;
+  int                m_sample_rate = 0;
+  int                m_n_channels  = 0;
+  int                m_bit_depth   = 0;
  std::string        m_error_blurb;

 public:
  WavData();
-  WavData (const std::vector<float>& samples, int n_channels, float mix_freq, int bit_depth);
+  WavData (const std::vector<float>& samples, int n_channels, int sample_rate, int bit_depth);

  bool load (const std::string& filename);
  bool save (const std::string& filename);

-  float                       mix_freq() const;
+  int                         sample_rate() const;
  int                         bit_depth() const;
  const char                 *error_blurb() const;