summaryrefslogtreecommitdiffstats
path: root/remoting/codec/audio_decoder_speex.cc
blob: 7114844a72dda111f6602a82d0a443150e53bee3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
// Copyright (c) 2012 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#include "remoting/codec/audio_decoder_speex.h"

#include <string>

#include "base/basictypes.h"
#include "base/memory/scoped_ptr.h"
#include "base/logging.h"
#include "base/stl_util.h"
#include "remoting/proto/audio.pb.h"
#include "third_party/speex/include/speex/speex_callbacks.h"
#include "third_party/speex/include/speex/speex_stereo.h"

namespace remoting {

namespace {

// Hosts will never generate more than 100 frames in a single packet.
const int kMaxFramesPerPacket = 100;

}  // namespace

AudioDecoderSpeex::AudioDecoderSpeex() {
  // Create and initialize the Speex structures.
  speex_bits_.reset(new SpeexBits());
  speex_bits_init(speex_bits_.get());
  speex_state_ = speex_decoder_init(&speex_wb_mode);

  // Create and initialize the Speex stereo state.
  speex_stereo_state_ = speex_stereo_state_init();

  // Create and initialize the stereo callback.
  speex_callback_.reset(new SpeexCallback());
  speex_callback_->callback_id = SPEEX_INBAND_STEREO;
  speex_callback_->func = speex_std_stereo_request_handler;
  speex_callback_->data = speex_stereo_state_;

  int result;

  // Turn on perceptual enhancer, which will make the audio sound better,
  // at the price of further distorting the decoded samples.
  int enhancer = 1;
  result = speex_decoder_ctl(speex_state_, SPEEX_SET_ENH, &enhancer);
  CHECK_EQ(result, 0);

  // Get the frame size, so that we know the size of output when we decode
  // frame by frame.
  result = speex_decoder_ctl(speex_state_,
                             SPEEX_GET_FRAME_SIZE,
                             &speex_frame_size_);
  CHECK_EQ(result, 0);

  // Set the stereo callback, so that the Speex decoder can get the intensity
  // stereo information.
  result = speex_decoder_ctl(speex_state_,
                             SPEEX_SET_HANDLER,
                             speex_callback_.get());
  CHECK_EQ(result, 0);
}

AudioDecoderSpeex::~AudioDecoderSpeex() {
  speex_stereo_state_destroy(speex_stereo_state_);
  speex_decoder_destroy(speex_state_);
  speex_bits_destroy(speex_bits_.get());
}

scoped_ptr<AudioPacket> AudioDecoderSpeex::Decode(
    scoped_ptr<AudioPacket> packet) {
  if ((packet->encoding() != AudioPacket::ENCODING_SPEEX) ||
      (packet->bytes_per_sample() != AudioPacket::BYTES_PER_SAMPLE_2) ||
      (packet->sampling_rate() == AudioPacket::SAMPLING_RATE_INVALID) ||
      (packet->channels() != AudioPacket::CHANNELS_STEREO)) {
    LOG(WARNING) << "Received an unsupported packet.";
    return scoped_ptr<AudioPacket>(NULL);
  }
  if (packet->data_size() > kMaxFramesPerPacket) {
    LOG(WARNING) << "Received an packet with too many frames.";
    return scoped_ptr<AudioPacket>();
  }

  // Create a new packet of decoded data.
  scoped_ptr<AudioPacket> decoded_packet(new AudioPacket());
  decoded_packet->set_encoding(AudioPacket::ENCODING_RAW);
  decoded_packet->set_sampling_rate(packet->sampling_rate());
  decoded_packet->set_bytes_per_sample(packet->bytes_per_sample());
  decoded_packet->set_channels(packet->channels());

  std::string* decoded_data = decoded_packet->add_data();
  decoded_data->resize(packet->data_size() *
                       speex_frame_size_ *
                       packet->bytes_per_sample() *
                       packet->channels());
  int16* samples = reinterpret_cast<int16*>(string_as_array(decoded_data));

  for (int i = 0; i < packet->data_size(); ++i) {
    // Read the bytes into the bits structure.
    speex_bits_read_from(speex_bits_.get(),
                         string_as_array(packet->mutable_data(i)),
                         packet->data(i).size());

    // Decode the frame and store it in the buffer.
    int status = speex_decode_int(speex_state_, speex_bits_.get(), samples);
    if (status < 0) {
      LOG(ERROR) << "Error in decoding Speex data.";
      return scoped_ptr<AudioPacket>(NULL);
    }
    // Transform mono to stereo.
    speex_decode_stereo_int(samples, speex_frame_size_, speex_stereo_state_);

    samples += (speex_frame_size_ * packet->channels());
  }

  return decoded_packet.Pass();
}

}  // namespace remoting