blob: d85844c9752e9a99b62e68e40b2d5ec6ba14aa7a [file] [log] [blame]
sakal07a3bd72017-09-04 03:57:21 -07001/*
2 * Copyright 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "sdk/android/src/jni/videoencoderwrapper.h"
sakal07a3bd72017-09-04 03:57:21 -070012
13#include <utility>
14
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020015#include "common_video/h264/h264_common.h"
16#include "modules/include/module_common_types.h"
17#include "modules/video_coding/include/video_codec_interface.h"
18#include "modules/video_coding/include/video_error_codes.h"
19#include "modules/video_coding/utility/vp8_header_parser.h"
20#include "modules/video_coding/utility/vp9_uncompressed_header_parser.h"
21#include "rtc_base/logging.h"
22#include "rtc_base/random.h"
23#include "rtc_base/timeutils.h"
Magnus Jedvert0371e102017-11-07 14:23:44 +010024#include "sdk/android/generated_video_jni/jni/VideoCodecStatus_jni.h"
25#include "sdk/android/generated_video_jni/jni/VideoEncoderWrapper_jni.h"
Magnus Jedvert56231d02017-10-31 17:47:06 +010026#include "sdk/android/generated_video_jni/jni/VideoEncoder_jni.h"
Magnus Jedvert0371e102017-11-07 14:23:44 +010027#include "sdk/android/src/jni/class_loader.h"
sakal07a3bd72017-09-04 03:57:21 -070028
29namespace webrtc {
30namespace jni {
31
32static const int kMaxJavaEncoderResets = 3;
33
34VideoEncoderWrapper::VideoEncoderWrapper(JNIEnv* jni, jobject j_encoder)
35 : encoder_(jni, j_encoder),
sakal07a3bd72017-09-04 03:57:21 -070036 frame_type_class_(jni,
Magnus Jedvert0371e102017-11-07 14:23:44 +010037 GetClass(jni, "org/webrtc/EncodedImage$FrameType")),
sakal07a3bd72017-09-04 03:57:21 -070038 int_array_class_(jni, jni->FindClass("[I")),
39 video_frame_factory_(jni) {
sakal07a3bd72017-09-04 03:57:21 -070040 implementation_name_ = GetImplementationName(jni);
41
sakal07a3bd72017-09-04 03:57:21 -070042 initialized_ = false;
43 num_resets_ = 0;
44
45 Random random(rtc::TimeMicros());
46 picture_id_ = random.Rand<uint16_t>() & 0x7FFF;
47 tl0_pic_idx_ = random.Rand<uint8_t>();
48}
49
50int32_t VideoEncoderWrapper::InitEncode(const VideoCodec* codec_settings,
51 int32_t number_of_cores,
52 size_t max_payload_size) {
53 JNIEnv* jni = AttachCurrentThreadIfNeeded();
54 ScopedLocalRefFrame local_ref_frame(jni);
55
56 number_of_cores_ = number_of_cores;
57 codec_settings_ = *codec_settings;
58 num_resets_ = 0;
Sami Kalliomäkia265da42017-10-02 11:18:01 +020059 encoder_queue_ = rtc::TaskQueue::Current();
sakal07a3bd72017-09-04 03:57:21 -070060
61 return InitEncodeInternal(jni);
62}
63
64int32_t VideoEncoderWrapper::InitEncodeInternal(JNIEnv* jni) {
65 bool automatic_resize_on;
66 switch (codec_settings_.codecType) {
67 case kVideoCodecVP8:
68 automatic_resize_on = codec_settings_.VP8()->automaticResizeOn;
69 break;
70 case kVideoCodecVP9:
71 automatic_resize_on = codec_settings_.VP9()->automaticResizeOn;
72 break;
73 default:
74 automatic_resize_on = true;
75 }
76
Magnus Jedvert0371e102017-11-07 14:23:44 +010077 jobject settings = Java_VideoEncoderWrapper_createSettings(
78 jni, number_of_cores_, codec_settings_.width, codec_settings_.height,
79 codec_settings_.startBitrate, codec_settings_.maxFramerate,
80 automatic_resize_on);
sakal07a3bd72017-09-04 03:57:21 -070081
Magnus Jedvert0371e102017-11-07 14:23:44 +010082 jobject callback = Java_VideoEncoderWrapper_createEncoderCallback(
83 jni, jlongFromPointer(this));
sakal07a3bd72017-09-04 03:57:21 -070084
85 jobject ret =
Magnus Jedvert56231d02017-10-31 17:47:06 +010086 Java_VideoEncoder_initEncode(jni, *encoder_, settings, callback);
87
Magnus Jedvert0371e102017-11-07 14:23:44 +010088 if (Java_VideoCodecStatus_getNumber(jni, ret) == WEBRTC_VIDEO_CODEC_OK) {
sakal07a3bd72017-09-04 03:57:21 -070089 initialized_ = true;
90 }
91
92 return HandleReturnCode(jni, ret);
93}
94
95int32_t VideoEncoderWrapper::RegisterEncodeCompleteCallback(
96 EncodedImageCallback* callback) {
97 callback_ = callback;
98 return WEBRTC_VIDEO_CODEC_OK;
99}
100
101int32_t VideoEncoderWrapper::Release() {
102 JNIEnv* jni = AttachCurrentThreadIfNeeded();
103 ScopedLocalRefFrame local_ref_frame(jni);
Magnus Jedvert56231d02017-10-31 17:47:06 +0100104 jobject ret = Java_VideoEncoder_release(jni, *encoder_);
sakal07a3bd72017-09-04 03:57:21 -0700105 frame_extra_infos_.clear();
106 initialized_ = false;
Sami Kalliomäkia265da42017-10-02 11:18:01 +0200107 encoder_queue_ = nullptr;
sakal07a3bd72017-09-04 03:57:21 -0700108 return HandleReturnCode(jni, ret);
109}
110
111int32_t VideoEncoderWrapper::Encode(
112 const VideoFrame& frame,
113 const CodecSpecificInfo* /* codec_specific_info */,
114 const std::vector<FrameType>* frame_types) {
115 if (!initialized_) {
116 // Most likely initializing the codec failed.
117 return WEBRTC_VIDEO_CODEC_FALLBACK_SOFTWARE;
118 }
119
120 JNIEnv* jni = AttachCurrentThreadIfNeeded();
121 ScopedLocalRefFrame local_ref_frame(jni);
122
123 // Construct encode info.
124 jobjectArray j_frame_types =
125 jni->NewObjectArray(frame_types->size(), *frame_type_class_, nullptr);
126 for (size_t i = 0; i < frame_types->size(); ++i) {
Magnus Jedvert0371e102017-11-07 14:23:44 +0100127 jobject j_frame_type = Java_VideoEncoderWrapper_createFrameType(
128 jni, static_cast<jint>((*frame_types)[i]));
sakal07a3bd72017-09-04 03:57:21 -0700129 jni->SetObjectArrayElement(j_frame_types, i, j_frame_type);
130 }
Magnus Jedvert0371e102017-11-07 14:23:44 +0100131 jobject encode_info =
132 Java_VideoEncoderWrapper_createEncodeInfo(jni, j_frame_types);
sakal07a3bd72017-09-04 03:57:21 -0700133
134 FrameExtraInfo info;
135 info.capture_time_ns = frame.timestamp_us() * rtc::kNumNanosecsPerMicrosec;
136 info.timestamp_rtp = frame.timestamp();
137 frame_extra_infos_.push_back(info);
138
Magnus Jedvert56231d02017-10-31 17:47:06 +0100139 jobject ret = Java_VideoEncoder_encode(
140 jni, *encoder_, video_frame_factory_.ToJavaFrame(jni, frame),
sakal07a3bd72017-09-04 03:57:21 -0700141 encode_info);
142 return HandleReturnCode(jni, ret);
143}
144
145int32_t VideoEncoderWrapper::SetChannelParameters(uint32_t packet_loss,
146 int64_t rtt) {
147 JNIEnv* jni = AttachCurrentThreadIfNeeded();
148 ScopedLocalRefFrame local_ref_frame(jni);
Magnus Jedvert56231d02017-10-31 17:47:06 +0100149 jobject ret = Java_VideoEncoder_setChannelParameters(
150 jni, *encoder_, (jshort)packet_loss, (jlong)rtt);
sakal07a3bd72017-09-04 03:57:21 -0700151 return HandleReturnCode(jni, ret);
152}
153
154int32_t VideoEncoderWrapper::SetRateAllocation(
155 const BitrateAllocation& allocation,
156 uint32_t framerate) {
157 JNIEnv* jni = AttachCurrentThreadIfNeeded();
158 ScopedLocalRefFrame local_ref_frame(jni);
159
160 jobject j_bitrate_allocation = ToJavaBitrateAllocation(jni, allocation);
Magnus Jedvert56231d02017-10-31 17:47:06 +0100161 jobject ret = Java_VideoEncoder_setRateAllocation(
162 jni, *encoder_, j_bitrate_allocation, (jint)framerate);
sakal07a3bd72017-09-04 03:57:21 -0700163 return HandleReturnCode(jni, ret);
164}
165
166VideoEncoderWrapper::ScalingSettings VideoEncoderWrapper::GetScalingSettings()
167 const {
168 JNIEnv* jni = AttachCurrentThreadIfNeeded();
169 ScopedLocalRefFrame local_ref_frame(jni);
170 jobject j_scaling_settings =
Magnus Jedvert56231d02017-10-31 17:47:06 +0100171 Java_VideoEncoder_getScalingSettings(jni, *encoder_);
sakal07a3bd72017-09-04 03:57:21 -0700172 bool on =
Magnus Jedvert0371e102017-11-07 14:23:44 +0100173 Java_VideoEncoderWrapper_getScalingSettingsOn(jni, j_scaling_settings);
sakal07a3bd72017-09-04 03:57:21 -0700174 jobject j_low =
Magnus Jedvert0371e102017-11-07 14:23:44 +0100175 Java_VideoEncoderWrapper_getScalingSettingsLow(jni, j_scaling_settings);
sakal07a3bd72017-09-04 03:57:21 -0700176 jobject j_high =
Magnus Jedvert0371e102017-11-07 14:23:44 +0100177 Java_VideoEncoderWrapper_getScalingSettingsHigh(jni, j_scaling_settings);
sakal07a3bd72017-09-04 03:57:21 -0700178
179 if (j_low != nullptr || j_high != nullptr) {
180 RTC_DCHECK(j_low != nullptr);
181 RTC_DCHECK(j_high != nullptr);
Magnus Jedvert0371e102017-11-07 14:23:44 +0100182 int low = Java_VideoEncoderWrapper_getIntValue(jni, j_low);
183 int high = Java_VideoEncoderWrapper_getIntValue(jni, j_high);
sakal07a3bd72017-09-04 03:57:21 -0700184 return ScalingSettings(on, low, high);
185 } else {
186 return ScalingSettings(on);
187 }
188}
189
190const char* VideoEncoderWrapper::ImplementationName() const {
191 return implementation_name_.c_str();
192}
193
194void VideoEncoderWrapper::OnEncodedFrame(JNIEnv* jni,
195 jobject j_buffer,
196 jint encoded_width,
197 jint encoded_height,
198 jlong capture_time_ns,
199 jint frame_type,
200 jint rotation,
201 jboolean complete_frame,
202 jobject j_qp) {
203 const uint8_t* buffer =
204 static_cast<uint8_t*>(jni->GetDirectBufferAddress(j_buffer));
205 const size_t buffer_size = jni->GetDirectBufferCapacity(j_buffer);
206
207 std::vector<uint8_t> buffer_copy(buffer_size);
208 memcpy(buffer_copy.data(), buffer, buffer_size);
209 int qp = -1;
210 if (j_qp != nullptr) {
Magnus Jedvert0371e102017-11-07 14:23:44 +0100211 qp = Java_VideoEncoderWrapper_getIntValue(jni, j_qp);
sakal07a3bd72017-09-04 03:57:21 -0700212 }
213
214 encoder_queue_->PostTask(
215 [
216 this, task_buffer = std::move(buffer_copy), qp, encoded_width,
217 encoded_height, capture_time_ns, frame_type, rotation, complete_frame
218 ]() {
219 FrameExtraInfo frame_extra_info;
220 do {
221 if (frame_extra_infos_.empty()) {
222 LOG(LS_WARNING)
223 << "Java encoder produced an unexpected frame with timestamp: "
224 << capture_time_ns;
225 return;
226 }
227
228 frame_extra_info = frame_extra_infos_.front();
229 frame_extra_infos_.pop_front();
230 // The encoder might drop frames so iterate through the queue until
231 // we find a matching timestamp.
232 } while (frame_extra_info.capture_time_ns != capture_time_ns);
233
234 RTPFragmentationHeader header = ParseFragmentationHeader(task_buffer);
235 EncodedImage frame(const_cast<uint8_t*>(task_buffer.data()),
236 task_buffer.size(), task_buffer.size());
237 frame._encodedWidth = encoded_width;
238 frame._encodedHeight = encoded_height;
239 frame._timeStamp = frame_extra_info.timestamp_rtp;
240 frame.capture_time_ms_ = capture_time_ns / rtc::kNumNanosecsPerMillisec;
241 frame._frameType = (FrameType)frame_type;
242 frame.rotation_ = (VideoRotation)rotation;
243 frame._completeFrame = complete_frame;
244 if (qp == -1) {
245 frame.qp_ = ParseQp(task_buffer);
246 } else {
247 frame.qp_ = qp;
248 }
249
250 CodecSpecificInfo info(ParseCodecSpecificInfo(frame));
251 callback_->OnEncodedImage(frame, &info, &header);
252 });
253}
254
255int32_t VideoEncoderWrapper::HandleReturnCode(JNIEnv* jni, jobject code) {
Magnus Jedvert0371e102017-11-07 14:23:44 +0100256 int32_t value = Java_VideoCodecStatus_getNumber(jni, code);
sakal07a3bd72017-09-04 03:57:21 -0700257 if (value < 0) { // Any errors are represented by negative values.
258 // Try resetting the codec.
259 if (++num_resets_ <= kMaxJavaEncoderResets &&
260 Release() == WEBRTC_VIDEO_CODEC_OK) {
261 LOG(LS_WARNING) << "Reset Java encoder: " << num_resets_;
262 return InitEncodeInternal(jni);
263 }
264
265 LOG(LS_WARNING) << "Falling back to software decoder.";
266 return WEBRTC_VIDEO_CODEC_FALLBACK_SOFTWARE;
267 } else {
268 return value;
269 }
270}
271
272RTPFragmentationHeader VideoEncoderWrapper::ParseFragmentationHeader(
273 const std::vector<uint8_t>& buffer) {
274 RTPFragmentationHeader header;
275 if (codec_settings_.codecType == kVideoCodecH264) {
276 h264_bitstream_parser_.ParseBitstream(buffer.data(), buffer.size());
277
278 // For H.264 search for start codes.
279 const std::vector<H264::NaluIndex> nalu_idxs =
280 H264::FindNaluIndices(buffer.data(), buffer.size());
281 if (nalu_idxs.empty()) {
282 LOG(LS_ERROR) << "Start code is not found!";
283 LOG(LS_ERROR) << "Data:" << buffer[0] << " " << buffer[1] << " "
284 << buffer[2] << " " << buffer[3] << " " << buffer[4] << " "
285 << buffer[5];
286 }
287 header.VerifyAndAllocateFragmentationHeader(nalu_idxs.size());
288 for (size_t i = 0; i < nalu_idxs.size(); i++) {
289 header.fragmentationOffset[i] = nalu_idxs[i].payload_start_offset;
290 header.fragmentationLength[i] = nalu_idxs[i].payload_size;
291 header.fragmentationPlType[i] = 0;
292 header.fragmentationTimeDiff[i] = 0;
293 }
294 } else {
295 // Generate a header describing a single fragment.
296 header.VerifyAndAllocateFragmentationHeader(1);
297 header.fragmentationOffset[0] = 0;
298 header.fragmentationLength[0] = buffer.size();
299 header.fragmentationPlType[0] = 0;
300 header.fragmentationTimeDiff[0] = 0;
301 }
302 return header;
303}
304
305int VideoEncoderWrapper::ParseQp(const std::vector<uint8_t>& buffer) {
306 int qp;
307 bool success;
308 switch (codec_settings_.codecType) {
309 case kVideoCodecVP8:
310 success = vp8::GetQp(buffer.data(), buffer.size(), &qp);
311 break;
312 case kVideoCodecVP9:
313 success = vp9::GetQp(buffer.data(), buffer.size(), &qp);
314 break;
315 case kVideoCodecH264:
316 success = h264_bitstream_parser_.GetLastSliceQp(&qp);
317 break;
318 default: // Default is to not provide QP.
319 success = false;
320 break;
321 }
322 return success ? qp : -1; // -1 means unknown QP.
323}
324
325CodecSpecificInfo VideoEncoderWrapper::ParseCodecSpecificInfo(
326 const EncodedImage& frame) {
327 const bool key_frame = frame._frameType == kVideoFrameKey;
328
329 CodecSpecificInfo info;
330 memset(&info, 0, sizeof(info));
331 info.codecType = codec_settings_.codecType;
332 info.codec_name = implementation_name_.c_str();
333
334 switch (codec_settings_.codecType) {
335 case kVideoCodecVP8:
336 info.codecSpecific.VP8.pictureId = picture_id_;
337 info.codecSpecific.VP8.nonReference = false;
338 info.codecSpecific.VP8.simulcastIdx = 0;
339 info.codecSpecific.VP8.temporalIdx = kNoTemporalIdx;
340 info.codecSpecific.VP8.layerSync = false;
341 info.codecSpecific.VP8.tl0PicIdx = kNoTl0PicIdx;
342 info.codecSpecific.VP8.keyIdx = kNoKeyIdx;
343 break;
344 case kVideoCodecVP9:
345 if (key_frame) {
346 gof_idx_ = 0;
347 }
348 info.codecSpecific.VP9.picture_id = picture_id_;
349 info.codecSpecific.VP9.inter_pic_predicted = key_frame ? false : true;
350 info.codecSpecific.VP9.flexible_mode = false;
351 info.codecSpecific.VP9.ss_data_available = key_frame ? true : false;
352 info.codecSpecific.VP9.tl0_pic_idx = tl0_pic_idx_++;
353 info.codecSpecific.VP9.temporal_idx = kNoTemporalIdx;
354 info.codecSpecific.VP9.spatial_idx = kNoSpatialIdx;
355 info.codecSpecific.VP9.temporal_up_switch = true;
356 info.codecSpecific.VP9.inter_layer_predicted = false;
357 info.codecSpecific.VP9.gof_idx =
358 static_cast<uint8_t>(gof_idx_++ % gof_.num_frames_in_gof);
359 info.codecSpecific.VP9.num_spatial_layers = 1;
360 info.codecSpecific.VP9.spatial_layer_resolution_present = false;
361 if (info.codecSpecific.VP9.ss_data_available) {
362 info.codecSpecific.VP9.spatial_layer_resolution_present = true;
363 info.codecSpecific.VP9.width[0] = frame._encodedWidth;
364 info.codecSpecific.VP9.height[0] = frame._encodedHeight;
365 info.codecSpecific.VP9.gof.CopyGofInfoVP9(gof_);
366 }
367 break;
368 default:
369 break;
370 }
371
372 picture_id_ = (picture_id_ + 1) & 0x7FFF;
373
374 return info;
375}
376
377jobject VideoEncoderWrapper::ToJavaBitrateAllocation(
378 JNIEnv* jni,
379 const BitrateAllocation& allocation) {
380 jobjectArray j_allocation_array = jni->NewObjectArray(
381 kMaxSpatialLayers, *int_array_class_, nullptr /* initial */);
382 for (int spatial_i = 0; spatial_i < kMaxSpatialLayers; ++spatial_i) {
383 jintArray j_array_spatial_layer = jni->NewIntArray(kMaxTemporalStreams);
384 jint* array_spatial_layer =
385 jni->GetIntArrayElements(j_array_spatial_layer, nullptr /* isCopy */);
386 for (int temporal_i = 0; temporal_i < kMaxTemporalStreams; ++temporal_i) {
387 array_spatial_layer[temporal_i] =
388 allocation.GetBitrate(spatial_i, temporal_i);
389 }
390 jni->ReleaseIntArrayElements(j_array_spatial_layer, array_spatial_layer,
391 JNI_COMMIT);
392
393 jni->SetObjectArrayElement(j_allocation_array, spatial_i,
394 j_array_spatial_layer);
395 }
Magnus Jedvert0371e102017-11-07 14:23:44 +0100396 return Java_VideoEncoderWrapper_createBitrateAllocation(jni,
397 j_allocation_array);
sakal07a3bd72017-09-04 03:57:21 -0700398}
399
400std::string VideoEncoderWrapper::GetImplementationName(JNIEnv* jni) const {
Magnus Jedvert56231d02017-10-31 17:47:06 +0100401 jstring jname = Java_VideoEncoder_getImplementationName(jni, *encoder_);
sakal07a3bd72017-09-04 03:57:21 -0700402 return JavaToStdString(jni, jname);
403}
404
405JNI_FUNCTION_DECLARATION(void,
Magnus Jedvert0371e102017-11-07 14:23:44 +0100406 VideoEncoderWrapper_onEncodedFrame,
sakal07a3bd72017-09-04 03:57:21 -0700407 JNIEnv* jni,
408 jclass,
409 jlong j_native_encoder,
410 jobject buffer,
411 jint encoded_width,
412 jint encoded_height,
413 jlong capture_time_ns,
414 jint frame_type,
415 jint rotation,
416 jboolean complete_frame,
417 jobject qp) {
418 VideoEncoderWrapper* native_encoder =
419 reinterpret_cast<VideoEncoderWrapper*>(j_native_encoder);
420 native_encoder->OnEncodedFrame(jni, buffer, encoded_width, encoded_height,
421 capture_time_ns, frame_type, rotation,
422 complete_frame, qp);
423}
424
425} // namespace jni
426} // namespace webrtc