open-webrtc-toolkit
diff --git a/‎webrtc/api/video_codecs/video_encoder.h
Lines changed: 6 additions & 1 deletion b/‎webrtc/api/video_codecs/video_encoder.h
Lines changed: 6 additions & 1 deletion
diff --git a/‎webrtc/common_types.cc
Lines changed: 23 additions & 0 deletions b/‎webrtc/common_types.cc
Lines changed: 23 additions & 0 deletions
diff --git a/‎webrtc/common_types.h
Lines changed: 20 additions & 1 deletion b/‎webrtc/common_types.h
Lines changed: 20 additions & 1 deletion
diff --git a/‎webrtc/common_video/video_frame.cc
Lines changed: 4 additions & 0 deletions b/‎webrtc/common_video/video_frame.cc
Lines changed: 4 additions & 0 deletions
diff --git a/‎webrtc/media/base/mediaconstants.cc
Lines changed: 11 additions & 1 deletion b/‎webrtc/media/base/mediaconstants.cc
Lines changed: 11 additions & 1 deletion
diff --git a/‎webrtc/modules/include/module_common_types.h
Lines changed: 21 additions & 1 deletion b/‎webrtc/modules/include/module_common_types.h
Lines changed: 21 additions & 1 deletion
diff --git a/‎webrtc/modules/rtp_rtcp/BUILD.gn
Lines changed: 4 additions & 0 deletions b/‎webrtc/modules/rtp_rtcp/BUILD.gn
Lines changed: 4 additions & 0 deletions
diff --git a/‎webrtc/modules/rtp_rtcp/source/h265_sps_parser.cc
Lines changed: 189 additions & 0 deletions b/‎webrtc/modules/rtp_rtcp/source/h265_sps_parser.cc
Lines changed: 189 additions & 0 deletions
@@ -67,6 +67,9 @@ class EncodedImageCallback {
 class VideoEncoder {
  public:
   enum EncoderType {
+#ifndef DISABLE_H265
+    kH265,
+#endif
     kH264,
     kVp8,
     kVp9,
@@ -95,7 +98,9 @@ class VideoEncoder {
   static VideoCodecVP8 GetDefaultVp8Settings();
   static VideoCodecVP9 GetDefaultVp9Settings();
   static VideoCodecH264 GetDefaultH264Settings();
-
+#ifndef DISABLE_H265
+  static VideoCodecH265 GetDefaultH265Settings();
+#endif
   virtual ~VideoEncoder() {}
 
   // Initialize the encoder with the information from the codecSettings
 
@@ -95,9 +95,24 @@ const VideoCodecH264& VideoCodec::H264() const {
   return codec_specific_.H264;
 }
 
+#ifndef DISABLE_H265
+VideoCodecH265* VideoCodec::H265() {
+  RTC_DCHECK_EQ(codecType, kVideoCodecH265);
+  return &codec_specific_.H265;
+}
+
+const VideoCodecH265& VideoCodec::H265() const {
+  RTC_DCHECK_EQ(codecType, kVideoCodecH265);
+  return codec_specific_.H265;
+}
+#endif
+
 static const char* kPayloadNameVp8 = "VP8";
 static const char* kPayloadNameVp9 = "VP9";
 static const char* kPayloadNameH264 = "H264";
+#ifndef DISABLE_H265
+static const char* kPayloadNameH265 = "H265";
+#endif
 static const char* kPayloadNameI420 = "I420";
 static const char* kPayloadNameRED = "RED";
 static const char* kPayloadNameULPFEC = "ULPFEC";
@@ -115,6 +130,10 @@ rtc::Optional<const char*> CodecTypeToPayloadName(VideoCodecType type) {
       return rtc::Optional<const char*>(kPayloadNameVp9);
     case kVideoCodecH264:
       return rtc::Optional<const char*>(kPayloadNameH264);
+#ifndef DISABLE_H265
+    case kVideoCodecH265:
+      return rtc::Optional<const char*>(kPayloadNameH265);
+#endif
     case kVideoCodecI420:
       return rtc::Optional<const char*>(kPayloadNameI420);
     case kVideoCodecRED:
@@ -135,6 +154,10 @@ rtc::Optional<VideoCodecType> PayloadNameToCodecType(const std::string& name) {
     return rtc::Optional<VideoCodecType>(kVideoCodecVP9);
   if (CodecNamesEq(name.c_str(), kPayloadNameH264))
     return rtc::Optional<VideoCodecType>(kVideoCodecH264);
+#ifndef DISABLE_H265
+  if (CodecNamesEq(name.c_str(), kPayloadNameH265))
+    return rtc::Optional<VideoCodecType>(kVideoCodecH265);
+#endif
   if (CodecNamesEq(name.c_str(), kPayloadNameI420))
     return rtc::Optional<VideoCodecType>(kVideoCodecI420);
   if (CodecNamesEq(name.c_str(), kPayloadNameRED))
 
@@ -511,12 +511,25 @@ struct VideoCodecH264 {
   size_t ppsLen;
   H264::Profile profile;
 };
+#ifndef DISABLE_H265
+struct VideoCodecH265 {
+    bool           frameDroppingOn;
+    int            keyFrameInterval;
+    const uint8_t* spsData;
+    size_t         spsLen;
+    const uint8_t* ppsData;
+    size_t         ppsLen;
+};
+#endif
 
 // Video codec types
 enum VideoCodecType {
   kVideoCodecVP8,
   kVideoCodecVP9,
   kVideoCodecH264,
+#ifndef DISABLE_H265
+  kVideoCodecH265,
+#endif
   kVideoCodecI420,
   kVideoCodecRED,
   kVideoCodecULPFEC,
@@ -533,6 +546,9 @@ union VideoCodecUnion {
   VideoCodecVP8 VP8;
   VideoCodecVP9 VP9;
   VideoCodecH264 H264;
+#ifndef DISABLE_H265
+  VideoCodecH265 H265;
+#endif
 };
 
 // Simulcast is when the same stream is encoded multiple times with different
@@ -597,7 +613,10 @@ class VideoCodec {
   const VideoCodecVP9& VP9() const;
   VideoCodecH264* H264();
   const VideoCodecH264& H264() const;
-
+#ifndef DISABLE_H265
+  VideoCodecH265* H265();
+  const VideoCodecH265& H265() const;
+#endif
  private:
   // TODO(hta): Consider replacing the union with a pointer type.
   // This will allow removing the VideoCodec* types from this file.
 
@@ -30,6 +30,10 @@ size_t EncodedImage::GetBufferPaddingBytes(VideoCodecType codec_type) {
       return 0;
     case kVideoCodecH264:
       return kBufferPaddingBytesH264;
+#ifndef DISABLE_H265
+    case kVideoCodecH265:
+      return 0;
+#endif
     case kVideoCodecI420:
     case kVideoCodecRED:
     case kVideoCodecULPFEC:
 
@@ -101,13 +101,23 @@ const char kComfortNoiseCodecName[] = "CN";
 const char kVp8CodecName[] = "VP8";
 const char kVp9CodecName[] = "VP9";
 const char kH264CodecName[] = "H264";
-
+#ifndef DISABLE_H265
+const char kH265CodecName[] = "H265";
+#endif
 // RFC 6184 RTP Payload Format for H.264 video
 const char kH264FmtpProfileLevelId[] = "profile-level-id";
 const char kH264FmtpLevelAsymmetryAllowed[] = "level-asymmetry-allowed";
 const char kH264FmtpPacketizationMode[] = "packetization-mode";
 const char kH264FmtpSpropParameterSets[] = "sprop-parameter-sets";
 const char kH264ProfileLevelConstrainedBaseline[] = "42e01f";
 
+#ifndef DISABLE_H265
+// RFC 7798 RTP Payload Format for H.265 video
+const char kH265FmtpProfileSpace[] = "profile-space";
+const char kH265FmtpProfileId[] = "profile-id";
+const char kH265FmtpTierFlag[] = "tier-flag";
+const char kH265FmtpLevelId[] = "level-id";
+#endif
+
 const int kDefaultVideoMaxFramerate = 60;
 }  // namespace cricket
@@ -29,6 +29,20 @@
 
 namespace webrtc {
 
+#ifndef DISABLE_H265
+// H265 packtization types we support: single,  aggregated, and fragmented.
+enum H265PacketizationTypes {
+    kH265SingleNalu,
+    kH265AP,
+    kH265FU,
+};
+
+struct RTPVideoHeaderH265 {
+    uint8_t nalu_type;
+    H265PacketizationTypes packetization_type;
+};
+#endif
+
 struct RTPAudioHeader {
   uint8_t numEnergy;                  // number of valid entries in arrOfEnergy
   uint8_t arrOfEnergy[kRtpCsrcSize];  // one energy byte (0-9) per channel
@@ -40,14 +54,20 @@ union RTPVideoTypeHeader {
   RTPVideoHeaderVP8 VP8;
   RTPVideoHeaderVP9 VP9;
   RTPVideoHeaderH264 H264;
+#ifndef DISABLE_H265
+  RTPVideoHeaderH265 H265;
+#endif
 };
 
 enum RtpVideoCodecTypes {
   kRtpVideoNone,
   kRtpVideoGeneric,
   kRtpVideoVp8,
   kRtpVideoVp9,
-  kRtpVideoH264
+  kRtpVideoH264,
+#ifndef DISABLE_H265
+  kRtpVideoH265
+#endif
 };
 // Since RTPVideoHeader is used as a member of a union, it can't have a
 // non-trivial default constructor.
 
@@ -102,6 +102,10 @@ rtc_static_library("rtp_rtcp") {
     "source/rtp_format.h",
     "source/rtp_format_h264.cc",
     "source/rtp_format_h264.h",
+    "source/h265_sps_parser.cc",
+    "source/h265_sps_parser.h",
+    "source/rtp_format_h265.cc",
+    "source/rtp_format_h265.h",
     "source/rtp_format_video_generic.cc",
     "source/rtp_format_video_generic.h",
     "source/rtp_format_vp8.cc",
 
@@ -0,0 +1,189 @@
+/*
+ * Intel License
+ */
+
+#include "webrtc/modules/rtp_rtcp/source/h265_sps_parser.h"
+
+#include "webrtc/base/bitbuffer.h"
+#include "webrtc/base/bytebuffer.h"
+#include "webrtc/base/logging.h"
+
+#include <vector>
+
+#define RETURN_FALSE_ON_FAIL(x) \
+  if (!(x)) {                   \
+    return false;               \
+  }
+
+namespace webrtc {
+
+H265SpsParser::H265SpsParser(const uint8_t* sps, size_t byte_length)
+    : sps_(sps), byte_length_(byte_length), width_(0), height_(0) {
+}
+
+bool H265SpsParser::Parse() {
+  // General note: this is based off the 04/2015 version of the H.265 standard.
+  // You can find it on this page:
+  // http://www.itu.int/rec/T-REC-H.265
+
+  const char* sps_bytes = reinterpret_cast<const char*>(sps_);
+  // First, parse out rbsp, which is basically the source buffer minus emulation
+  // bytes (the last byte of a 0x00 0x00 0x03 sequence). RBSP is defined in
+  // section 7.3.1.1 of the H.265 standard, similar to H264.
+  rtc::ByteBufferWriter rbsp_buffer;
+  for (size_t i = 0; i < byte_length_;) {
+    // Be careful about over/underflow here. byte_length_ - 3 can underflow, and
+    // i + 3 can overflow, but byte_length_ - i can't, because i < byte_length_
+    // above, and that expression will produce the number of bytes left in
+    // the stream including the byte at i.
+    if (byte_length_ - i >= 3 && sps_[i] == 0 && sps_[i + 1] == 0 &&
+        sps_[i + 2] == 3) {
+      // Two rbsp bytes + the emulation byte.
+      rbsp_buffer.WriteBytes(sps_bytes + i, 2);
+      i += 3;
+    } else {
+      // Single rbsp byte.
+      rbsp_buffer.WriteBytes(sps_bytes + i, 1);
+      i++;
+    }
+  }
+
+  // Now, we need to use a bit buffer to parse through the actual HEVC SPS
+  // format. See Section 7.3.2.1.1 ("Sequence parameter set data syntax") of the
+  // H.265 standard for a complete description.
+  // Since we only care about resolution, we ignore the majority of fields, but
+  // we still have to actively parse through a lot of the data, since many of
+  // the fields have variable size.
+  // Unlike H264, for H265, the picture size is indicated by pic_width_in_luma_samples
+  // and pic_height_in_luma_samples,  if conformance_window_flag !=1;
+  // When conformance_window_flag is 1,  the width is adjusted with con_win_xx_offset
+  //
+  rtc::BitBuffer parser(reinterpret_cast<const uint8_t*>(rbsp_buffer.Data()),
+                        rbsp_buffer.Length());
+
+  // The golomb values we have to read, not just consume.
+  uint32_t golomb_ignored;
+
+  // separate_colour_plane_flag is optional (assumed 0), but has implications
+  // about the ChromaArrayType, which modifies how we treat crop coordinates.
+  uint32_t separate_colour_plane_flag = 0;
+  // chroma_format_idc will be ChromaArrayType if separate_colour_plane_flag is
+  // 0. It defaults to 1, when not specified.
+  uint32_t chroma_format_idc = 1;
+
+
+  // sps_video_parameter_set_id: u(4)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBits(4));
+  // sps_max_sub_layers_minus1: u(3)
+  uint32_t sps_max_sub_layers_minus1 = 0;
+  RETURN_FALSE_ON_FAIL(parser.ReadBits(&sps_max_sub_layers_minus1, 3));
+  // sps_temporal_id_nesting_flag: u(1)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBits(1));
+  // profile_tier_level(1, sps_max_sub_layers_minus1). We are acutally not
+  // using them, so read/skip over it.
+  // general_profile_space+general_tier_flag+general_prfile_idc: u(8)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBytes(1));
+  // general_profile_compatabilitiy_flag[32]
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBytes(4));
+  // general_progressive_source_flag + interlaced_source_flag+ non-packed_constraint
+  // flag + frame_only_constraint_flag: u(4)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBits(4));
+  // general_profile_idc decided flags or reserved.  u(43)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBits(43));
+  // general_inbld_flag or reserved 0: u(1)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBits(1));
+  // general_level_idc: u(8)
+  RETURN_FALSE_ON_FAIL(parser.ConsumeBytes(1));
+  // if max_sub_layers_minus1 >=1, read the sublayer profile information
+  std::vector<uint32_t> sub_layer_profile_present_flags;
+  std::vector<uint32_t> sub_layer_level_present_flags;
+  uint32_t sub_layer_profile_present = 0;
+  uint32_t sub_layer_level_present = 0;
+  for (uint32_t i = 0; i < sps_max_sub_layers_minus1; i++) {
+      //sublayer_profile_present_flag and sublayer_level_presnet_flag:  u(2)
+      RETURN_FALSE_ON_FAIL(parser.ReadBits(&sub_layer_profile_present, 1));
+      RETURN_FALSE_ON_FAIL(parser.ReadBits(&sub_layer_level_present, 1));
+      sub_layer_profile_present_flags.push_back(sub_layer_profile_present);
+      sub_layer_level_present_flags.push_back(sub_layer_level_present);
+  }
+  if (sps_max_sub_layers_minus1 > 0) {
+      for (uint32_t j = sps_max_sub_layers_minus1; j < 8; j++) {
+        // reserved 2 bits: u(2)
+          RETURN_FALSE_ON_FAIL(parser.ConsumeBits(2));
+      }
+  }
+  for (uint32_t k = 0; k < sps_max_sub_layers_minus1; k++) {
+      if(sub_layer_profile_present_flags[k]) {//
+        // sub_layer profile_space/tier_flag/profile_idc. ignored. u(8)
+        RETURN_FALSE_ON_FAIL(parser.ConsumeBytes(1));
+        // profile_compatability_flag:  u(32)
+        RETURN_FALSE_ON_FAIL(parser.ConsumeBytes(4));
+        // sub_layer progressive_source_flag/interlaced_source_flag/
+        // non_packed_constraint_flag/frame_only_constraint_flag: u(4)
+        RETURN_FALSE_ON_FAIL(parser.ConsumeBits(4));
+        // following 43-bits are profile_idc specific. We simply read/skip it. u(43)
+        RETURN_FALSE_ON_FAIL(parser.ConsumeBits(43));
+        // 1-bit profile_idc specific inbld flag.  We simply read/skip it. u(1)
+        RETURN_FALSE_ON_FAIL(parser.ConsumeBits(1));
+      }
+      if (sub_layer_level_present_flags[k]) {
+        // sub_layer_level_idc: u(8)
+          RETURN_FALSE_ON_FAIL(parser.ConsumeBytes(1));
+      }
+  }
+  //sps_seq_parameter_set_id: ue(v)
+  RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&golomb_ignored));
+  // chrome_format_idc: ue(v)
+  RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&chroma_format_idc));
+  if (chroma_format_idc == 3) {
+    // seperate_colour_plane_flag: u(1)
+    RETURN_FALSE_ON_FAIL(parser.ReadBits(&separate_colour_plane_flag, 1));
+  }
+  uint32_t pic_width_in_luma_samples = 0;
+  uint32_t pic_height_in_luma_samples = 0;
+  // pic_width_in_luma_samples: ue(v)
+  RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&pic_width_in_luma_samples));
+  // pic_height_in_luma_samples: ue(v)
+  RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&pic_height_in_luma_samples));
+  // conformance_window_flag: u(1)
+  uint32_t conformance_window_flag = 0;
+  RETURN_FALSE_ON_FAIL(parser.ReadBits(&conformance_window_flag, 1));
+
+  uint32_t conf_win_left_offset = 0;
+  uint32_t conf_win_right_offset = 0;
+  uint32_t conf_win_top_offset = 0;
+  uint32_t conf_win_bottom_offset = 0;
+  if (conformance_window_flag) {
+      // conf_win_left_offset: ue(v)
+      RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&conf_win_left_offset));
+      // conf_win_right_offset: ue(v)
+      RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&conf_win_right_offset));
+      // conf_win_top_offset: ue(v)
+      RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&conf_win_top_offset));
+      // conf_win_bottom_offset: ue(v)
+      RETURN_FALSE_ON_FAIL(parser.ReadExponentialGolomb(&conf_win_bottom_offset));
+  }
+
+  //For enough to get the resolution information. calcaluate according to HEVC spec 7.4.3.2
+  int width = 0;
+  int height = 0;
+
+  width = pic_width_in_luma_samples;
+  height = pic_height_in_luma_samples;
+
+  if (conformance_window_flag) {
+    int sub_width_c = ((1 == chroma_format_idc) || (2 == chroma_format_idc)) &&
+                        (0 == separate_colour_plane_flag) ? 2 : 1;
+    int sub_height_c = (1 == chroma_format_idc) && (0 == separate_colour_plane_flag) ? 2 : 1;
+    //the offset includes the pixel within conformance window. so don't need to +1 as per spec
+    width -= sub_width_c*(conf_win_right_offset + conf_win_left_offset);
+    height -= sub_height_c*(conf_win_top_offset + conf_win_bottom_offset);
+  }
+
+  width_ = width;
+  height_ = height;
+  return true;
+
+}
+
+}  // namespace webrtc