H264.h 12.7 KB
Newer Older
xiongziliang committed
1
/*
2 3
 * MIT License
 *
xiongziliang committed
4
 * Copyright (c) 2016-2019 xiongziliang <771730766@qq.com>
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
 *
 * This file is part of ZLMediaKit(https://github.com/xiongziliang/ZLMediaKit).
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in all
 * copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */
xiongziliang committed
26

27 28
#ifndef ZLMEDIAKIT_H264_H
#define ZLMEDIAKIT_H264_H
xiongziliang committed
29 30

#include "Frame.h"
31
#include "Track.h"
xiongziliang committed
32 33
#include "Util/base64.h"
using namespace toolkit;
xiongziliang committed
34 35
#define H264_TYPE(v) ((uint8_t)(v) & 0x1F)

xiongziliang committed
36
namespace mediakit{
xiongziliang committed
37

38
bool getAVCInfo(const string &strSps,int &iVideoWidth, int &iVideoHeight, float  &iVideoFps);
39
void splitH264(const char *ptr, int len, const std::function<void(const char *, int)> &cb);
xiongziliang committed
40

xiongziliang committed
41
/**
42
 * 264帧类
xiongziliang committed
43
 */
44
class H264Frame : public Frame {
xiongziliang committed
45
public:
46
    typedef std::shared_ptr<H264Frame> Ptr;
xiongziliang committed
47

xiongziliang committed
48 49 50 51 52 53
    typedef enum {
        NAL_SPS = 7,
        NAL_PPS = 8,
        NAL_IDR = 5,
    } NalType;

54 55 56 57 58 59
    char *data() const override{
        return (char *)buffer.data();
    }
    uint32_t size() const override {
        return buffer.size();
    }
xiongziliang committed
60
    uint32_t dts() const override {
61 62
        return timeStamp;
    }
xiongziliang committed
63 64 65 66 67

    uint32_t pts() const override {
        return ptsStamp ? ptsStamp : timeStamp;
    }

68 69 70
    uint32_t prefixSize() const override{
        return iPrefixSize;
    }
71

72 73 74
    TrackType getTrackType() const override{
        return TrackVideo;
    }
75

76 77 78
    CodecId getCodecId() const override{
        return CodecH264;
    }
79

80
    bool keyFrame() const override {
81
        return H264_TYPE(buffer[iPrefixSize]) == H264Frame::NAL_IDR;
82
    }
xiongziliang committed
83 84 85 86 87 88 89 90 91 92

    bool configFrame() const override{
        switch(H264_TYPE(buffer[iPrefixSize]) ){
            case H264Frame::NAL_SPS:
            case H264Frame::NAL_PPS:
                return true;
            default:
                return false;
        }
    }
93 94
public:
    uint32_t timeStamp;
xiongziliang committed
95
    uint32_t ptsStamp = 0;
96 97
    string buffer;
    uint32_t iPrefixSize = 4;
xiongziliang committed
98 99
};

100

101 102 103 104 105
/**
 * 防止内存拷贝的H264类
 * 用户可以通过该类型快速把一个指针无拷贝的包装成Frame类
 * 该类型在DevChannel中有使用
 */
106
class H264FrameNoCacheAble : public FrameNoCacheAble {
xiongziliang committed
107
public:
108
    typedef std::shared_ptr<H264FrameNoCacheAble> Ptr;
xiongziliang committed
109

110
    H264FrameNoCacheAble(char *ptr,uint32_t size,uint32_t dts , uint32_t pts ,int prefixeSize = 4){
xiongziliang committed
111 112 113 114 115
        _ptr = ptr;
        _size = size;
        _dts = dts;
        _pts = pts;
        _prefixSize = prefixeSize;
116
    }
117

118 119 120
    TrackType getTrackType() const override{
        return TrackVideo;
    }
121

122 123 124
    CodecId getCodecId() const override{
        return CodecH264;
    }
125

126
    bool keyFrame() const override {
xiongziliang committed
127
        return H264_TYPE(_ptr[_prefixSize]) == H264Frame::NAL_IDR;
128
    }
xiongziliang committed
129 130 131 132 133 134 135 136 137 138

    bool configFrame() const override{
        switch(H264_TYPE(_ptr[_prefixSize])){
            case H264Frame::NAL_SPS:
            case H264Frame::NAL_PPS:
                return true;
            default:
                return false;
        }
    }
xiongziliang committed
139 140
};

141 142 143 144 145 146
/**
 * 一个H264Frame类中可以有多个帧,他们通过 0x 00 00 01 分隔
 * ZLMediaKit会先把这种复合帧split成单个帧然后再处理
 * 一个复合帧可以通过无内存拷贝的方式切割成多个H264FrameSubFrame
 * 提供该类的目的是切换复合帧时防止内存拷贝,提高性能
 */
147 148
template<typename Parent>
class FrameInternal : public Parent{
149
public:
150 151 152 153 154
    typedef std::shared_ptr<FrameInternal> Ptr;
    FrameInternal(const Frame::Ptr &parent_frame,
                  char *ptr,
                  uint32_t size,
                  int prefixeSize) : Parent(ptr,size,parent_frame->dts(),parent_frame->pts(),prefixeSize){
155 156 157 158
        _parent_frame = parent_frame;
    }
    bool cacheAble() const override {
        return _parent_frame->cacheAble();
159 160
    }
private:
161
    Frame::Ptr _parent_frame;
162
};
163

164 165
typedef FrameInternal<H264FrameNoCacheAble> H264FrameInternal;

xiongziliang committed
166 167 168
/**
 * 264视频通道
 */
xiongziliang committed
169
class H264Track : public VideoTrack{
xiongziliang committed
170
public:
xiongziliang committed
171
    typedef std::shared_ptr<H264Track> Ptr;
172 173

    /**
xiongziliang committed
174 175 176 177 178
     * 不指定sps pps构造h264类型的媒体
     * 在随后的inputFrame中获取sps pps
     */
    H264Track(){}
    /**
179 180 181 182 183 184 185 186 187
     * 构造h264类型的媒体
     * @param sps sps帧数据
     * @param pps pps帧数据
     * @param sps_prefix_len 264头长度,可以为3个或4个字节,一般为0x00 00 00 01
     * @param pps_prefix_len 264头长度,可以为3个或4个字节,一般为0x00 00 00 01
     */
    H264Track(const string &sps,const string &pps,int sps_prefix_len = 4,int pps_prefix_len = 4){
        _sps = sps.substr(sps_prefix_len);
        _pps = pps.substr(pps_prefix_len);
xiongziliang committed
188
        onReady();
189 190 191 192 193 194 195 196 197 198 199 200 201
    }

    /**
     * 构造h264类型的媒体
     * @param sps sps帧
     * @param pps pps帧
     */
    H264Track(const Frame::Ptr &sps,const Frame::Ptr &pps){
        if(sps->getCodecId() != CodecH264 || pps->getCodecId() != CodecH264 ){
            throw std::invalid_argument("必须输入H264类型的帧");
        }
        _sps = string(sps->data() + sps->prefixSize(),sps->size() - sps->prefixSize());
        _pps = string(pps->data() + pps->prefixSize(),pps->size() - pps->prefixSize());
xiongziliang committed
202
        onReady();
xiongziliang committed
203
    }
204 205 206 207 208

    /**
     * 返回不带0x00 00 00 01头的sps
     * @return
     */
xiongziliang committed
209 210 211
    const string &getSps() const{
        return _sps;
    }
212 213 214 215 216

    /**
     * 返回不带0x00 00 00 01头的pps
     * @return
     */
xiongziliang committed
217 218 219
    const string &getPps() const{
        return _pps;
    }
220 221

    CodecId getCodecId() const override {
222
        return CodecH264;
xiongziliang committed
223
    }
224 225 226 227 228 229

    /**
     * 返回视频高度
     * @return
     */
    int getVideoHeight() const override{
230
        return _height ;
231 232 233 234 235 236 237
    }

    /**
     * 返回视频宽度
     * @return
     */
    int getVideoWidth() const override{
238
        return _width;
239 240 241 242 243 244 245 246 247
    }

    /**
     * 返回视频fps
     * @return
     */
    float getVideoFps() const override{
        return _fps;
    }
xiongziliang committed
248

249 250
    bool ready() override {
        return !_sps.empty() && !_pps.empty();
xiongziliang committed
251 252
    }

253 254 255 256 257 258 259 260 261 262 263 264
    /**
    * 输入数据帧,并获取sps pps
    * @param frame 数据帧
    */
    void inputFrame(const Frame::Ptr &frame) override{
        int type = H264_TYPE(*((uint8_t *)frame->data() + frame->prefixSize()));
        if(type == H264Frame::NAL_SPS){
            //有些设备会把SPS PPS IDR帧当做一个帧打包,所以我们要split一下
            bool  first_frame = true;
            splitH264(frame->data() + frame->prefixSize(),
                      frame->size() - frame->prefixSize(),
                      [&](const char *ptr, int len){
265 266 267 268 269 270 271 272 273 274 275 276 277 278 279
                          if(first_frame){
                              H264FrameInternal::Ptr sub_frame = std::make_shared<H264FrameInternal>(frame,
                                                                                                     frame->data(),
                                                                                                     len + frame->prefixSize(),
                                                                                                     frame->prefixSize());
                              inputFrame_l(sub_frame);
                              first_frame = false;
                          }else{
                              H264FrameInternal::Ptr sub_frame = std::make_shared<H264FrameInternal>(frame,
                                                                                                     (char *)ptr,
                                                                                                     len ,
                                                                                                     3);
                              inputFrame_l(sub_frame);
                          }
                      });
280 281 282 283 284 285 286 287 288 289 290 291 292 293
        } else{
            inputFrame_l(frame);
        }
    }
private:
    /**
     * 解析sps获取宽高fps
     */
    void onReady(){
        getAVCInfo(_sps,_width,_height,_fps);
    }
    Track::Ptr clone() override {
        return std::make_shared<std::remove_reference<decltype(*this)>::type >(*this);
    }
xiongziliang committed
294 295 296 297 298

    /**
     * 输入数据帧,并获取sps pps
     * @param frame 数据帧
     */
299
    void inputFrame_l(const Frame::Ptr &frame){
xiongziliang committed
300
        int type = H264_TYPE(*((uint8_t *)frame->data() + frame->prefixSize()));
xiongziliang committed
301
        switch (type){
xiongziliang committed
302
            case H264Frame::NAL_SPS:{
xiongziliang committed
303 304 305 306
                //sps
                _sps = string(frame->data() + frame->prefixSize(),frame->size() - frame->prefixSize());
            }
                break;
xiongziliang committed
307
            case H264Frame::NAL_PPS:{
xiongziliang committed
308 309 310 311 312
                //pps
                _pps = string(frame->data() + frame->prefixSize(),frame->size() - frame->prefixSize());
            }
                break;

xiongziliang committed
313
            case H264Frame::NAL_IDR:{
xiongziliang committed
314
                //I
xiongziliang committed
315
                insertConfigFrame(frame);
316
                VideoTrack::inputFrame(frame);
xiongziliang committed
317 318 319
            }
                break;

320
            default:
321
                VideoTrack::inputFrame(frame);
xiongziliang committed
322 323
                break;
        }
xiongziliang committed
324

325
        _last_frame_is_idr = type == H264Frame::NAL_IDR;
xiongziliang committed
326 327 328
        if(_width == 0 && ready()){
            onReady();
        }
xiongziliang committed
329
    }
xiongziliang committed
330

xiongziliang committed
331 332
    //生成sdp
    Sdp::Ptr getSdp() override ;
xiongziliang committed
333 334 335 336 337 338 339 340
private:
    //在idr帧前插入sps pps帧
    void insertConfigFrame(const Frame::Ptr &frame){
        if(_last_frame_is_idr){
            return;
        }

        if(!_sps.empty()){
xiongziliang committed
341 342 343 344 345 346
            auto spsFrame = std::make_shared<H264Frame>();
            spsFrame->iPrefixSize = 4;
            spsFrame->buffer.assign("\x0\x0\x0\x1",4);
            spsFrame->buffer.append(_sps);
            spsFrame->timeStamp = frame->stamp();
            VideoTrack::inputFrame(spsFrame);
xiongziliang committed
347 348 349
        }

        if(!_pps.empty()){
xiongziliang committed
350 351 352 353 354 355
            auto ppsFrame = std::make_shared<H264Frame>();
            ppsFrame->iPrefixSize = 4;
            ppsFrame->buffer.assign("\x0\x0\x0\x1",4);
            ppsFrame->buffer.append(_pps);
            ppsFrame->timeStamp = frame->stamp();
            VideoTrack::inputFrame(ppsFrame);
xiongziliang committed
356 357
        }
    }
358
private:
xiongziliang committed
359 360
    string _sps;
    string _pps;
361 362 363
    int _width = 0;
    int _height = 0;
    float _fps = 0;
xiongziliang committed
364
    bool _last_frame_is_idr = false;
xiongziliang committed
365 366 367
};


368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388
/**
* h264类型sdp
*/
class H264Sdp : public Sdp {
public:

    /**
     *
     * @param sps 264 sps,不带0x00000001头
     * @param pps 264 pps,不带0x00000001头
     * @param playload_type  rtp playload type 默认96
     * @param bitrate 比特率
     */
    H264Sdp(const string &strSPS,
            const string &strPPS,
            int playload_type = 96,
            int bitrate = 4000) : Sdp(90000,playload_type) {
        //视频通道
        _printer << "m=video 0 RTP/AVP " << playload_type << "\r\n";
        _printer << "b=AS:" << bitrate << "\r\n";
        _printer << "a=rtpmap:" << playload_type << " H264/" << 90000 << "\r\n";
xiongziliang committed
389
        _printer << "a=fmtp:" << playload_type << " packetization-mode=1; profile-level-id=";
390 391 392 393 394 395 396 397 398 399 400

        char strTemp[100];
        uint32_t profile_level_id = 0;
        if (strSPS.length() >= 4) { // sanity check
            profile_level_id = (uint8_t(strSPS[1]) << 16) |
                               (uint8_t(strSPS[2]) << 8)  |
                               (uint8_t(strSPS[3])); // profile_idc|constraint_setN_flag|level_idc
        }
        memset(strTemp, 0, 100);
        sprintf(strTemp, "%06X", profile_level_id);
        _printer << strTemp;
xiongziliang committed
401
        _printer << "; sprop-parameter-sets=";
402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426
        memset(strTemp, 0, 100);
        av_base64_encode(strTemp, 100, (uint8_t *) strSPS.data(), strSPS.size());
        _printer << strTemp << ",";
        memset(strTemp, 0, 100);
        av_base64_encode(strTemp, 100, (uint8_t *) strPPS.data(), strPPS.size());
        _printer << strTemp << "\r\n";
        _printer << "a=control:trackID=" << getTrackType() << "\r\n";
    }

    string getSdp() const override {
        return _printer;
    }

    TrackType getTrackType() const override {
        return TrackVideo;
    }

    CodecId getCodecId() const override {
        return CodecH264;
    }
private:
    _StrPrinter _printer;
};


xiongziliang committed
427
}//namespace mediakit
xiongziliang committed
428

429 430

#endif //ZLMEDIAKIT_H264_H