SRS之SrsHls::on_audio详解

1. SrsHls::on_audio

将音频数据封装到 ts 文件中。

/*
 * mux the audio packet to ts.
 * @param shared_audio, directly ptr, copy it if need to save it.
 */
int SrsHls::on_audio(SrsSharedPtrMessage* shared_audio)
{
    int ret = ERROR_SUCCESS;
    
    /* 检测是够使能了 hls */
    if (!hls_enabled) {
        return ret;
    }
    
    /* hls_dispose: HLS 清理的过期时间(s)，系统重启或者超过这个时间时，
     * 清理 HLS 所有的文件，包括 m3u8 和 ts。默认为 0，即不清理 */
    /* update the hls time, for hls_dispose */
    last_update_time = srs_get_system_time_ms();
    
    /* 将传入的音频消息拷贝一个副本 */
    SrsSharedPtrMessage* audio = shared_audio->copy();
    SrsAutoFree(SrsSharedPtrMessage, audio);
    
    /* clear all samples.
     * the sample units never copy the bytes, it directly use the ptr,
     * so when video/audio packet is destroyed, the sample must be clear.
     * in a word, user must clear sample before demux it.
     * @remark demux sample use SrsAvcAacCodec.audio_aac_demux or video_avc_demux.*/
    sample->clear();
    /* 解析音频数据
     * 对于 aac sequence header，会将该消息的负载拷贝到 aac_extra_data 中，
     * 并解析其中相关字段；
     * 对于 aac raw，则直接将负载数据的首地址赋给 sample_units[i]->bytes */
    if ((ret = codec->audio_aac_demux(audio->payload, audio->size, sample)) 
        != ERROR_SUCCESS) {
        if (ret != ERROR_HLS_TRY_MP3) {
            srs_error("hls aac demux audio failed. ret=%d", ret);
            return ret;
        }
        if ((ret = codec->audio_mp3_demux(audio->payload, audio->size, sample)) 
            != ERROR_SUCCESS) {
            srs_error("hls mp3 demux audio failed. ret=%d", ret);
            return ret;
        }
    }
    SrsCodecAudio acodec = (SrsCodecAudio)codec->audio_codec_id;
    
    /* ts support audio codec: aac/mp3 */
    if (acodec != SrsCodecAudioAAC && acodec != SrsCodecAudioMP3) {
        return ret;
    }
    
    /* update_acodec:
     * when open ts, we donot write the header (PSI),
     * for user may need to update the acodec to mp3 or others,
     * so we use delay write PSI, when write audio or video.
     * @remark for audio aac codec, for example, SRS1, 
     *     it's ok to write PSI when open ts.
     * @see https://github.com/ossrs/srs/issues/301
     */
    /* when codec changed, write new header. */
    if ((ret = muxer->update_acodec(acodec)) != ERROR_SUCCESS) {
        srs_error("http: ts audio write header failed. ret=%d", ret);
        return ret;
    }
    
    /* 忽略该 aac sequence header，即暂时不将该消息写入到 ts 中 */
    /* ignore sequence header */
    if (acodec == SrsCodecAudioAAC && 
        sample->aac_packet_type == SrsCodecAudioTypeSequenceHeader) {
        return hls_cache->on_sequence_header(muxer);
    }
    
    /* 第二个参数表示禁止 jitter correct */
    /* TODO: FIXME: config the jitter of HLS. */
    if ((ret = jitter->correct(audio, SrsRtmpJitterAlgorithmOFF)) 
        != ERROR_SUCCESS) {
        srs_error("rtmp jitter correct audio failed. ret=%d", ret);
        return ret;
    }
    
    /* 时间戳将每一秒分成 90000 份，即将每一毫秒分成 90 份，
     * 在 flv 中直接存储的都是毫秒级，在 ts 存储的是时间戳级 */
    /* the dts calc from rtmp/flv header. */
    int64_t dts = audio->timestamp * 90;
    
    /* for pure audio, we need to update the stream dts also. */
    stream_dts = dts;
    
    /* write audio to cache, if need to flush, flush to muxer. */
    if ((ret = hls_cache->write_audio(codec, muxer, dts, sample)) 
        != ERROR_SUCCESS) {
        srs_error("hls cache write audio failed. ret=%d", ret);
        return ret;
    }
    
    return ret;
}

1.1 SrsAvcAacCodec::audio_aac_demux

/*
 * demux the audio packet in aac codec.
 * the packet mux in FLV/RTMP format defined in flv specification.
 * demux the audio specified data(sound_format, sound_size, ...) to sample.
 * demux the aac specified data(aac_profile, ...) to codec from sequence header
 * demux the aac raw to sample units.
 */
int SrsAvcAacCodec::audio_aac_demux(char* data, int size, 
    SrsCodecSample* sample)
{
    int ret = ERROR_SUCCESS;
    
    sample->is_video = false;
    
    if (!data || size <= 0) {
        srs_trace("no audio present, ignore it.");
        return ret;
    }
    
    if ((ret = stream->initialize(data, size)) != ERROR_SUCCESS) {
        return ret;
    }
    
    /* audio decode */
    if (!stream->require(1)) {
        ret = ERROR_HLS_DECODE_ERROR;
        srs_error("aac decode sound_format failed. ret=%d", ret);
        return ret;
    }
    
    /* @see: E.4.2 Audio Tags, video_file_format_spec_v10_1.pdf, page 76 */
    int8_t sound_format = stream->read_1bytes();
    
    /* 声道：单声道 or 双声道，对于 AAC 永远是双声道 */
    int8_t sound_type = sound_format & 0x01;
    /* 采样精度: 8bit/16bit, 压缩过的音频都是 16bit */
    int8_t sound_size = (sound_format >> 1) & 0x01;
    /* 采样率: AAC 为 44KHz */
    int8_t sound_rate = (sound_format >> 2) & 0x03;
    /* 音频格式: 为 10，即 AAC */
    sound_format = (sound_format >> 4) & 0x0f;
    
    audio_codec_id = sound_format;
    sample->acodec = (SrsCodecAudio)audio_codec_id;

    sample->sound_type = (SrsCodecAudioSoundType)sound_type;
    sample->sound_rate = (SrsCodecAudioSampleRate)sound_rate;
    sample->sound_size = (SrsCodecAudioSampleSize)sound_size;
    
    /* we support h.264+mp3 for hls. */
    if (audio_codec_id == SrsCodecAudioMP3) {
        return ERROR_HLS_TRY_MP3;
    }
    
    /* only support aac */
    if (audio_codec_id != SrsCodecAudioAAC) {
        ret = ERROR_HLS_DECODE_ERROR;
        srs_error("aac only support mp3/aac codec. actual=%d, ret=%d", 
                  audio_codec_id, ret);
        return ret;
    }
    
    if (!stream->require(1)) {
        ret = ERROR_HLS_DECODE_ERROR;
        srs_error("aac decode aac_packet_type failed. ret=%d", ret);
        return ret;
    }
    
    /* 0: AAC sequence header, 1: AAC raw */
    int8_t aac_packet_type = stream->read_1bytes();
    sample->aac_packet_type = (SrsCodecAudioType)aac_packet_type;
    
    if (aac_packet_type == SrsCodecAudioTypeSequenceHeader) {
        /* AudioSpecificConfig
         * 1.6.2.1 AudioSpecificConfig, 
         * in aac-mp4a-format-ISO_IEC_14496-3+2001.pdf, page 33. */
        aac_extra_size = stream->size() - stream->pos();
        if (aac_extra_size > 0) {
            srs_freepa(aac_extra_data);
            aac_extra_data = new char[aac_extra_size];
            memcpy(aac_extra_data, stream->data() + stream->pos(), 
                   aac_extra_size);

            /* demux the sequence header. */
            if ((ret = audio_aac_sequence_header_demux(aac_extra_data, aac_extra_size)) 
                != ERROR_SUCCESS) {
                return ret;
            }
        }
    } else if (aac_packet_type == SrsCodecAudioTypeRawData) {
        if (!is_aac_codec_ok()) {
            srs_warn("aac ignore type=%d for no sequence header. ret=%d", 
                     aac_packet_type, ret);
            return ret;
        }
        
        if ((ret = sample->add_sample_unit(stream->data() + stream->pos(), 
                   stream->size() - stream->pos())) != ERROR_SUCCESS) {
            srs_error("aac add sample failed. ret=%d", ret);
            return ret;
        }
    } else {
        /* ignored */
    }
    
    /* reset the sample rate by sequence header */
    if (aac_sample_rate != SRS_AAC_SAMPLE_RATE_UNSET) {
        static int aac_sample_rates[] = {
            96000, 88200, 64000, 48000,
            44100, 32000, 24000, 22050,
            16000, 12000, 11025,  8000,
            7350,     0,     0,    0
        };
        /* 根据采样率索引值在采样率表中找到对应的采样率 */
        switch (aac_sample_rates[aac_sample_rate]) {
            case 11025:
                sample->sound_rate = SrsCodecAudioSampleRate11025;
                break;
            case 22050:
                sample->sound_rate = SrsCodecAudioSampleRate22050;
                break;
            case 44100:
                sample->sound_rate = SrsCodecAudioSampleRate44100;
                break;
            default:
                break;
        };
    }
    
    return ret;
}

1.1.1 SrsAvcAacCodec::audio_aac_sequence_header_demux

int SrsAvcAacCodec::audio_aac_sequence_header_demux(char* data, int size)
{
    int ret = ERROR_SUCCESS;
    
    if ((ret = stream->initialize(data, size)) != ERROR_SUCCESS) {
        return ret;
    }
    
    /*
     * only need to decode the first 2bytes:
     *     audioObjectType, aac_profile, 5bits.
     *     samplingFrequencyIndex, aac_sample_rate, 4bits.
     *     channelConfiguration, aac_channels, 4bits
     */
    if (!stream->require(2)) {
        ret = ERROR_HLS_DECODE_ERROR;
        srs_error("audio codec decode aac sequence header failed. ret=%d", ret);
        return ret;
    }
    u_int8_t profile_ObjectType = stream->read_1bytes();
    u_int8_t samplingFrequencyIndex = stream->read_1bytes();
    
    /* AAC profile(5bits) */
    aac_channels = (samplingFrequencyIndex >> 3) & 0x0f;
    /* 采样率表中的索引值 */
    samplingFrequencyIndex = ((profile_ObjectType << 1) & 0x0e) | 
                             ((samplingFrequencyIndex >> 7) & 0x01);
    profile_ObjectType = (profile_ObjectType >> 3) & 0x1f;
    
    /* set the aac sample rate.*/
    aac_sample_rate = samplingFrequencyIndex;
    
    /* convert the object type in sequence header to aac profile of ADTS. */
    aac_object = (SrsAacObjectType)profile_ObjectType;
    if (aac_object == SrsAacObjectTypeReserved) {
        ret = ERROR_HLS_DECODE_ERROR;
        srs_error("audio codec decode aac sequence header failed, "
            "adts object=%d invalid. ret=%d", profile_ObjectType, ret);
        return ret;
    }
    
    return ret;
}

1.1.2 SrsCodecSample::add_sample_unit

若该音频包为 raw data，则调用该函数进行处理.

/*
 * add the a sample unit, it's a h.264 NALU or aac raw data.
 * the sample unit directly use the ptr of packet bytes,
 * so user must never use sample unit when packet is destroyed.
 * in a word, user must clear sample before demux it.
 */
int SrsCodecSample::add_sample_unit(char* bytes, int size)
{
    int ret = ERROR_SUCCESS;
    
    /*
     * nb_sample_units:
     * each audio/video raw data packet will dumps to one or multiple buffers,
     * the buffers will write to hls and clear to reset.
     * generally, aac audio packet corresponding to one buffer,
     * where avc/h264 video packet may contains multiple buffer.
     */
    if (nb_sample_units >= SRS_SRS_MAX_CODEC_SAMPLE) {
        ret = ERROR_HLS_DECODE_ERROR;
        srs_error("hls decode samples error, "
            "exceed the max count: %d, ret=%d", SRS_SRS_MAX_CODEC_SAMPLE, ret);
        return ret;
    }
    
    SrsCodecSampleUnit* sample_unit = &sample_units[nb_sample_units++];
    sample_unit->bytes = bytes;
    sample_unit->size = size;
    
    /* for video, parse the nalu type, set the IDR flag. */
    if (is_video) {
        SrsAvcNaluType nal_unit_type = (SrsAvcNaluType)(bytes[0] & 0x1f);
        
        if (nal_unit_type == SrsAvcNaluTypeIDR) {
            /* whether sample_units contains IDR frame. */
            has_idr = true;
        } else if (nal_unit_type == SrsAvcNaluTypeSPS || 
                   nal_unit_type == SrsAvcNaluTypePPS) {
            has_sps_pps = true;
        } else if (nal_unit_type == SrsAvcNaluTypeAccessUnitDelimiter) {
            has_aud = true;
        }
    
        if (first_nalu_type == SrsAvcNaluTypeReserved) {
            /* The first nalu type. */
            first_nalu_type = nal_unit_type;
        }
    }
    
    return ret;
}

1.2 SrsHlsCache::on_sequence_header

/*
 * when get sequence header,
 * must write a #EXT-X-DISCONTINUITY to m3u8.
 * @see: hls-m3u8-draft-pantos-http-live-streaming-12.txt
 * @see: 3.4.11.  EXT-X-DISCONTINUITY
 */
int SrsHlsCache::on_sequence_header(SrsHlsMuxer* muxer)
{
    /* TODO: support discontinuity for the same stream
     * currently we reap and insert discontinity when encoder republish,
     * but actually, event when stream is not republish, the
     * sequence header may change, for example,
     * ffmpeg ingest a external rtmp stream and push to srs,
     * when the sequence header changed, the stream is not republish.
     */
    return muxer->on_sequence_header();
}

1.2.1 SrsHlsMuxer::on_sequence_header

int SrsHlsMuxer::on_sequence_header()
{
    int ret = ERROR_SUCCESS;
    
    srs_assert(current);
    
    /* set the current segment to sequence header,
     * when close the segement, it will write a discontinuity to m3u8 file. */
    current->is_sequence_header = true;
    
    return ret;
}

1.3 SrsHlsCache::write_audio

将 audio data 写入到缓存中，并将其 flush 到 ts 封装中。

/*
 * write audio to cache, if need to flush, flush to muxer.
 */
int SrsHlsCache::write_audio(SrsAvcAacCodec* codec, SrsHlsMuxer* muxer, 
    int64_t pts, SrsCodecSample* sample)
{
    int ret = ERROR_SUCCESS;
    
    /* write audio to cache. */
    if ((ret = cache->cache_audio(codec, pts, sample)) != ERROR_SUCCESS) {
        return ret;
    }
    
    /* 
     * reap when current source is pure audio.
     * it maybe changed when stream info changed,
     * for example, pure audio when start, audio/video when publishing,
     * pure audio again for audio disabled.
     * so we reap event when the audio incoming when segment overflow.
     * @see https://github.com/ossrs/srs/issues/151
     * we use absolutely overflow of segment to make jwplayer/ffplay happy
     * @see https://github.com/ossrs/srs/issues/151#issuecomment-71155184 */
    if (cache->audio && muxer->is_segment_absolutely_overflow()) {
        srs_info("hls: absolute audio reap segment.");
        /* 若为纯音频时，当 ts 时长超过 hls_fragment*hls_aof_ratio，
         * 这里即为 10*2.0=20s 时，就调用 reap_segment 切割 ts 文件，
         * 这里暂不分析该函数，当纯音频时再分析 */
        if ((ret = reap_segment("audio", muxer, cache->audio->pts)) != ERROR_SUCCESS) {
            return ret;
        }
    }
    
    /* for pure audio, aggregate some frame to one. */
    if (muxer->pure_audio() && cache->audio) {
        if (pts - cache->audio->start_pts < SRS_CONSTS_HLS_PURE_AUDIO_AGGREGATE) {
            return ret;
        }
    }
    
    /* 
     * directly write the audio frame by frame to ts,
     * it's ok for the hls overload, or maye cause the audio corrupt,
     * which introduced by aggregate the audios to a big one.
     * @see https://github.com/ossrs/srs/issues/512
     */
    if ((ret = muxer->flush_audio(cache)) != ERROR_SUCCESS) {
        return ret;
    }
    
    return ret;
}

1.3.1 SrsTsCache::cache_audio

/* write audio to cache */
int SrsTsCache::cache_audio(SrsAvcAacCodec* codec, int64_t dts, SrsCodecSample* sample)
{
    int ret = ERROR_SUCCESS;
    
    /* 若还没有创建 SrsTsMessage 类的 audio 对象，则新建一个，
     * 该 SrsTsMessage* audio 表征当前的 ts message */
    if (!audio) {
        audio = new SrsTsMessage();
        /* 
         * whether this message with pcr info,
         * generally, the video IDR(I frame, the keyframe of h.264) carray the pcr info. */
        audio->write_pcr = false;
        /* the timestamp in 90khz */
        audio->dts = audio->pts = audio->start_pts = dts;
    }
    
    /* sid 为 pes 层的 stream id，通常为 0xc0，即 SrsTsPESStreamIdAudioCommon */
    /* the id of pes stream to indicates the paylaod codec.
     * @remark use is_audio() and is_video() to check it, 
     * and stream_number() to finger it out. */
    audio->sid = SrsTsPESStreamIdAudioCommon;
    
    /* must be aac or mp3 */
    SrsCodecAudio acodec = (SrsCodecAudio)codec->audio_codec_id;
    srs_assert(acodec == SrsCodecAudioAAC || acodec == SrsCodecAudioMP3);
    
    /* write audio to cache. */
    if (codec->audio_codec_id == SrsCodecAudioAAC) {
        /* 将音频数据写入到 cache 中 */
        if ((ret = do_cache_aac(codec, sample)) != ERROR_SUCCESS) {
            return ret;
        }
    } else {
        if ((ret = do_cache_mp3(codec, sample)) != ERROR_SUCCESS) {
            return ret;
        }
    }
    
    return ret;
}

1.3.2 SrsTsMessage 构造

/*
 * the media audio/video message parsed from PES packet.
 */
SrsTsMessage::SrsTsMessage(SrsTsChannel* c, SrsTsPacket* p)
{
    /* decoder only, 
     * the ts message does not use them,
     * for user to get the channel and packet. */
    channel = c;
    packet = p;

    /* the timestamp in 90khz */
    dts = pts = 0;
    /* the id of pes stream to indicates the payload codec.
     * @remark, use is_audio() and is_video() to check it, 
     * and stream_number() to finger it out. */
    sid = (SrsTsPESStreamId)0x00;
    continuity_counter = 0;
    /* the size of payload, 0 indicates the length() of payload. */
    PES_packet_length = 0;
    /* the payload bytes */
    payload = new SrsSimpleBuffer();
    /* whether got discontinuity ts, for example, sequence header changed. */
    is_discontinuity = false;

    /* the audio cache buffer start pts, to flush audio if full.
     * @remark, the pts is not the adjust one, it's the orignal pts. */
    start_pts = 0;
    /* whether this message with pcr info,
     * generally, the video IDR(I frame, the keyframe of h.264) 
     * carray the pcr info. */
    write_pcr = false;
}

1.3.3 SrsTsCache::do_cache_aac

int SrsTsCache::do_cache_aac(SrsAvcAacCodec* codec, SrsCodecSample* sample)
{
    int ret = ERROR_SUCCESS;
    
    /*
     * nb_sample_units: s
     * each audio/video raw data packet will dumps to one or multiple buffers,
     * the buffers will write to hls and clear to reset.
     * generally, aac audio packet corresponding to one buffer,
     * where avc/h264 video packet may contains multiple buffer.
     */
    for (int i = 0; i < sample->nb_sample_units; i++) {
        SrsCodecSampleUnit* sample_unit = &sample->sample_units[i];
        int32_t size = sample_unit->size;
        
        if (!sample_unit->bytes || size <= 0 || size > 0x1fff) {
            ret = ERROR_HLS_AAC_FRAME_LENGTH;
            srs_error("invalid aac frame length=%d, ret=%d", size, ret);
            return ret;
        }
        
        /* the frame length is the AAC raw data plus the adts header size. */
        int32_t frame_length = size + 7;
        
        /*
         * AAC-ADTS
         * 6.2 Audio Data Transport Stream, ADTS
         * in aac-iso-13818-7.pdf, page 26.
         * fixed 7bytes header
         */
        u_int8_t adts_header[7] = {0xff, 0xf9, 0x00, 0x00, 0x00, 0x0f, 0xfc};
        
        /*
         * adts_fixed_header
         * 2B, 16bits
         * int16_t syncword; // 12bits, '1111 1111 1111'
         * int8_t ID; // 1bit, '1'
         * int8_t layer; // 2bits, '00'
         * int8_t protection_absent; // 1bit, can be '1'
         *
         * 12bits
         * int8_t profile; // 2bit, 7.1 Profiles, page 40
         * TSAacSampleFrequency sampling_frequency_index; // 4bits, Table 35, page 46
         * int8_t private_bit; // 1bit, can be '0'
         * int8_t channel_configuration; // 3bits, Table 8
         * int8_t original_or_copy; // 1bit, can be '0'
         * int8_t home; // 1bit, can be '0'
         *
         * adts_variable_header
         * 28bits
         * int8_t copyright_identification_bit; // 1bit, can be '0'
         * int8_t copyright_identification_start; // 1bit, can be '0'
         * int16_t frame_length; // 13bits
         * int16_t adts_buffer_fullness; // 11bits, 7FF signals that the bitstream 
         *                                  is a variable rate bitstream.
         * int8_t number_of_raw_data_blocks_in_frame; // 2bits, 
         *        // 0 indicating 1 raw_data_block()
         */
        /* profile, 2bits */
        SrsAacProfile aac_profile = srs_codec_aac_rtmp2ts(codec->aac_object);
        adts_header[2] = (aac_profile << 6) & 0xc0;
        /* sampling_frequency_index 4bits */
        adts_header[2] |= (codec->aac_sample_rate << 2) & 0x3c;
        /* channel_configuration 3bits */
        adts_header[2] |= (codec->aac_channels >> 2) & 0x01;
        adts_header[3] = (codec->aac_channels << 6) & 0xc0;
        /* frame_length 13bits */
        adts_header[3] |= (frame_length >> 11) & 0x03;
        adts_header[4] = (frame_length >> 3) & 0xff;
        adts_header[5] = ((frame_length << 5) & 0xe0);
        /* adts_buffer_fullness; 11bits */
        adts_header[5] |= 0x1f;
        
        /* copy to audio buffer */
        audio->payload->append((const char*)adts_header, sizeof(adts_header));
        audio->payload->append(sample_unit->bytes, sample_unit->size);
    }
    
    return ret;
}

该函数将每一个音频包都前都加上一个 7 字节的 adts_header。

1.3.4 SrsSimpleBuffer::append

/*
 * append specified bytes to buffer.
 * @param size, the size of bytes
 * @remark, assert size is positive
 */
void SrsSimpleBuffer::append(const char* bytes, int size)
{
    srs_assert(size > 0);
    
    data.insert(data.end(), bytes, bytes + size);
}

1.3.5 SrsHlsMuxer::is_segment_absolutely_overflow

/* drop the segment when duration of ts too small. */
#define SRS_AUTO_HLS_SEGMENT_MIN_DURATION_MS 100

/*
 * whether segment absolutely overflow, for pure audio to reap segment,
 * that is whether the current segment duration>=2*(the segment in config)
 * @see https://github.com/ossrs/srs/issues/151#issuecomment-71155184
 */
bool SrsHlsMuxer::is_segment_absolutely_overflow()
{
    /* @see https://github.com/ossrs/srs/issues/151#issuecomment-83553950 */
    srs_assert(current);
    
    /* to prevent very small segment */
    if (current->duration * 1000 < 2 * SRS_AUTO_HLS_SEGMENT_MIN_DURATION_MS) {
        return false;
    }
    
    /* use N% deviation, to smoother. */
    double deviation = hls_ts_floor? SRS_HLS_FLOOR_REAP_PERCENT * 
        deviation_ts * hls_fragment : 0.0;
    srs_info("hls: dur=%.2f, tar=%.2f, dev=%.2fms/%dp, frag=%.2f",
             current->duration, hls_fragment + deviation, 
             deviation, deviation_ts, hls_fragment);
    
    /* hls_aof_ratio: 倍数，纯音频时，当 ts 时长超过配置的 hls_fragment 
     * 乘以这个系数时就切割文件。例如，当 hls_fragment 是 10 秒，
     * hls_aof_ratio 是 2.0 时，对于纯音频，10s * 2.0 = 20 秒就切割 ts 文件 */
    return current->duration >= hls_aof_ratio * hls_fragment + deviation;
}

1.3.6 SrsHlsCache::reap_segment

/*
 * reopen the muxer for a new hls segment,
 * close current segment, open a new segment,
 * then write the key frame to the new segment.
 * so, user must reap_segment then flush_video to hls muxer.
 */
int SrsHlsCache::reap_segment(string log_desc, SrsHlsMuxer* muxer, 
    int64_t segment_start_dts)
{
    int ret = ERROR_SUCCESS;
    
    /* TODO: flush audio before or after segment?
     * TODO: fresh segment begin with audio or video? */
    
    /* close current ts. */
    if ((ret = muxer->segment_close(log_desc)) != ERROR_SUCCESS) {
        srs_error("m3u8 muxer close segment failed. ret=%d", ret);
        return ret;
    }
    
    /* open new ts. */
    if ((ret = muxer->segment_open(segment_start_dts)) != ERROR_SUCCES) {
        srs_error("m3u8 muxer open segment failed. ret=%d", ret);
        return ret;
    }
    
    /* segment open, flush video first. */
    if ((ret = muxer->flush_video(cache)) != ERROR_SUCCESS) {
        srs_error("m3u8 muxer flush video failed. ret=%d", ret);
        return ret;
    }
    
    /* segment open, flush the audio.
     * @see: ngx_rtmp_hls_open_fragment
     * start fragment with audio to make iPhone happy */
    if ((ret = muxer->flush_audio(cache)) != ERROR_SUCCESS) {
        srs_error("m3u8 muxer flush audio failed. ret=%d", ret);
        return ret;
    }
    
    return ret;
}

1.3.7 SrsHlsMuxer::pure_audio

/* whether current hls muxer is pure audio mode. */
bool SrsHlsMuxer::pure_audio()
{
    return current && current->muxer && 
           current->muxer->video_codec() == SrsCodecVideoDisabled;
}

检测当前 hls muxer 是否是纯音频。

1.3.8 SrsHlsMuxer::flush_audio

直接将音频帧逐帧写入到 ts 文件中。

int SrsHlsMuxer::flush_audio(SrsTsCache* cache)
{
    int ret = ERROR_SUCCESS;
    
    /* 检测是否已经打开当前要写入的片 */
    /* if current is NULL, segment is not open, ignore the flush event. */
    if (!current) {
        srs_warn("flush audio ignored, for segment is not open.");
        return ret;
    }
    
    /* cacha 缓冲必须有数据 */
    if (!cache->audio || cache->audio->payload->length() <= 0) {
        return ret;
    }
    
    /* 更新当前片的时长 */
    current->update_duration(cache->audio->pts);
    
    /* 将一个音频帧写入到 ts 文件中 */
    if ((ret = current->muxer->write_audio(cache->audio)) != ERROR_SUCCESS) 
    {
        return ret;
    }
    
    /* write success, clear and free the msg */
    srs_freep(cache->audio);

    return ret;
}

1.3.9 SrsHlsSegment::update_duration

该函数用于更新切片的时长。

/*
 * update the segment duration.
 * @current_frame_dts, the dts of frame, in tbn of ts.
 */
void SrsHlsSegment::update_duration(int64_t current_frame_dts)
{
    /* we use video/audio to update segment duration,
     * so when reap segment, some previous audio frame will
     * update the segment duration, which is nagetive, 
     * just ignore it. */
    if (current_frame_dts < segment_start_dts) {
        /* for atc and timestamp jump, reset the start dts. */
        if (current_frame_dts < 
            segment_start_dts - SRS_AUTO_HLS_SEGMENT_TIMESTAMP_JUMP_MS * 90) 
            
                     segment_start_dts, current_frame_dts);
            segment_start_dts = current_frame_dts;
        }
        return ;
    }
    
    /* duration: duration in seconds in m3u8. */
    duration = (current_frame_dts - segment_start_dts) / 90000.0;
    srs_assert(duration >= 0);
    
    return;
}

1.3.10 SrsTSMuxer::write_audio

/* write an audio frame to ts  */
int SrsTSMuxer::write_audio(SrsTsMessage* audio)
{
    int ret = ERROR_SUCCESS;
    
    /* ts 文件分三层：
     * 1. ts 层: 是在 pes 层上加入数据流的识别和传输必须的信息
     * 2. pes 层：是在音视频数据上加入了时间戳等对数据帧的说明信息
     * 3. es 层：即音视频数据 */
    /* 将音频帧写入到 PES packet 中 */
    if ((ret = context->encode(writer, audio, vcodec, acodec)) 
        != ERROR_SUCCESS) {
        srs_error("hls encode audio failed. ret=%d", ret);
        return ret;
    }
    
    return ret;
}

1.3.11 SrsTsContext::encode

/*
 * write the PES packet, the video/audio stream.
 * @param msg, the video/audio msg to write to ts.
 * @param vc, the video codec, write the PAT/PMT table when changed.
 * @param ac, the audio codec, write the PAT/PMT table when changed.
 */
int SrsTsContext::encode(SrsFileWriter* writer, SrsTsMessage* msg, 
    SrsCodecVideo vc, SrsCodecAudio ac)
{
    int ret = ERROR_SUCCESS;
    
    SrsTsStream vs, as;
    int16_t video_pid = 0, audio_pid = 0;
    switch (vc) {
        case SrsCodecVideoAVC:
            vs = SrsTsStreamVideoH264; 
            video_pid = TS_VIDEO_AVC_PID;
            break;
        case SrsCodecVideoDisabled:
            vs = SrsTsStreamReserved;
            break;
        case SrsCodecVideoReserved:
        case SrsCodecVideoReserved1:
        case SrsCodecVideoReserved2:
        case SrsCodecVideoSorensonH263:
        case SrsCodecVideoScreenVideo:
        case SrsCodecVideoOn2VP6:
        case SrsCodecVideoOn2VP6WithAlphaChannel:
        case SrsCodecVideoScreenVideoVersion2:
            vs = SrsTsStreamReserved;
            break;
    }
    switch (ac) {
        case SrsCodecAudioAAC:
            as = SrsTsStreamAudioAAC; 
            audio_pid = TS_AUDIO_AAC_PID;
            break;
        case SrsCodecAudioMP3:
            as = SrsTsStreamAudioMp3; 
            audio_pid = TS_AUDIO_MP3_PID;
            break;
        case SrsCodecAudioDisabled:
            as = SrsTsStreamReserved;
            break;
        case SrsCodecAudioReserved1:
        case SrsCodecAudioLinearPCMPlatformEndian:
        case SrsCodecAudioADPCM:
        case SrsCodecAudioLinearPCMLittleEndian:
        case SrsCodecAudioNellymoser16kHzMono:
        case SrsCodecAudioNellymoser8kHzMono:
        case SrsCodecAudioNellymoser:
        case SrsCodecAudioReservedG711AlawLogarithmicPCM:
        case SrsCodecAudioReservedG711MuLawLogarithmicPCM:
        case SrsCodecAudioReserved:
        case SrsCodecAudioSpeex:
        case SrsCodecAudioReservedMP3_8kHz:
        case SrsCodecAudioReservedDeviceSpecificSound:
            as = SrsTsStreamReserved;
            break;
    }
    
    if (as == SrsTsStreamReserved && vs == SrsTsStreamReserved) {
        ret = ERROR_HLS_NO_STREAM;
        srs_error("hls: no video or audio stream, vcodec=%d, acodec=%d. ret=%d", 
                  vc, ac, ret);
        return ret;
    }
    
    /* when any codec changed, write PAT/PMT table. */
    if (vcodec != vc || acodec != ac) {
        vcodec = vc;
        acodec = ac;
        if ((ret = encode_pat_pmt(writer, video_pid, vs, audio_pid, as)) 
            != ERROR_SUCCESS) {
            return ret;
        }
    }
    
    /* encode the media frame to PES packets over TS. */
    if (msg->is_audio()) {
        /* 将音频数据封装成 pes 包 */
        return encode_pes(writer, msg, audio_pid, as, vs == SrsTsStreamReserved);
    } else {
        return encode_pes(writer, msg, video_pid, vs, vs == SrsTsStreamReserved);
    }
}

1.3.12 SrsTsContext::encode_pes

该函数的具体分析可参考： SRS之SrsTsContext::encode_pes详解