demux aac from ts and write to file.aac

2025-03-09 15:49:59 +00:00 · 2013-11-22 00:04:37 +08:00 · 2013-11-22 00:04:37 +08:00 · f70894d2c3
commit f70894d2c3
parent a0ecc5a305
1 changed files with 276 additions and 8 deletions
--- a/trunk/research/ts_info.cpp
+++ b/trunk/research/ts_info.cpp
@ -557,6 +557,9 @@ public:
 	// 2.4.3.7 Semantic definition of fields in PES packet. page 49.
 	int32_t packet_start_code_prefix;
 	int64_t pts; // 33bits
 	int64_t dts; // 33bits
    // header size.
    int packet_header_size;
@ -681,6 +684,7 @@ TSMessage::TSMessage()
 	stream_type = TSStreamTypeReserved;
 	stream_id = 0;
 	packet_start_code_prefix = 0;
 	pts = dts = 0;
 	PES_packet_length = 0;
 	packet_header_size = 0;
 	parsed_packet_size = 0;
@ -1439,6 +1443,8 @@ int TSPayloadPES::demux(TSContext* ctx, TSPacket* pkt, u_int8_t* start, u_int8_t
 		msg->continuity_counter = pid->continuity_counter;
 		msg->stream_id = stream_id;
 		msg->packet_start_code_prefix = packet_start_code_prefix;
 		msg->dts = dts;
 		msg->pts = pts;
 		// PES_packet_data_byte, page58.
 		// the packet size contains the header size.
@ -1789,7 +1795,31 @@ public:
 };
 /**
-* 6.2 Audio Data Transport Stream, ADTS
+* Table 35 – Sampling frequency dependent on
 * sampling_frequency_index. in page 46.
 */
 enum TSAacSampleFrequency
 {
 	TSAacSampleFrequency96000 		= 0x00,
 	TSAacSampleFrequency88200 		= 0x01,
 	TSAacSampleFrequency64000 		= 0x02,
 	TSAacSampleFrequency48000 		= 0x03,
 	TSAacSampleFrequency44100 		= 0x04,
 	TSAacSampleFrequency32000 		= 0x05,
 	TSAacSampleFrequency24000 		= 0x06,
 	TSAacSampleFrequency22050 		= 0x07,
 	TSAacSampleFrequency16000 		= 0x08,
 	TSAacSampleFrequency12000 		= 0x09,
 	TSAacSampleFrequency11025 		= 0x0a,
 	TSAacSampleFrequency8000  		= 0x0b,
 	TSAacSampleFrequencyReserved0 	= 0x0c,
 	TSAacSampleFrequencyReserved1 	= 0x0d,
 	TSAacSampleFrequencyReserved2 	= 0x0e,
 	TSAacSampleFrequencyReserved3 	= 0x0f,
 };
 /**
 * 6.2 Audio Data Transport Stream, ADTS, in page 26.
 */
 class TSAacAdts
 {
@ -1802,7 +1832,7 @@ public:
 	int8_t protection_absent; //1bit
 	// 12bits
 	int8_t profile; //2bit
-	int8_t sampling_frequency_index; //4bits
+	TSAacSampleFrequency sampling_frequency_index; //4bits
 	int8_t private_bit; //1bit
 	int8_t channel_configuration; //3bits
 	int8_t original_or_copy; //1bit
@ -1826,7 +1856,7 @@ public:
 		layer = 0;
 		protection_absent = 0;
 		profile = 0;
-		sampling_frequency_index = 0;
+		sampling_frequency_index = TSAacSampleFrequencyReserved0;
 		private_bit = 0;
 		channel_configuration = 0;
 		original_or_copy = 0;
@ -1904,7 +1934,7 @@ public:
 		private_bit = temp & 0x01;
 		temp = temp >> 1;
-		sampling_frequency_index = temp & 0x0F;
+		sampling_frequency_index = (TSAacSampleFrequency)(temp & 0x0F);
 		temp = temp >> 4;
 		profile = temp & 0x03;
@ -1928,7 +1958,199 @@ public:
 	}
 };
-int consume(TSMessage* msg)
+class FlvMuxer
 {
 public:
 	int fd;
 	const char* file;
 	bool audio_sequence_header_writen;
 	FlvMuxer()
 	{
 		file = NULL;
 		fd = 0;
 		audio_sequence_header_writen = false;
 	}
 	virtual ~FlvMuxer()
 	{
 		if (fd > 0) {
 			close(fd);
 		}
 	}
 	int open(const char* _file)
 	{
 		file = _file;
 		if ((fd = ::open(file, O_CREAT|O_WRONLY|O_TRUNC, 
 			S_IRUSR|S_IWUSR|S_IRGRP|S_IWGRP|S_IROTH)) < 0 
 		) {
 			return -1;
 		}
 		char header[] = {
 			0x46, 0x4c, 0x56, // FLV
 			0x01,  // version: 01
 			0x04, // 0x05:audio+video, 0x01:video, 0x04:audio
 			0x00, 0x00, 0x00, 0x09, // offset: always 0x09
 			0x00, 0x00, 0x00, 0x00 // previous tag 0: always 0
 		};
 		if (write(fd, header, sizeof(header)) != sizeof(header)) {
 			return -1;
 		}
 		return 0;
 	}
 	/**
 	* @param size, if 0 for sequence header.
 	* @param sound_rate, Sampling rate. The following values are defined:
 	* 		0 = 5.5 kHz
 	* 		1 = 11 kHz
 	* 		2 = 22 kHz
 	* 		3 = 44 kHz
 	* @param sound_type, Mono or stereo sound
 	* 		0 = Mono sound
 	* 		1 = Stereo sound
 	*/
 	int write_audio(char* data, int size, u_int32_t timestamp, int sound_rate, int sound_type)
 	{
 		if (size > 0 && !audio_sequence_header_writen) {
 			audio_sequence_header_writen = true;
 			if (write_audio(NULL, 0, 0, sound_rate, sound_type) != 0) {
 				return -1;
 			}
 		}
 		char tag_header[11];
 		char sequence_header[2]; // aac only
 		int data_size = size + sizeof(sequence_header);
 		int tag_size = data_size + sizeof(tag_header);
 		////////////////////////////////////
 		// 11bytes tag header.
 		////////////////////////////////////
 		// TagType
 		char* p = tag_header;
 		*p++ = 0x08; // audio
 		// DataSize
 		char* pp = (char*)&data_size;
 		*p++ = pp[2];
 		*p++ = pp[1];
 		*p++ = pp[0];
 		// Timestamp
 		pp = (char*)&timestamp;
 		*p++ = pp[2];
 		*p++ = pp[1];
 		*p++ = pp[0];
 		// TimestampExtended
 		*p++ = pp[3]; 
 		//StreamID
 		*p++ = 0;
 		*p++ = 0;
 		*p++ = 0;
 		////////////////////////////////////
 		// 2bytes codec header for aac
 		////////////////////////////////////
 		// SoundFormat
 		sequence_header[0] = 0xa0; // aac
 		sequence_header[0] |= (sound_rate << 2) & 0x0c;
 		sequence_header[0] |= 0x02; // Compressed formats always decode to 16 bits internally.
 		sequence_header[0] |= sound_type & 0x01;
 		// AACPacketType
 		if (size == 0) {
 			sequence_header[1] = 0x00;
 		} else {
 			sequence_header[1] = 0x01;
 		}
 		////////////////////////////////////
 		// 4bytes tag size
 		////////////////////////////////////
 		char tag_size_bytes[4];
 		p = tag_size_bytes;
 		pp = (char*)&tag_size;
 		*p++ = pp[4];
 		*p++ = pp[2];
 		*p++ = pp[1];
 		*p++ = pp[0];
 		// write
 		if (write(fd, tag_header, sizeof(tag_header)) != sizeof(tag_header)) {
 			return -1;
 		}
 		if (write(fd, sequence_header, sizeof(sequence_header)) != sizeof(sequence_header)) {
 			return -1;
 		}
 		if (size > 0 && write(fd, data, size) != size) {
 			return -1;
 		}
 		if (write(fd, tag_size_bytes, sizeof(tag_size_bytes)) != sizeof(tag_size_bytes)) {
 			return -1;
 		}
 		return 0;
 	}
 	int write_video(char* data, int size)
 	{
 		return 0;
 	}
 };
 class AacMuxer
 {
 public:
 	int fd;
 	const char* file;
 	AacMuxer()
 	{
 		file = NULL;
 		fd = 0;
 	}
 	virtual ~AacMuxer()
 	{
 		if (fd > 0) {
 			close(fd);
 		}
 	}
 	int open(const char* _file)
 	{
 		file = _file;
 		if ((fd = ::open(file, O_CREAT|O_WRONLY|O_TRUNC, 
 			S_IRUSR|S_IWUSR|S_IRGRP|S_IWGRP|S_IROTH)) < 0 
 		) {
 			return -1;
 		}
 		return 0;
 	}
 	int write_audio(char* data, int size)
 	{
 		if (size > 0 && write(fd, data, size) != size) {
 			return -1;
 		}
 		return 0;
 	}
 	int write_video(char* data, int size)
 	{
 		return 0;
 	}
 };
 int consume(TSMessage* msg, FlvMuxer* flv, AacMuxer* aac_muxer)
 {
 	int ret = 0;
@ -1941,6 +2163,11 @@ int consume(TSMessage* msg)
 	char* last = msg->packet_data + msg->packet_data_size;
    if (!msg->is_video()) {
 	    // write AAC raw audio.
 	    if (aac_muxer && (ret = aac_muxer->write_audio((char*)msg->packet_data, msg->packet_data_size)) != 0) {
 	        return ret;
 	    }
 	    // parse AAC audio.
 		while (p < last) {
 		    TSAacAdts aac;
@ -1949,7 +2176,35 @@ int consume(TSMessage* msg)
 		    }
 		    trace("ts+aac audio raw data parsed, size: %d, 0x%02x 0x%02x 0x%02x 0x%02x",
 		    	aac.size, aac.at(0), aac.at(1), aac.at(2), aac.at(3));
-		    // TODO: process audio.
+		    
 		    int sound_rate = 0;
 		    if (aac.sampling_frequency_index == TSAacSampleFrequency22050) {
 		        sound_rate = 0x02;
 		    } else if(aac.sampling_frequency_index == TSAacSampleFrequency44100) {
 		        sound_rate = 0x03;
 		    } else {
 		         // 0 = 5.5 kHz
 		         // 1 = 11 kHz
 		         // others.
 		         trace("ts+aac flv donot support sample-rate: %d", aac.sampling_frequency_index);
 		         return -1;
 		    }
 		    int sound_type = 0;
 		    if (aac.channel_configuration == 1) {
 		        // 0 = Mono sound
 		        sound_type = 0;
 		    } else if (aac.channel_configuration == 2) {
 		        // 1 = Stereo sound
 		        sound_type = 1;
 		    } else {
 		         trace("ts+aac flv donot support channel: %d", aac.channel_configuration);
 		         return -1;
 		    }
 		    if (flv && (ret = flv->write_audio((char*)aac.raw_data, aac.size, msg->pts, sound_rate, sound_type)) != 0) {
 		        return ret;
 		    }
 		}
    } else {
        // parse H264 video.
@ -1970,10 +2225,23 @@ int consume(TSMessage* msg)
 int main(int /*argc*/, char** /*argv*/)
 {
    const char* file = "livestream-1347.ts";
-    //file = "nginx-rtmp-hls/livestream-1347-currupt.ts";
+    const char* output_flv_file = "livestream.flv";
    const char* output_aac_file = "livestream.aac";
    int fd = open(file, O_RDONLY);
    FlvMuxer flv;
    AacMuxer aac_muxer;
    int ret = 0;
    if ((ret = flv.open(output_flv_file)) != 0) {
        trace("flv+open open flv file failed.");
        return ret;
    }
    if ((ret = aac_muxer.open(output_aac_file)) != 0) {
        trace("aac_muxer+open open flv file failed.");
        return ret;
    }
    trace("demuxer+read packet count offset T+0  T+1  T+2  T+3  T+x T+L2 T+L1 T+L0");
    TSContext ctx;
@ -2012,7 +2280,7 @@ int main(int /*argc*/, char** /*argv*/)
 	            continue;
 	        }
-	        if ((ret = consume(msg)) != 0) {
+	        if ((ret = consume(msg, &flv, &aac_muxer)) != 0) {
 	            trace("demuxer+consume parse and consume message failed. ret=%d", ret);
 	            break;
 	        }