Context Navigation

← Previous Revision
Latest Revision
Next Revision →
Annotate
Revision Log

mpeginfo.py @ 4

Revision 4, 28.8 KB checked in by ajaworski, 13 years ago (diff)
Added modified SAGE sources

Line
1	#if 0
2	# $Id: mpeginfo.py,v 1.33 2005/02/15 18:52:51 dischi Exp $
3	# $Log: mpeginfo.py,v $
4	# Revision 1.33 2005/02/15 18:52:51 dischi
5	# some strange bugfix (what is this doing?)
6	#
7	# Revision 1.32 2005/01/21 16:37:02 dischi
8	# try to find bad timestamps
9	#
10	# Revision 1.31 2005/01/08 12:06:45 dischi
11	# make sure the buffer is big enough
12	#
13	# Revision 1.30 2005/01/02 14:57:27 dischi
14	# detect ac3 in normal mpeg2
15	#
16	# Revision 1.29 2004/11/27 14:42:12 dischi
17	# remove future warning
18	#
19	# Revision 1.28 2004/11/15 21:43:36 dischi
20	# remove bad debugging stuff
21	#
22	# Revision 1.27 2004/11/12 18:10:45 dischi
23	# add ac3 support in mpeg streams
24	#
25	# Revision 1.26 2004/10/04 18:06:54 dischi
26	# test length of remaining buffer
27	#
28	# Revision 1.25 2004/07/11 19:37:25 dischi
29	# o read more bytes on ts scan
30	# o support for AC3 in private streams
31	#
32	# Revision 1.24 2004/07/03 09:01:32 dischi
33	# o fix PES start detection inside TS
34	# o try to find out if the stream is progressive or interlaced
35	#
36	# Revision 1.23 2004/06/23 19:44:10 dischi
37	# better length detection, big cleanup
38	#
39	# Revision 1.22 2004/06/22 21:37:34 dischi
40	# o PES support
41	# o basic length detection for TS and PES
42	#
43	# Revision 1.21 2004/06/21 20:37:34 dischi
44	# basic support for mpeg-ts
45	#
46	# Revision 1.20 2004/03/13 23:41:59 dischi
47	# add AudioInfo to mpeg for all streams
48	#
49	# Revision 1.19 2004/02/11 20:11:54 dischi
50	# Updated length calculation for mpeg files. This may not work for all files.
51	#
52	#
53	# MMPython - Media Metadata for Python
54	# Copyright (C) 2003 Thomas Schueppel
55	#
56	# This program is free software; you can redistribute it and/or modify
57	# it under the terms of the GNU General Public License as published by
58	# the Free Software Foundation; either version 2 of the License, or
59	# (at your option) any later version.
60	#
61	# This program is distributed in the hope that it will be useful, but
62	# WITHOUT ANY WARRANTY; without even the implied warranty of MER-
63	# CHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
64	# Public License for more details.
65	#
66	# You should have received a copy of the GNU General Public License along
67	# with this program; if not, write to the Free Software Foundation, Inc.,
68	# 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
69	#
70	# -----------------------------------------------------------------------
71	#endif
72
73	import re
74	import os
75	import struct
76	import string
77	import fourcc
78
79	from mmpython import mediainfo
80	import mmpython
81	import stat
82
83	##------------------------------------------------------------------------
84	## START_CODE
85	##
86	## Start Codes, with 'slice' occupying 0x01..0xAF
87	##------------------------------------------------------------------------
88	START_CODE = {
89	0x00 : 'picture_start_code',
90	0xB0 : 'reserved',
91	0xB1 : 'reserved',
92	0xB2 : 'user_data_start_code',
93	0xB3 : 'sequence_header_code',
94	0xB4 : 'sequence_error_code',
95	0xB5 : 'extension_start_code',
96	0xB6 : 'reserved',
97	0xB7 : 'sequence end',
98	0xB8 : 'group of pictures',
99	}
100	for i in range(0x01,0xAF):
101	START_CODE[i] = 'slice_start_code'
102
103	##------------------------------------------------------------------------
104	## START CODES
105	##------------------------------------------------------------------------
106	PICTURE = 0x00
107	USERDATA = 0xB2
108	SEQ_HEAD = 0xB3
109	SEQ_ERR = 0xB4
110	EXT_START = 0xB5
111	SEQ_END = 0xB7
112	GOP = 0xB8
113
114	SEQ_START_CODE = 0xB3
115	PACK_PKT = 0xBA
116	SYS_PKT = 0xBB
117	PADDING_PKT = 0xBE
118	AUDIO_PKT = 0xC0
119	VIDEO_PKT = 0xE0
120	PRIVATE_STREAM1 = 0xBD
121	PRIVATE_STREAM2 = 0xBf
122
123	TS_PACKET_LENGTH = 188
124	TS_SYNC = 0x47
125
126	##------------------------------------------------------------------------
127	## FRAME_RATE
128	##
129	## A lookup table of all the standard frame rates. Some rates adhere to
130	## a particular profile that ensures compatibility with VLSI capabilities
131	## of the early to mid 1990s.
132	##
133	## CPB
134	## Constrained Parameters Bitstreams, an MPEG-1 set of sampling and
135	## bitstream parameters designed to normalize decoder computational
136	## complexity, buffer size, and memory bandwidth while still addressing
137	## the widest possible range of applications.
138	##
139	## Main Level
140	## MPEG-2 Video Main Profile and Main Level is analogous to MPEG-1's
141	## CPB, with sampling limits at CCIR 601 parameters (720x480x30 Hz or
142	## 720x576x24 Hz).
143	##
144	##------------------------------------------------------------------------
145	FRAME_RATE = [
146	0,
147	round(24000.0/1001*100)/100, ## 3-2 pulldown NTSC (CPB/Main Level)
148	24, ## Film (CPB/Main Level)
149	25, ## PAL/SECAM or 625/60 video
150	round(30000.0/1001*100)/100, ## NTSC (CPB/Main Level)
151	30, ## drop-frame NTSC or component 525/60 (CPB/Main Level)
152	50, ## double-rate PAL
153	round(60000.0/1001*100)/100, ## double-rate NTSC
154	60, ## double-rate, drop-frame NTSC/component 525/60 video
155	]
156
157	##------------------------------------------------------------------------
158	## ASPECT_RATIO -- INCOMPLETE?
159	##
160	## This lookup table maps the header aspect ratio index to a common name.
161	## These are just the defined ratios for CPB I believe. As I understand
162	## it, a stream that doesn't adhere to one of these aspect ratios is
163	## technically considered non-compliant.
164	##------------------------------------------------------------------------
165	ASPECT_RATIO = [ 'Forbidden',
166	'1/1 (VGA)',
167	'4/3 (TV)',
168	'16/9 (Large TV)',
169	'2.21/1 (Cinema)',
170	]
171
172
173	class MpegInfo(mediainfo.AVInfo):
174	def __init__(self,file):
175	mediainfo.AVInfo.__init__(self)
176	self.context = 'video'
177	self.sequence_header_offset = 0
178
179	# detect TS (fast scan)
180	self.valid = self.isTS(file)
181
182	if not self.valid:
183	# detect system mpeg (many infos)
184	self.valid = self.isMPEG(file)
185
186	if not self.valid:
187	# detect PES
188	self.valid = self.isPES(file)
189
190	if self.valid:
191	self.mime = 'video/mpeg'
192	if not self.video:
193	self.video.append(mediainfo.VideoInfo())
194
195	if self.sequence_header_offset <= 0:
196	return
197
198	self.progressive(file)
199
200	for vi in self.video:
201	vi.width, vi.height = self.dxy(file)
202	vi.fps, vi.aspect = self.framerate_aspect(file)
203	vi.bitrate = self.bitrate(file)
204	if self.length:
205	vi.length = self.length
206
207	if not self.type:
208	if self.video[0].width == 480:
209	self.type = 'MPEG2 video' # SVCD spec
210	elif self.video[0].width == 352:
211	self.type = 'MPEG1 video' # VCD spec
212	else:
213	self.type = 'MPEG video'
214
215	if mediainfo.DEBUG > 2:
216	self.__scan__()
217
218
219	def dxy(self,file):
220	"""
221	get width and height of the video
222	"""
223	file.seek(self.sequence_header_offset+4,0)
224	v = file.read(4)
225	x = struct.unpack('>H',v[:2])[0] >> 4
226	y = struct.unpack('>H',v[1:3])[0] & 0x0FFF
227	return (x,y)
228
229
230	def framerate_aspect(self,file):
231	"""
232	read framerate and aspect ratio
233	"""
234	file.seek(self.sequence_header_offset+7,0)
235	v = struct.unpack( '>B', file.read(1) )[0]
236	try:
237	fps = FRAME_RATE[v&0xf]
238	except IndexError:
239	fps = None
240	try:
241	aspect = ASPECT_RATIO[v>>4]
242	except IndexError:
243	if mediainfo.DEBUG:
244	print 'Index error: %s' % (v>>4)
245	aspect = None
246	return (fps, aspect)
247
248
249	def progressive(self, file):
250	"""
251	Try to find out with brute force if the mpeg is interlaced or not.
252	Search for the Sequence_Extension in the extension header (01B5)
253	"""
254	file.seek(0)
255	buffer = ''
256	count = 0
257	while 1:
258	if len(buffer) < 1000:
259	count += 1
260	if count > 1000:
261	break
262	buffer += file.read(1024)
263	if len(buffer) < 1000:
264	break
265	pos = buffer.find('\x00\x00\x01\xb5')
266	if pos == -1 or len(buffer) - pos < 5:
267	buffer = buffer[-10:]
268	continue
269	ext = (ord(buffer[pos+4]) >> 4)
270	if ext == 8:
271	pass
272	elif ext == 1:
273	if (ord(buffer[pos+5]) >> 3) & 1:
274	self.keys.append('progressive')
275	self.progressive = 1
276	else:
277	self.keys.append('interlaced')
278	self.interlaced = 1
279	return True
280	else:
281	print 'ext', ext
282	buffer = buffer[pos+4:]
283	return False
284
285
286	##------------------------------------------------------------------------
287	## bitrate()
288	##
289	## From the MPEG-2.2 spec:
290	##
291	## bit_rate -- This is a 30-bit integer. The lower 18 bits of the
292	## integer are in bit_rate_value and the upper 12 bits are in
293	## bit_rate_extension. The 30-bit integer specifies the bitrate of the
294	## bitstream measured in units of 400 bits/second, rounded upwards.
295	## The value zero is forbidden.
296	##
297	## So ignoring all the variable bitrate stuff for now, this 30 bit integer
298	## multiplied times 400 bits/sec should give the rate in bits/sec.
299	##
300	## TODO: Variable bitrates? I need one that implements this.
301	##
302	## Continued from the MPEG-2.2 spec:
303	##
304	## If the bitstream is a constant bitrate stream, the bitrate specified
305	## is the actual rate of operation of the VBV specified in annex C. If
306	## the bitstream is a variable bitrate stream, the STD specifications in
307	## ISO/IEC 13818-1 supersede the VBV, and the bitrate specified here is
308	## used to dimension the transport stream STD (2.4.2 in ITU-T Rec. xxx \|
309	## ISO/IEC 13818-1), or the program stream STD (2.4.5 in ITU-T Rec. xxx \|
310	## ISO/IEC 13818-1).
311	##
312	## If the bitstream is not a constant rate bitstream the vbv_delay
313	## field shall have the value FFFF in hexadecimal.
314	##
315	## Given the value encoded in the bitrate field, the bitstream shall be
316	## generated so that the video encoding and the worst case multiplex
317	## jitter do not cause STD buffer overflow or underflow.
318	##
319	##
320	##------------------------------------------------------------------------
321
322
323	## Some parts in the code are based on mpgtx (mpgtx.sf.net)
324
325	def bitrate(self,file):
326	"""
327	read the bitrate (most of the time broken)
328	"""
329	file.seek(self.sequence_header_offset+8,0)
330	t,b = struct.unpack( '>HB', file.read(3) )
331	vrate = t << 2 \| b >> 6
332	return vrate * 400
333
334
335	def ReadSCRMpeg2(self, buffer):
336	"""
337	read SCR (timestamp) for MPEG2 at the buffer beginning (6 Bytes)
338	"""
339	highbit = (ord(buffer[0])&0x20)>>5
340
341	low4Bytes= ((long(ord(buffer[0])) & 0x18) >> 3) << 30
342	low4Bytes \|= (ord(buffer[0]) & 0x03) << 28
343	low4Bytes \|= ord(buffer[1]) << 20
344	low4Bytes \|= (ord(buffer[2]) & 0xF8) << 12
345	low4Bytes \|= (ord(buffer[2]) & 0x03) << 13
346	low4Bytes \|= ord(buffer[3]) << 5
347	low4Bytes \|= (ord(buffer[4])) >> 3
348
349	sys_clock_ref=(ord(buffer[4]) & 0x3) << 7
350	sys_clock_ref\|=(ord(buffer[5]) >> 1)
351
352	return (long(highbit * (1<<16) * (1<<16)) + low4Bytes) / 90000
353
354
355	def ReadSCRMpeg1(self, buffer):
356	"""
357	read SCR (timestamp) for MPEG1 at the buffer beginning (5 Bytes)
358	"""
359	highbit = (ord(buffer[0]) >> 3) & 0x01
360
361	low4Bytes = ((long(ord(buffer[0])) >> 1) & 0x03) << 30
362	low4Bytes \|= ord(buffer[1]) << 22;
363	low4Bytes \|= (ord(buffer[2]) >> 1) << 15;
364	low4Bytes \|= ord(buffer[3]) << 7;
365	low4Bytes \|= ord(buffer[4]) >> 1;
366
367	return (long(highbit) * (1<<16) * (1<<16) + low4Bytes) / 90000;
368
369
370	def ReadPTS(self, buffer):
371	"""
372	read PTS (PES timestamp) at the buffer beginning (5 Bytes)
373	"""
374	high = ((ord(buffer[0]) & 0xF) >> 1)
375	med = (ord(buffer[1]) << 7) + (ord(buffer[2]) >> 1)
376	low = (ord(buffer[3]) << 7) + (ord(buffer[4]) >> 1)
377	return ((long(high) << 30 ) + (med << 15) + low) / 90000
378
379
380	def ReadHeader(self, buffer, offset):
381	"""
382	Handle MPEG header in buffer on position offset
383	Return -1 on error, new offset or 0 if the new offset can't be scanned
384	"""
385	if buffer[offset:offset+3] != '\x00\x00\x01':
386	return -1
387
388	id = ord(buffer[offset+3])
389
390	if id == PADDING_PKT:
391	return offset + (ord(buffer[offset+4]) << 8) + ord(buffer[offset+5]) + 6
392
393	if id == PACK_PKT:
394	if ord(buffer[offset+4]) & 0xF0 == 0x20:
395	self.type = 'MPEG1 video'
396	self.get_time = self.ReadSCRMpeg1
397	return offset + 12
398	elif (ord(buffer[offset+4]) & 0xC0) == 0x40:
399	self.type = 'MPEG2 video'
400	self.get_time = self.ReadSCRMpeg2
401	return offset + (ord(buffer[offset+13]) & 0x07) + 14
402	else:
403	# WTF? Very strange
404	return -1
405
406	if 0xC0 <= id <= 0xDF:
407	# code for audio stream
408	for a in self.audio:
409	if a.id == id:
410	break
411	else:
412	self.audio.append(mediainfo.AudioInfo())
413	self.audio[-1].id = id
414	self.audio[-1].keys.append('id')
415	return 0
416
417	if 0xE0 <= id <= 0xEF:
418	# code for video stream
419	for v in self.video:
420	if v.id == id:
421	break
422	else:
423	self.video.append(mediainfo.VideoInfo())
424	self.video[-1].id = id
425	self.video[-1].keys.append('id')
426	return 0
427
428	if id == SEQ_HEAD:
429	# sequence header, remember that position for later use
430	self.sequence_header_offset = offset
431	return 0
432
433	if id in (PRIVATE_STREAM1, PRIVATE_STREAM2):
434	# private stream. we don't know, but maybe we can guess later
435	add = ord(buffer[offset+8])
436	# if (ord(buffer[offset+6]) & 4) or 1:
437	# id = ord(buffer[offset+10+add])
438	if buffer[offset+11+add:offset+15+add].find('\x0b\x77') != -1:
439	# AC3 stream
440	for a in self.audio:
441	if a.id == id:
442	break
443	else:
444	self.audio.append(mediainfo.AudioInfo())
445	self.audio[-1].id = id
446	self.audio[-1].codec = 'AC3'
447	self.audio[-1].keys.append('id')
448	return 0
449
450	if id == SYS_PKT:
451	return 0
452
453	if id == EXT_START:
454	return 0
455
456	return 0
457
458
459	# Normal MPEG (VCD, SVCD) ========================================
460
461	def isMPEG(self, file):
462	"""
463	This MPEG starts with a sequence of 0x00 followed by a PACK Header
464	http://dvd.sourceforge.net/dvdinfo/packhdr.html
465	"""
466	file.seek(0,0)
467	buffer = file.read(10000)
468	offset = 0
469
470	# seek until the 0 byte stop
471	while buffer[offset] == '\0':
472	offset += 1
473	offset -= 2
474
475	# test for mpeg header 0x00 0x00 0x01
476	if not buffer[offset:offset+4] == '\x00\x00\x01%s' % chr(PACK_PKT):
477	return 0
478
479	# scan the 100000 bytes of data
480	buffer += file.read(100000)
481
482	# scan first header, to get basic info about
483	# how to read a timestamp
484	self.ReadHeader(buffer, offset)
485
486	# store first timestamp
487	self.start = self.get_time(buffer[offset+4:])
488	while len(buffer) > offset + 1000 and buffer[offset:offset+3] == '\x00\x00\x01':
489	# read the mpeg header
490	new_offset = self.ReadHeader(buffer, offset)
491
492	# header scanning detected error, this is no mpeg
493	if new_offset == -1:
494	return 0
495
496	if new_offset:
497	# we have a new offset
498	offset = new_offset
499
500	# skip padding 0 before a new header
501	while len(buffer) > offset + 10 and \
502	not ord(buffer[offset+2]):
503	offset += 1
504
505	else:
506	# seek to new header by brute force
507	offset += buffer[offset+4:].find('\x00\x00\x01') + 4
508
509	# fill in values for support functions:
510	self.__seek_size__ = 1000000
511	self.__sample_size__ = 10000
512	self.__search__ = self._find_timer_
513	self.filename = file.name
514
515	# get length of the file
516	self.length = self.get_length()
517	return 1
518
519
520	def _find_timer_(self, buffer):
521	"""
522	Return position of timer in buffer or -1 if not found.
523	This function is valid for 'normal' mpeg files
524	"""
525	pos = buffer.find('\x00\x00\x01%s' % chr(PACK_PKT))
526	if pos == -1:
527	return -1
528	return pos + 4
529
530
531
532	# PES ============================================================
533
534
535	def ReadPESHeader(self, offset, buffer, id=0):
536	"""
537	Parse a PES header.
538	Since it starts with 0x00 0x00 0x01 like 'normal' mpegs, this
539	function will return (0, -1) when it is no PES header or
540	(packet length, timestamp position (maybe -1))
541
542	http://dvd.sourceforge.net/dvdinfo/pes-hdr.html
543	"""
544	if not buffer[0:3] == '\x00\x00\x01':
545	return 0, -1
546
547	packet_length = (ord(buffer[4]) << 8) + ord(buffer[5]) + 6
548	align = ord(buffer[6]) & 4
549	header_length = ord(buffer[8])
550
551	# PES ID (starting with 001)
552	if ord(buffer[3]) & 0xE0 == 0xC0:
553	id = id or ord(buffer[3]) & 0x1F
554	for a in self.audio:
555	if a.id == id:
556	break
557	else:
558	self.audio.append(mediainfo.AudioInfo())
559	self.audio[-1].id = id
560	self.audio[-1].keys.append('id')
561
562	elif ord(buffer[3]) & 0xF0 == 0xE0:
563	id = id or ord(buffer[3]) & 0xF
564	for v in self.video:
565	if v.id == id:
566	break
567	else:
568	self.video.append(mediainfo.VideoInfo())
569	self.video[-1].id = id
570	self.video[-1].keys.append('id')
571
572	# new mpeg starting
573	if buffer[header_length+9:header_length+13] == \
574	'\x00\x00\x01\xB3' and not self.sequence_header_offset:
575	# yes, remember offset for later use
576	self.sequence_header_offset = offset + header_length+9
577	elif ord(buffer[3]) == 189 or ord(buffer[3]) == 191:
578	# private stream. we don't know, but maybe we can guess later
579	id = id or ord(buffer[3]) & 0xF
580	if align and buffer[header_length+9:header_length+11] == '\x0b\x77':
581	# AC3 stream
582	for a in self.audio:
583	if a.id == id:
584	break
585	else:
586	self.audio.append(mediainfo.AudioInfo())
587	self.audio[-1].id = id
588	self.audio[-1].codec = 'AC3'
589	self.audio[-1].keys.append('id')
590
591	else:
592	# unknown content
593	pass
594
595	ptsdts = ord(buffer[7]) >> 6
596
597	if ptsdts and ptsdts == ord(buffer[9]) >> 4:
598	if ord(buffer[9]) >> 4 != ptsdts:
599	print 'WARNING: bad PTS/DTS, please contact us'
600	return packet_length, -1
601
602	# timestamp = self.ReadPTS(buffer[9:14])
603	high = ((ord(buffer[9]) & 0xF) >> 1)
604	med = (ord(buffer[10]) << 7) + (ord(buffer[11]) >> 1)
605	low = (ord(buffer[12]) << 7) + (ord(buffer[13]) >> 1)
606	return packet_length, 9
607
608	return packet_length, -1
609
610
611
612	def isPES(self, file):
613	if mediainfo.DEBUG:
614	print 'trying mpeg-pes scan'
615	file.seek(0,0)
616	buffer = file.read(3)
617
618	# header (also valid for all mpegs)
619	if not buffer == '\x00\x00\x01':
620	return 0
621
622	self.sequence_header_offset = 0
623	buffer += file.read(10000)
624
625	offset = 0
626	while offset + 1000 < len(buffer):
627	pos, timestamp = self.ReadPESHeader(offset, buffer[offset:])
628	if not pos:
629	return 0
630	if timestamp != -1 and not hasattr(self, 'start'):
631	self.get_time = self.ReadPTS
632	self.start = self.get_time(buffer[offset+timestamp:offset+timestamp+5])
633	if self.sequence_header_offset and hasattr(self, 'start'):
634	# we have all informations we need
635	break
636
637	offset += pos
638	if offset + 1000 < len(buffer) and len(buffer) < 1000000 or 1:
639	# looks like a pes, read more
640	buffer += file.read(10000)
641
642	if not self.video and not self.audio:
643	# no video and no audio?
644	return 0
645
646	self.type = 'MPEG-PES'
647
648	# fill in values for support functions:
649	self.__seek_size__ = 10000000 # 10 MB
650	self.__sample_size__ = 500000 # 500 k scanning
651	self.__search__ = self._find_timer_PES_
652	self.filename = file.name
653
654	# get length of the file
655	self.length = self.get_length()
656	return 1
657
658
659	def _find_timer_PES_(self, buffer):
660	"""
661	Return position of timer in buffer or -1 if not found.
662	This function is valid for PES files
663	"""
664	pos = buffer.find('\x00\x00\x01')
665	offset = 0
666	if pos == -1 or offset + 1000 >= len(buffer):
667	return -1
668
669	retpos = -1
670	ackcount = 0
671	while offset + 1000 < len(buffer):
672	pos, timestamp = self.ReadPESHeader(offset, buffer[offset:])
673	if timestamp != -1 and retpos == -1:
674	retpos = offset + timestamp
675	if pos == 0:
676	# Oops, that was a mpeg header, no PES header
677	offset += buffer[offset:].find('\x00\x00\x01')
678	retpos = -1
679	ackcount = 0
680	else:
681	offset += pos
682	if retpos != -1:
683	ackcount += 1
684	if ackcount > 10:
685	# looks ok to me
686	return retpos
687	return -1
688
689
690	# Transport Stream ===============================================
691
692	def isTS(self, file):
693	file.seek(0,0)
694
695	buffer = file.read(TS_PACKET_LENGTH * 2)
696	c = 0
697
698	while c + TS_PACKET_LENGTH < len(buffer):
699	if ord(buffer[c]) == ord(buffer[c+TS_PACKET_LENGTH]) == TS_SYNC:
700	break
701	c += 1
702	else:
703	return 0
704
705	buffer += file.read(10000)
706	self.type = 'MPEG-TS'
707
708	while c + TS_PACKET_LENGTH < len(buffer):
709	start = ord(buffer[c+1]) & 0x40
710	# maybe load more into the buffer
711	if c + 2 * TS_PACKET_LENGTH > len(buffer) and c < 500000:
712	buffer += file.read(10000)
713
714	# wait until the ts payload contains a payload header
715	if not start:
716	c += TS_PACKET_LENGTH
717	continue
718
719	tsid = ((ord(buffer[c+1]) & 0x3F) << 8) + ord(buffer[c+2])
720	adapt = (ord(buffer[c+3]) & 0x30) >> 4
721
722	offset = 4
723	if adapt & 0x02:
724	# meta info present, skip it for now
725	adapt_len = ord(buffer[c+offset])
726	offset += adapt_len + 1
727
728	if not ord(buffer[c+1]) & 0x40:
729	# no new pes or psi in stream payload starting
730	pass
731	elif adapt & 0x01:
732	# PES
733	timestamp = self.ReadPESHeader(c+offset, buffer[c+offset:], tsid)[1]
734	if timestamp != -1:
735	if not hasattr(self, 'start'):
736	self.get_time = self.ReadPTS
737	timestamp = c + offset + timestamp
738	self.start = self.get_time(buffer[timestamp:timestamp+5])
739	elif not hasattr(self, 'audio_ok'):
740	timestamp = c + offset + timestamp
741	start = self.get_time(buffer[timestamp:timestamp+5])
742	if abs(start - self.start) < 10:
743	# looks ok
744	self.audio_ok = True
745	else:
746	# timestamp broken
747	del self.start
748	if mediainfo.DEBUG:
749	print 'Timestamp error, correcting'
750
751	if hasattr(self, 'start') and self.start and \
752	self.sequence_header_offset and self.video and self.audio:
753	break
754
755	c += TS_PACKET_LENGTH
756
757
758	if not self.sequence_header_offset:
759	return 0
760
761	if hasattr(self, 'start') and self.start:
762	self.keys.append('start')
763
764	# fill in values for support functions:
765	self.__seek_size__ = 10000000 # 10 MB
766	self.__sample_size__ = 100000 # 100 k scanning
767	self.__search__ = self._find_timer_TS_
768	self.filename = file.name
769
770	# get length of the file
771	self.length = self.get_length()
772	return 1
773
774
775	def _find_timer_TS_(self, buffer):
776	c = 0
777
778	while c + TS_PACKET_LENGTH < len(buffer):
779	if ord(buffer[c]) == ord(buffer[c+TS_PACKET_LENGTH]) == TS_SYNC:
780	break
781	c += 1
782	else:
783	return -1
784
785	while c + TS_PACKET_LENGTH < len(buffer):
786	start = ord(buffer[c+1]) & 0x40
787	if not start:
788	c += TS_PACKET_LENGTH
789	continue
790
791	tsid = ((ord(buffer[c+1]) & 0x3F) << 8) + ord(buffer[c+2])
792	adapt = (ord(buffer[c+3]) & 0x30) >> 4
793
794	offset = 4
795	if adapt & 0x02:
796	# meta info present, skip it for now
797	offset += ord(buffer[c+offset]) + 1
798
799	if adapt & 0x01:
800	timestamp = self.ReadPESHeader(c+offset, buffer[c+offset:], tsid)[1]
801	return c + offset + timestamp
802	c += TS_PACKET_LENGTH
803	return -1
804
805
806
807	# Support functions ==============================================
808
809	def get_endpos(self):
810	"""
811	get the last timestamp of the mpeg, return -1 if this is not possible
812	"""
813	if not hasattr(self, 'filename') or not hasattr(self, 'start'):
814	return -1
815
816	file = open(self.filename)
817	file.seek(os.stat(self.filename)[stat.ST_SIZE]-self.__sample_size__)
818	buffer = file.read(self.__sample_size__)
819
820	end = -1
821	while 1:
822	pos = self.__search__(buffer)
823	if pos == -1:
824	break
825	end = self.get_time(buffer[pos:])
826	buffer = buffer[pos+100:]
827
828	file.close()
829	return end
830
831
832	def get_length(self):
833	"""
834	get the length in seconds, return -1 if this is not possible
835	"""
836	end = self.get_endpos()
837	if end == -1:
838	return -1
839	if self.start > end:
840	return int(((long(1) << 33) - 1 ) / 90000) - self.start + end
841	return end - self.start
842
843
844	def seek(self, end_time):
845	"""
846	Return the byte position in the file where the time position
847	is 'pos' seconds. Return 0 if this is not possible
848	"""
849	if not hasattr(self, 'filename') or not hasattr(self, 'start'):
850	return 0
851
852	file = open(self.filename)
853	seek_to = 0
854
855	while 1:
856	file.seek(self.__seek_size__, 1)
857	buffer = file.read(self.__sample_size__)
858	if len(buffer) < 10000:
859	break
860	pos = self.__search__(buffer)
861	if pos != -1:
862	# found something
863	if self.get_time(buffer[pos:]) >= end_time:
864	# too much, break
865	break
866	# that wasn't enough
867	seek_to = file.tell()
868
869	file.close()
870	return seek_to
871
872
873	def __scan__(self):
874	"""
875	scan file for timestamps (may take a long time)
876	"""
877	if not hasattr(self, 'filename') or not hasattr(self, 'start'):
878	return 0
879	file = open(self.filename)
880	print 'scanning file...'
881	while 1:
882	file.seek(self.__seek_size__ * 10, 1)
883	buffer = file.read(self.__sample_size__)
884	if len(buffer) < 10000:
885	break
886	pos = self.__search__(buffer)
887	if pos == -1:
888	continue
889	print self.get_time(buffer[pos:])
890
891	file.close()
892	print 'done'
893	print
894
895
896
897	mmpython.registertype( 'video/mpeg', ('mpeg','mpg','mp4', 'ts'), mediainfo.TYPE_AV, MpegInfo )

Note: See TracBrowser for help on using the repository browser.

Context Navigation

source: trunk/src/testing/bin/fileServer/misc/mmpython/video/mpeginfo.py @ 4

Download in other formats: