fixts first attempt

2 years ago · eaf3ed2e54
parent 30d5ccc483
commit eaf3ed2e54
1 changed files with 245 additions and 0 deletions
--- a/common/common/fixts.py
+++ b/common/common/fixts.py
@ -0,0 +1,245 @@
 import struct
 class FixTS():
 	"""Does stream processing on an MPEG-TS stream, adjusting all timestamps in it.
 	The stream will be adjusted such that the first packet starts at the given start_time,
 	with all other packets adjusted to be the same time relative to that packet.
 	In other words, a video that goes from 01:23:45 to 01:24:45 will be retimed to instead
 	go from (for example) 00:10:00 to 00:11:00.
 	The object maintains an internal buffer of data.
 	Use feed() to add more data. Data will be removed from the buffer when a whole packet
 	can be parsed, and any completed data will be returned from feed().
 	Finally, when there is no more data, call end() to assert there is no left-over data
 	and provide the final video end time.
 	All timestamps are in seconds as a float.
 	Example use:
 		fixer = FixTimestamps(0)
 		for chunk in input:
 			fixed_data = fixer.feed(chunk)
 			output(fixed_data)
 		end_time = fixer.end()
 	"""
 	PACKET_SIZE = 188
 	def __init__(self, start_time):
 		self.start_time = start_time
 		self.end_time = start_time
 		self.offset = None
 		self.data = b""
 	def feed(self, data):
 		"""Takes more data as a bytestring to add to buffer.
 		Fixes any whole packets in the buffer and returns them as a single bytestring."""
 		self.data += data
 		output = []
 		while len(self.data) >= self.PACKET_SIZE:
 			packet = self.data[:self.PACKET_SIZE]
 			self.data = self.data[self.PACKET_SIZE:]
 			output.append(self._fix_packet(packet))
 		return b''.join(output)
 	def end(self):
 		"""Should be called when no more data will be added.
 		Checks no data was left over, and returns the final end time (ie. start time + video duration).
 		"""
 		if len(self.data) > 0:
 			raise ValueError("Stream has a partial packet remaining: {!r}", self.data)
 		return self.end_time
 	# TODO we should really be only using PCR to calibrate the offset (ie. we want the first PCR
 	# to be = start_time, not the first PTS we see which might be the audio stream).
 	# Also we need to pad the end_time to the time of the NEXT expected frame, or else
 	# we'll overlap the last frame here with the first frame of the next segment.
 	# How to determine expected frame? Easiest way is probably average or median difference
 	# between PCRs, with a reasonable fallback.
 	def _convert_time(self, old_time):
 		# If this is the first timestamp we've seen, use it to calibrate offset.
 		if self.offset is None:
 			self.offset = self.start_time - old_time
 		new_time = old_time + self.offset
 		# It's rare but possible that when resetting times to start at 0, the second packet
 		# might start slightly earlier than the first and thus have a negative time.
 		# This isn't encodable in the data format, so just clamp to 0.
 		new_time = max(0, new_time)
 		# keep track of latest new_time as the end time
 		self.end_time = max(self.end_time, new_time)
 		return new_time
 	def _fix_packet(self, packet):
 		""" 
 		- If an adaptation field is present and contains a PCR, fix the PCR
 		- If packet is the start of a unit, and the unit begins with 0x0001
 		  (ie. it's an elementary stream and not a table):
 			- If the packet header contains a PTS, fix the PTS
 			- If the packet header cannot be decoded far enough (not enough data in first packet),
 			  bail - we don't care about this edge case.
 		"""
 		assert len(packet) == self.PACKET_SIZE 
 		def check(expr, reason):
 			if not expr:
 				raise ValueError("Packet cannot be parsed: {}\n{!r}".format(reason, packet))
 		# Note this is a very simple, hacky parser that only parses as much as we need.
 		# Useful links: https://en.wikipedia.org/wiki/MPEG_transport_stream
 		# 4 byte header: "G" | TEI(1) PUSI(1) PRI(1) PID(5) | PID(8) | TSC(2) AFC(2) CONT(4)
 		# Of interest to us:
 		#   TEI: If set, data is known to be corrupt
 		#   PUSI: If set, this packet contains a new payload unit
 		#       This matters because payload unit headers contain a timestamp we need to edit
 		#   TSC: If non-zero, indicates data is scrambled (we don't implement handling that)
 		#   AFC: First bit indicates an adaptation field header is present, second bit indicates a payload
 		check(packet[0:1] == b"G", "Sync byte is incorrect")
 		check(packet[1] & 0x80 == 0, "Transport error indicator is set")
 		pusi = bool(packet[1] & 0x40)
 		check(packet[3] & 0xc0 == 0, "TSC indicates data is scrambled")
 		has_adaptation_field = bool(packet[3] & 0x20)
 		has_payload = bool(packet[3] & 0x10)
 		has_pcr = False
 		if has_adaptation_field:
 			field_length = packet[4]
 			payload_index = 5 + field_length
 			# According to the spec, the adaptation field header is at least 1 byte.
 			# But in the wild we see a header as "present" except 0 bytes long.
 			# We should just treat this as "not present"
 			if field_length > 0:
 				# The adaptation field is a bit field of 8 flags indicating whether optional
 				# sections are present. Thankfully, the only one we're interested in (the PCR)
 				# is always the first field if present, so we don't even need to check the others.
 				has_pcr = bool(packet[5] & 0x10)
 				if has_pcr:
 					check(field_length >= 7, "Adaptation field indicates PCR but is too small")
 					old_time = decode_pcr(packet[6:12])
 					new_time = self._convert_time(old_time)
 					encoded = encode_pcr(new_time)
 					packet = packet[:6] + encoded + packet[12:]
 					assert len(packet) == 188
 		else:
 			# No adapatation field, payload starts immediately after the packet header
 			payload_index = 4
 		if pusi:
 			# Payload Unit Start Indicator indicates there is a new payload unit in this packet.
 			# When set, there is an extra byte before the payload indicating where within the
 			# payload the new payload unit starts.
 			# A payload unit is a thing like a video frame, audio packet, etc. The payload unit header
 			# contains a timestamp we need to edit.
 			check(has_payload, "PUSI set but no payload is present")
 			payload_pointer = packet[payload_index]
 			# move index past payload pointer, then seek into payload to find start of payload unit.
 			unit_index = payload_index + 1 + payload_pointer
 			# The header we're after is only present in elementary streams, not in program tables.
 			# We can tell the difference because streams start with a 0x0001 prefix,
 			# whereas program tables start with a header where at least bits 0x0030 must be set.
 			# Note wikipedia in https://en.wikipedia.org/wiki/Packetized_elementary_stream
 			# claims the prefix is 0x000001, but that is including the payload pointer, which seems
 			# to always be set to 0 for an elementary stream
 			# (compare https://en.wikipedia.org/wiki/Program-specific_information which also includes
 			# the payload pointer but says it can be any 8-bit value).
 			if packet[unit_index : unit_index + 2] == b"\x00\x01":
 				# unit header looks like: 00, 01, stream id, length(2 bytes), then PES header
 				# The only thing we care about in the PES header is the top two bits of the second byte,
 				# which indicates if timestamps are present.
 				# It's possible that we didn't get enough of the payload in this one packet
 				# to read the whole header, but exceedingly unlikely.
 				check(unit_index + 6 < self.PACKET_SIZE, "Payload too small to read unit header")
 				flags = packet[unit_index + 6]
 				has_pts = bool(flags & 0x80)
 				has_dts = bool(flags & 0x40)
 				check(not has_dts, "DTS timestamp is present, we cannot handle fixing it")
 				# Once again, PTS is the first optional field, so we don't need to worry
 				# about other fields being present.
 				if has_pts:
 					pts_index = unit_index + 8
 					check(pts_index + 5 <= self.PACKET_SIZE, "Payload too small to read PTS")
 					raw = packet[pts_index : pts_index + 5]
 					pts = decode_ts(raw, 2)
 					pts = self._convert_time(pts)
 					encoded = encode_ts(pts, 2)
 					packet = packet[:pts_index] + encoded + packet[pts_index + 5:]
 					assert len(packet) == 188
 		return packet
 def bits(value, start, end):
 	"""Extract bits [START, END) from value, where 0 is LSB"""
 	size = end - start
 	return (value >> start) & ((1 << size) - 1)
 def decode_padded(value, spec):
 	size = struct.calcsize(spec)
 	pad = size - len(value)
 	assert pad >= 0
 	value = b"\0" * pad + value
 	return struct.unpack(spec, value)[0]
 def encode_pcr(seconds):
 	assert seconds >= 0
 	raw = int(seconds * 27000000)
 	base, ext = divmod(raw, 300)
 	assert base < 2**33
 	value = (base << 15) + ext
 	value = struct.pack('!Q', value)
 	return value[2:]
 def decode_pcr(value):
 	value = decode_padded(value, '!Q')
 	base = bits(value, 15, 48)
 	extension = bits(value, 0, 9)
 	raw = 300 * base + extension
 	seconds = float(raw) / 27000000
 	return seconds
 def encode_ts(seconds, tag):
 	# bits: TTTTxxx1 xxxxxxxx xxxxxxx1 xxxxxxxx xxxxxxx1
 	# T is tag, x is bits of actual number
 	assert seconds >= 0
 	raw = int(seconds * 90000)
 	a = bits(raw, 30, 33)
 	b = bits(raw, 15, 30)
 	c = bits(raw, 0, 15)
 	value = 1 + (1 << 16) + (1 << 32) + (tag << 36) + (a << 33) + (b << 17) + (c << 1)
 	value = struct.pack('!Q', value)
 	return value[3:]
 def decode_ts(value, tag):
 	# bits: TTTTxxx1 xxxxxxxx xxxxxxx1 xxxxxxxx xxxxxxx1
 	# T is tag, x is bits of actual number
 	value = decode_padded(value, '!Q')
 	assert bits(value, 36, 40) == tag 
 	assert all(value & (1 << bit) for bit in [0, 16, 32])
 	a = bits(value, 33, 36) 
 	b = bits(value, 17, 32) 
 	c = bits(value, 1, 16) 
 	value = (a << 30) + (b << 15) + c 
 	seconds = float(value) / 90000
 	return seconds
 if __name__ == '__main__':
 	# simple test: read file from stdin, set start to first arg, output to stdout.
 	import sys
 	start_time = float(sys.argv[1])
 	fixer = FixTS(start_time)
 	chunk = None
 	while chunk != b"":
 		chunk = sys.stdin.buffer.read(8192)
 		if chunk:
 			output = fixer.feed(chunk)
 			while output:
 				written = sys.stdout.buffer.write(output)
 				output = output[written:]
 	end_time = fixer.end()
 	sys.stderr.write(str(end_time) + '\n')