-
-
Notifications
You must be signed in to change notification settings - Fork 192
/
Copy pathmp4.py
executable file
·134 lines (92 loc) · 3.03 KB
/
mp4.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
#!/usr/bin/env python3
# script to collide "MP4"-based files
# Ange Albertini 2018-2021
# the "atom/box" format used in MP4 is a derivate of Apple Quicktime, and is used by many other formats (JP2, HEIF)
# it may or may not work on other format or other player. They follow the same logic.
# see http://www.ftyps.com/ for a complete list
import struct
import sys
import hashlib
def dprint(s):
DEBUG = True
DEBUG = False
if DEBUG:
print("D " + s)
def relocate(d, delta):
# finds and relocates all Sample Tables Chunk Offset tables
# TODO: support 64 bits `co64` tables ()
offset = 0
tablecount = d.count(b"stco")
dprint("stco found: %i" % tablecount)
for i in range(tablecount):
offset = d.find(b"stco", offset)
dprint("current offset: %0X" % offset)
length = struct.unpack(">I", d[offset-4:offset])[0]
verflag = struct.unpack(">I", d[offset+4:offset+8])[0]
offcount = struct.unpack(">I", d[offset+8:offset+12])[0]
if verflag != 0:
dprint(" version/flag not 0 (found %X) at offset: %0X" % (verflag, offset+4))
continue
# length, type, verflag, count - all 32b
if (offcount + 4) * 4 != length:
dprint(" Atom length (%X) and offset count (%X) don't match" % (length, offcount))
continue
dprint(" offset count: %i" % offcount)
offset += 4 * 3
offsets = struct.unpack(">%iI" % offcount, d[offset:offset + offcount * 4])
dprint(" offsets (old): %s" % repr(list(offsets)))
offsets = [i + delta for i in offsets]
dprint(" (new) offsets: %s" % repr(offsets))
d = d[:offset] + struct.pack(">%iI" % offcount, *offsets) + d[offset+offcount*4:]
offset += 4 * offcount
dprint("")
return d
def freeAtom(l):
return struct.pack(">I", l) + b"free" + b"\0" * (l - 8)
def isValid(d):
# fragile check of validity
return d.startswith(b"\0\0\0") and d[:32].count(b"ftyp") > 0
fn1, fn2 = sys.argv[1:3]
with open(fn1, "rb") as f:
d1 = f.read()
with open(fn2, "rb") as f:
d2 = f.read()
assert isValid(d1)
assert isValid(d2)
l1 = len(d1)
l2 = len(d2)
suffix = b"".join([
struct.pack(">I", 0x100 + 8), b"free",
b"\0" * (0x100 - 8),
struct.pack(">I", 8 + l1), b"free",
relocate(d1, 0x1C0 + 8),
relocate(d2, 0x1C0 + 8 + l1),
])
# 32b length prefix
with open("mp4-1.bin", "rb") as f:
prefix1 = f.read()
with open("mp4-2.bin", "rb") as f:
prefix2 = f.read()
col1 = prefix1 + suffix
col2 = prefix2 + suffix
md5 = hashlib.md5(col1).hexdigest()
if md5 == hashlib.md5(col2).hexdigest():
print("common md5: %s" % md5)
with open("collision1.mp4", "wb") as f:
f.write(col1)
with open("collision2.mp4", "wb") as f:
f.write(col2)
# 64b length prefix
with open("mp4l-1.bin", "rb") as f:
prefix1 = f.read()
with open("mp4l-2.bin", "rb") as f:
prefix2 = f.read()
col1 = prefix1 + suffix
col2 = prefix2 + suffix
md5 = hashlib.md5(col1).hexdigest()
if md5 == hashlib.md5(col2).hexdigest():
print("common md5: %s" % md5)
with open("collisionl1.mp4", "wb") as f:
f.write(col1)
with open("collisionl2.mp4", "wb") as f:
f.write(col2)