-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathPerspective.moon
398 lines (315 loc) · 17.4 KB
/
Perspective.moon
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
haveDepCtrl, DependencyControl, depctrl = pcall require, 'l0.DependencyControl'
local amath
if haveDepCtrl
depctrl = DependencyControl {
name: "Perspective",
version: "1.2.0",
description: [[Math functions for dealing with perspective transformations.]],
author: "arch1t3cht",
url: "https://github.com/TypesettingTools/arch1t3cht-Aegisub-Scripts",
moduleName: 'arch.Perspective',
{
{"arch.Math", version: "0.1.8", url: "https://github.com/TypesettingTools/arch1t3cht-Aegisub-Scripts",
feed: "https://raw.githubusercontent.com/TypesettingTools/arch1t3cht-Aegisub-Scripts/main/DependencyControl.json"},
}
}
amath = depctrl\requireModules!
else
amath = require"arch.Math"
{:Point, :Matrix} = amath
-- compatibility with Lua >= 5.2
unpack = unpack or table.unpack
local Quad
-- Quadrilateral (usually in 2D space) described by its four corners, in clockwise or counter-clockwise direction.
-- Internally, we always use numbering that's counter-clockwise in the cartesian plane, which is clockwise on a 2D screen.
class Quad extends Matrix
new: (...) =>
super(...)
assert(@height == 4)
-- Computes the intersection point of the diagonals.
-- Doubles as a generic function to intersect to lines in 2D space.
midpoint: =>
la = Matrix(@[3] - @[1], @[4] - @[2])\transpose!\preim(@[4] - @[1])
return @[1] + la[1] * (@[3] - @[1])
--------------------
-- Collection of functions describing the perspective transformation between this quad and a 1x1 square.
-- These were originally computed from cross-ratios and run through Mathematica to combine all the fractions,
-- which makes it work in such "edge" cases as two sides of the quad being parallel.
-- They were then dumped from Mathematica in InputForm and inserted here without much postprocessing,
-- except for sometimes putting common denominators in an extra variable
--------------------
-- Helper functions to wrap code dumped from Mathematica
-- returns x1, x2, x3, x4, y1, y2, y3, y4
unwrap: => @[1][1], @[2][1], @[3][1], @[4][1], @[1][2], @[2][2], @[3][2], @[4][2]
-- translates x1, y1 to 0, 0 and returns x2, x3, x4, y2, y3, y4
unwrap_rel: =>
@ = @ - @[1]
return @[2][1], @[3][1], @[4][1], @[2][2], @[3][2], @[4][2]
-- Perspective transform mapping the quad to a unit square
xy_to_uv: (xy) =>
assert(@width == 2)
x2, x3, x4, y2, y3, y4 = @unwrap_rel!
x, y = unpack(xy - @[1])
u = -(((x3*y2 - x2*y3)*(x4*y - x*y4)*(x4*(-y2 + y3) + x3*(y2 - y4) + x2*(-y3 + y4)))/(x3^2*(x4*y2^2*(-y + y4) + y4*(x*y2*(y2 - y4) + x2*(y - y2)*y4)) + x3*(x4^2*y2^2*(y - y3) + 2*x4*(x2*y*y3*(y2 - y4) + x*y2*(-y2 + y3)*y4) + x2*y4*(x2*(-y + y3)*y4 + 2*x*y2*(-y3 + y4))) + y3*(x*x4^2*y2*(y2 - y3) + x2*x4^2*(y2*y3 + y*(-2*y2 + y3)) - x2^2*(x4*y*(y3 - 2*y4) + x4*y3*y4 + x*y4*(-y3 + y4)))))
v = ((x2*y - x*y2)*(x4*y3 - x3*y4)*(x4*(y2 - y3) + x2*(y3 - y4) + x3*(-y2 + y4)))/(x3*(x4^2*y2^2*(-y + y3) + x2*y4*(2*x*y2*(y3 - y4) + x2*(y - y3)*y4) - 2*x4*(x2*y*y3*(y2 - y4) + x*y2*(-y2 + y3)*y4)) + x3^2*(x4*y2^2*(y - y4) + y4*(x2*(-y + y2)*y4 + x*y2*(-y2 + y4))) + y3*(x*x4^2*y2*(-y2 + y3) + x2*x4^2*(2*y*y2 - y*y3 - y2*y3) + x2^2*(x4*y*(y3 - 2*y4) + x4*y3*y4 + x*y4*(-y3 + y4))))
return Point(u, v)
-- Perspective transform mapping a unit square to the quad
uv_to_xy: (uv) =>
assert(@width == 2)
x2, x3, x4, y2, y3, y4 = @unwrap_rel!
u, v = unpack(uv)
d = (x4*((-1 + u + v)*y2 + y3 - v*y3) + x3*(y2 - u*y2 + (-1 + v)*y4) + x2*((-1 + u)*y3 - (-1 + u + v)*y4))
x = (v*x4*(x3*y2 - x2*y3) + u*x2*(x4*y3 - x3*y4)) / d
y = (v*y4*(x3*y2 - x2*y3) + u*y2*(x4*y3 - x3*y4)) / d
return Point(x, y) + @[1]
-- Derivative (i.e. Jacobian) of uv_to_xy at the given point
d_uv_to_xy: (uv) =>
assert(@width == 2)
x2, x3, x4, y2, y3, y4 = @unwrap_rel!
u, v = unpack(uv)
d = (x4*((-1 + u + v)*y2 + y3 - v*y3) + x3*(y2 - u*y2 + (-1 + v)*y4) + x2*((-1 + u)*y3 - (-1 + u + v)*y4))^2
dxdu = (x2*(x4*y3 - x3*y4)*(x4*((-1 + u + v)*y2 + y3 - v*y3) + x3*(y2 - u*y2 + (-1 + v)*y4) + x2*((-1 + u)*y3 - (-1 + u + v)*y4)) + (x3*y2 - x4*y2 + x2*(-y3 + y4))*(v*x4*(x3*y2 - x2*y3) + u*x2*(x4*y3 - x3*y4))) / d
dxdv = (x4*(x3*y2 - x2*y3)*(x4*((-1 + u + v)*y2 + y3 - v*y3) + x3*(y2 - u*y2 + (-1 + v)*y4) + x2*((-1 + u)*y3 - (-1 + u + v)*y4)) - (x4*(y2 - y3) + (-x2 + x3)*y4)*(v*x4*(x3*y2 - x2*y3) + u*x2*(x4*y3 - x3*y4))) / d
dydu = ((-1 + v)*x3^2*y2*(y2 - y4)*y4 + y3*((-1 + v)*x4^2*y2*(y2 - y3) + v*x2^2*(y3 - y4)*y4 + x2*x4*y2*(-y3 + y4)) + x3*y2*(2*(-1 + v)*x4*y3*y4 - (-1 + 2*v)*x2*(y3 - y4)*y4 + x4*y2*(y3 + y4 - 2*v*y4))) / d
dydv = ((x3*y2 - x2*y3)*y4*(-(x4*y2) - x2*y3 + x4*y3 + x3*(y2 - y4) + x2*y4) + u*(x4^2*y2*y3*(-y2 + y3) + 2*x3*x4*y2*(y2 - y3)*y4 + y4*(2*x2*x3*y2*(y3 - y4) + x3^2*y2*(-y2 + y4) + x2^2*y3*(-y3 + y4)))) / d
return Matrix({{dxdu, dxdv}, {dydu, dydv}})
-- Derivative (i.e. Jacobian) of xy_to_uv at the given point
d_xy_to_uv: (xy) =>
assert(@width == 2)
x2, x3, x4, y2, y3, y4 = @unwrap_rel!
x, y = unpack(xy)
d = (x3*(x4^2*y2^2*(-y + y3) + x2*y4*(2*x*y2*(y3 - y4) + x2*(y - y3)*y4) - 2*x4*(x2*y*y3*(y2 - y4) + x*y2*(-y2 + y3)*y4)) + x3^2*(x4*y2^2*(y - y4) + y4*(x2*(-y + y2)*y4 + x*y2*(-y2 + y4))) + y3*(x*x4^2*y2*(-y2 + y3) + x2*x4^2*(2*y*y2 - y*y3 - y2*y3) + x2^2*(x4*y*(y3 - 2*y4) + x4*y3*y4 + x*y4*(-y3 + y4))))^2
dudx = ((x3*y2 - x2*y3)*(x4*y2 - x2*y4)*(x4*y3 - x3*y4)*(x4*y*(y2 - y3) + x3*(y - y2)*y4 + x2*(-y + y3)*y4)*(x4*(-y2 + y3) + x3*(y2 - y4) + x2*(-y3 + y4))) / d
dvdx = -((x3*y2 - x2*y3)*(x4*y2 - x2*y4)*(x4*y3 - x3*y4)*(-(x3*x4*y2) + x*x4*(y2 - y3) + x2*x4*y3 + x*(-x2 + x3)*y4)*(x4*(-y2 + y3) + x3*(y2 - y4) + x2*(-y3 + y4))) / d
dudy = ((x3*y2 - x2*y3)*(x4*y2 - x2*y4)*(x4*y3 - x3*y4)*(x4*y2*(y - y3) + x2*y*(y3 - y4) + x3*y2*(-y + y4))*(x4*(y2 - y3) + x2*(y3 - y4) + x3*(-y2 + y4))) / d
dvdy = ((x3*y2 - x2*y3)*(x4*y2 - x2*y4)*(-(x4*y3) + x3*y4)*(x4*(-y2 + y3) + x3*(y2 - y4) + x2*(-y3 + y4))*(x*(x3*y2 - x4*y2 - x2*y3 + x2*y4) + x2*(x4*y3 - x3*y4))) / d
return Matrix({{dudx, dudy}, {dvdx, dvdy}})
rect: (width, height) ->
Quad {
{0, 0},
{width, 0},
{width, height},
{0, height},
}
screen_z = 312.5
an_xshift = { 0, 0.5, 1, 0, 0.5, 1, 0, 0.5, 1 }
an_yshift = { 1, 1, 1, 0.5, 0.5, 0.5, 0, 0, 0 }
-- List of tags that affect perspective
relevantTags = {"fontsize", "shear_x", "shear_y", "scale_x", "scale_y", "angle", "angle_x", "angle_y", "origin", "position", "outline", "outline_x", "outline_y", "shadow", "shadow_x", "shadow_y"}
-- List of tags that are used in perspective. This is the same list as relevant_tags except for outline and shadow, since the single-coordinate versions of those tags are used instead
usedTags = {"fontsize", "shear_x", "shear_y", "scale_x", "scale_y", "angle", "angle_x", "angle_y", "origin", "position", "outline_x", "outline_y", "shadow_x", "shadow_y"}
-- Takes an ASSFoundation LineContents object and returns its effective tags, but preprocessed
-- for perspective handling. This includes inforcing the relations between \org and \pos as
-- well as those between the various transform tags, as well as warning when the line has tags
-- that would break perspective calulations (\move, certain \t transformations, multiple tag sections, etc).
-- Also needs the ASSFoundation library to be given in its first parameter. This is to prevent this library
-- from depending on ASSFoundation.
-- Returns:
-- - the effective tags table
-- - the line's width (not scaled with \fscx)
-- - the line's height (not scaled with \fscy)
-- - a table of warnings about possibly problematic tags
-- -> each warning is of the form {warning, details} where details may be nil depending on the warning.
prepareForPerspective = (ASS, data) ->
tagvals = data\getEffectiveTags(-1, true, true, true).tags
width, height = 0, 0
has_text, has_drawing = false, false
data\callback (section) ->
if section.class == ASS.Section.Text
has_text = true
width, height = data\getTextExtents!
if section.class == ASS.Section.Drawing
has_drawing = true
ext = section\getExtremePoints!
width, height = ext.w, ext.h
warnings = {}
table.insert(warnings, {"text_and_drawings"}) if has_text and has_drawing
table.insert(warnings, {"zero_size"}) if has_text and (width == 0 or height == 0)
table.insert(warnings, {"move"}) if data\getPosition().class == ASS.Tag.Move
-- Width and height can be 0 for drawings
width = math.max(width, 0.01)
height = math.max(height, 0.01)
width /= (tagvals.scale_x.value / 100)
height /= (tagvals.scale_y.value / 100)
-- Do some checks for cases that break this script
-- These are a bit more aggressive than necessary (e.g. two tags of the same type in the same section will trigger this detection but not break resampling)
-- but I can't be bothered to be more exact. Users can run ASSWipe before resampling or something.
for tname in *relevantTags
table.insert(warnings, {"multiple_tags", ASS.tagMap[tname].overrideName}) if #data\getTags({tname}) >= 2
-- Assf doesn't support nested transforms so this code could be much simpler, but a) I only found that out after writing this and b) I guess I can
-- keep this code around in case it ever starts supporting them
checkTransformTags = (section, initial) ->
if not initial
for tname in *relevantTags
table.insert(warnings, {"transform", ASS.tagMap[tname].overrideName}) if #section\getTags({tname}) >= 1
section\modTags {"transform"}, (tag) ->
checkTransformTags tag.tags, false
tag
checkTransformTags data, true
-- Manually enforce the relations between tags
if #data\getTags({"origin"}) == 0
tagvals.origin.x = tagvals.position.x
tagvals.origin.y = tagvals.position.y
for name in *{"outline", "shadow"}
for coord in *{"x", "y"}
cname = "#{name}_#{coord}"
if #data\getTags({cname}) == 0
tagvals[cname].value = tagvals[name].value
return tagvals, width, height, warnings
-- Transforms the given list of points in a relative coordinate system according to the given .ass tags.
-- If no list of points is given, a rectangle with the given dimensions is used.
-- The width and height parameters should contain the raw dimensions of the line to be transformed. These are used for alignment.
-- Thus, when transforming a shape with \an7, width and height can be zero. When transforming text, they should be whatever aegisub.text_extents returned.
-- The table t is supposed to be a table of tags as returned by ASSFoundation, but any table with the same keys and .value or .x/.y
-- fields for the respective tags works.
-- The layoutScale parameter should be set to (script's PlayResY)/(script's LayoutResY), or (scipt's PlayResY)/(video height) if LayoutResY is not present
-- (though in that case you should add it to your script or yell at your user to do so)
transformPoints = (t, width, height, points=nil, layoutScale=1) ->
if points == nil
points = Quad.rect width, height
else
points = Matrix(points)
scaled_screen_z = screen_z * layoutScale
pos = Point(t.position.x, t.position.y)
org = Point(t.origin.x, t.origin.y)
-- Shearing
points *= Matrix({
{1, t.shear_x.value},
{t.shear_y.value, 1},
})\t!
-- Translate to alignment point
an = t.align.value
points -= Point(width * an_xshift[an], height * an_yshift[an])
-- Apply scaling
points *= (Matrix.diag(t.scale_x.value, t.scale_y.value) / 100)
-- Translate relative to origin
points += pos - org
-- Rotate ZXY
points ..= 0
points *= Matrix.rot2d(math.rad(-t.angle.value))\onSubspace(3)\t!
points *= Matrix.rot2d(math.rad(-t.angle_x.value))\onSubspace(1)\t!
points *= Matrix.rot2d(math.rad(t.angle_y.value))\onSubspace(2)\t!
-- Project
points = Matrix [ (scaled_screen_z / (p\z! + scaled_screen_z)) * p\project(2) for p in *points ]
-- Move to origin
points += org
return points
-- Given a quad on screen and the width and height of the text, returns in t (again an ASSFoundation tags table)
-- the tag values that will transform this text to the given quad.
-- The orgMode parameter controls how the value of \org is chosen:
-- orgMode = 1: \org is not changed, i.e. the origin tag passed in the t parameter is not modified
-- orgMode = 2: \org is set to the center of the quad
-- orgMode = 3: \org is chosen in a way that tries to ensure that \fax can be zero, or as close to zero as possible
-- The layoutScale parameter should be set to (script's PlayResY)/(script's LayoutResY), or (scipt's PlayResY)/(video height) if LayoutResY is not present
-- (though in that case you should add it to your script or yell at your user to do so)
-- For the sake of backwards compatibility, orgMode=false is synonymous with orgMode=1 and orgMode=true is synonymous with orgMode=2 .
tagsFromQuad = (t, quad, width, height, orgMode=0, layoutScale=1) ->
quad = Quad(quad) if quad.__class != Quad
scaled_screen_z = layoutScale * screen_z
-- Find a parallelogram projecting to the quad
z24 = Matrix({ quad[2] - quad[3], quad[4] - quad[3] })\t!\preim(quad[1] - quad[3])
if orgMode == 2 or orgMode == true
center = quad\midpoint!
t.origin.x = center\x!
t.origin.y = center\y!
else if orgMode == 3
v2 = quad[2] - quad[1]
v4 = quad[4] - quad[1]
-- Look for a translation after which the quad will unproject to a rectangle.
-- Specifically, look for a vector t such that this happens after moving q0 to t.
-- The set of such vectors is cut out by the equation a (x^2 + y^2) - b1 x - b2 y + c
-- with the following coefficients.
a = (1 - z24[1]) * (1 - z24[2])
b = z24[1] * v2 + z24[2] * v4 - z24[1] * z24[2] * (v2 + v4)
c = z24[1] * z24[2] * v2 * v4 + (z24[1] - 1) * (z24[2] - 1) * scaled_screen_z ^ 2
-- Our default value for o, which would put \org at the center of the quad.
-- We'll try to find a value for \org that's as close as possible to it.
o = quad[1] - quad\midpoint!
-- Handle all the edge cases. These can actually come up in practice, like when
-- starting from text without any perspective.
if a == 0
-- If b = 0 we get a trivial or impossible equation, so just keep the previous \org.
if b\length! != 0
-- The equation cuts out a line. Find the point closest to the previous o.
o = o + b * ((c - o\dot(b)) / b\dot(b))
else
-- The equation cuts out a circle.
-- Complete the square to find center and radius.
circleCenter = b / (2 * a)
sqradius = (b\dot(b) / (4 * a) - c) / a
if sqradius <= 0
-- This is actually very rare.
org = circleCenter
else
-- Find the point on the circle closest to the current \org.
radius = math.sqrt(sqradius)
center2t = o - circleCenter
if center2t\length! == 0
o = circleCenter + Point(radius, 0)
else
o = circleCenter + center2t / center2t\length! * radius
org = quad[1] - o
t.origin.x = org\x!
t.origin.y = org\y!
-- Normalize to center
org = Point(t.origin.x, t.origin.y)
quad -= org
-- Unproject the quad
zs = Point(1, z24[1], z24\sum! - 1, z24[2])
quad ..= scaled_screen_z
quad = Matrix.diag(zs) * quad
-- Normalize so the origin has z=scaled_screen_z
orgla = Matrix({Point(0, 0, scaled_screen_z), quad[1] - quad[2], quad[1] - quad[4]})\t!\preim(quad[1])
quad /= orgla[1]
quad -= Matrix[{0, 0, scaled_screen_z} for i=1,4]
-- Find the rotations
n = (quad[2] - quad[1])\cross(quad[4] - quad[1])
roty = math.atan(n\x! / n\z!)
roty += math.pi if n\z! < 0
ry = Matrix.rot2d(roty)\onSubspace(2)
n = Point(ry * n)
rotx = math.atan(n\y! / n\z!)
rx = Matrix.rot2d(rotx)\onSubspace(1)
quad *= ry\t!
quad *= rx\t!
ab = quad[2] - quad[1]
rotz = math.atan(ab\y! / ab\x!)
rotz += math.pi if ab\x! < 0
rz = Matrix.rot2d(-rotz)\onSubspace(3)
quad *= rz\t!
-- We now have a horizontal parallelogram in the 2D plane, so find the shear and the dimensions
ab = quad[2] - quad[1]
ad = quad[4] - quad[1]
rawfax = ad\x! / ad\y!
quadwidth = ab\length!
quadheight = math.abs(ad\y!)
scalex = quadwidth / width
scaley = quadheight / height
-- Find \pos
an = t.align.value
pos = org + (quad[1]\project(2) + Point(quadwidth * an_xshift[an], quadheight * an_yshift[an]))
-- Set all the new tags
t.position.x = pos\x!
t.position.y = pos\y!
t.angle.value = math.deg(-rotz)
t.angle_x.value = math.deg(rotx)
t.angle_y.value = math.deg(-roty)
t.scale_x.value = 100 * scalex
t.scale_y.value = 100 * scaley
t.shear_x.value = rawfax * scaley / scalex
t.shear_y.value = 0
lib = {
:Quad,
:an_xshift,
:an_yshift,
:relevantTags,
:usedTags,
:prepareForPerspective
:transformPoints,
:tagsFromQuad,
}
if haveDepCtrl
lib.version = depctrl
return depctrl\register lib
else
return lib