6
6
from typing import TYPE_CHECKING
7
7
8
8
import numpy as np
9
+ from numpy import concatenate as npconcat
10
+ from numpy import zeros as npzeros
9
11
10
12
from auto_editor import version
11
13
from auto_editor .lang .json import Lexer , Parser , dump
19
21
orc ,
20
22
)
21
23
from auto_editor .lib .data_structs import Sym
22
- from auto_editor .render .subtitle import SubtitleParser
23
24
from auto_editor .utils .cmdkw import (
24
25
Required ,
25
26
pAttr ,
@@ -190,7 +191,7 @@ def none(self) -> NDArray[np.bool_]:
190
191
return np .ones (self .media_length , dtype = np .bool_ )
191
192
192
193
def all (self ) -> NDArray [np .bool_ ]:
193
- return np . zeros (self .media_length , dtype = np .bool_ )
194
+ return npzeros (self .media_length , dtype = np .bool_ )
194
195
195
196
def read_cache (self , tag : str , obj : dict [str , Any ]) -> None | np .ndarray :
196
197
workfile = os .path .join (
@@ -278,7 +279,7 @@ def get_max_volume(s: np.ndarray) -> float:
278
279
)
279
280
self .bar .start (audio_ticks , "Analyzing audio volume" )
280
281
281
- threshold_list = np . zeros ((audio_ticks ), dtype = np .float64 )
282
+ threshold_list = npzeros ((audio_ticks ), dtype = np .float64 )
282
283
283
284
if max_volume == 0 : # Prevent dividing by zero
284
285
return threshold_list
@@ -313,31 +314,51 @@ def subtitle(
313
314
except re .error as e :
314
315
self .log .error (e )
315
316
316
- sub_file = self .ensure .subtitle (self .src , stream )
317
- parser = SubtitleParser (self .tb )
317
+ import av
318
+
319
+ result = npzeros ((30 ), dtype = np .bool_ )
320
+ count = 0
321
+ subtitle_length = 0
318
322
319
- with open (sub_file , encoding = "utf-8" ) as file :
320
- parser .parse (file .read (), "webvtt" )
323
+ with av .open (self .src .path , "r" ) as container :
324
+ for packet in container .demux (subtitles = stream ):
325
+ if packet is None or packet .pts is None :
326
+ continue
321
327
322
- # stackoverflow.com/questions/9662346/python-code-to-remove-html-tags-from-a-string
323
- def cleanhtml (raw_html : str ) -> str :
324
- cleanr = re .compile ("<.*?>" )
325
- return re .sub (cleanr , "" , raw_html )
328
+ line = ""
329
+ if sub := packet .decode ():
330
+ for val in sub [0 ].rects :
331
+ if isinstance (val , av .subtitles .subtitle .AssSubtitle ):
332
+ line += val .ass .decode ("utf-8" , "ignore" )
333
+ if isinstance (val , av .subtitles .subtitle .TextSubtitle ):
334
+ line += val .text .decode ("utf-8" , "ignore" )
326
335
327
- if not parser .contents :
328
- self .log .error ("subtitle has no valid entries" )
336
+ if packet .duration is not None and packet .time_base is not None :
337
+ end = round (
338
+ (packet .pts + packet .duration ) * packet .time_base * self .tb
339
+ )
340
+ subtitle_length = max (subtitle_length , end )
329
341
330
- result = np .zeros ((parser .contents [- 1 ].end ), dtype = np .bool_ )
342
+ if line and re .search (pattern , line ):
343
+ if packet .duration is None or packet .time_base is None :
344
+ self .log .warning ("Subtitle has unknown duration" )
345
+ continue
331
346
332
- count = 0
333
- for content in parser .contents :
334
- if max_count is not None and count >= max_count :
335
- break
347
+ count += 1
348
+ start = round (packet .pts * packet .time_base * self .tb )
349
+
350
+ if len (result ) < end :
351
+ new_length = max (end , len (result ) * 2 )
352
+ result = npconcat (
353
+ [result , npzeros (new_length , dtype = np .bool_ )], axis = 0
354
+ )
355
+
356
+ result [start :end ] = 1
357
+
358
+ if max_count is not None and count >= max_count :
359
+ break
336
360
337
- line = cleanhtml (content .after .strip ())
338
- if line and re .search (pattern , line ):
339
- result [content .start : content .end ] = 1
340
- count += 1
361
+ result = result [:subtitle_length ]
341
362
342
363
return result
343
364
@@ -377,7 +398,7 @@ def motion(self, s: int, blur: int, width: int) -> NDArray[np.float64]:
377
398
)
378
399
graph .configure ()
379
400
380
- threshold_list = np . zeros ((1024 ), dtype = np .float64 )
401
+ threshold_list = npzeros ((1024 ), dtype = np .float64 )
381
402
382
403
for unframe in container .decode (stream ):
383
404
graph .push (unframe )
@@ -392,8 +413,8 @@ def motion(self, s: int, blur: int, width: int) -> NDArray[np.float64]:
392
413
current_frame = frame .to_ndarray ()
393
414
394
415
if index > len (threshold_list ) - 1 :
395
- threshold_list = np . concatenate (
396
- (threshold_list , np . zeros ((len (threshold_list )), dtype = np .float64 )),
416
+ threshold_list = npconcat (
417
+ (threshold_list , npzeros ((len (threshold_list )), dtype = np .float64 )),
397
418
axis = 0 ,
398
419
)
399
420
0 commit comments