split up code to functions (finally)

2020-06-25 13:29:24 +02:00
parent cc0376fc37
commit 6030a2e58a
1 changed files with 52 additions and 46 deletions
--- a/gen-script.py
+++ b/gen-script.py
@ -3,9 +3,6 @@ import re
 import os
 from datetime import timedelta

-search = '(pesky bird)' # the searched phrase
-sides = timedelta(seconds=8) # time we cut on both sides
-
 # TODO:
 #reimplement overlapping
 #now sides cant be bigger than 29, because of the way i hardcoded it somewhere
@ -13,7 +10,7 @@ sides = timedelta(seconds=8) # time we cut on both sides
 # the fast version should be for testing only a
 # implement fast better quality version. will have to use

-# left clamps. used to make sure that 00:00:02 doesn't become 23:59:42
+# left clamps. used to make sure that eg. 00:00:02 doesn't become 23:59:52
 def l_clamps(t, delta):
    if t < delta:
        return timedelta()
@ -32,46 +29,55 @@ def merge_overlap(data): # if two chunks overlap, they get merged
        prev = cur


+def get_subs_location():
+    file_names = []
+    for file in os.listdir(path):
+        file_names.append(file)
+        file_names.sort()
+    return file_names
+
+
+def generate_splice_data(file_names):
+    data = []
+    for i, f in enumerate(file_names):
+        file = open(path + f)
+        for i, line in enumerate(file):
+            if i%4 == 2 and re.search(search, line): # we only need to check lines which contain text, hence the first condition
+                data.append({
+                'fname':f,
+                'beg':l_clamps(timedelta(minutes = int(prev[3  :5]), seconds=int(prev[6:  8])), sides),
+                'end':l_clamps(timedelta(minutes = int(prev[20:22]), seconds=int(prev[23:25])), sides),
+                'desc':line[:-1]}) # get file name, time stamps and desciption
+            if i%4 == 1:
+                prev = line # a timestamp line
+    return data
+
+
+def write_list_rip_debug(data):
+    file_list = open('list.txt', 'w')
+    file_rip = open('rip.sh', 'w')
+    file_rip.write('#!/bin/bash\n')
+    for (i, d) in enumerate(data):
+        if d['desc'][-1]=='@':
+            continue
+        name = d['fname'][:2] # get a name without an extension
+        outname ="../out/{}-{:0>2}.mp4".format(name, i)
+
+        file_list.write("file '{}'\n".format(outname))
+        print(d['end']-d['beg'])
+        delta=d['end']-d['beg']+timedelta(seconds=6)
+        file_rip .write('ffmpeg -ss {} -i ../original/{}.mp4 -to 0{} -c copy {}\n'.format(d['beg'], name, d['end']-d['beg']+timedelta(seconds=6),outname)) # fast but not accurate
+        # file_rip .write('ffmpeg -i ../original/{}.mp4 -ss 0{} -t 0{} -async 1 {}\n'.format(name, d['beg'], delta ,outname)) # fast but not accurate
+
+    file_debug = open('debug.txt', 'w')
+    for d in data:
+        file_debug.write('{}\t{}\t{}\t{}\n'.format(d['fname'][:2], d['beg'], d['end'], d['desc']))
+
+
 path = os.getcwd() + '/../subs/' # subtitles location
-file_names = []
-
-for file in os.listdir(path):
-    file_names.append(file)
-file_names.sort()
-
-data = []
-
-for i, f in enumerate(file_names):
-    file = open(path + f)
-    for i, line in enumerate(file):
-        if i%4 == 2 and re.search(search, line): # we only need to check lines which contain text, hence the first condition
-            data.append({
-            'fname':f,
-            'beg':l_clamps(timedelta(minutes = int(prev[3  :5]), seconds=int(prev[6:  8])), sides),
-            'end':l_clamps(timedelta(minutes = int(prev[20:22]), seconds=int(prev[23:25])), sides),
-            'desc':line[:-1]}) # get file name, time stamps and desciption
-        if i%4 == 1:
-            prev = line # a timestamp line
-
-
-#merge_overlap(data)
-
-
-file_list = open('list.txt', 'w')
-file_rip = open('rip.sh', 'w')
-file_rip.write('#!/bin/bash\n')
-for (i, d) in enumerate(data):
-      if d['desc'][-1]=='@':
-          continue
-      name = d['fname'][:2] # get a name without an extension
-      outname ="../out/{}-{:0>2}.mp4".format(name, i)
-
-      file_list.write("file '{}'\n".format(outname))
-      print(d['end']-d['beg'])
-      delta=d['end']-d['beg']+timedelta(seconds=6)
-      file_rip .write('ffmpeg -ss {} -i ../original/{}.mp4 -to 0{} -c copy {}\n'.format(d['beg'], name, d['end']-d['beg']+timedelta(seconds=6),outname)) # fast but not accurate
-      # file_rip .write('ffmpeg -i ../original/{}.mp4 -ss 0{} -t 0{} -async 1 {}\n'.format(name, d['beg'], delta ,outname)) # fast but not accurate
-
-file_debug = open('debug.txt', 'w')
-for d in data:
-    file_debug.write('{}\t{}\t{}\t{}\n'.format(d['fname'][:2], d['beg'], d['end'], d['desc']))
+search = '(pesky bird)' # the searched phrase
+sides = timedelta(seconds=8) # time we cut on both sides
+file_names = get_subs_location()
+data = generate_splice_data(file_names)
+merge_overlap(data)
+write_list_rip_debug(data)