openshot_video_generator.py 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976
  1. from os import listdir
  2. from os.path import isfile, isdir, join
  3. import openshot
  4. import threading
  5. import zhtts
  6. import os
  7. import urllib
  8. from typing import List
  9. import requests
  10. from pydantic import BaseModel
  11. from bs4 import BeautifulSoup
  12. from PIL import Image,ImageDraw,ImageFont
  13. import pyttsx3
  14. import rpyc
  15. import random
  16. import re
  17. import time
  18. import math
  19. import dataset
  20. from datetime import datetime
  21. from gtts import gTTS
  22. import ffmpy
  23. from difflib import SequenceMatcher
  24. import difflib
  25. from autosub import DEFAULT_CONCURRENCY
  26. from autosub import DEFAULT_SUBTITLE_FORMAT
  27. from pytranscriber.control.ctr_main import Ctr_Main
  28. from pytranscriber.control.ctr_autosub import Ctr_Autosub
  29. import multiprocessing
  30. from itertools import groupby
  31. from operator import itemgetter
  32. from util.parser import parser
  33. dir_sound = 'mp3_track/'
  34. dir_photo = 'photo/'
  35. dir_text = 'text_file/'
  36. dir_video = 'video_material/'
  37. dir_title = 'title/'
  38. dir_subtitle = 'subtitle/'
  39. dir_anchor = 'anchor_raw/'
  40. tmp_video_dir = 'tmp_video/'
  41. video_sub_folder = 'ai_anchor_video/'
  42. dir_list = [dir_sound,dir_photo,dir_text,dir_video,dir_title,dir_subtitle,dir_anchor,tmp_video_dir]
  43. def notify_group(msg):
  44. glist=['7vilzohcyQMPLfAMRloUawiTV4vtusZhxv8Czo7AJX8','WekCRfnAirSiSxALiD6gcm0B56EejsoK89zFbIaiZQD','1dbtJHbWVbrooXmQqc4r8OyRWDryjD4TMJ6DiDsdgsX','HOB1kVNgIb81tTB4Ort1BfhVp9GFo6NlToMQg88vEhh']
  45. for gid in glist:
  46. headers = {
  47. "Authorization": "Bearer " + gid,
  48. "Content-Type": "application/x-www-form-urlencoded"
  49. }
  50. params = {"message": msg}
  51. r = requests.post("https://notify-api.line.me/api/notify",headers=headers, params=params)
  52. def cKey(r,g,b,fuzz):
  53. col=openshot.Color()
  54. col.red=openshot.Keyframe(r)
  55. col.green=openshot.Keyframe(g)
  56. col.blue=openshot.Keyframe(b)
  57. return openshot.ChromaKey(col, openshot.Keyframe(fuzz))
  58. def video_photo_clip(vid=None,layer=None, position=None, end=None
  59. ,scale_x=1,scale_y=1,location_x=0,location_y=0,ck=None,audio=True):
  60. clip = openshot.Clip(vid)
  61. clip.Layer(layer)
  62. clip.Position(position)
  63. clip.End(end)
  64. clip.scale_x=openshot.Keyframe(scale_x)
  65. clip.scale_y=openshot.Keyframe(scale_y)
  66. clip.location_x=openshot.Keyframe(location_x)
  67. clip.location_y=openshot.Keyframe(location_y)
  68. if ck!=None:
  69. clip.AddEffect(ck)
  70. if audio==True:
  71. clip.has_audio=openshot.Keyframe(1)
  72. else:
  73. clip.has_audio=openshot.Keyframe(0)
  74. return clip
  75. def listener_progress(string, percent):
  76. True
  77. def myunichchar(unicode_char):
  78. mb_string = unicode_char.encode('big5')
  79. try:
  80. unicode_char = unichr(ord(mb_string[0]) << 8 | ord(mb_string[1]))
  81. except NameError:
  82. unicode_char = chr(mb_string[0] << 8 | mb_string[1])
  83. return unicode_char
  84. def get_url_type(url):
  85. req = urllib.request.Request(url, method='HEAD', headers={'User-Agent': 'Mozilla/5.0'})
  86. r = urllib.request.urlopen(req)
  87. contentType = r.getheader('Content-Type')
  88. return contentType
  89. def make_dir(name_hash):
  90. for direct in dir_list:
  91. if not os.path.isdir(direct):
  92. os.mkdir(direct)
  93. try:
  94. os.mkdir(dir_photo+name_hash)
  95. except FileExistsError:
  96. print("~~~~~~Warning~~~~~~~~~Directory " , dir_photo+name_hash , " already exists")
  97. try:
  98. os.mkdir(dir_text+name_hash)
  99. except FileExistsError:
  100. print("~~~~~~Warning~~~~~~~~~Directory " , dir_text+name_hash , " already exists")
  101. try:
  102. os.mkdir(dir_sound+name_hash)
  103. except FileExistsError:
  104. print("~~~~~~Warning~~~~~~~~~Directory " , dir_sound+name_hash , " already exists")
  105. try:
  106. os.mkdir(dir_anchor+name_hash)
  107. except FileExistsError:
  108. print("~~~~~~Warning~~~~~~~~~Directory " , dir_anchor+name_hash , " already exists")
  109. try:
  110. os.mkdir(dir_subtitle+name_hash)
  111. except FileExistsError:
  112. print("~~~~~~Warning~~~~~~~~~Directory " , dir_subtitle+name_hash , " already exists")
  113. def file_prepare(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  114. make_dir(name_hash)
  115. img_num = 1
  116. for imgu in image_urls:
  117. if get_url_type(imgu) =='video/mp4':
  118. r=requests.get(imgu)
  119. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  120. for chunk in r.iter_content(chunk_size=255):
  121. if chunk:
  122. f.write(chunk)
  123. f.close()
  124. else:
  125. im = Image.open(requests.get(imgu, stream=True).raw)
  126. im= im.convert("RGB")
  127. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  128. img_num+=1
  129. #save text
  130. txt_idx=0
  131. for txt in text_content:
  132. text_file = open(dir_text+name_hash+"/"+str(txt_idx)+".txt", "w")
  133. text_file.write(txt)
  134. text_file.close()
  135. txt_idx+=1
  136. print("text file made")
  137. #make mp3
  138. txt_idx = 0
  139. for txt in text_content:
  140. if lang!='zh' or multiLang==1:
  141. if lang!='zh':
  142. tts = gTTS(txt)
  143. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  144. else:
  145. tts = gTTS(txt,lang='zh-tw')
  146. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  147. #speed up
  148. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  149. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  150. ff.run()
  151. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  152. else:
  153. print('use zhtts')
  154. tts = zhtts.TTS()
  155. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  156. txt_idx+=1
  157. print("mp3 file made")
  158. #make title as image
  159. txt2image_title(name, dir_title+name_hash+".png",lang)
  160. def file_prepare_long(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  161. make_dir(name_hash)
  162. img_num = 1
  163. for imgu in image_urls:
  164. if get_url_type(imgu) =='video/mp4':
  165. r=requests.get(imgu)
  166. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  167. for chunk in r.iter_content(chunk_size=255):
  168. if chunk:
  169. f.write(chunk)
  170. f.close()
  171. else:
  172. im = Image.open(requests.get(imgu, stream=True).raw)
  173. im= im.convert("RGB")
  174. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  175. img_num+=1
  176. #make mp3
  177. text_parser = parser()
  178. txt_idx = 0
  179. for txt in text_content:
  180. rep_list = text_parser.replace_list(txt)
  181. for reptxt in rep_list:
  182. txt = txt.replace(reptxt,'')
  183. if lang!='zh' or multiLang==1:
  184. if lang!='zh':
  185. tts = gTTS(txt)
  186. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  187. else:
  188. tts = gTTS(txt,lang='zh-tw')
  189. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  190. #speed up
  191. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  192. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  193. ff.run()
  194. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  195. else:
  196. print('use zhtts')
  197. tts = zhtts.TTS()
  198. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  199. txt_idx+=1
  200. print("mp3 file made")
  201. #make title as image
  202. txt2image_title(name, dir_title+name_hash+".png",lang)
  203. def txt2image(content, save_target,lang='zh'):
  204. unicode_text = trim_punctuation(content)
  205. font = ''
  206. if lang=='zh':
  207. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=38)
  208. else :
  209. font = ImageFont.truetype(font="font/arial.ttf", size=38)
  210. text_width, text_height = font.getsize(unicode_text)
  211. canvas = Image.new('RGBA', (700, 500), (255, 0, 0, 0) )
  212. draw = ImageDraw.Draw(canvas)
  213. text= unicode_text
  214. draw.text((5,5), text, (255, 255, 0), font)
  215. canvas.save(save_target, "PNG")
  216. def txt2image_title(content, save_target, lang='zh'):
  217. unicode_text = trim_punctuation(content)
  218. font = ''
  219. if lang=='zh':
  220. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=22)
  221. else :
  222. font = ImageFont.truetype(font="font/arial.ttf", size=22)
  223. text_width, text_height = font.getsize(unicode_text)
  224. canvas = Image.new('RGBA', (510, 500), (255, 0, 0, 0) )
  225. draw = ImageDraw.Draw(canvas)
  226. text= unicode_text
  227. draw.text((5,5), text, (17, 41, 167), font)
  228. canvas.save(save_target, "PNG")
  229. def call_anchor(fileName,avatar):
  230. conn = rpyc.classic.connect("192.168.1.105",18812)
  231. ros = conn.modules.os
  232. rsys = conn.modules.sys
  233. fr=open(dir_sound+fileName+".mp3",'rb')# voice
  234. #warning!!! file my be replaced by other process
  235. fw=conn.builtins.open('/tmp/output.mp3','wb')
  236. while True:
  237. b=fr.read(1024)
  238. if b:
  239. fw.write(b)
  240. else:
  241. break
  242. fr.close()
  243. fw.close()
  244. val=random.randint(1000000,9999999)
  245. ros.chdir('/home/jared/to_video')
  246. ros.system('./p'+str(avatar)+'.sh '+str(val)+' &')
  247. while True:
  248. print('waiting...')
  249. if ros.path.exists('/tmp/results/'+str(val)):
  250. break
  251. time.sleep(5)
  252. print('waiting...')
  253. fr=conn.builtins.open('/tmp/results/'+str(val)+'.mp4','rb')
  254. fw=open(dir_anchor+fileName+".mp4",'wb')
  255. while True:
  256. b=fr.read(1024)
  257. if b:
  258. fw.write(b)
  259. else:
  260. break
  261. fr.close()
  262. fw.close()
  263. def syllable_count(word):
  264. word = word.lower()
  265. count = 0
  266. vowels = "aeiouy"
  267. if word[0] in vowels:
  268. count += 1
  269. for index in range(1, len(word)):
  270. if word[index] in vowels and word[index - 1] not in vowels:
  271. count += 1
  272. if word.endswith("e"):
  273. count -= 1
  274. if count == 0:
  275. count += 1
  276. return count
  277. def split_sentence(in_str, maxLen):
  278. re.findall(r'[\u4e00-\u9fff]+', in_str)
  279. zh_idx = []
  280. eng_idx= []
  281. for i in range(len(in_str)):
  282. if in_str[i] > u'\u4e00' and in_str[i] < u'\u9fff':
  283. zh_idx.append(i)
  284. else:
  285. eng_idx.append(i)
  286. space_index = [m.start() for m in re.finditer(' ', in_str)]
  287. for idx in space_index:
  288. eng_idx.remove(idx)
  289. eng_range_list = []
  290. for k, g in groupby(enumerate(eng_idx), lambda ix : ix[0] - ix[1]):
  291. eng_range = list(map(itemgetter(1), g))
  292. eng_range_list.append(eng_range)
  293. total_syllable = 0
  294. for i in range(len(eng_range_list)):
  295. total_syllable += (syllable_count(in_str[eng_range_list[i][0]:eng_range_list[i][-1]+1])+0.5)
  296. for i in range(len(zh_idx)):
  297. total_syllable+=1
  298. #final chchchchchc[en][en][en]
  299. #[en] is a vocabulary dict with occurence of image
  300. zh_eng_idx_list = []
  301. i = 0
  302. while i < len(in_str):
  303. if in_str[i]==' ':
  304. i+=1
  305. if i in zh_idx:
  306. zh_eng_idx_list.append(i)
  307. i+=1
  308. if i in eng_idx:
  309. for ls in eng_range_list:
  310. if i in ls:
  311. zh_eng_idx_list.append(ls)
  312. i = ls[-1]+1
  313. break
  314. zh_eng_dict_list = [{'content':'','time_ratio':0}]
  315. idx = 0
  316. current_len = 0
  317. sen_idx = 0
  318. while idx < len(zh_eng_idx_list):
  319. str_from_idx = ''
  320. sylla_cnt = 1
  321. if type(zh_eng_idx_list[idx])==type([]):
  322. str_from_idx = in_str[zh_eng_idx_list[idx][0]:zh_eng_idx_list[idx][-1]+1]+' '
  323. sylla_cnt = syllable_count(str_from_idx)
  324. else:
  325. str_from_idx = in_str[zh_eng_idx_list[idx]]
  326. if len(zh_eng_dict_list[sen_idx]['content'])+sylla_cnt>=maxLen:
  327. zh_eng_dict_list[sen_idx]['time_ratio'] = current_len/total_syllable
  328. zh_eng_dict_list.append({'content':'','time_ratio':0})
  329. sen_idx+=1
  330. current_len = 0
  331. else:
  332. current_len += sylla_cnt
  333. zh_eng_dict_list[sen_idx]['content'] += str_from_idx
  334. idx+=1
  335. total_ratio = 0
  336. for obj in zh_eng_dict_list:
  337. total_ratio+=obj['time_ratio']
  338. zh_eng_dict_list[-1]['time_ratio'] = 1-total_ratio
  339. return zh_eng_dict_list
  340. def parse_script(file_path,gt_list):
  341. with open(file_path, 'r',encoding="utf-8") as f:
  342. raw_lines = [line.strip() for line in f]
  343. lines = adjustSub_by_text_similarity(gt_list,raw_lines)
  344. text_parser = parser()
  345. #make dict
  346. dict_list = []
  347. for idx in range(len(lines)):
  348. script={}
  349. print(lines[idx])
  350. rep_ls = text_parser.replace_list(lines[idx])
  351. print(rep_ls)
  352. line_content = lines[idx]
  353. for reptxt in rep_ls:
  354. line_content = line_content.replace(reptxt,'')
  355. if len(rep_ls)!=0:
  356. script['image_idx'] = int(rep_ls[0].replace('{','').replace('}',''))
  357. script['content'] = line_content
  358. time_raw = raw_lines[idx * 4 +1 ].split(' --> ')
  359. start = time_raw[0].split(':')
  360. stop = time_raw[1].split(':')
  361. script['start'] = float(start[0])*3600 + float(start[1])*60 + float(start[2].replace(',','.'))
  362. script['stop'] = float(stop[0])*3600 + float(stop[1])*60 + float(stop[2].replace(',','.'))
  363. dict_list.append(script)
  364. #merge duplicated sentences
  365. script_not_dup_list = []
  366. for idx in range(len(dict_list)):
  367. dup_list = []
  368. for idx_inner in range(len(dict_list)):
  369. if dict_list[idx_inner]['content']==dict_list[idx]['content']:
  370. dup_list.append(idx_inner)
  371. for dup_idx in dup_list:
  372. if dup_idx == min(dup_list):
  373. dict_list[dup_idx]['type'] = 'lead_sentence'
  374. else:
  375. dict_list[dup_idx]['type'] = 'duplicated'
  376. dict_list[dup_list[0]]['stop'] = dict_list[dup_list[-1]]['stop']
  377. if dict_list[idx]['type'] == 'lead_sentence':
  378. script_not_dup_list.append(dict_list[idx])
  379. #avoid subtitle overlapping ? Timeline overlapping not found currently
  380. #cut by max length----> eng seperated problem {eng_idx}
  381. #ENG counts, zh counts, space counts
  382. new_idx = 0
  383. splitted_dict = []
  384. for dic in script_not_dup_list:
  385. dic_idx = 0
  386. accumulated_duration = 0
  387. duration = dic['stop']-dic['start']
  388. for sub_dic in split_sentence(dic['content'],13):
  389. new_dic = {}
  390. new_dic['index'] = new_idx
  391. if 'image_idx' in dic:
  392. new_dic['image_obj'] = {'start':dic['start'],'idx':dic['image_idx']}
  393. new_idx+=1
  394. ind_duration = duration * sub_dic['time_ratio']
  395. new_dic['start'] = dic['start'] + accumulated_duration
  396. accumulated_duration += ind_duration
  397. new_dic['content'] = sub_dic['content']
  398. new_dic['duration'] = ind_duration*0.7
  399. splitted_dict.append(new_dic)
  400. return splitted_dict
  401. def adjustSub_by_text_similarity(gts_in,gens_raw):
  402. #call by value only
  403. gts = gts_in[:]
  404. text_parser = parser()
  405. for i in range(len(gts)):
  406. rep_ls = text_parser.replace_list(gts[i])
  407. for reptxt in rep_ls:
  408. gts[i] = gts[i].replace(reptxt,'')
  409. print(gts)
  410. gens = []
  411. for idx in range(int((len(gens_raw)+1)/4)):
  412. gens.append(gens_raw[idx*4+2])
  413. combine2 = [''.join([i,j]) for i,j in zip(gts, gts[1:])]
  414. combine3 = [''.join([i,j,k]) for i,j,k in zip(gts, gts[1:], gts[2:])]
  415. alls = gts + combine2 + combine3
  416. adjusted = [None]*len(gens)
  417. duplicated_list = []
  418. for idx in range(len(gens)):
  419. match_text = difflib.get_close_matches(gens[idx], alls, cutoff=0.1)
  420. if match_text[0] in duplicated_list:
  421. for mt in match_text:
  422. if mt == adjusted[idx-1] or mt not in duplicated_list:
  423. adjusted[idx] = mt
  424. break
  425. else:
  426. adjusted[idx] = match_text[0]
  427. duplicated_list.append(match_text[0])
  428. combine2_tag = [''.join([i,j]) for i,j in zip(gts_in, gts_in[1:])]
  429. combine3_tag = [''.join([i,j,k]) for i,j,k in zip(gts_in, gts_in[1:], gts_in[2:])]
  430. alls_tag = gts_in + combine2_tag + combine3_tag
  431. for idx in range(len(adjusted)):
  432. match_text = difflib.get_close_matches(adjusted[idx], alls_tag, cutoff=0.1)
  433. adjusted[idx] = match_text[0]
  434. return adjusted
  435. def trim_punctuation(s):
  436. pat_block = u'[^\u4e00-\u9fff0-9a-zA-Z]+';
  437. pattern = u'([0-9]+{0}[0-9]+)|{0}'.format(pat_block)
  438. res = re.sub(pattern, lambda x: x.group(1) if x.group(1) else u" " ,s)
  439. return res
  440. def splitter(s):
  441. for sent in re.findall(u'[^!?,。\!\?]+[!? 。\!\?]?', s, flags=re.U):
  442. yield sent
  443. def split_by_pun(s):
  444. res = list(splitter(s))
  445. return res
  446. def generate_subtitle_image_from_dict(name_hash, sub_dict):
  447. for script in sub_dict:
  448. sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  449. sub = script['content']
  450. txt2image(sub,sv_path)
  451. def generate_subtitle_image(name_hash,text_content):
  452. img_list = [None]*len(text_content)
  453. for idx in range(len(text_content)):
  454. img_list[idx]=[]
  455. senList = split_by_pun(text_content[idx])
  456. for inner_idx in range(len(senList)):
  457. sv_path = dir_subtitle + name_hash +'/'+str(idx)+ str(inner_idx) +'.png'
  458. sub = senList[inner_idx]
  459. txt2image(sub,sv_path)
  460. img_list[idx]+=[{"count":len(sub),"path":sv_path}]
  461. return img_list
  462. def generate_subtitle_image_ENG(name_hash,text_content):
  463. img_list = [None]*len(text_content)
  464. for idx in range(len(text_content)):
  465. sv_path = dir_subtitle + name_hash +'/'+str(idx)+'.png'
  466. sub = text_content[idx]
  467. txt2image(sub, sv_path,lang='eng')
  468. img_list[idx] = sv_path
  469. return img_list
  470. def video_writer_init(path):
  471. w = openshot.FFmpegWriter(path)
  472. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  473. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  474. openshot.Fraction(1, 1), False, False, 3000000)
  475. return w
  476. def video_gen(name_hash,name,text_content, image_urls,multiLang,avatar):
  477. file_prepare_long(name, name_hash, text_content,image_urls,multiLang)
  478. for fname in range(len(text_content)):
  479. call_anchor(name_hash+"/"+str(fname),avatar)
  480. print('called............................................')
  481. ck=cKey(0,254,0,270)
  482. ck_anchor=cKey(0,255,1,320)
  483. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  484. t.Open()
  485. main_timer = 0
  486. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  487. LOGO_OP.Open() # Open the reader
  488. head_duration = LOGO_OP.info.duration
  489. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=head_duration
  490. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  491. t.AddClip(LOGO_OP_clip)
  492. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  493. bg_head.Open()
  494. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  495. t.AddClip(bg_head_clip)
  496. main_timer += head_duration
  497. bg_head.Close()
  498. LOGO_OP.Close()
  499. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  500. anchor.Open()
  501. #anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  502. # location_x=0.35,location_y=0.25,position=main_timer, end=anchor.info.duration,ck=ck_anchor,audio=False)
  503. #t.AddClip(anchor_clip)
  504. speech = openshot.FFmpegReader(dir_sound+name_hash+"/0.mp3")
  505. speech.Open()
  506. speech_clip = openshot.Clip(speech)
  507. speech_clip.Position(main_timer)
  508. speech_clip.End(anchor.info.duration)
  509. t.AddClip(speech_clip)
  510. main_timer += anchor.info.duration
  511. anchor.Close()
  512. speech.Close()
  513. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  514. LOGO_ED.Open()
  515. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration
  516. ,location_x=0.005,location_y=-0.031, scale_x=0.8,scale_y=0.6825)
  517. t.AddClip(LOGO_ED_clip)
  518. main_timer += LOGO_ED.info.duration
  519. LOGO_ED.Close()
  520. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  521. bg.Open()
  522. bg_times = math.floor(main_timer/bg.info.duration)
  523. left_time = (main_timer) % bg.info.duration
  524. bg_clip_list = [None] * bg_times
  525. bg_list = [None] * bg_times
  526. bg.Close()
  527. bg_timer = head_duration
  528. for idx in range(bg_times):
  529. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  530. bg_list[idx].Open()
  531. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer,end=bg_list[idx].info.duration,ck=ck)
  532. t.AddClip(bg_clip_list[idx])
  533. bg_timer += bg_list[idx].info.duration
  534. bg_list[idx].Close()
  535. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  536. bg_left.Open()
  537. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  538. t.AddClip(bg_left_clip)
  539. bg_left.Close()
  540. title = openshot.QtImageReader(dir_title+name_hash+".png")
  541. title.Open() # Open the reader
  542. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  543. t.AddClip(title_clip)
  544. w = video_writer_init(tmp_video_dir+name_hash+"raw.mp4")
  545. w.Open()
  546. frames = int(t.info.fps)*int(main_timer)
  547. for n in range(frames):
  548. f=t.GetFrame(n)
  549. w.WriteFrame(f)
  550. t.Close()
  551. w.Close()
  552. print(name+"RAW DONE : www.choozmo.com:8168/"+tmp_video_dir+name_hash+"raw.mp4")
  553. #start adding sub
  554. #add sub
  555. Ctr_Autosub.init()
  556. Ctr_Autosub.generate_subtitles(tmp_video_dir+name_hash+"raw.mp4",'zh',listener_progress,output=tmp_video_dir+name_hash+"script.txt",concurrency=DEFAULT_CONCURRENCY,subtitle_file_format=DEFAULT_SUBTITLE_FORMAT)
  557. sub_dict = parse_script(tmp_video_dir+name_hash+"script.txt",split_by_pun(text_content[0]))
  558. for subd in sub_dict:
  559. print(subd)
  560. generate_subtitle_image_from_dict(name_hash, sub_dict)
  561. #sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  562. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  563. t.Open()
  564. raw = openshot.FFmpegReader(tmp_video_dir+name_hash+"raw.mp4")
  565. raw.Open()
  566. raw_clip = video_photo_clip(vid=raw,layer=2,position=0, end=raw.info.duration)
  567. t.AddClip(raw_clip)
  568. sub_img_list = [None] * len(sub_dict)
  569. sub_clip_list = [None] * len(sub_dict)
  570. for sub_obj in sub_dict:
  571. idx = int(sub_obj['index'])
  572. sub_img_list[idx] = openshot.QtImageReader(dir_subtitle + name_hash + '/' + str(idx)+'.png')
  573. sub_img_list[idx].Open()
  574. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=sub_obj['start'],end=math.ceil(sub_obj['duration']))
  575. t.AddClip(sub_clip_list[idx])
  576. sub_img_list[idx].Close()
  577. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  578. anchor.Open()
  579. anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  580. location_x=0.35,location_y=0.25,position=head_duration, end=anchor.info.duration,ck=ck_anchor,audio=False)
  581. t.AddClip(anchor_clip)
  582. w = video_writer_init(tmp_video_dir+name_hash+".mp4")
  583. w.Open()
  584. frames = int(t.info.fps)*int(main_timer)
  585. for n in range(frames):
  586. f=t.GetFrame(n)
  587. w.WriteFrame(f)
  588. t.Close()
  589. w.Close()
  590. os.remove(tmp_video_dir+name_hash+"raw.mp4")
  591. os.remove(tmp_video_dir+name_hash+"script.txt")
  592. print(name+"ALL DONE : www.choozmo.com:8168/"+video_sub_folder+name_hash+"raw.mp4")
  593. def anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar):
  594. print(os.getcwd())
  595. print('sub image made')
  596. print(multiLang)
  597. file_prepare(name, name_hash, text_content,image_urls,multiLang)
  598. sub_list=generate_subtitle_image(name_hash,text_content)
  599. for fname in range(len(text_content)):
  600. call_anchor(name_hash+"/"+str(fname),avatar)
  601. print('step finish')
  602. print('called............................................')
  603. ck=cKey(0,254,0,270)
  604. ck_anchor=cKey(0,255,1,320)
  605. duration = 0
  606. #average layer level is 3
  607. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  608. t.Open()
  609. main_timer = 0
  610. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  611. LOGO_OP.Open() # Open the reader
  612. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  613. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  614. t.AddClip(LOGO_OP_clip)
  615. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  616. bg_head.Open()
  617. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  618. t.AddClip(bg_head_clip)
  619. main_timer += LOGO_OP.info.duration
  620. head_duration = LOGO_OP.info.duration
  621. bg_head.Close()
  622. LOGO_OP.Close()
  623. clip_duration=0
  624. photo_clip_list = [None]*len(text_content)
  625. img_list = [None]*len(text_content)
  626. anchor_clip_list = [None] * len(text_content)
  627. anchor_list = [None] * len(text_content)
  628. audio_clip_list = [None] * len(text_content)
  629. audio_list = [None] * len(text_content)
  630. sub_clip_list = [None] * len(text_content)
  631. sub_img_list = [None] * len(text_content)
  632. idx = 0
  633. for p in listdir(dir_photo+name_hash):
  634. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  635. clip_duration = anchor_list[idx].info.duration
  636. anchor_list[idx].Open()
  637. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  638. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  639. t.AddClip(anchor_clip_list[idx])
  640. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  641. img_list[idx].Open()
  642. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  643. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  644. t.AddClip(photo_clip_list[idx])
  645. img_list[idx].Close()
  646. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  647. audio_list[idx].Open()
  648. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  649. audio_clip_list[idx].Position(main_timer)
  650. audio_clip_list[idx].End(clip_duration)
  651. t.AddClip(audio_clip_list[idx])
  652. img_list[idx].Close()
  653. anchor_list[idx].Close()
  654. audio_list[idx].Close()
  655. sub_img_list[idx] = [None] * len(sub_list[idx])
  656. sub_clip_list[idx] = [None] * len(sub_list[idx])
  657. sub_timer = 0
  658. for sub_idx in range(len(sub_list[idx])):
  659. sub_img_list[idx][sub_idx] = openshot.QtImageReader(sub_list[idx][sub_idx]['path'])
  660. sub_img_list[idx][sub_idx].Open()
  661. sub_duration = 0.205*sub_list[idx][sub_idx]['count']
  662. sub_clip_list[idx][sub_idx] = video_photo_clip(vid=sub_img_list[idx][sub_idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer+sub_timer,end=sub_duration)
  663. t.AddClip(sub_clip_list[idx][sub_idx])
  664. sub_img_list[idx][sub_idx].Close()
  665. sub_timer += sub_duration
  666. print(sub_list[idx][sub_idx]['path'])
  667. main_timer += clip_duration
  668. idx+=1
  669. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  670. LOGO_ED.Open()
  671. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  672. ,location_x=0.005,location_y=-0.031
  673. ,scale_x=0.8,scale_y=0.6825)
  674. t.AddClip(LOGO_ED_clip)
  675. ED_duration = LOGO_ED.info.duration
  676. LOGO_ED.Close()
  677. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  678. bg.Open()
  679. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  680. left_time = (main_timer+ED_duration) % bg.info.duration
  681. bg_clip_list = [None] * bg_times
  682. bg_list = [None] * bg_times
  683. bg.Close()
  684. bg_timer = head_duration
  685. for idx in range(bg_times):
  686. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  687. bg_list[idx].Open()
  688. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  689. ,end=bg_list[idx].info.duration,ck=ck)
  690. t.AddClip(bg_clip_list[idx])
  691. bg_timer += bg_list[idx].info.duration
  692. bg_list[idx].Close()
  693. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  694. bg_left.Open()
  695. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  696. t.AddClip(bg_left_clip)
  697. bg_left.Close()
  698. title = openshot.QtImageReader(dir_title+name_hash+".png")
  699. title.Open() # Open the reader
  700. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  701. t.AddClip(title_clip)
  702. ####start building
  703. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  704. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  705. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  706. openshot.Fraction(1, 1), False, False, 3000000)
  707. w.Open()
  708. #may change duration into t.info.duration
  709. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  710. for n in range(frames):
  711. f=t.GetFrame(n)
  712. w.WriteFrame(f)
  713. #notify_group(name+"的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  714. t.Close()
  715. w.Close()
  716. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  717. def anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar):
  718. file_prepare(name, name_hash, text_content,image_urls,'eng')
  719. sub_list=generate_subtitle_image_ENG(name_hash,sub_titles)
  720. for fname in range(len(text_content)):
  721. call_anchor(name_hash+"/"+str(fname),avatar)
  722. print('step finish')
  723. print('called............................................')
  724. ck=cKey(0,254,0,270)
  725. ck_anchor=cKey(0,255,1,320)
  726. duration = 0
  727. #average layer level is 3
  728. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  729. t.Open()
  730. main_timer = 0
  731. #add logo
  732. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  733. LOGO_OP.Open() # Open the reader
  734. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  735. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  736. t.AddClip(LOGO_OP_clip)
  737. #add background video (head is different)
  738. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  739. bg_head.Open()
  740. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  741. t.AddClip(bg_head_clip)
  742. main_timer += LOGO_OP.info.duration
  743. head_duration = LOGO_OP.info.duration
  744. bg_head.Close()
  745. LOGO_OP.Close()
  746. #prepare empty list
  747. clip_duration=0
  748. photo_clip_list = [None]*len(text_content)
  749. img_list = [None]*len(text_content)
  750. anchor_clip_list = [None] * len(text_content)
  751. anchor_list = [None] * len(text_content)
  752. audio_clip_list = [None] * len(text_content)
  753. audio_list = [None] * len(text_content)
  754. sub_clip_list = [None] * len(text_content)
  755. #openshot image holder
  756. sub_img_list = [None] * len(text_content)
  757. idx = 0
  758. for p in listdir(dir_photo+name_hash):
  759. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  760. clip_duration = anchor_list[idx].info.duration
  761. anchor_list[idx].Open()
  762. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  763. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  764. t.AddClip(anchor_clip_list[idx])
  765. #insert image
  766. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  767. img_list[idx].Open()
  768. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  769. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  770. t.AddClip(photo_clip_list[idx])
  771. img_list[idx].Close()
  772. #insert audio (speech)
  773. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  774. audio_list[idx].Open()
  775. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  776. audio_clip_list[idx].Position(main_timer)
  777. audio_clip_list[idx].End(clip_duration)
  778. t.AddClip(audio_clip_list[idx])
  779. #insert subtitle
  780. sub_img_list[idx] = openshot.QtImageReader(sub_list[idx])
  781. sub_img_list[idx].Open()
  782. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer,end=clip_duration)
  783. t.AddClip(sub_clip_list[idx])
  784. img_list[idx].Close()
  785. anchor_list[idx].Close()
  786. audio_list[idx].Close()
  787. sub_img_list[idx].Close()
  788. main_timer += clip_duration
  789. idx+=1
  790. LOGO_ED = openshot.FFmpegReader(dir_video+"ED_ENG.mp4")
  791. LOGO_ED.Open()
  792. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  793. ,location_x=0.005,location_y=-0.031
  794. ,scale_x=0.8,scale_y=0.6825)
  795. t.AddClip(LOGO_ED_clip)
  796. ED_duration = LOGO_ED.info.duration
  797. LOGO_ED.Close()
  798. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  799. bg.Open()
  800. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  801. left_time = (main_timer+ED_duration) % bg.info.duration
  802. bg_clip_list = [None] * bg_times
  803. bg_list = [None] * bg_times
  804. bg.Close()
  805. bg_timer = head_duration
  806. for idx in range(bg_times):
  807. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  808. bg_list[idx].Open()
  809. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  810. ,end=bg_list[idx].info.duration,ck=ck)
  811. t.AddClip(bg_clip_list[idx])
  812. bg_timer += bg_list[idx].info.duration
  813. bg_list[idx].Close()
  814. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  815. bg_left.Open()
  816. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  817. t.AddClip(bg_left_clip)
  818. bg_left.Close()
  819. title = openshot.QtImageReader(dir_title+name_hash+".png")
  820. title.Open() # Open the reader
  821. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  822. t.AddClip(title_clip)
  823. ####start building
  824. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  825. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  826. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  827. openshot.Fraction(1, 1), False, False, 3000000)
  828. w.Open()
  829. #may change duration into t.info.duration
  830. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  831. for n in range(frames):
  832. f=t.GetFrame(n)
  833. w.WriteFrame(f)
  834. #notify_group(name+"(ENG)的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  835. t.Close()
  836. w.Close()
  837. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  838. #line notifs
  839. import pyttsx3
  840. def make_speech(text):
  841. engine = pyttsx3.init()
  842. #voices = engine.getProperty('voices')
  843. engine.setProperty('voice', 'Mandarin')
  844. engine.save_to_file(text, '/app/speech.mp3')
  845. engine.runAndWait()
  846. class video_service(rpyc.Service):
  847. def exposed_call_video(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  848. print('ML:'+str(multiLang))
  849. anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar)
  850. def exposed_call_video_eng(self,name_hash,name,text_content, image_urls,sub_titles,avatar):
  851. anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar)
  852. def exposed_call_video_gen(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  853. print('ML:'+str(multiLang))#this is long video version,
  854. video_gen(name_hash,name,text_content, image_urls,multiLang,avatar)
  855. def exposed_make_speech(self,text):
  856. make_speech(text)
  857. from rpyc.utils.server import ThreadedServer
  858. t = ThreadedServer(video_service, port=8858)
  859. print('service started')
  860. t.start()