openshot_video_generator.py 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974
  1. from os import listdir
  2. from os.path import isfile, isdir, join
  3. import openshot
  4. import threading
  5. import zhtts
  6. import os
  7. import urllib
  8. from typing import List
  9. import requests
  10. from pydantic import BaseModel
  11. from bs4 import BeautifulSoup
  12. from PIL import Image,ImageDraw,ImageFont
  13. import pyttsx3
  14. import rpyc
  15. import random
  16. import re
  17. import time
  18. import math
  19. import dataset
  20. from datetime import datetime
  21. from gtts import gTTS
  22. import ffmpy
  23. from difflib import SequenceMatcher
  24. import difflib
  25. from autosub import DEFAULT_CONCURRENCY
  26. from autosub import DEFAULT_SUBTITLE_FORMAT
  27. from pytranscriber.control.ctr_main import Ctr_Main
  28. from pytranscriber.control.ctr_autosub import Ctr_Autosub
  29. import multiprocessing
  30. from itertools import groupby
  31. from operator import itemgetter
  32. from util.parser import parser
  33. dir_sound = 'mp3_track/'
  34. dir_photo = 'photo/'
  35. dir_text = 'text_file/'
  36. dir_video = 'video_material/'
  37. dir_title = 'title/'
  38. dir_subtitle = 'subtitle/'
  39. dir_anchor = 'anchor_raw/'
  40. tmp_video_dir = 'tmp_video/'
  41. video_sub_folder = 'ai_anchor_video/'
  42. dir_list = [dir_sound,dir_photo,dir_text,dir_video,dir_title,dir_subtitle,dir_anchor,tmp_video_dir]
  43. def notify_group(msg):
  44. glist=['7vilzohcyQMPLfAMRloUawiTV4vtusZhxv8Czo7AJX8','WekCRfnAirSiSxALiD6gcm0B56EejsoK89zFbIaiZQD','1dbtJHbWVbrooXmQqc4r8OyRWDryjD4TMJ6DiDsdgsX','HOB1kVNgIb81tTB4Ort1BfhVp9GFo6NlToMQg88vEhh']
  45. for gid in glist:
  46. headers = {
  47. "Authorization": "Bearer " + gid,
  48. "Content-Type": "application/x-www-form-urlencoded"
  49. }
  50. params = {"message": msg}
  51. r = requests.post("https://notify-api.line.me/api/notify",headers=headers, params=params)
  52. def cKey(r,g,b,fuzz):
  53. col=openshot.Color()
  54. col.red=openshot.Keyframe(r)
  55. col.green=openshot.Keyframe(g)
  56. col.blue=openshot.Keyframe(b)
  57. return openshot.ChromaKey(col, openshot.Keyframe(fuzz))
  58. def video_photo_clip(vid=None,layer=None, position=None, end=None
  59. ,scale_x=1,scale_y=1,location_x=0,location_y=0,ck=None,audio=True):
  60. clip = openshot.Clip(vid)
  61. clip.Layer(layer)
  62. clip.Position(position)
  63. clip.End(end)
  64. clip.scale_x=openshot.Keyframe(scale_x)
  65. clip.scale_y=openshot.Keyframe(scale_y)
  66. clip.location_x=openshot.Keyframe(location_x)
  67. clip.location_y=openshot.Keyframe(location_y)
  68. if ck!=None:
  69. clip.AddEffect(ck)
  70. if audio==True:
  71. clip.has_audio=openshot.Keyframe(1)
  72. else:
  73. clip.has_audio=openshot.Keyframe(0)
  74. return clip
  75. def listener_progress(string, percent):
  76. True
  77. def myunichchar(unicode_char):
  78. mb_string = unicode_char.encode('big5')
  79. try:
  80. unicode_char = unichr(ord(mb_string[0]) << 8 | ord(mb_string[1]))
  81. except NameError:
  82. unicode_char = chr(mb_string[0] << 8 | mb_string[1])
  83. return unicode_char
  84. def get_url_type(url):
  85. req = urllib.request.Request(url, method='HEAD', headers={'User-Agent': 'Mozilla/5.0'})
  86. r = urllib.request.urlopen(req)
  87. contentType = r.getheader('Content-Type')
  88. return contentType
  89. def make_dir(name_hash):
  90. for direct in dir_list:
  91. if not os.path.isdir(direct):
  92. os.mkdir(direct)
  93. try:
  94. os.mkdir(dir_photo+name_hash)
  95. except FileExistsError:
  96. print("~~~~~~Warning~~~~~~~~~Directory " , dir_photo+name_hash , " already exists")
  97. try:
  98. os.mkdir(dir_text+name_hash)
  99. except FileExistsError:
  100. print("~~~~~~Warning~~~~~~~~~Directory " , dir_text+name_hash , " already exists")
  101. try:
  102. os.mkdir(dir_sound+name_hash)
  103. except FileExistsError:
  104. print("~~~~~~Warning~~~~~~~~~Directory " , dir_sound+name_hash , " already exists")
  105. try:
  106. os.mkdir(dir_anchor+name_hash)
  107. except FileExistsError:
  108. print("~~~~~~Warning~~~~~~~~~Directory " , dir_anchor+name_hash , " already exists")
  109. try:
  110. os.mkdir(dir_subtitle+name_hash)
  111. except FileExistsError:
  112. print("~~~~~~Warning~~~~~~~~~Directory " , dir_subtitle+name_hash , " already exists")
  113. def file_prepare(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  114. make_dir(name_hash)
  115. img_num = 1
  116. for imgu in image_urls:
  117. if get_url_type(imgu) =='video/mp4':
  118. r=requests.get(imgu)
  119. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  120. for chunk in r.iter_content(chunk_size=255):
  121. if chunk:
  122. f.write(chunk)
  123. f.close()
  124. else:
  125. im = Image.open(requests.get(imgu, stream=True).raw)
  126. im= im.convert("RGB")
  127. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  128. img_num+=1
  129. #save text
  130. txt_idx=0
  131. for txt in text_content:
  132. text_file = open(dir_text+name_hash+"/"+str(txt_idx)+".txt", "w")
  133. text_file.write(txt)
  134. text_file.close()
  135. txt_idx+=1
  136. print("text file made")
  137. #make mp3
  138. txt_idx = 0
  139. for txt in text_content:
  140. if lang!='zh' or multiLang==1:
  141. if lang!='zh':
  142. tts = gTTS(txt)
  143. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  144. else:
  145. tts = gTTS(txt,lang='zh-tw')
  146. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  147. #speed up
  148. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  149. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  150. ff.run()
  151. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  152. else:
  153. print('use zhtts')
  154. tts = zhtts.TTS()
  155. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  156. txt_idx+=1
  157. print("mp3 file made")
  158. #make title as image
  159. txt2image_title(name, dir_title+name_hash+".png",lang)
  160. def file_prepare_long(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  161. make_dir(name_hash)
  162. img_num = 1
  163. for imgu in image_urls:
  164. if get_url_type(imgu) =='video/mp4':
  165. r=requests.get(imgu)
  166. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  167. for chunk in r.iter_content(chunk_size=255):
  168. if chunk:
  169. f.write(chunk)
  170. f.close()
  171. else:
  172. im = Image.open(requests.get(imgu, stream=True).raw)
  173. im= im.convert("RGB")
  174. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  175. img_num+=1
  176. #make mp3
  177. text_parser = parser()
  178. txt_idx = 0
  179. for txt in text_content:
  180. rep_list = text_parser.replace_list(k)
  181. for reptxt in rep_list:
  182. txt = txt.replace(reptxt,'')
  183. if lang!='zh' or multiLang==1:
  184. if lang!='zh':
  185. tts = gTTS(txt)
  186. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  187. else:
  188. tts = gTTS(txt,lang='zh-tw')
  189. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  190. #speed up
  191. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  192. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  193. ff.run()
  194. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  195. else:
  196. print('use zhtts')
  197. tts = zhtts.TTS()
  198. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  199. txt_idx+=1
  200. print("mp3 file made")
  201. #make title as image
  202. txt2image_title(name, dir_title+name_hash+".png",lang)
  203. def txt2image(content, save_target,lang='zh'):
  204. unicode_text = trim_punctuation(content)
  205. font = ''
  206. if lang=='zh':
  207. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=38)
  208. else :
  209. font = ImageFont.truetype(font="font/arial.ttf", size=38)
  210. text_width, text_height = font.getsize(unicode_text)
  211. canvas = Image.new('RGBA', (700, 500), (255, 0, 0, 0) )
  212. draw = ImageDraw.Draw(canvas)
  213. text= unicode_text
  214. draw.text((5,5), text, (255, 255, 0), font)
  215. canvas.save(save_target, "PNG")
  216. def txt2image_title(content, save_target, lang='zh'):
  217. unicode_text = trim_punctuation(content)
  218. font = ''
  219. if lang=='zh':
  220. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=22)
  221. else :
  222. font = ImageFont.truetype(font="font/arial.ttf", size=22)
  223. text_width, text_height = font.getsize(unicode_text)
  224. canvas = Image.new('RGBA', (510, 500), (255, 0, 0, 0) )
  225. draw = ImageDraw.Draw(canvas)
  226. text= unicode_text
  227. draw.text((5,5), text, (17, 41, 167), font)
  228. canvas.save(save_target, "PNG")
  229. def call_anchor(fileName,avatar):
  230. conn = rpyc.classic.connect("192.168.1.105",18812)
  231. ros = conn.modules.os
  232. rsys = conn.modules.sys
  233. fr=open(dir_sound+fileName+".mp3",'rb')# voice
  234. #warning!!! file my be replaced by other process
  235. fw=conn.builtins.open('/tmp/output.mp3','wb')
  236. while True:
  237. b=fr.read(1024)
  238. if b:
  239. fw.write(b)
  240. else:
  241. break
  242. fr.close()
  243. fw.close()
  244. val=random.randint(1000000,9999999)
  245. ros.chdir('/home/jared/to_video')
  246. ros.system('./p'+str(avatar)+'.sh '+str(val)+' &')
  247. while True:
  248. print('waiting...')
  249. if ros.path.exists('/tmp/results/'+str(val)):
  250. break
  251. time.sleep(5)
  252. print('waiting...')
  253. fr=conn.builtins.open('/tmp/results/'+str(val)+'.mp4','rb')
  254. fw=open(dir_anchor+fileName+".mp4",'wb')
  255. while True:
  256. b=fr.read(1024)
  257. if b:
  258. fw.write(b)
  259. else:
  260. break
  261. fr.close()
  262. fw.close()
  263. def syllable_count(word):
  264. word = word.lower()
  265. count = 0
  266. vowels = "aeiouy"
  267. if word[0] in vowels:
  268. count += 1
  269. for index in range(1, len(word)):
  270. if word[index] in vowels and word[index - 1] not in vowels:
  271. count += 1
  272. if word.endswith("e"):
  273. count -= 1
  274. if count == 0:
  275. count += 1
  276. return count
  277. def split_sentence(in_str, maxLen):
  278. re.findall(r'[\u4e00-\u9fff]+', in_str)
  279. zh_idx = []
  280. eng_idx= []
  281. for i in range(len(in_str)):
  282. if in_str[i] > u'\u4e00' and in_str[i] < u'\u9fff':
  283. zh_idx.append(i)
  284. else:
  285. eng_idx.append(i)
  286. space_index = [m.start() for m in re.finditer(' ', in_str)]
  287. for idx in space_index:
  288. eng_idx.remove(idx)
  289. eng_range_list = []
  290. for k, g in groupby(enumerate(eng_idx), lambda ix : ix[0] - ix[1]):
  291. eng_range = list(map(itemgetter(1), g))
  292. eng_range_list.append(eng_range)
  293. total_syllable = 0
  294. for i in range(len(eng_range_list)):
  295. total_syllable += (syllable_count(in_str[eng_range_list[i][0]:eng_range_list[i][-1]+1])+0.5)
  296. for i in range(len(zh_idx)):
  297. total_syllable+=1
  298. #final chchchchchc[en][en][en]
  299. #[en] is a vocabulary dict with occurence of image
  300. zh_eng_idx_list = []
  301. i = 0
  302. while i < len(in_str):
  303. if in_str[i]==' ':
  304. i+=1
  305. if i in zh_idx:
  306. zh_eng_idx_list.append(i)
  307. i+=1
  308. if i in eng_idx:
  309. for ls in eng_range_list:
  310. if i in ls:
  311. zh_eng_idx_list.append(ls)
  312. i = ls[-1]+1
  313. break
  314. zh_eng_dict_list = [{'content':'','time_ratio':0}]
  315. idx = 0
  316. current_len = 0
  317. sen_idx = 0
  318. while idx < len(zh_eng_idx_list):
  319. str_from_idx = ''
  320. sylla_cnt = 1
  321. if type(zh_eng_idx_list[idx])==type([]):
  322. str_from_idx = in_str[zh_eng_idx_list[idx][0]:zh_eng_idx_list[idx][-1]+1]+' '
  323. sylla_cnt = syllable_count(str_from_idx)
  324. else:
  325. str_from_idx = in_str[zh_eng_idx_list[idx]]
  326. if len(zh_eng_dict_list[sen_idx]['content'])+sylla_cnt>=maxLen:
  327. zh_eng_dict_list[sen_idx]['time_ratio'] = current_len/total_syllable
  328. zh_eng_dict_list.append({'content':'','time_ratio':0})
  329. sen_idx+=1
  330. current_len = 0
  331. else:
  332. current_len += sylla_cnt
  333. zh_eng_dict_list[sen_idx]['content'] += str_from_idx
  334. idx+=1
  335. total_ratio = 0
  336. for obj in zh_eng_dict_list:
  337. total_ratio+=obj['time_ratio']
  338. zh_eng_dict_list[-1]['time_ratio'] = 1-total_ratio
  339. return zh_eng_dict_list
  340. def parse_script(file_path,gt_list):
  341. with open(file_path, 'r',encoding="utf-8") as f:
  342. raw_lines = [line.strip() for line in f]
  343. lines = adjustSub_by_text_similarity(gt_list,raw_lines)
  344. text_parser = parser()
  345. #make dict
  346. dict_list = []
  347. for idx in range(len(lines)):
  348. script={}
  349. rep_ls = text_parser.replace_list(lines[idx])
  350. line_content = lines[idx]
  351. for reptxt in rep_ls:
  352. line_content = line_content.replace(reptxt,'')
  353. if len(rep_ls)!=0:
  354. script['image_idx'] = int(rep_ls[0].replace('{','').replace('}',''))
  355. script['content'] = line_content
  356. time_raw = raw_lines[idx * 4 +1 ].split(' --> ')
  357. start = time_raw[0].split(':')
  358. stop = time_raw[1].split(':')
  359. script['start'] = float(start[0])*3600 + float(start[1])*60 + float(start[2].replace(',','.'))
  360. script['stop'] = float(stop[0])*3600 + float(stop[1])*60 + float(stop[2].replace(',','.'))
  361. dict_list.append(script)
  362. #merge duplicated sentences
  363. script_not_dup_list = []
  364. for idx in range(len(dict_list)):
  365. dup_list = []
  366. for idx_inner in range(len(dict_list)):
  367. if dict_list[idx_inner]['content']==dict_list[idx]['content']:
  368. dup_list.append(idx_inner)
  369. for dup_idx in dup_list:
  370. if dup_idx == min(dup_list):
  371. dict_list[dup_idx]['type'] = 'lead_sentence'
  372. else:
  373. dict_list[dup_idx]['type'] = 'duplicated'
  374. dict_list[dup_list[0]]['stop'] = dict_list[dup_list[-1]]['stop']
  375. if dict_list[idx]['type'] == 'lead_sentence':
  376. script_not_dup_list.append(dict_list[idx])
  377. #avoid subtitle overlapping ? Timeline overlapping not found currently
  378. #cut by max length----> eng seperated problem {eng_idx}
  379. #ENG counts, zh counts, space counts
  380. new_idx = 0
  381. splitted_dict = []
  382. for dic in script_not_dup_list:
  383. dic_idx = 0
  384. accumulated_duration = 0
  385. duration = dic['stop']-dic['start']
  386. for sub_dic in split_sentence(dic['content'],13):
  387. new_dic = {}
  388. new_dic['index'] = new_idx
  389. if 'image_idx' in dic:
  390. new_dic['image_obj'] = {'start':dic['start'],'idx':dic['image_idx']}
  391. new_idx+=1
  392. ind_duration = duration * sub_dic['time_ratio']
  393. new_dic['start'] = dic['start'] + accumulated_duration
  394. accumulated_duration += ind_duration
  395. new_dic['content'] = sub_dic['content']
  396. new_dic['duration'] = ind_duration*0.7
  397. splitted_dict.append(new_dic)
  398. return splitted_dict
  399. def adjustSub_by_text_similarity(gts_in,gens_raw):
  400. #call by value only
  401. gts = gts_in[:]
  402. text_parser = parser()
  403. for i in range(len(gts)):
  404. rep_ls = text_parser.replace_list(gts[i])
  405. for reptxt in rep_ls:
  406. gts[i] = gts[i].replace(reptxt)
  407. print(gts)
  408. gens = []
  409. for idx in range(int((len(gens_raw)+1)/4)):
  410. gens.append(gens_raw[idx*4+2])
  411. combine2 = [''.join([i,j]) for i,j in zip(gts, gts[1:])]
  412. combine3 = [''.join([i,j,k]) for i,j,k in zip(gts, gts[1:], gts[2:])]
  413. alls = gts + combine2 + combine3
  414. adjusted = [None]*len(gens)
  415. duplicated_list = []
  416. for idx in range(len(gens)):
  417. match_text = difflib.get_close_matches(gens[idx], alls, cutoff=0.1)
  418. if match_text[0] in duplicated_list:
  419. for mt in match_text:
  420. if mt == adjusted[idx-1] or mt not in duplicated_list:
  421. adjusted[idx] = mt
  422. break
  423. else:
  424. adjusted[idx] = match_text[0]
  425. duplicated_list.append(match_text[0])
  426. combine2_tag = [''.join([i,j]) for i,j in zip(gts_in, gts_in[1:])]
  427. combine3_tag = [''.join([i,j,k]) for i,j,k in zip(gts_in, gts_in[1:], gts_in[2:])]
  428. alls_tag = gts_in + combine2_tag + combine3_tag
  429. for idx in range(len(adjusted)):
  430. match_text = difflib.get_close_matches(adjusted[idx], alls_tag, cutoff=0.1)
  431. adjusted[idx] = match_text
  432. return adjusted
  433. def trim_punctuation(s):
  434. pat_block = u'[^\u4e00-\u9fff0-9a-zA-Z]+';
  435. pattern = u'([0-9]+{0}[0-9]+)|{0}'.format(pat_block)
  436. res = re.sub(pattern, lambda x: x.group(1) if x.group(1) else u" " ,s)
  437. return res
  438. def splitter(s):
  439. for sent in re.findall(u'[^!?,。\!\?]+[!? 。\!\?]?', s, flags=re.U):
  440. yield sent
  441. def split_by_pun(s):
  442. res = list(splitter(s))
  443. return res
  444. def generate_subtitle_image_from_dict(name_hash, sub_dict):
  445. for script in sub_dict:
  446. sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  447. sub = script['content']
  448. txt2image(sub,sv_path)
  449. def generate_subtitle_image(name_hash,text_content):
  450. img_list = [None]*len(text_content)
  451. for idx in range(len(text_content)):
  452. img_list[idx]=[]
  453. senList = split_by_pun(text_content[idx])
  454. for inner_idx in range(len(senList)):
  455. sv_path = dir_subtitle + name_hash +'/'+str(idx)+ str(inner_idx) +'.png'
  456. sub = senList[inner_idx]
  457. txt2image(sub,sv_path)
  458. img_list[idx]+=[{"count":len(sub),"path":sv_path}]
  459. return img_list
  460. def generate_subtitle_image_ENG(name_hash,text_content):
  461. img_list = [None]*len(text_content)
  462. for idx in range(len(text_content)):
  463. sv_path = dir_subtitle + name_hash +'/'+str(idx)+'.png'
  464. sub = text_content[idx]
  465. txt2image(sub, sv_path,lang='eng')
  466. img_list[idx] = sv_path
  467. return img_list
  468. def video_writer_init(path):
  469. w = openshot.FFmpegWriter(path)
  470. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  471. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  472. openshot.Fraction(1, 1), False, False, 3000000)
  473. return w
  474. def video_gen(name_hash,name,text_content, image_urls,multiLang,avatar):
  475. file_prepare_long(name, name_hash, text_content,image_urls,multiLang)
  476. for fname in range(len(text_content)):
  477. call_anchor(name_hash+"/"+str(fname),avatar)
  478. print('called............................................')
  479. ck=cKey(0,254,0,270)
  480. ck_anchor=cKey(0,255,1,320)
  481. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  482. t.Open()
  483. main_timer = 0
  484. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  485. LOGO_OP.Open() # Open the reader
  486. head_duration = LOGO_OP.info.duration
  487. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=head_duration
  488. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  489. t.AddClip(LOGO_OP_clip)
  490. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  491. bg_head.Open()
  492. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  493. t.AddClip(bg_head_clip)
  494. main_timer += head_duration
  495. bg_head.Close()
  496. LOGO_OP.Close()
  497. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  498. anchor.Open()
  499. #anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  500. # location_x=0.35,location_y=0.25,position=main_timer, end=anchor.info.duration,ck=ck_anchor,audio=False)
  501. #t.AddClip(anchor_clip)
  502. speech = openshot.FFmpegReader(dir_sound+name_hash+"/0.mp3")
  503. speech.Open()
  504. speech_clip = openshot.Clip(speech)
  505. speech_clip.Position(main_timer)
  506. speech_clip.End(anchor.info.duration)
  507. t.AddClip(speech_clip)
  508. main_timer += anchor.info.duration
  509. anchor.Close()
  510. speech.Close()
  511. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  512. LOGO_ED.Open()
  513. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration
  514. ,location_x=0.005,location_y=-0.031, scale_x=0.8,scale_y=0.6825)
  515. t.AddClip(LOGO_ED_clip)
  516. main_timer += LOGO_ED.info.duration
  517. LOGO_ED.Close()
  518. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  519. bg.Open()
  520. bg_times = math.floor(main_timer/bg.info.duration)
  521. left_time = (main_timer) % bg.info.duration
  522. bg_clip_list = [None] * bg_times
  523. bg_list = [None] * bg_times
  524. bg.Close()
  525. bg_timer = head_duration
  526. for idx in range(bg_times):
  527. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  528. bg_list[idx].Open()
  529. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer,end=bg_list[idx].info.duration,ck=ck)
  530. t.AddClip(bg_clip_list[idx])
  531. bg_timer += bg_list[idx].info.duration
  532. bg_list[idx].Close()
  533. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  534. bg_left.Open()
  535. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  536. t.AddClip(bg_left_clip)
  537. bg_left.Close()
  538. title = openshot.QtImageReader(dir_title+name_hash+".png")
  539. title.Open() # Open the reader
  540. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  541. t.AddClip(title_clip)
  542. w = video_writer_init(tmp_video_dir+name_hash+"raw.mp4")
  543. w.Open()
  544. frames = int(t.info.fps)*int(main_timer)
  545. for n in range(frames):
  546. f=t.GetFrame(n)
  547. w.WriteFrame(f)
  548. t.Close()
  549. w.Close()
  550. print(name+"RAW DONE : www.choozmo.com:8168/"+tmp_video_dir+name_hash+"raw.mp4")
  551. #start adding sub
  552. #add sub
  553. Ctr_Autosub.init()
  554. Ctr_Autosub.generate_subtitles(tmp_video_dir+name_hash+"raw.mp4",'zh',listener_progress,output=tmp_video_dir+name_hash+"script.txt",concurrency=DEFAULT_CONCURRENCY,subtitle_file_format=DEFAULT_SUBTITLE_FORMAT)
  555. sub_dict = parse_script(tmp_video_dir+name_hash+"script.txt",split_by_pun(text_content[0]))
  556. for subd in sub_dict:
  557. print(subd)
  558. generate_subtitle_image_from_dict(name_hash, sub_dict)
  559. #sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  560. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  561. t.Open()
  562. raw = openshot.FFmpegReader(tmp_video_dir+name_hash+"raw.mp4")
  563. raw.Open()
  564. raw_clip = video_photo_clip(vid=raw,layer=2,position=0, end=raw.info.duration)
  565. t.AddClip(raw_clip)
  566. sub_img_list = [None] * len(sub_dict)
  567. sub_clip_list = [None] * len(sub_dict)
  568. for sub_obj in sub_dict:
  569. idx = int(sub_obj['index'])
  570. sub_img_list[idx] = openshot.QtImageReader(dir_subtitle + name_hash + '/' + str(idx)+'.png')
  571. sub_img_list[idx].Open()
  572. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=sub_obj['start'],end=math.ceil(sub_obj['duration']))
  573. t.AddClip(sub_clip_list[idx])
  574. sub_img_list[idx].Close()
  575. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  576. anchor.Open()
  577. anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  578. location_x=0.35,location_y=0.25,position=head_duration, end=anchor.info.duration,ck=ck_anchor,audio=False)
  579. t.AddClip(anchor_clip)
  580. w = video_writer_init(tmp_video_dir+name_hash+".mp4")
  581. w.Open()
  582. frames = int(t.info.fps)*int(main_timer)
  583. for n in range(frames):
  584. f=t.GetFrame(n)
  585. w.WriteFrame(f)
  586. t.Close()
  587. w.Close()
  588. os.remove(tmp_video_dir+name_hash+"raw.mp4")
  589. os.remove(tmp_video_dir+name_hash+"script.txt")
  590. print(name+"ALL DONE : www.choozmo.com:8168/"+video_sub_folder+name_hash+"raw.mp4")
  591. def anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar):
  592. print(os.getcwd())
  593. print('sub image made')
  594. print(multiLang)
  595. file_prepare(name, name_hash, text_content,image_urls,multiLang)
  596. sub_list=generate_subtitle_image(name_hash,text_content)
  597. for fname in range(len(text_content)):
  598. call_anchor(name_hash+"/"+str(fname),avatar)
  599. print('step finish')
  600. print('called............................................')
  601. ck=cKey(0,254,0,270)
  602. ck_anchor=cKey(0,255,1,320)
  603. duration = 0
  604. #average layer level is 3
  605. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  606. t.Open()
  607. main_timer = 0
  608. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  609. LOGO_OP.Open() # Open the reader
  610. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  611. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  612. t.AddClip(LOGO_OP_clip)
  613. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  614. bg_head.Open()
  615. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  616. t.AddClip(bg_head_clip)
  617. main_timer += LOGO_OP.info.duration
  618. head_duration = LOGO_OP.info.duration
  619. bg_head.Close()
  620. LOGO_OP.Close()
  621. clip_duration=0
  622. photo_clip_list = [None]*len(text_content)
  623. img_list = [None]*len(text_content)
  624. anchor_clip_list = [None] * len(text_content)
  625. anchor_list = [None] * len(text_content)
  626. audio_clip_list = [None] * len(text_content)
  627. audio_list = [None] * len(text_content)
  628. sub_clip_list = [None] * len(text_content)
  629. sub_img_list = [None] * len(text_content)
  630. idx = 0
  631. for p in listdir(dir_photo+name_hash):
  632. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  633. clip_duration = anchor_list[idx].info.duration
  634. anchor_list[idx].Open()
  635. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  636. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  637. t.AddClip(anchor_clip_list[idx])
  638. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  639. img_list[idx].Open()
  640. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  641. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  642. t.AddClip(photo_clip_list[idx])
  643. img_list[idx].Close()
  644. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  645. audio_list[idx].Open()
  646. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  647. audio_clip_list[idx].Position(main_timer)
  648. audio_clip_list[idx].End(clip_duration)
  649. t.AddClip(audio_clip_list[idx])
  650. img_list[idx].Close()
  651. anchor_list[idx].Close()
  652. audio_list[idx].Close()
  653. sub_img_list[idx] = [None] * len(sub_list[idx])
  654. sub_clip_list[idx] = [None] * len(sub_list[idx])
  655. sub_timer = 0
  656. for sub_idx in range(len(sub_list[idx])):
  657. sub_img_list[idx][sub_idx] = openshot.QtImageReader(sub_list[idx][sub_idx]['path'])
  658. sub_img_list[idx][sub_idx].Open()
  659. sub_duration = 0.205*sub_list[idx][sub_idx]['count']
  660. sub_clip_list[idx][sub_idx] = video_photo_clip(vid=sub_img_list[idx][sub_idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer+sub_timer,end=sub_duration)
  661. t.AddClip(sub_clip_list[idx][sub_idx])
  662. sub_img_list[idx][sub_idx].Close()
  663. sub_timer += sub_duration
  664. print(sub_list[idx][sub_idx]['path'])
  665. main_timer += clip_duration
  666. idx+=1
  667. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  668. LOGO_ED.Open()
  669. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  670. ,location_x=0.005,location_y=-0.031
  671. ,scale_x=0.8,scale_y=0.6825)
  672. t.AddClip(LOGO_ED_clip)
  673. ED_duration = LOGO_ED.info.duration
  674. LOGO_ED.Close()
  675. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  676. bg.Open()
  677. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  678. left_time = (main_timer+ED_duration) % bg.info.duration
  679. bg_clip_list = [None] * bg_times
  680. bg_list = [None] * bg_times
  681. bg.Close()
  682. bg_timer = head_duration
  683. for idx in range(bg_times):
  684. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  685. bg_list[idx].Open()
  686. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  687. ,end=bg_list[idx].info.duration,ck=ck)
  688. t.AddClip(bg_clip_list[idx])
  689. bg_timer += bg_list[idx].info.duration
  690. bg_list[idx].Close()
  691. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  692. bg_left.Open()
  693. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  694. t.AddClip(bg_left_clip)
  695. bg_left.Close()
  696. title = openshot.QtImageReader(dir_title+name_hash+".png")
  697. title.Open() # Open the reader
  698. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  699. t.AddClip(title_clip)
  700. ####start building
  701. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  702. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  703. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  704. openshot.Fraction(1, 1), False, False, 3000000)
  705. w.Open()
  706. #may change duration into t.info.duration
  707. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  708. for n in range(frames):
  709. f=t.GetFrame(n)
  710. w.WriteFrame(f)
  711. #notify_group(name+"的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  712. t.Close()
  713. w.Close()
  714. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  715. def anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar):
  716. file_prepare(name, name_hash, text_content,image_urls,'eng')
  717. sub_list=generate_subtitle_image_ENG(name_hash,sub_titles)
  718. for fname in range(len(text_content)):
  719. call_anchor(name_hash+"/"+str(fname),avatar)
  720. print('step finish')
  721. print('called............................................')
  722. ck=cKey(0,254,0,270)
  723. ck_anchor=cKey(0,255,1,320)
  724. duration = 0
  725. #average layer level is 3
  726. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  727. t.Open()
  728. main_timer = 0
  729. #add logo
  730. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  731. LOGO_OP.Open() # Open the reader
  732. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  733. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  734. t.AddClip(LOGO_OP_clip)
  735. #add background video (head is different)
  736. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  737. bg_head.Open()
  738. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  739. t.AddClip(bg_head_clip)
  740. main_timer += LOGO_OP.info.duration
  741. head_duration = LOGO_OP.info.duration
  742. bg_head.Close()
  743. LOGO_OP.Close()
  744. #prepare empty list
  745. clip_duration=0
  746. photo_clip_list = [None]*len(text_content)
  747. img_list = [None]*len(text_content)
  748. anchor_clip_list = [None] * len(text_content)
  749. anchor_list = [None] * len(text_content)
  750. audio_clip_list = [None] * len(text_content)
  751. audio_list = [None] * len(text_content)
  752. sub_clip_list = [None] * len(text_content)
  753. #openshot image holder
  754. sub_img_list = [None] * len(text_content)
  755. idx = 0
  756. for p in listdir(dir_photo+name_hash):
  757. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  758. clip_duration = anchor_list[idx].info.duration
  759. anchor_list[idx].Open()
  760. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  761. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  762. t.AddClip(anchor_clip_list[idx])
  763. #insert image
  764. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  765. img_list[idx].Open()
  766. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  767. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  768. t.AddClip(photo_clip_list[idx])
  769. img_list[idx].Close()
  770. #insert audio (speech)
  771. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  772. audio_list[idx].Open()
  773. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  774. audio_clip_list[idx].Position(main_timer)
  775. audio_clip_list[idx].End(clip_duration)
  776. t.AddClip(audio_clip_list[idx])
  777. #insert subtitle
  778. sub_img_list[idx] = openshot.QtImageReader(sub_list[idx])
  779. sub_img_list[idx].Open()
  780. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer,end=clip_duration)
  781. t.AddClip(sub_clip_list[idx])
  782. img_list[idx].Close()
  783. anchor_list[idx].Close()
  784. audio_list[idx].Close()
  785. sub_img_list[idx].Close()
  786. main_timer += clip_duration
  787. idx+=1
  788. LOGO_ED = openshot.FFmpegReader(dir_video+"ED_ENG.mp4")
  789. LOGO_ED.Open()
  790. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  791. ,location_x=0.005,location_y=-0.031
  792. ,scale_x=0.8,scale_y=0.6825)
  793. t.AddClip(LOGO_ED_clip)
  794. ED_duration = LOGO_ED.info.duration
  795. LOGO_ED.Close()
  796. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  797. bg.Open()
  798. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  799. left_time = (main_timer+ED_duration) % bg.info.duration
  800. bg_clip_list = [None] * bg_times
  801. bg_list = [None] * bg_times
  802. bg.Close()
  803. bg_timer = head_duration
  804. for idx in range(bg_times):
  805. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  806. bg_list[idx].Open()
  807. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  808. ,end=bg_list[idx].info.duration,ck=ck)
  809. t.AddClip(bg_clip_list[idx])
  810. bg_timer += bg_list[idx].info.duration
  811. bg_list[idx].Close()
  812. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  813. bg_left.Open()
  814. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  815. t.AddClip(bg_left_clip)
  816. bg_left.Close()
  817. title = openshot.QtImageReader(dir_title+name_hash+".png")
  818. title.Open() # Open the reader
  819. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  820. t.AddClip(title_clip)
  821. ####start building
  822. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  823. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  824. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  825. openshot.Fraction(1, 1), False, False, 3000000)
  826. w.Open()
  827. #may change duration into t.info.duration
  828. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  829. for n in range(frames):
  830. f=t.GetFrame(n)
  831. w.WriteFrame(f)
  832. #notify_group(name+"(ENG)的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  833. t.Close()
  834. w.Close()
  835. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  836. #line notifs
  837. import pyttsx3
  838. def make_speech(text):
  839. engine = pyttsx3.init()
  840. #voices = engine.getProperty('voices')
  841. engine.setProperty('voice', 'Mandarin')
  842. engine.save_to_file(text, '/app/speech.mp3')
  843. engine.runAndWait()
  844. class video_service(rpyc.Service):
  845. def exposed_call_video(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  846. print('ML:'+str(multiLang))
  847. anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar)
  848. def exposed_call_video_eng(self,name_hash,name,text_content, image_urls,sub_titles,avatar):
  849. anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar)
  850. def exposed_call_video_gen(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  851. print('ML:'+str(multiLang))#this is long video version,
  852. video_gen(name_hash,name,text_content, image_urls,multiLang,avatar)
  853. def exposed_make_speech(self,text):
  854. make_speech(text)
  855. from rpyc.utils.server import ThreadedServer
  856. t = ThreadedServer(video_service, port=8858)
  857. print('service started')
  858. t.start()