openshot_video_generator.py 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975
  1. from os import listdir
  2. from os.path import isfile, isdir, join
  3. import openshot
  4. import threading
  5. import zhtts
  6. import os
  7. import urllib
  8. from typing import List
  9. import requests
  10. from pydantic import BaseModel
  11. from bs4 import BeautifulSoup
  12. from PIL import Image,ImageDraw,ImageFont
  13. import pyttsx3
  14. import rpyc
  15. import random
  16. import re
  17. import time
  18. import math
  19. import dataset
  20. from datetime import datetime
  21. from gtts import gTTS
  22. import ffmpy
  23. from difflib import SequenceMatcher
  24. import difflib
  25. from autosub import DEFAULT_CONCURRENCY
  26. from autosub import DEFAULT_SUBTITLE_FORMAT
  27. from pytranscriber.control.ctr_main import Ctr_Main
  28. from pytranscriber.control.ctr_autosub import Ctr_Autosub
  29. import multiprocessing
  30. from itertools import groupby
  31. from operator import itemgetter
  32. from util.parser import parser
  33. dir_sound = 'mp3_track/'
  34. dir_photo = 'photo/'
  35. dir_text = 'text_file/'
  36. dir_video = 'video_material/'
  37. dir_title = 'title/'
  38. dir_subtitle = 'subtitle/'
  39. dir_anchor = 'anchor_raw/'
  40. tmp_video_dir = 'tmp_video/'
  41. video_sub_folder = 'ai_anchor_video/'
  42. dir_list = [dir_sound,dir_photo,dir_text,dir_video,dir_title,dir_subtitle,dir_anchor,tmp_video_dir]
  43. def notify_group(msg):
  44. glist=['7vilzohcyQMPLfAMRloUawiTV4vtusZhxv8Czo7AJX8','WekCRfnAirSiSxALiD6gcm0B56EejsoK89zFbIaiZQD','1dbtJHbWVbrooXmQqc4r8OyRWDryjD4TMJ6DiDsdgsX','HOB1kVNgIb81tTB4Ort1BfhVp9GFo6NlToMQg88vEhh']
  45. for gid in glist:
  46. headers = {
  47. "Authorization": "Bearer " + gid,
  48. "Content-Type": "application/x-www-form-urlencoded"
  49. }
  50. params = {"message": msg}
  51. r = requests.post("https://notify-api.line.me/api/notify",headers=headers, params=params)
  52. def cKey(r,g,b,fuzz):
  53. col=openshot.Color()
  54. col.red=openshot.Keyframe(r)
  55. col.green=openshot.Keyframe(g)
  56. col.blue=openshot.Keyframe(b)
  57. return openshot.ChromaKey(col, openshot.Keyframe(fuzz))
  58. def video_photo_clip(vid=None,layer=None, position=None, end=None
  59. ,scale_x=1,scale_y=1,location_x=0,location_y=0,ck=None,audio=True):
  60. clip = openshot.Clip(vid)
  61. clip.Layer(layer)
  62. clip.Position(position)
  63. clip.End(end)
  64. clip.scale_x=openshot.Keyframe(scale_x)
  65. clip.scale_y=openshot.Keyframe(scale_y)
  66. clip.location_x=openshot.Keyframe(location_x)
  67. clip.location_y=openshot.Keyframe(location_y)
  68. if ck!=None:
  69. clip.AddEffect(ck)
  70. if audio==True:
  71. clip.has_audio=openshot.Keyframe(1)
  72. else:
  73. clip.has_audio=openshot.Keyframe(0)
  74. return clip
  75. def listener_progress(string, percent):
  76. True
  77. def myunichchar(unicode_char):
  78. mb_string = unicode_char.encode('big5')
  79. try:
  80. unicode_char = unichr(ord(mb_string[0]) << 8 | ord(mb_string[1]))
  81. except NameError:
  82. unicode_char = chr(mb_string[0] << 8 | mb_string[1])
  83. return unicode_char
  84. def get_url_type(url):
  85. req = urllib.request.Request(url, method='HEAD', headers={'User-Agent': 'Mozilla/5.0'})
  86. r = urllib.request.urlopen(req)
  87. contentType = r.getheader('Content-Type')
  88. return contentType
  89. def make_dir(name_hash):
  90. for direct in dir_list:
  91. if not os.path.isdir(direct):
  92. os.mkdir(direct)
  93. try:
  94. os.mkdir(dir_photo+name_hash)
  95. except FileExistsError:
  96. print("~~~~~~Warning~~~~~~~~~Directory " , dir_photo+name_hash , " already exists")
  97. try:
  98. os.mkdir(dir_text+name_hash)
  99. except FileExistsError:
  100. print("~~~~~~Warning~~~~~~~~~Directory " , dir_text+name_hash , " already exists")
  101. try:
  102. os.mkdir(dir_sound+name_hash)
  103. except FileExistsError:
  104. print("~~~~~~Warning~~~~~~~~~Directory " , dir_sound+name_hash , " already exists")
  105. try:
  106. os.mkdir(dir_anchor+name_hash)
  107. except FileExistsError:
  108. print("~~~~~~Warning~~~~~~~~~Directory " , dir_anchor+name_hash , " already exists")
  109. try:
  110. os.mkdir(dir_subtitle+name_hash)
  111. except FileExistsError:
  112. print("~~~~~~Warning~~~~~~~~~Directory " , dir_subtitle+name_hash , " already exists")
  113. def file_prepare(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  114. make_dir(name_hash)
  115. img_num = 1
  116. for imgu in image_urls:
  117. if get_url_type(imgu) =='video/mp4':
  118. r=requests.get(imgu)
  119. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  120. for chunk in r.iter_content(chunk_size=255):
  121. if chunk:
  122. f.write(chunk)
  123. f.close()
  124. else:
  125. im = Image.open(requests.get(imgu, stream=True).raw)
  126. im= im.convert("RGB")
  127. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  128. img_num+=1
  129. #save text
  130. txt_idx=0
  131. for txt in text_content:
  132. text_file = open(dir_text+name_hash+"/"+str(txt_idx)+".txt", "w")
  133. text_file.write(txt)
  134. text_file.close()
  135. txt_idx+=1
  136. print("text file made")
  137. #make mp3
  138. txt_idx = 0
  139. for txt in text_content:
  140. if lang!='zh' or multiLang==1:
  141. if lang!='zh':
  142. tts = gTTS(txt)
  143. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  144. else:
  145. tts = gTTS(txt,lang='zh-tw')
  146. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  147. #speed up
  148. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  149. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  150. ff.run()
  151. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  152. else:
  153. print('use zhtts')
  154. tts = zhtts.TTS()
  155. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  156. txt_idx+=1
  157. print("mp3 file made")
  158. #make title as image
  159. txt2image_title(name, dir_title+name_hash+".png",lang)
  160. def file_prepare_long(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  161. make_dir(name_hash)
  162. img_num = 1
  163. for imgu in image_urls:
  164. if get_url_type(imgu) =='video/mp4':
  165. r=requests.get(imgu)
  166. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  167. for chunk in r.iter_content(chunk_size=255):
  168. if chunk:
  169. f.write(chunk)
  170. f.close()
  171. else:
  172. im = Image.open(requests.get(imgu, stream=True).raw)
  173. im= im.convert("RGB")
  174. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  175. img_num+=1
  176. #make mp3
  177. text_parser = parser()
  178. txt_idx = 0
  179. for txt in text_content:
  180. rep_list = text_parser.replace_list(txt)
  181. for reptxt in rep_list:
  182. txt = txt.replace(reptxt,'')
  183. if lang!='zh' or multiLang==1:
  184. if lang!='zh':
  185. tts = gTTS(txt)
  186. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  187. else:
  188. tts = gTTS(txt,lang='zh-tw')
  189. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  190. #speed up
  191. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  192. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  193. ff.run()
  194. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  195. else:
  196. print('use zhtts')
  197. tts = zhtts.TTS()
  198. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  199. txt_idx+=1
  200. print("mp3 file made")
  201. #make title as image
  202. txt2image_title(name, dir_title+name_hash+".png",lang)
  203. def txt2image(content, save_target,lang='zh'):
  204. unicode_text = trim_punctuation(content)
  205. font = ''
  206. if lang=='zh':
  207. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=38)
  208. else :
  209. font = ImageFont.truetype(font="font/arial.ttf", size=38)
  210. text_width, text_height = font.getsize(unicode_text)
  211. canvas = Image.new('RGBA', (700, 500), (255, 0, 0, 0) )
  212. draw = ImageDraw.Draw(canvas)
  213. text= unicode_text
  214. draw.text((5,5), text, (255, 255, 0), font)
  215. canvas.save(save_target, "PNG")
  216. def txt2image_title(content, save_target, lang='zh'):
  217. unicode_text = trim_punctuation(content)
  218. font = ''
  219. if lang=='zh':
  220. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=22)
  221. else :
  222. font = ImageFont.truetype(font="font/arial.ttf", size=22)
  223. text_width, text_height = font.getsize(unicode_text)
  224. canvas = Image.new('RGBA', (510, 500), (255, 0, 0, 0) )
  225. draw = ImageDraw.Draw(canvas)
  226. text= unicode_text
  227. draw.text((5,5), text, (17, 41, 167), font)
  228. canvas.save(save_target, "PNG")
  229. def call_anchor(fileName,avatar):
  230. conn = rpyc.classic.connect("192.168.1.105",18812)
  231. ros = conn.modules.os
  232. rsys = conn.modules.sys
  233. fr=open(dir_sound+fileName+".mp3",'rb')# voice
  234. #warning!!! file my be replaced by other process
  235. fw=conn.builtins.open('/tmp/output.mp3','wb')
  236. while True:
  237. b=fr.read(1024)
  238. if b:
  239. fw.write(b)
  240. else:
  241. break
  242. fr.close()
  243. fw.close()
  244. val=random.randint(1000000,9999999)
  245. ros.chdir('/home/jared/to_video')
  246. ros.system('./p'+str(avatar)+'.sh '+str(val)+' &')
  247. while True:
  248. print('waiting...')
  249. if ros.path.exists('/tmp/results/'+str(val)):
  250. break
  251. time.sleep(5)
  252. print('waiting...')
  253. fr=conn.builtins.open('/tmp/results/'+str(val)+'.mp4','rb')
  254. fw=open(dir_anchor+fileName+".mp4",'wb')
  255. while True:
  256. b=fr.read(1024)
  257. if b:
  258. fw.write(b)
  259. else:
  260. break
  261. fr.close()
  262. fw.close()
  263. def syllable_count(word):
  264. word = word.lower()
  265. count = 0
  266. vowels = "aeiouy"
  267. if word[0] in vowels:
  268. count += 1
  269. for index in range(1, len(word)):
  270. if word[index] in vowels and word[index - 1] not in vowels:
  271. count += 1
  272. if word.endswith("e"):
  273. count -= 1
  274. if count == 0:
  275. count += 1
  276. return count
  277. def split_sentence(in_str, maxLen):
  278. re.findall(r'[\u4e00-\u9fff]+', in_str)
  279. zh_idx = []
  280. eng_idx= []
  281. for i in range(len(in_str)):
  282. if in_str[i] > u'\u4e00' and in_str[i] < u'\u9fff':
  283. zh_idx.append(i)
  284. else:
  285. eng_idx.append(i)
  286. space_index = [m.start() for m in re.finditer(' ', in_str)]
  287. for idx in space_index:
  288. eng_idx.remove(idx)
  289. eng_range_list = []
  290. for k, g in groupby(enumerate(eng_idx), lambda ix : ix[0] - ix[1]):
  291. eng_range = list(map(itemgetter(1), g))
  292. eng_range_list.append(eng_range)
  293. total_syllable = 0
  294. for i in range(len(eng_range_list)):
  295. total_syllable += (syllable_count(in_str[eng_range_list[i][0]:eng_range_list[i][-1]+1])+0.5)
  296. for i in range(len(zh_idx)):
  297. total_syllable+=1
  298. #final chchchchchc[en][en][en]
  299. #[en] is a vocabulary dict with occurence of image
  300. zh_eng_idx_list = []
  301. i = 0
  302. while i < len(in_str):
  303. if in_str[i]==' ':
  304. i+=1
  305. if i in zh_idx:
  306. zh_eng_idx_list.append(i)
  307. i+=1
  308. if i in eng_idx:
  309. for ls in eng_range_list:
  310. if i in ls:
  311. zh_eng_idx_list.append(ls)
  312. i = ls[-1]+1
  313. break
  314. zh_eng_dict_list = [{'content':'','time_ratio':0}]
  315. idx = 0
  316. current_len = 0
  317. sen_idx = 0
  318. while idx < len(zh_eng_idx_list):
  319. str_from_idx = ''
  320. sylla_cnt = 1
  321. if type(zh_eng_idx_list[idx])==type([]):
  322. str_from_idx = in_str[zh_eng_idx_list[idx][0]:zh_eng_idx_list[idx][-1]+1]+' '
  323. sylla_cnt = syllable_count(str_from_idx)
  324. else:
  325. str_from_idx = in_str[zh_eng_idx_list[idx]]
  326. if len(zh_eng_dict_list[sen_idx]['content'])+sylla_cnt>=maxLen:
  327. zh_eng_dict_list[sen_idx]['time_ratio'] = current_len/total_syllable
  328. zh_eng_dict_list.append({'content':'','time_ratio':0})
  329. sen_idx+=1
  330. current_len = 0
  331. else:
  332. current_len += sylla_cnt
  333. zh_eng_dict_list[sen_idx]['content'] += str_from_idx
  334. idx+=1
  335. total_ratio = 0
  336. for obj in zh_eng_dict_list:
  337. total_ratio+=obj['time_ratio']
  338. zh_eng_dict_list[-1]['time_ratio'] = 1-total_ratio
  339. return zh_eng_dict_list
  340. def parse_script(file_path,gt_list):
  341. with open(file_path, 'r',encoding="utf-8") as f:
  342. raw_lines = [line.strip() for line in f]
  343. lines = adjustSub_by_text_similarity(gt_list,raw_lines)
  344. text_parser = parser()
  345. #make dict
  346. dict_list = []
  347. for idx in range(len(lines)):
  348. script={}
  349. print(lines[idx])
  350. rep_ls = text_parser.replace_list(lines[idx])
  351. line_content = lines[idx]
  352. for reptxt in rep_ls:
  353. line_content = line_content.replace(reptxt,'')
  354. if len(rep_ls)!=0:
  355. script['image_idx'] = int(rep_ls[0].replace('{','').replace('}',''))
  356. script['content'] = line_content
  357. time_raw = raw_lines[idx * 4 +1 ].split(' --> ')
  358. start = time_raw[0].split(':')
  359. stop = time_raw[1].split(':')
  360. script['start'] = float(start[0])*3600 + float(start[1])*60 + float(start[2].replace(',','.'))
  361. script['stop'] = float(stop[0])*3600 + float(stop[1])*60 + float(stop[2].replace(',','.'))
  362. dict_list.append(script)
  363. #merge duplicated sentences
  364. script_not_dup_list = []
  365. for idx in range(len(dict_list)):
  366. dup_list = []
  367. for idx_inner in range(len(dict_list)):
  368. if dict_list[idx_inner]['content']==dict_list[idx]['content']:
  369. dup_list.append(idx_inner)
  370. for dup_idx in dup_list:
  371. if dup_idx == min(dup_list):
  372. dict_list[dup_idx]['type'] = 'lead_sentence'
  373. else:
  374. dict_list[dup_idx]['type'] = 'duplicated'
  375. dict_list[dup_list[0]]['stop'] = dict_list[dup_list[-1]]['stop']
  376. if dict_list[idx]['type'] == 'lead_sentence':
  377. script_not_dup_list.append(dict_list[idx])
  378. #avoid subtitle overlapping ? Timeline overlapping not found currently
  379. #cut by max length----> eng seperated problem {eng_idx}
  380. #ENG counts, zh counts, space counts
  381. new_idx = 0
  382. splitted_dict = []
  383. for dic in script_not_dup_list:
  384. dic_idx = 0
  385. accumulated_duration = 0
  386. duration = dic['stop']-dic['start']
  387. for sub_dic in split_sentence(dic['content'],13):
  388. new_dic = {}
  389. new_dic['index'] = new_idx
  390. if 'image_idx' in dic:
  391. new_dic['image_obj'] = {'start':dic['start'],'idx':dic['image_idx']}
  392. new_idx+=1
  393. ind_duration = duration * sub_dic['time_ratio']
  394. new_dic['start'] = dic['start'] + accumulated_duration
  395. accumulated_duration += ind_duration
  396. new_dic['content'] = sub_dic['content']
  397. new_dic['duration'] = ind_duration*0.7
  398. splitted_dict.append(new_dic)
  399. return splitted_dict
  400. def adjustSub_by_text_similarity(gts_in,gens_raw):
  401. #call by value only
  402. gts = gts_in[:]
  403. text_parser = parser()
  404. for i in range(len(gts)):
  405. rep_ls = text_parser.replace_list(gts[i])
  406. for reptxt in rep_ls:
  407. gts[i] = gts[i].replace(reptxt,'')
  408. print(gts)
  409. gens = []
  410. for idx in range(int((len(gens_raw)+1)/4)):
  411. gens.append(gens_raw[idx*4+2])
  412. combine2 = [''.join([i,j]) for i,j in zip(gts, gts[1:])]
  413. combine3 = [''.join([i,j,k]) for i,j,k in zip(gts, gts[1:], gts[2:])]
  414. alls = gts + combine2 + combine3
  415. adjusted = [None]*len(gens)
  416. duplicated_list = []
  417. for idx in range(len(gens)):
  418. match_text = difflib.get_close_matches(gens[idx], alls, cutoff=0.1)
  419. if match_text[0] in duplicated_list:
  420. for mt in match_text:
  421. if mt == adjusted[idx-1] or mt not in duplicated_list:
  422. adjusted[idx] = mt
  423. break
  424. else:
  425. adjusted[idx] = match_text[0]
  426. duplicated_list.append(match_text[0])
  427. combine2_tag = [''.join([i,j]) for i,j in zip(gts_in, gts_in[1:])]
  428. combine3_tag = [''.join([i,j,k]) for i,j,k in zip(gts_in, gts_in[1:], gts_in[2:])]
  429. alls_tag = gts_in + combine2_tag + combine3_tag
  430. for idx in range(len(adjusted)):
  431. match_text = difflib.get_close_matches(adjusted[idx], alls_tag, cutoff=0.1)
  432. adjusted[idx] = match_text
  433. return adjusted
  434. def trim_punctuation(s):
  435. pat_block = u'[^\u4e00-\u9fff0-9a-zA-Z]+';
  436. pattern = u'([0-9]+{0}[0-9]+)|{0}'.format(pat_block)
  437. res = re.sub(pattern, lambda x: x.group(1) if x.group(1) else u" " ,s)
  438. return res
  439. def splitter(s):
  440. for sent in re.findall(u'[^!?,。\!\?]+[!? 。\!\?]?', s, flags=re.U):
  441. yield sent
  442. def split_by_pun(s):
  443. res = list(splitter(s))
  444. return res
  445. def generate_subtitle_image_from_dict(name_hash, sub_dict):
  446. for script in sub_dict:
  447. sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  448. sub = script['content']
  449. txt2image(sub,sv_path)
  450. def generate_subtitle_image(name_hash,text_content):
  451. img_list = [None]*len(text_content)
  452. for idx in range(len(text_content)):
  453. img_list[idx]=[]
  454. senList = split_by_pun(text_content[idx])
  455. for inner_idx in range(len(senList)):
  456. sv_path = dir_subtitle + name_hash +'/'+str(idx)+ str(inner_idx) +'.png'
  457. sub = senList[inner_idx]
  458. txt2image(sub,sv_path)
  459. img_list[idx]+=[{"count":len(sub),"path":sv_path}]
  460. return img_list
  461. def generate_subtitle_image_ENG(name_hash,text_content):
  462. img_list = [None]*len(text_content)
  463. for idx in range(len(text_content)):
  464. sv_path = dir_subtitle + name_hash +'/'+str(idx)+'.png'
  465. sub = text_content[idx]
  466. txt2image(sub, sv_path,lang='eng')
  467. img_list[idx] = sv_path
  468. return img_list
  469. def video_writer_init(path):
  470. w = openshot.FFmpegWriter(path)
  471. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  472. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  473. openshot.Fraction(1, 1), False, False, 3000000)
  474. return w
  475. def video_gen(name_hash,name,text_content, image_urls,multiLang,avatar):
  476. file_prepare_long(name, name_hash, text_content,image_urls,multiLang)
  477. for fname in range(len(text_content)):
  478. call_anchor(name_hash+"/"+str(fname),avatar)
  479. print('called............................................')
  480. ck=cKey(0,254,0,270)
  481. ck_anchor=cKey(0,255,1,320)
  482. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  483. t.Open()
  484. main_timer = 0
  485. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  486. LOGO_OP.Open() # Open the reader
  487. head_duration = LOGO_OP.info.duration
  488. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=head_duration
  489. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  490. t.AddClip(LOGO_OP_clip)
  491. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  492. bg_head.Open()
  493. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  494. t.AddClip(bg_head_clip)
  495. main_timer += head_duration
  496. bg_head.Close()
  497. LOGO_OP.Close()
  498. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  499. anchor.Open()
  500. #anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  501. # location_x=0.35,location_y=0.25,position=main_timer, end=anchor.info.duration,ck=ck_anchor,audio=False)
  502. #t.AddClip(anchor_clip)
  503. speech = openshot.FFmpegReader(dir_sound+name_hash+"/0.mp3")
  504. speech.Open()
  505. speech_clip = openshot.Clip(speech)
  506. speech_clip.Position(main_timer)
  507. speech_clip.End(anchor.info.duration)
  508. t.AddClip(speech_clip)
  509. main_timer += anchor.info.duration
  510. anchor.Close()
  511. speech.Close()
  512. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  513. LOGO_ED.Open()
  514. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration
  515. ,location_x=0.005,location_y=-0.031, scale_x=0.8,scale_y=0.6825)
  516. t.AddClip(LOGO_ED_clip)
  517. main_timer += LOGO_ED.info.duration
  518. LOGO_ED.Close()
  519. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  520. bg.Open()
  521. bg_times = math.floor(main_timer/bg.info.duration)
  522. left_time = (main_timer) % bg.info.duration
  523. bg_clip_list = [None] * bg_times
  524. bg_list = [None] * bg_times
  525. bg.Close()
  526. bg_timer = head_duration
  527. for idx in range(bg_times):
  528. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  529. bg_list[idx].Open()
  530. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer,end=bg_list[idx].info.duration,ck=ck)
  531. t.AddClip(bg_clip_list[idx])
  532. bg_timer += bg_list[idx].info.duration
  533. bg_list[idx].Close()
  534. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  535. bg_left.Open()
  536. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  537. t.AddClip(bg_left_clip)
  538. bg_left.Close()
  539. title = openshot.QtImageReader(dir_title+name_hash+".png")
  540. title.Open() # Open the reader
  541. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  542. t.AddClip(title_clip)
  543. w = video_writer_init(tmp_video_dir+name_hash+"raw.mp4")
  544. w.Open()
  545. frames = int(t.info.fps)*int(main_timer)
  546. for n in range(frames):
  547. f=t.GetFrame(n)
  548. w.WriteFrame(f)
  549. t.Close()
  550. w.Close()
  551. print(name+"RAW DONE : www.choozmo.com:8168/"+tmp_video_dir+name_hash+"raw.mp4")
  552. #start adding sub
  553. #add sub
  554. Ctr_Autosub.init()
  555. Ctr_Autosub.generate_subtitles(tmp_video_dir+name_hash+"raw.mp4",'zh',listener_progress,output=tmp_video_dir+name_hash+"script.txt",concurrency=DEFAULT_CONCURRENCY,subtitle_file_format=DEFAULT_SUBTITLE_FORMAT)
  556. sub_dict = parse_script(tmp_video_dir+name_hash+"script.txt",split_by_pun(text_content[0]))
  557. for subd in sub_dict:
  558. print(subd)
  559. generate_subtitle_image_from_dict(name_hash, sub_dict)
  560. #sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  561. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  562. t.Open()
  563. raw = openshot.FFmpegReader(tmp_video_dir+name_hash+"raw.mp4")
  564. raw.Open()
  565. raw_clip = video_photo_clip(vid=raw,layer=2,position=0, end=raw.info.duration)
  566. t.AddClip(raw_clip)
  567. sub_img_list = [None] * len(sub_dict)
  568. sub_clip_list = [None] * len(sub_dict)
  569. for sub_obj in sub_dict:
  570. idx = int(sub_obj['index'])
  571. sub_img_list[idx] = openshot.QtImageReader(dir_subtitle + name_hash + '/' + str(idx)+'.png')
  572. sub_img_list[idx].Open()
  573. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=sub_obj['start'],end=math.ceil(sub_obj['duration']))
  574. t.AddClip(sub_clip_list[idx])
  575. sub_img_list[idx].Close()
  576. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  577. anchor.Open()
  578. anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  579. location_x=0.35,location_y=0.25,position=head_duration, end=anchor.info.duration,ck=ck_anchor,audio=False)
  580. t.AddClip(anchor_clip)
  581. w = video_writer_init(tmp_video_dir+name_hash+".mp4")
  582. w.Open()
  583. frames = int(t.info.fps)*int(main_timer)
  584. for n in range(frames):
  585. f=t.GetFrame(n)
  586. w.WriteFrame(f)
  587. t.Close()
  588. w.Close()
  589. os.remove(tmp_video_dir+name_hash+"raw.mp4")
  590. os.remove(tmp_video_dir+name_hash+"script.txt")
  591. print(name+"ALL DONE : www.choozmo.com:8168/"+video_sub_folder+name_hash+"raw.mp4")
  592. def anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar):
  593. print(os.getcwd())
  594. print('sub image made')
  595. print(multiLang)
  596. file_prepare(name, name_hash, text_content,image_urls,multiLang)
  597. sub_list=generate_subtitle_image(name_hash,text_content)
  598. for fname in range(len(text_content)):
  599. call_anchor(name_hash+"/"+str(fname),avatar)
  600. print('step finish')
  601. print('called............................................')
  602. ck=cKey(0,254,0,270)
  603. ck_anchor=cKey(0,255,1,320)
  604. duration = 0
  605. #average layer level is 3
  606. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  607. t.Open()
  608. main_timer = 0
  609. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  610. LOGO_OP.Open() # Open the reader
  611. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  612. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  613. t.AddClip(LOGO_OP_clip)
  614. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  615. bg_head.Open()
  616. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  617. t.AddClip(bg_head_clip)
  618. main_timer += LOGO_OP.info.duration
  619. head_duration = LOGO_OP.info.duration
  620. bg_head.Close()
  621. LOGO_OP.Close()
  622. clip_duration=0
  623. photo_clip_list = [None]*len(text_content)
  624. img_list = [None]*len(text_content)
  625. anchor_clip_list = [None] * len(text_content)
  626. anchor_list = [None] * len(text_content)
  627. audio_clip_list = [None] * len(text_content)
  628. audio_list = [None] * len(text_content)
  629. sub_clip_list = [None] * len(text_content)
  630. sub_img_list = [None] * len(text_content)
  631. idx = 0
  632. for p in listdir(dir_photo+name_hash):
  633. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  634. clip_duration = anchor_list[idx].info.duration
  635. anchor_list[idx].Open()
  636. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  637. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  638. t.AddClip(anchor_clip_list[idx])
  639. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  640. img_list[idx].Open()
  641. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  642. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  643. t.AddClip(photo_clip_list[idx])
  644. img_list[idx].Close()
  645. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  646. audio_list[idx].Open()
  647. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  648. audio_clip_list[idx].Position(main_timer)
  649. audio_clip_list[idx].End(clip_duration)
  650. t.AddClip(audio_clip_list[idx])
  651. img_list[idx].Close()
  652. anchor_list[idx].Close()
  653. audio_list[idx].Close()
  654. sub_img_list[idx] = [None] * len(sub_list[idx])
  655. sub_clip_list[idx] = [None] * len(sub_list[idx])
  656. sub_timer = 0
  657. for sub_idx in range(len(sub_list[idx])):
  658. sub_img_list[idx][sub_idx] = openshot.QtImageReader(sub_list[idx][sub_idx]['path'])
  659. sub_img_list[idx][sub_idx].Open()
  660. sub_duration = 0.205*sub_list[idx][sub_idx]['count']
  661. sub_clip_list[idx][sub_idx] = video_photo_clip(vid=sub_img_list[idx][sub_idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer+sub_timer,end=sub_duration)
  662. t.AddClip(sub_clip_list[idx][sub_idx])
  663. sub_img_list[idx][sub_idx].Close()
  664. sub_timer += sub_duration
  665. print(sub_list[idx][sub_idx]['path'])
  666. main_timer += clip_duration
  667. idx+=1
  668. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  669. LOGO_ED.Open()
  670. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  671. ,location_x=0.005,location_y=-0.031
  672. ,scale_x=0.8,scale_y=0.6825)
  673. t.AddClip(LOGO_ED_clip)
  674. ED_duration = LOGO_ED.info.duration
  675. LOGO_ED.Close()
  676. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  677. bg.Open()
  678. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  679. left_time = (main_timer+ED_duration) % bg.info.duration
  680. bg_clip_list = [None] * bg_times
  681. bg_list = [None] * bg_times
  682. bg.Close()
  683. bg_timer = head_duration
  684. for idx in range(bg_times):
  685. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  686. bg_list[idx].Open()
  687. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  688. ,end=bg_list[idx].info.duration,ck=ck)
  689. t.AddClip(bg_clip_list[idx])
  690. bg_timer += bg_list[idx].info.duration
  691. bg_list[idx].Close()
  692. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  693. bg_left.Open()
  694. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  695. t.AddClip(bg_left_clip)
  696. bg_left.Close()
  697. title = openshot.QtImageReader(dir_title+name_hash+".png")
  698. title.Open() # Open the reader
  699. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  700. t.AddClip(title_clip)
  701. ####start building
  702. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  703. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  704. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  705. openshot.Fraction(1, 1), False, False, 3000000)
  706. w.Open()
  707. #may change duration into t.info.duration
  708. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  709. for n in range(frames):
  710. f=t.GetFrame(n)
  711. w.WriteFrame(f)
  712. #notify_group(name+"的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  713. t.Close()
  714. w.Close()
  715. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  716. def anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar):
  717. file_prepare(name, name_hash, text_content,image_urls,'eng')
  718. sub_list=generate_subtitle_image_ENG(name_hash,sub_titles)
  719. for fname in range(len(text_content)):
  720. call_anchor(name_hash+"/"+str(fname),avatar)
  721. print('step finish')
  722. print('called............................................')
  723. ck=cKey(0,254,0,270)
  724. ck_anchor=cKey(0,255,1,320)
  725. duration = 0
  726. #average layer level is 3
  727. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  728. t.Open()
  729. main_timer = 0
  730. #add logo
  731. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  732. LOGO_OP.Open() # Open the reader
  733. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  734. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  735. t.AddClip(LOGO_OP_clip)
  736. #add background video (head is different)
  737. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  738. bg_head.Open()
  739. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  740. t.AddClip(bg_head_clip)
  741. main_timer += LOGO_OP.info.duration
  742. head_duration = LOGO_OP.info.duration
  743. bg_head.Close()
  744. LOGO_OP.Close()
  745. #prepare empty list
  746. clip_duration=0
  747. photo_clip_list = [None]*len(text_content)
  748. img_list = [None]*len(text_content)
  749. anchor_clip_list = [None] * len(text_content)
  750. anchor_list = [None] * len(text_content)
  751. audio_clip_list = [None] * len(text_content)
  752. audio_list = [None] * len(text_content)
  753. sub_clip_list = [None] * len(text_content)
  754. #openshot image holder
  755. sub_img_list = [None] * len(text_content)
  756. idx = 0
  757. for p in listdir(dir_photo+name_hash):
  758. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  759. clip_duration = anchor_list[idx].info.duration
  760. anchor_list[idx].Open()
  761. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  762. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  763. t.AddClip(anchor_clip_list[idx])
  764. #insert image
  765. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  766. img_list[idx].Open()
  767. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  768. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  769. t.AddClip(photo_clip_list[idx])
  770. img_list[idx].Close()
  771. #insert audio (speech)
  772. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  773. audio_list[idx].Open()
  774. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  775. audio_clip_list[idx].Position(main_timer)
  776. audio_clip_list[idx].End(clip_duration)
  777. t.AddClip(audio_clip_list[idx])
  778. #insert subtitle
  779. sub_img_list[idx] = openshot.QtImageReader(sub_list[idx])
  780. sub_img_list[idx].Open()
  781. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer,end=clip_duration)
  782. t.AddClip(sub_clip_list[idx])
  783. img_list[idx].Close()
  784. anchor_list[idx].Close()
  785. audio_list[idx].Close()
  786. sub_img_list[idx].Close()
  787. main_timer += clip_duration
  788. idx+=1
  789. LOGO_ED = openshot.FFmpegReader(dir_video+"ED_ENG.mp4")
  790. LOGO_ED.Open()
  791. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  792. ,location_x=0.005,location_y=-0.031
  793. ,scale_x=0.8,scale_y=0.6825)
  794. t.AddClip(LOGO_ED_clip)
  795. ED_duration = LOGO_ED.info.duration
  796. LOGO_ED.Close()
  797. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  798. bg.Open()
  799. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  800. left_time = (main_timer+ED_duration) % bg.info.duration
  801. bg_clip_list = [None] * bg_times
  802. bg_list = [None] * bg_times
  803. bg.Close()
  804. bg_timer = head_duration
  805. for idx in range(bg_times):
  806. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  807. bg_list[idx].Open()
  808. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  809. ,end=bg_list[idx].info.duration,ck=ck)
  810. t.AddClip(bg_clip_list[idx])
  811. bg_timer += bg_list[idx].info.duration
  812. bg_list[idx].Close()
  813. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  814. bg_left.Open()
  815. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  816. t.AddClip(bg_left_clip)
  817. bg_left.Close()
  818. title = openshot.QtImageReader(dir_title+name_hash+".png")
  819. title.Open() # Open the reader
  820. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  821. t.AddClip(title_clip)
  822. ####start building
  823. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  824. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  825. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  826. openshot.Fraction(1, 1), False, False, 3000000)
  827. w.Open()
  828. #may change duration into t.info.duration
  829. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  830. for n in range(frames):
  831. f=t.GetFrame(n)
  832. w.WriteFrame(f)
  833. #notify_group(name+"(ENG)的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  834. t.Close()
  835. w.Close()
  836. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  837. #line notifs
  838. import pyttsx3
  839. def make_speech(text):
  840. engine = pyttsx3.init()
  841. #voices = engine.getProperty('voices')
  842. engine.setProperty('voice', 'Mandarin')
  843. engine.save_to_file(text, '/app/speech.mp3')
  844. engine.runAndWait()
  845. class video_service(rpyc.Service):
  846. def exposed_call_video(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  847. print('ML:'+str(multiLang))
  848. anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar)
  849. def exposed_call_video_eng(self,name_hash,name,text_content, image_urls,sub_titles,avatar):
  850. anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar)
  851. def exposed_call_video_gen(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  852. print('ML:'+str(multiLang))#this is long video version,
  853. video_gen(name_hash,name,text_content, image_urls,multiLang,avatar)
  854. def exposed_make_speech(self,text):
  855. make_speech(text)
  856. from rpyc.utils.server import ThreadedServer
  857. t = ThreadedServer(video_service, port=8858)
  858. print('service started')
  859. t.start()