openshot_video_generator.py 37 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994
  1. from os import listdir
  2. from os.path import isfile, isdir, join
  3. import openshot
  4. import threading
  5. import zhtts
  6. import os
  7. import urllib
  8. from typing import List
  9. import requests
  10. from pydantic import BaseModel
  11. from bs4 import BeautifulSoup
  12. from PIL import Image,ImageDraw,ImageFont
  13. import pyttsx3
  14. import rpyc
  15. import random
  16. import re
  17. import time
  18. import math
  19. import dataset
  20. from datetime import datetime
  21. from gtts import gTTS
  22. import ffmpy
  23. from difflib import SequenceMatcher
  24. import difflib
  25. from autosub import DEFAULT_CONCURRENCY
  26. from autosub import DEFAULT_SUBTITLE_FORMAT
  27. from pytranscriber.control.ctr_main import Ctr_Main
  28. from pytranscriber.control.ctr_autosub import Ctr_Autosub
  29. import multiprocessing
  30. from itertools import groupby
  31. from operator import itemgetter
  32. from util.parser import parser
  33. dir_sound = 'mp3_track/'
  34. dir_photo = 'photo/'
  35. dir_text = 'text_file/'
  36. dir_video = 'video_material/'
  37. dir_title = 'title/'
  38. dir_subtitle = 'subtitle/'
  39. dir_anchor = 'anchor_raw/'
  40. tmp_video_dir = 'tmp_video/'
  41. video_sub_folder = 'ai_anchor_video/'
  42. dir_list = [dir_sound,dir_photo,dir_text,dir_video,dir_title,dir_subtitle,dir_anchor,tmp_video_dir]
  43. def notify_group(msg):
  44. glist=['7vilzohcyQMPLfAMRloUawiTV4vtusZhxv8Czo7AJX8','WekCRfnAirSiSxALiD6gcm0B56EejsoK89zFbIaiZQD','1dbtJHbWVbrooXmQqc4r8OyRWDryjD4TMJ6DiDsdgsX','HOB1kVNgIb81tTB4Ort1BfhVp9GFo6NlToMQg88vEhh']
  45. for gid in glist:
  46. headers = {
  47. "Authorization": "Bearer " + gid,
  48. "Content-Type": "application/x-www-form-urlencoded"
  49. }
  50. params = {"message": msg}
  51. r = requests.post("https://notify-api.line.me/api/notify",headers=headers, params=params)
  52. def cKey(r,g,b,fuzz):
  53. col=openshot.Color()
  54. col.red=openshot.Keyframe(r)
  55. col.green=openshot.Keyframe(g)
  56. col.blue=openshot.Keyframe(b)
  57. return openshot.ChromaKey(col, openshot.Keyframe(fuzz))
  58. def video_photo_clip(vid=None,layer=None, position=None, end=None
  59. ,scale_x=1,scale_y=1,location_x=0,location_y=0,ck=None,audio=True):
  60. clip = openshot.Clip(vid)
  61. clip.Layer(layer)
  62. clip.Position(position)
  63. clip.End(end)
  64. clip.scale_x=openshot.Keyframe(scale_x)
  65. clip.scale_y=openshot.Keyframe(scale_y)
  66. clip.location_x=openshot.Keyframe(location_x)
  67. clip.location_y=openshot.Keyframe(location_y)
  68. if ck!=None:
  69. clip.AddEffect(ck)
  70. if audio==True:
  71. clip.has_audio=openshot.Keyframe(1)
  72. else:
  73. clip.has_audio=openshot.Keyframe(0)
  74. return clip
  75. def listener_progress(string, percent):
  76. True
  77. def myunichchar(unicode_char):
  78. mb_string = unicode_char.encode('big5')
  79. try:
  80. unicode_char = unichr(ord(mb_string[0]) << 8 | ord(mb_string[1]))
  81. except NameError:
  82. unicode_char = chr(mb_string[0] << 8 | mb_string[1])
  83. return unicode_char
  84. def get_url_type(url):
  85. req = urllib.request.Request(url, method='HEAD', headers={'User-Agent': 'Mozilla/5.0'})
  86. r = urllib.request.urlopen(req)
  87. contentType = r.getheader('Content-Type')
  88. return contentType
  89. def make_dir(name_hash):
  90. for direct in dir_list:
  91. if not os.path.isdir(direct):
  92. os.mkdir(direct)
  93. try:
  94. os.mkdir(dir_photo+name_hash)
  95. except FileExistsError:
  96. print("~~~~~~Warning~~~~~~~~~Directory " , dir_photo+name_hash , " already exists")
  97. try:
  98. os.mkdir(dir_text+name_hash)
  99. except FileExistsError:
  100. print("~~~~~~Warning~~~~~~~~~Directory " , dir_text+name_hash , " already exists")
  101. try:
  102. os.mkdir(dir_sound+name_hash)
  103. except FileExistsError:
  104. print("~~~~~~Warning~~~~~~~~~Directory " , dir_sound+name_hash , " already exists")
  105. try:
  106. os.mkdir(dir_anchor+name_hash)
  107. except FileExistsError:
  108. print("~~~~~~Warning~~~~~~~~~Directory " , dir_anchor+name_hash , " already exists")
  109. try:
  110. os.mkdir(dir_subtitle+name_hash)
  111. except FileExistsError:
  112. print("~~~~~~Warning~~~~~~~~~Directory " , dir_subtitle+name_hash , " already exists")
  113. def file_prepare(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  114. make_dir(name_hash)
  115. img_num = 1
  116. for imgu in image_urls:
  117. if get_url_type(imgu) =='video/mp4':
  118. r=requests.get(imgu)
  119. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  120. for chunk in r.iter_content(chunk_size=255):
  121. if chunk:
  122. f.write(chunk)
  123. f.close()
  124. else:
  125. im = Image.open(requests.get(imgu, stream=True).raw)
  126. im= im.convert("RGB")
  127. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  128. img_num+=1
  129. #save text
  130. txt_idx=0
  131. for txt in text_content:
  132. text_file = open(dir_text+name_hash+"/"+str(txt_idx)+".txt", "w")
  133. text_file.write(txt)
  134. text_file.close()
  135. txt_idx+=1
  136. print("text file made")
  137. #make mp3
  138. txt_idx = 0
  139. for txt in text_content:
  140. if lang!='zh' or multiLang==1:
  141. if lang!='zh':
  142. tts = gTTS(txt)
  143. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  144. else:
  145. tts = gTTS(txt,lang='zh-tw')
  146. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  147. #speed up
  148. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  149. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  150. ff.run()
  151. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  152. else:
  153. print('use zhtts')
  154. tts = zhtts.TTS()
  155. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  156. txt_idx+=1
  157. print("mp3 file made")
  158. #make title as image
  159. txt2image_title(name, dir_title+name_hash+".png",lang)
  160. def file_prepare_long(name, name_hash,text_content,image_urls,multiLang,lang='zh'):
  161. make_dir(name_hash)
  162. img_num = 1
  163. for imgu in image_urls:
  164. if get_url_type(imgu) =='video/mp4':
  165. r=requests.get(imgu)
  166. f=open(dir_photo+name_hash+"/"+str(img_num)+".mp4",'wb')
  167. for chunk in r.iter_content(chunk_size=255):
  168. if chunk:
  169. f.write(chunk)
  170. f.close()
  171. else:
  172. im = Image.open(requests.get(imgu, stream=True).raw)
  173. im= im.convert("RGB")
  174. im.save(dir_photo+name_hash+"/"+str(img_num)+".jpg")
  175. img_num+=1
  176. #make mp3
  177. text_parser = parser()
  178. txt_idx = 0
  179. for txt in text_content:
  180. rep_list = text_parser.replace_list(txt)
  181. for reptxt in rep_list:
  182. txt = txt.replace(reptxt,'')
  183. if lang!='zh' or multiLang==1:
  184. if lang!='zh':
  185. tts = gTTS(txt)
  186. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  187. else:
  188. tts = gTTS(txt,lang='zh-tw')
  189. tts.save(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  190. #speed up
  191. ff = ffmpy.FFmpeg(inputs={dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3": None}
  192. , outputs={dir_sound+name_hash+"/"+str(txt_idx)+".mp3": ["-filter:a", "atempo=1.2"]})
  193. ff.run()
  194. os.remove(dir_sound+name_hash+"/"+str(txt_idx)+"raw.mp3")
  195. else:
  196. print('use zhtts')
  197. tts = zhtts.TTS()
  198. tts.text2wav(txt,dir_sound+name_hash+"/"+str(txt_idx)+".mp3")
  199. txt_idx+=1
  200. print("mp3 file made")
  201. #make title as image
  202. txt2image_title(name, dir_title+name_hash+".png",lang)
  203. def txt2image(content, save_target,lang='zh'):
  204. unicode_text = trim_punctuation(content)
  205. font = ''
  206. if lang=='zh':
  207. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=38)
  208. else :
  209. font = ImageFont.truetype(font="font/arial.ttf", size=38)
  210. text_width, text_height = font.getsize(unicode_text)
  211. canvas = Image.new('RGBA', (700, 500), (255, 0, 0, 0) )
  212. draw = ImageDraw.Draw(canvas)
  213. text= unicode_text
  214. draw.text((5,5), text, (255, 255, 0), font)
  215. canvas.save(save_target, "PNG")
  216. def txt2image_title(content, save_target, lang='zh'):
  217. unicode_text = trim_punctuation(content)
  218. font = ''
  219. if lang=='zh':
  220. font = ImageFont.truetype(font="font/DFT_B7.ttc", size=22)
  221. else :
  222. font = ImageFont.truetype(font="font/arial.ttf", size=22)
  223. text_width, text_height = font.getsize(unicode_text)
  224. canvas = Image.new('RGBA', (510, 500), (255, 0, 0, 0) )
  225. draw = ImageDraw.Draw(canvas)
  226. text= unicode_text
  227. draw.text((5,5), text, (17, 41, 167), font)
  228. canvas.save(save_target, "PNG")
  229. def call_anchor(fileName,avatar):
  230. conn = rpyc.classic.connect("192.168.1.105",18812)
  231. ros = conn.modules.os
  232. rsys = conn.modules.sys
  233. fr=open(dir_sound+fileName+".mp3",'rb')# voice
  234. #warning!!! file my be replaced by other process
  235. fw=conn.builtins.open('/tmp/output.mp3','wb')
  236. while True:
  237. b=fr.read(1024)
  238. if b:
  239. fw.write(b)
  240. else:
  241. break
  242. fr.close()
  243. fw.close()
  244. val=random.randint(1000000,9999999)
  245. ros.chdir('/home/jared/to_video')
  246. ros.system('./p'+str(avatar)+'.sh '+str(val)+' &')
  247. while True:
  248. print('waiting...')
  249. if ros.path.exists('/tmp/results/'+str(val)):
  250. break
  251. time.sleep(5)
  252. print('waiting...')
  253. fr=conn.builtins.open('/tmp/results/'+str(val)+'.mp4','rb')
  254. fw=open(dir_anchor+fileName+".mp4",'wb')
  255. while True:
  256. b=fr.read(1024)
  257. if b:
  258. fw.write(b)
  259. else:
  260. break
  261. fr.close()
  262. fw.close()
  263. def syllable_count(word):
  264. word = word.lower()
  265. count = 0
  266. vowels = "aeiouy"
  267. if word[0] in vowels:
  268. count += 1
  269. for index in range(1, len(word)):
  270. if word[index] in vowels and word[index - 1] not in vowels:
  271. count += 1
  272. if word.endswith("e"):
  273. count -= 1
  274. if count == 0:
  275. count += 1
  276. return count
  277. def split_sentence(in_str, maxLen):
  278. re.findall(r'[\u4e00-\u9fff]+', in_str)
  279. zh_idx = []
  280. eng_idx= []
  281. for i in range(len(in_str)):
  282. if in_str[i] > u'\u4e00' and in_str[i] < u'\u9fff':
  283. zh_idx.append(i)
  284. else:
  285. eng_idx.append(i)
  286. space_index = [m.start() for m in re.finditer(' ', in_str)]
  287. for idx in space_index:
  288. eng_idx.remove(idx)
  289. eng_range_list = []
  290. for k, g in groupby(enumerate(eng_idx), lambda ix : ix[0] - ix[1]):
  291. eng_range = list(map(itemgetter(1), g))
  292. eng_range_list.append(eng_range)
  293. total_syllable = 0
  294. for i in range(len(eng_range_list)):
  295. total_syllable += (syllable_count(in_str[eng_range_list[i][0]:eng_range_list[i][-1]+1])+0.5)
  296. for i in range(len(zh_idx)):
  297. total_syllable+=1
  298. #final chchchchchc[en][en][en]
  299. #[en] is a vocabulary dict with occurence of image
  300. zh_eng_idx_list = []
  301. i = 0
  302. while i < len(in_str):
  303. if in_str[i]==' ':
  304. i+=1
  305. if i in zh_idx:
  306. zh_eng_idx_list.append(i)
  307. i+=1
  308. if i in eng_idx:
  309. for ls in eng_range_list:
  310. if i in ls:
  311. zh_eng_idx_list.append(ls)
  312. i = ls[-1]+1
  313. break
  314. zh_eng_dict_list = [{'content':'','time_ratio':0}]
  315. idx = 0
  316. current_len = 0
  317. sen_idx = 0
  318. while idx < len(zh_eng_idx_list):
  319. str_from_idx = ''
  320. sylla_cnt = 1
  321. if type(zh_eng_idx_list[idx])==type([]):
  322. str_from_idx = in_str[zh_eng_idx_list[idx][0]:zh_eng_idx_list[idx][-1]+1]+' '
  323. sylla_cnt = syllable_count(str_from_idx)
  324. else:
  325. str_from_idx = in_str[zh_eng_idx_list[idx]]
  326. if len(zh_eng_dict_list[sen_idx]['content'])+sylla_cnt>=maxLen:
  327. zh_eng_dict_list[sen_idx]['time_ratio'] = current_len/total_syllable
  328. zh_eng_dict_list.append({'content':'','time_ratio':0})
  329. sen_idx+=1
  330. current_len = 0
  331. else:
  332. current_len += sylla_cnt
  333. zh_eng_dict_list[sen_idx]['content'] += str_from_idx
  334. idx+=1
  335. total_ratio = 0
  336. for obj in zh_eng_dict_list:
  337. total_ratio+=obj['time_ratio']
  338. zh_eng_dict_list[-1]['time_ratio'] = 1-total_ratio
  339. return zh_eng_dict_list
  340. def parse_script(file_path,gt_list):
  341. with open(file_path, 'r',encoding="utf-8") as f:
  342. raw_lines = [line.strip() for line in f]
  343. lines = adjustSub_by_text_similarity(gt_list,raw_lines)
  344. text_parser = parser()
  345. #make dict
  346. dict_list = []
  347. for idx in range(len(lines)):
  348. script={}
  349. print(lines[idx])
  350. rep_ls = text_parser.replace_list(lines[idx])
  351. print(rep_ls)
  352. line_content = lines[idx]
  353. for reptxt in rep_ls:
  354. line_content = line_content.replace(reptxt,'')
  355. if len(rep_ls)!=0:
  356. script['image_idx'] = int(rep_ls[0].replace('{','').replace('}',''))
  357. script['content'] = line_content
  358. time_raw = raw_lines[idx * 4 +1 ].split(' --> ')
  359. start = time_raw[0].split(':')
  360. stop = time_raw[1].split(':')
  361. script['start'] = float(start[0])*3600 + float(start[1])*60 + float(start[2].replace(',','.'))
  362. script['stop'] = float(stop[0])*3600 + float(stop[1])*60 + float(stop[2].replace(',','.'))
  363. dict_list.append(script)
  364. #merge duplicated sentences
  365. script_not_dup_list = []
  366. for idx in range(len(dict_list)):
  367. dup_list = []
  368. for idx_inner in range(len(dict_list)):
  369. if dict_list[idx_inner]['content']==dict_list[idx]['content']:
  370. dup_list.append(idx_inner)
  371. for dup_idx in dup_list:
  372. if dup_idx == min(dup_list):
  373. dict_list[dup_idx]['type'] = 'lead_sentence'
  374. else:
  375. dict_list[dup_idx]['type'] = 'duplicated'
  376. dict_list[dup_list[0]]['stop'] = dict_list[dup_list[-1]]['stop']
  377. if dict_list[idx]['type'] == 'lead_sentence':
  378. script_not_dup_list.append(dict_list[idx])
  379. #avoid subtitle overlapping ? Timeline overlapping not found currently
  380. #cut by max length----> eng seperated problem {eng_idx}
  381. #ENG counts, zh counts, space counts
  382. new_idx = 0
  383. splitted_dict = []
  384. for dic in script_not_dup_list:
  385. dic_idx = 0
  386. accumulated_duration = 0
  387. duration = dic['stop']-dic['start']
  388. for sub_dic in split_sentence(dic['content'],13):
  389. new_dic = {}
  390. new_dic['index'] = new_idx
  391. if 'image_idx' in dic:
  392. new_dic['image_obj'] = {'start':dic['start'],'idx':dic['image_idx']}
  393. new_idx+=1
  394. ind_duration = duration * sub_dic['time_ratio']
  395. new_dic['start'] = dic['start'] + accumulated_duration
  396. accumulated_duration += ind_duration
  397. new_dic['content'] = sub_dic['content']
  398. new_dic['duration'] = ind_duration*0.7
  399. splitted_dict.append(new_dic)
  400. return splitted_dict
  401. def adjustSub_by_text_similarity(gts_in,gens_raw):
  402. #call by value only
  403. gts = gts_in[:]
  404. text_parser = parser()
  405. for i in range(len(gts)):
  406. rep_ls = text_parser.replace_list(gts[i])
  407. for reptxt in rep_ls:
  408. gts[i] = gts[i].replace(reptxt,'')
  409. print(gts)
  410. gens = []
  411. for idx in range(int((len(gens_raw)+1)/4)):
  412. gens.append(gens_raw[idx*4+2])
  413. combine2 = [''.join([i,j]) for i,j in zip(gts, gts[1:])]
  414. combine3 = [''.join([i,j,k]) for i,j,k in zip(gts, gts[1:], gts[2:])]
  415. alls = gts + combine2 + combine3
  416. adjusted = [None]*len(gens)
  417. duplicated_list = []
  418. for idx in range(len(gens)):
  419. match_text = difflib.get_close_matches(gens[idx], alls, cutoff=0.1)
  420. if match_text[0] in duplicated_list:
  421. for mt in match_text:
  422. if mt == adjusted[idx-1] or mt not in duplicated_list:
  423. adjusted[idx] = mt
  424. break
  425. else:
  426. adjusted[idx] = match_text[0]
  427. duplicated_list.append(match_text[0])
  428. combine2_tag = [''.join([i,j]) for i,j in zip(gts_in, gts_in[1:])]
  429. combine3_tag = [''.join([i,j,k]) for i,j,k in zip(gts_in, gts_in[1:], gts_in[2:])]
  430. alls_tag = gts_in + combine2_tag + combine3_tag
  431. for idx in range(len(adjusted)):
  432. match_text = difflib.get_close_matches(adjusted[idx], alls_tag, cutoff=0.1)
  433. adjusted[idx] = match_text[0]
  434. return adjusted
  435. def trim_punctuation(s):
  436. pat_block = u'[^\u4e00-\u9fff0-9a-zA-Z]+';
  437. pattern = u'([0-9]+{0}[0-9]+)|{0}'.format(pat_block)
  438. res = re.sub(pattern, lambda x: x.group(1) if x.group(1) else u" " ,s)
  439. return res
  440. def splitter(s):
  441. for sent in re.findall(u'[^!?,。\!\?]+[!? 。\!\?]?', s, flags=re.U):
  442. yield sent
  443. def split_by_pun(s):
  444. res = list(splitter(s))
  445. return res
  446. def generate_subtitle_image_from_dict(name_hash, sub_dict):
  447. for script in sub_dict:
  448. sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  449. sub = script['content']
  450. txt2image(sub,sv_path)
  451. def generate_subtitle_image(name_hash,text_content):
  452. img_list = [None]*len(text_content)
  453. for idx in range(len(text_content)):
  454. img_list[idx]=[]
  455. senList = split_by_pun(text_content[idx])
  456. for inner_idx in range(len(senList)):
  457. sv_path = dir_subtitle + name_hash +'/'+str(idx)+ str(inner_idx) +'.png'
  458. sub = senList[inner_idx]
  459. txt2image(sub,sv_path)
  460. img_list[idx]+=[{"count":len(sub),"path":sv_path}]
  461. return img_list
  462. def generate_subtitle_image_ENG(name_hash,text_content):
  463. img_list = [None]*len(text_content)
  464. for idx in range(len(text_content)):
  465. sv_path = dir_subtitle + name_hash +'/'+str(idx)+'.png'
  466. sub = text_content[idx]
  467. txt2image(sub, sv_path,lang='eng')
  468. img_list[idx] = sv_path
  469. return img_list
  470. def video_writer_init(path):
  471. w = openshot.FFmpegWriter(path)
  472. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  473. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  474. openshot.Fraction(1, 1), False, False, 3000000)
  475. return w
  476. def video_gen(name_hash,name,text_content, image_urls,multiLang,avatar):
  477. file_prepare_long(name, name_hash, text_content,image_urls,multiLang)
  478. for fname in range(len(text_content)):
  479. call_anchor(name_hash+"/"+str(fname),avatar)
  480. print('called............................................')
  481. ck=cKey(0,254,0,270)
  482. ck_anchor=cKey(0,255,1,320)
  483. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  484. t.Open()
  485. main_timer = 0
  486. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  487. LOGO_OP.Open() # Open the reader
  488. head_duration = LOGO_OP.info.duration
  489. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=head_duration
  490. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  491. t.AddClip(LOGO_OP_clip)
  492. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  493. bg_head.Open()
  494. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  495. t.AddClip(bg_head_clip)
  496. main_timer += head_duration
  497. bg_head.Close()
  498. LOGO_OP.Close()
  499. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  500. anchor.Open()
  501. #anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  502. # location_x=0.35,location_y=0.25,position=main_timer, end=anchor.info.duration,ck=ck_anchor,audio=False)
  503. #t.AddClip(anchor_clip)
  504. speech = openshot.FFmpegReader(dir_sound+name_hash+"/0.mp3")
  505. speech.Open()
  506. speech_clip = openshot.Clip(speech)
  507. speech_clip.Position(main_timer)
  508. speech_clip.End(anchor.info.duration)
  509. t.AddClip(speech_clip)
  510. main_timer += anchor.info.duration
  511. anchor.Close()
  512. speech.Close()
  513. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  514. LOGO_ED.Open()
  515. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration
  516. ,location_x=0.005,location_y=-0.031, scale_x=0.8,scale_y=0.6825)
  517. t.AddClip(LOGO_ED_clip)
  518. main_timer += LOGO_ED.info.duration
  519. LOGO_ED.Close()
  520. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  521. bg.Open()
  522. bg_times = math.floor(main_timer/bg.info.duration)
  523. left_time = (main_timer) % bg.info.duration
  524. bg_clip_list = [None] * bg_times
  525. bg_list = [None] * bg_times
  526. bg.Close()
  527. bg_timer = head_duration
  528. for idx in range(bg_times):
  529. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  530. bg_list[idx].Open()
  531. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer,end=bg_list[idx].info.duration,ck=ck)
  532. t.AddClip(bg_clip_list[idx])
  533. bg_timer += bg_list[idx].info.duration
  534. bg_list[idx].Close()
  535. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  536. bg_left.Open()
  537. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  538. t.AddClip(bg_left_clip)
  539. bg_left.Close()
  540. title = openshot.QtImageReader(dir_title+name_hash+".png")
  541. title.Open() # Open the reader
  542. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  543. t.AddClip(title_clip)
  544. w = video_writer_init(tmp_video_dir+name_hash+"raw.mp4")
  545. w.Open()
  546. frames = int(t.info.fps)*int(main_timer)
  547. for n in range(frames):
  548. f=t.GetFrame(n)
  549. w.WriteFrame(f)
  550. t.Close()
  551. w.Close()
  552. print(name+"RAW DONE : www.choozmo.com:8168/"+tmp_video_dir+name_hash+"raw.mp4")
  553. #start adding sub
  554. #add sub
  555. Ctr_Autosub.init()
  556. Ctr_Autosub.generate_subtitles(tmp_video_dir+name_hash+"raw.mp4",'zh',listener_progress,output=tmp_video_dir+name_hash+"script.txt",concurrency=DEFAULT_CONCURRENCY,subtitle_file_format=DEFAULT_SUBTITLE_FORMAT)
  557. sub_dict = parse_script(tmp_video_dir+name_hash+"script.txt",split_by_pun(text_content[0]))
  558. for subd in sub_dict:
  559. print(subd)
  560. generate_subtitle_image_from_dict(name_hash, sub_dict)
  561. #sv_path = dir_subtitle + name_hash + '/' + str(script['index'])+'.png'
  562. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  563. t.Open()
  564. raw = openshot.FFmpegReader(tmp_video_dir+name_hash+"raw.mp4")
  565. raw.Open()
  566. raw_clip = video_photo_clip(vid=raw,layer=2,position=0, end=raw.info.duration)
  567. t.AddClip(raw_clip)
  568. sub_img_list = [None] * len(sub_dict)
  569. sub_clip_list = [None] * len(sub_dict)
  570. for sub_obj in sub_dict:
  571. idx = int(sub_obj['index'])
  572. sub_img_list[idx] = openshot.QtImageReader(dir_subtitle + name_hash + '/' + str(idx)+'.png')
  573. sub_img_list[idx].Open()
  574. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=sub_obj['start'],end=math.ceil(sub_obj['duration']))
  575. t.AddClip(sub_clip_list[idx])
  576. sub_img_list[idx].Close()
  577. tp = parser()
  578. img_dict_ls = tp.image_clip_info(sub_dict)
  579. #if 'image_idx' in dic:
  580. # new_dic['image_obj'] = {'start':dic['start'],'idx':dic['image_idx']}
  581. img_clip_list = [None]*len(text_content)
  582. img_list = [None]*len(text_content)
  583. for p in listdir(dir_photo+name_hash):
  584. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  585. img_list[idx].Open()
  586. img_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  587. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=img_dict_ls[int(p)+1]['start'],end=img_dict_ls[int(p)+1]['duration'],audio=False)
  588. t.AddClip(img_clip_list[idx])
  589. img_list[idx].Close()
  590. anchor = openshot.FFmpegReader(dir_anchor+name_hash+"/0.mp4")
  591. anchor.Open()
  592. anchor_clip = video_photo_clip(vid=anchor,layer=4,scale_x=0.65,scale_y=0.65,
  593. location_x=0.35,location_y=0.25,position=head_duration, end=anchor.info.duration,ck=ck_anchor,audio=False)
  594. t.AddClip(anchor_clip)
  595. w = video_writer_init(tmp_video_dir+name_hash+".mp4")
  596. w.Open()
  597. frames = int(t.info.fps)*int(main_timer)
  598. for n in range(frames):
  599. f=t.GetFrame(n)
  600. w.WriteFrame(f)
  601. t.Close()
  602. w.Close()
  603. os.remove(tmp_video_dir+name_hash+"raw.mp4")
  604. os.remove(tmp_video_dir+name_hash+"script.txt")
  605. print(name+"ALL DONE : www.choozmo.com:8168/"+video_sub_folder+name_hash+"raw.mp4")
  606. def anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar):
  607. print(os.getcwd())
  608. print('sub image made')
  609. print(multiLang)
  610. file_prepare(name, name_hash, text_content,image_urls,multiLang)
  611. sub_list=generate_subtitle_image(name_hash,text_content)
  612. for fname in range(len(text_content)):
  613. call_anchor(name_hash+"/"+str(fname),avatar)
  614. print('step finish')
  615. print('called............................................')
  616. ck=cKey(0,254,0,270)
  617. ck_anchor=cKey(0,255,1,320)
  618. duration = 0
  619. #average layer level is 3
  620. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  621. t.Open()
  622. main_timer = 0
  623. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  624. LOGO_OP.Open() # Open the reader
  625. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  626. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  627. t.AddClip(LOGO_OP_clip)
  628. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  629. bg_head.Open()
  630. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  631. t.AddClip(bg_head_clip)
  632. main_timer += LOGO_OP.info.duration
  633. head_duration = LOGO_OP.info.duration
  634. bg_head.Close()
  635. LOGO_OP.Close()
  636. clip_duration=0
  637. photo_clip_list = [None]*len(text_content)
  638. img_list = [None]*len(text_content)
  639. anchor_clip_list = [None] * len(text_content)
  640. anchor_list = [None] * len(text_content)
  641. audio_clip_list = [None] * len(text_content)
  642. audio_list = [None] * len(text_content)
  643. sub_clip_list = [None] * len(text_content)
  644. sub_img_list = [None] * len(text_content)
  645. idx = 0
  646. for p in listdir(dir_photo+name_hash):
  647. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  648. clip_duration = anchor_list[idx].info.duration
  649. anchor_list[idx].Open()
  650. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  651. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  652. t.AddClip(anchor_clip_list[idx])
  653. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  654. img_list[idx].Open()
  655. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  656. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  657. t.AddClip(photo_clip_list[idx])
  658. img_list[idx].Close()
  659. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  660. audio_list[idx].Open()
  661. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  662. audio_clip_list[idx].Position(main_timer)
  663. audio_clip_list[idx].End(clip_duration)
  664. t.AddClip(audio_clip_list[idx])
  665. img_list[idx].Close()
  666. anchor_list[idx].Close()
  667. audio_list[idx].Close()
  668. sub_img_list[idx] = [None] * len(sub_list[idx])
  669. sub_clip_list[idx] = [None] * len(sub_list[idx])
  670. sub_timer = 0
  671. for sub_idx in range(len(sub_list[idx])):
  672. sub_img_list[idx][sub_idx] = openshot.QtImageReader(sub_list[idx][sub_idx]['path'])
  673. sub_img_list[idx][sub_idx].Open()
  674. sub_duration = 0.205*sub_list[idx][sub_idx]['count']
  675. sub_clip_list[idx][sub_idx] = video_photo_clip(vid=sub_img_list[idx][sub_idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer+sub_timer,end=sub_duration)
  676. t.AddClip(sub_clip_list[idx][sub_idx])
  677. sub_img_list[idx][sub_idx].Close()
  678. sub_timer += sub_duration
  679. print(sub_list[idx][sub_idx]['path'])
  680. main_timer += clip_duration
  681. idx+=1
  682. LOGO_ED = openshot.FFmpegReader(dir_video+"LOGO_ED.avi")
  683. LOGO_ED.Open()
  684. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  685. ,location_x=0.005,location_y=-0.031
  686. ,scale_x=0.8,scale_y=0.6825)
  687. t.AddClip(LOGO_ED_clip)
  688. ED_duration = LOGO_ED.info.duration
  689. LOGO_ED.Close()
  690. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  691. bg.Open()
  692. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  693. left_time = (main_timer+ED_duration) % bg.info.duration
  694. bg_clip_list = [None] * bg_times
  695. bg_list = [None] * bg_times
  696. bg.Close()
  697. bg_timer = head_duration
  698. for idx in range(bg_times):
  699. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  700. bg_list[idx].Open()
  701. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  702. ,end=bg_list[idx].info.duration,ck=ck)
  703. t.AddClip(bg_clip_list[idx])
  704. bg_timer += bg_list[idx].info.duration
  705. bg_list[idx].Close()
  706. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  707. bg_left.Open()
  708. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  709. t.AddClip(bg_left_clip)
  710. bg_left.Close()
  711. title = openshot.QtImageReader(dir_title+name_hash+".png")
  712. title.Open() # Open the reader
  713. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  714. t.AddClip(title_clip)
  715. ####start building
  716. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  717. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  718. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  719. openshot.Fraction(1, 1), False, False, 3000000)
  720. w.Open()
  721. #may change duration into t.info.duration
  722. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  723. for n in range(frames):
  724. f=t.GetFrame(n)
  725. w.WriteFrame(f)
  726. #notify_group(name+"的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  727. t.Close()
  728. w.Close()
  729. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  730. def anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar):
  731. file_prepare(name, name_hash, text_content,image_urls,'eng')
  732. sub_list=generate_subtitle_image_ENG(name_hash,sub_titles)
  733. for fname in range(len(text_content)):
  734. call_anchor(name_hash+"/"+str(fname),avatar)
  735. print('step finish')
  736. print('called............................................')
  737. ck=cKey(0,254,0,270)
  738. ck_anchor=cKey(0,255,1,320)
  739. duration = 0
  740. #average layer level is 3
  741. t = openshot.Timeline(1280, 720, openshot.Fraction(30000, 1000), 44100, 2, openshot.LAYOUT_STEREO)
  742. t.Open()
  743. main_timer = 0
  744. #add logo
  745. LOGO_OP = openshot.FFmpegReader(dir_video+"LOGO_OP_4.mp4")
  746. LOGO_OP.Open() # Open the reader
  747. LOGO_OP_clip = video_photo_clip(vid=LOGO_OP,layer=4,position=0,end=LOGO_OP.info.duration
  748. ,location_y=-0.03,scale_x=0.8,scale_y=0.704)
  749. t.AddClip(LOGO_OP_clip)
  750. #add background video (head is different)
  751. bg_head = openshot.FFmpegReader(dir_video+"complete_head_aispokesgirl.mp4")
  752. bg_head.Open()
  753. bg_head_clip = video_photo_clip(vid=bg_head,layer=2,position=0,end=LOGO_OP.info.duration,ck=ck)
  754. t.AddClip(bg_head_clip)
  755. main_timer += LOGO_OP.info.duration
  756. head_duration = LOGO_OP.info.duration
  757. bg_head.Close()
  758. LOGO_OP.Close()
  759. #prepare empty list
  760. clip_duration=0
  761. photo_clip_list = [None]*len(text_content)
  762. img_list = [None]*len(text_content)
  763. anchor_clip_list = [None] * len(text_content)
  764. anchor_list = [None] * len(text_content)
  765. audio_clip_list = [None] * len(text_content)
  766. audio_list = [None] * len(text_content)
  767. sub_clip_list = [None] * len(text_content)
  768. #openshot image holder
  769. sub_img_list = [None] * len(text_content)
  770. idx = 0
  771. for p in listdir(dir_photo+name_hash):
  772. anchor_list[idx] = openshot.FFmpegReader(dir_anchor+name_hash+"/"+str(idx)+".mp4")
  773. clip_duration = anchor_list[idx].info.duration
  774. anchor_list[idx].Open()
  775. anchor_clip_list[idx] = video_photo_clip(vid=anchor_list[idx],layer=4,scale_x=0.65,scale_y=0.65,
  776. location_x=0.35,location_y=0.25,position=main_timer, end=clip_duration,ck=ck_anchor,audio=False)
  777. t.AddClip(anchor_clip_list[idx])
  778. #insert image
  779. img_list[idx] = openshot.FFmpegReader(dir_photo+name_hash+'/'+p)
  780. img_list[idx].Open()
  781. photo_clip_list[idx] = video_photo_clip(vid=img_list[idx],layer=3
  782. ,scale_x=0.81,scale_y=0.68,location_y=-0.03,position=main_timer,end=clip_duration,audio=False)
  783. t.AddClip(photo_clip_list[idx])
  784. img_list[idx].Close()
  785. #insert audio (speech)
  786. audio_list[idx] = openshot.FFmpegReader(dir_sound+name_hash+"/"+str(idx)+".mp3")
  787. audio_list[idx].Open()
  788. audio_clip_list[idx] = openshot.Clip(audio_list[idx])
  789. audio_clip_list[idx].Position(main_timer)
  790. audio_clip_list[idx].End(clip_duration)
  791. t.AddClip(audio_clip_list[idx])
  792. #insert subtitle
  793. sub_img_list[idx] = openshot.QtImageReader(sub_list[idx])
  794. sub_img_list[idx].Open()
  795. sub_clip_list[idx] = video_photo_clip(vid=sub_img_list[idx], layer=6,location_x=0.069, location_y=0.89,position=main_timer,end=clip_duration)
  796. t.AddClip(sub_clip_list[idx])
  797. img_list[idx].Close()
  798. anchor_list[idx].Close()
  799. audio_list[idx].Close()
  800. sub_img_list[idx].Close()
  801. main_timer += clip_duration
  802. idx+=1
  803. LOGO_ED = openshot.FFmpegReader(dir_video+"ED_ENG.mp4")
  804. LOGO_ED.Open()
  805. LOGO_ED_clip = video_photo_clip(vid=LOGO_ED,layer=4,position=main_timer,end=LOGO_ED.info.duration+2
  806. ,location_x=0.005,location_y=-0.031
  807. ,scale_x=0.8,scale_y=0.6825)
  808. t.AddClip(LOGO_ED_clip)
  809. ED_duration = LOGO_ED.info.duration
  810. LOGO_ED.Close()
  811. bg = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  812. bg.Open()
  813. bg_times = math.floor(main_timer+ED_duration/bg.info.duration)
  814. left_time = (main_timer+ED_duration) % bg.info.duration
  815. bg_clip_list = [None] * bg_times
  816. bg_list = [None] * bg_times
  817. bg.Close()
  818. bg_timer = head_duration
  819. for idx in range(bg_times):
  820. bg_list[idx] = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  821. bg_list[idx].Open()
  822. bg_clip_list[idx] = video_photo_clip(bg_list[idx],layer=2,position=bg_timer
  823. ,end=bg_list[idx].info.duration,ck=ck)
  824. t.AddClip(bg_clip_list[idx])
  825. bg_timer += bg_list[idx].info.duration
  826. bg_list[idx].Close()
  827. bg_left = openshot.FFmpegReader(dir_video+"complete_double_aispokesgirl.mp4")
  828. bg_left.Open()
  829. bg_left_clip = video_photo_clip(bg_left,layer=2,position=bg_timer,end=left_time,ck=ck)
  830. t.AddClip(bg_left_clip)
  831. bg_left.Close()
  832. title = openshot.QtImageReader(dir_title+name_hash+".png")
  833. title.Open() # Open the reader
  834. title_clip = video_photo_clip(vid=title, layer=4,location_x=-0.047, location_y=0.801,position=0,end=head_duration+main_timer)
  835. t.AddClip(title_clip)
  836. ####start building
  837. w = openshot.FFmpegWriter(tmp_video_dir+name_hash+".mp4")
  838. w.SetAudioOptions(True, "aac", 44100, 2, openshot.LAYOUT_STEREO, 3000000)
  839. w.SetVideoOptions(True, "libx264", openshot.Fraction(30000, 1000), 1280, 720,
  840. openshot.Fraction(1, 1), False, False, 3000000)
  841. w.Open()
  842. #may change duration into t.info.duration
  843. frames = int(t.info.fps)*int(head_duration+main_timer+ED_duration)
  844. for n in range(frames):
  845. f=t.GetFrame(n)
  846. w.WriteFrame(f)
  847. #notify_group(name+"(ENG)的影片已經產生完成囉! www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  848. t.Close()
  849. w.Close()
  850. print("video at : www.choozmo.com:8168/"+video_sub_folder+name_hash+".mp4")
  851. #line notifs
  852. import pyttsx3
  853. def make_speech(text):
  854. engine = pyttsx3.init()
  855. #voices = engine.getProperty('voices')
  856. engine.setProperty('voice', 'Mandarin')
  857. engine.save_to_file(text, '/app/speech.mp3')
  858. engine.runAndWait()
  859. class video_service(rpyc.Service):
  860. def exposed_call_video(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  861. print('ML:'+str(multiLang))
  862. anchor_video_v2(name_hash,name,text_content, image_urls,multiLang,avatar)
  863. def exposed_call_video_eng(self,name_hash,name,text_content, image_urls,sub_titles,avatar):
  864. anchor_video_eng(name_hash,name,text_content, image_urls,sub_titles,avatar)
  865. def exposed_call_video_gen(self,name_hash,name,text_content, image_urls,multiLang,avatar):
  866. print('ML:'+str(multiLang))#this is long video version,
  867. video_gen(name_hash,name,text_content, image_urls,multiLang,avatar)
  868. def exposed_make_speech(self,text):
  869. make_speech(text)
  870. from rpyc.utils.server import ThreadedServer
  871. t = ThreadedServer(video_service, port=8858)
  872. print('service started')
  873. t.start()