解决视频库 加载问题
import imageio
imageio.plugins.ffmpeg.download()
1 2 3 4 5 | Imageio: 'ffmpeg.win32.exe' was not found on your computer; downloading it now. Try 1. Download from https: / / github.com / imageio / imageio - binaries / raw / master / ffmpeg / ffmpeg.win32.exe ( 27.4 MB) Downloading: 8192 / 28781056 bytes ( 0.0 % ) 24576 / 28781056 bytes ( 0.1 % ) 32768 / 28781056 bytes ( 0.1 % ) |
目的是拿到播放时间长
1 2 3 4 5 6 7 | import imageio imageio.plugins.ffmpeg.download() from moviepy.editor import VideoFileClip f = 'g3dbliukeyuanCAKE_whole_parag3uidliukeyuanCAKE_whole_para1523498532saveVideo.b.avi' clip = VideoFileClip(f) print ( clip.duration ) # seconds |
1 2 3 4 5 6 7 | f = 'g3dbCAKEg3uidnoBRBlankLine.08.mp3' import mutagen.id3 from mutagen.easyid3 import EasyID3 from mutagen.mp3 import MP3 EasyID3.valid_keys[ "comment" ] = "COMM::'XXX'" id3info = MP3(f, ID3 = EasyID3) |
视频 音频 文件信息
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 | # 设置分句的标志符号;可以根据实际需要进行修改 # cutlist = "。!?".decode('utf-8') cutlist = [ '\n' , '\t' , '。' , ';' , '?' , '.' , ';' , '?' , '...' , '、、、' , ':' ] # cutlist = [ '。', ';', '?', '.', ';', '?', '...', '、、、',':',':',','] # cutlist = [ '。', ';', '?', '.', ';', '?', '...', '、、、',':',',','、'] # 检查某字符是否分句标志符号的函数;如果是,返回True,否则返回False def FindToken(cutlist, char): if char in cutlist: return True else : return False # 进行分句的核心函数 def Cut(cutlist, lines): # 参数1:引用分句标志符;参数2:被分句的文本,为一行中文字符 l = [] # 句子列表,用于存储单个分句成功后的整句内容,为函数的返回值 line = [] # 临时列表,用于存储捕获到分句标志符之前的每个字符,一旦发现分句符号后,就会将其内容全部赋给l,然后就会被清空 for i in lines: # 对函数参数2中的每一字符逐个进行检查 (本函数中,如果将if和else对换一下位置,会更好懂) if FindToken(cutlist, i): # 如果当前字符是分句符号 line.append(i) # 将此字符放入临时列表中 l.append(''.join(line)) # 并把当前临时列表的内容加入到句子列表中 line = [] # 将符号列表清空,以便下次分句使用 else : # 如果当前字符不是分句符号,则将该字符直接放入临时列表中 line.append(i) return l r_s = [] # 以下为调用上述函数实现从文本文件中读取内容并进行分句。 # with open('mybaidu.parp.b.txt','r',encoding='utf-8') as fr : # for lines in fr: # l = Cut(list(cutlist), list(lines)) # for line in l: # if len(line.replace(' ', '')) == 0: # continue # if line.strip() != "": # line=line.strip() # r_s.append(line) # # # li = line.strip().split() # # for sentence in li: # # r_s.append(sentence) str_ = '' # cutlist = [ '。', ';', '?', '.', ';', '?', '...', '、、、',':',':',',','\n'] with open ( 'mybaidu.parp.b.txt' , 'r' , encoding = 'utf-8' ) as fr: for lines in fr: if len (lines.replace( ' ' , '')) = = 0 : continue # str_='{}{}'.format(str_,lines.replace('\n','')) # if len(lines.replace(' ','').replace('\n',''))==0: # continue str_ = '{}{}' . format (str_, lines) # l = Cut(list(cutlist), list(lines)) # for line in l: # if line.strip() != "": # line=line.strip() from aip import AipSpeech bd_k_l = [ '11059852' , '5Kk01GtG2fjCwpzEkwdn0mjw' , 'bp6Wyx377Elq7RsCQZzTBgGUFzLm8G2A' ] APP_ID, API_KEY, SECRET_KEY = bd_k_l mp3_dir = 'C:\\Users\\sas\\PycharmProjects\\produce_video\\result_liukeyun\\' client = AipSpeech(APP_ID, API_KEY, SECRET_KEY) # result = client.synthesis(str_, 'zh', 1, { # 'vol': 5, # }) uid = 'liukeyuanCAKE_whole_para' # 识别正确返回语音二进制 错误则返回dict 参照下面错误码 f_w = '{}{}{}{}{}' . format (mp3_dir, 'g3db' , uid, 'g3uid' , '.mp3' ) # # if not isinstance(result, dict): # # f_w = '{}{}{}{}'.format(mp3_dir, 'g3uid', uid, '.mp3') # f_w = '{}{}{}{}{}'.format(mp3_dir, 'g3db', uid, 'g3uid', '.mp3') # # ,'g3db',uid,'g3uid' # # with open('auido.b.mp3', 'wb') as f: # with open(f_w, 'wb') as f: # f.write(result) sentence_l, sentence_l_chk = Cut( list (cutlist), list (str_)), [] for i in sentence_l: chk_br = i.replace( '\n' , '') # del sentence_l[sentence_l.index(i)] if len (chk_br) > 0 : sentence_l_chk.append(chk_br) sentence_l_chk = [i.replace( ' ' , '') for i in sentence_l_chk] import os import os, time, glob import cv2 os_sep = os.sep this_file_abspath = os.path.abspath(__file__) this_file_dirname, this_file_name = os.path.dirname(this_file_abspath), os.path.abspath(__file__).split(os_sep)[ - 1 ] f_img_d = '{}{}{}{}{}' . format (this_file_dirname, os_sep, 'mypng' , os_sep, '*.jpg' ) imgs, img_size_d = glob.glob(f_img_d), {} for i in imgs: img = cv2.imread(i) w_h_s = '{},{}' . format (img.shape[ 1 ], img.shape[ 0 ]) if w_h_s not in img_size_d: img_size_d[w_h_s] = 1 else : img_size_d[w_h_s] + = 1 mode_img_size_wh = [ int (i) for i in sorted (img_size_d.items(), key = lambda mytuple: mytuple[ 1 ], reverse = True )[ 0 ][ 0 ].split( ',' )] import os os_sep = os.sep this_file_abspath = os.path.abspath(__file__) this_file_dirname, this_file_name = os.path.dirname(this_file_abspath), os.path.abspath(__file__).split(os_sep)[ - 1 ] f_mp3 = '{}{}{}' . format (this_file_dirname, os_sep, 'auido.mp3' ) from playsound import playsound import time import math this_time = time.time() f_mp3 = f_w # # playsound(f_mp3) # # # t_spend = time.time() - this_time # # t_spend = 58.777058839797974 # # 音频的秒数 # # t_spend = 115.18474054336548 # # t_spend = 420.18474054336548 # # t_spend = 337.18474054336548 # t_spend = 362.5 # t_spend = 335.5 # #937 # t_spend = 577 # t_spend = math.ceil(t_spend) f_mp3 = 'g3dbCAKEg3uidnoBRBlankLine.08.mp3' import mutagen.id3 from mutagen.easyid3 import EasyID3 from mutagen.mp3 import MP3 EasyID3.valid_keys[ "comment" ] = "COMM::'XXX'" id3info = MP3(f_mp3, ID3 = EasyID3) t_spend = id3info.info.length import cv2 import glob ''' python+opencv视频图像相互转换 - CSDN博客 https://blog.csdn.net/m0_37733057/article/details/79023693 链接:https://www.zhihu.com/question/49558804/answer/343058915 OpenCV: Drawing Functions in OpenCV https://docs.opencv.org/3.1.0/dc/da5/tutorial_py_drawing_functions.html ''' # 每秒传输帧数(Frames Per Second) fps = 100 # 保存视频的FPS,可以适当调整 FPS是图像领域中的定义,是指画面每秒传输帧数,通俗来讲就是指动画或视频的画面数。FPS是测量用于保存、显示动态视频的信息数量。每秒钟帧数愈多,所显示的动作就会愈流畅。通常,要避免动作不流畅的最低是30。某些计算机视频格式,每秒只能提供15帧。 f_img_d = '{}{}{}{}{}' . format (this_file_dirname, os_sep, 'mypng' , os_sep, '*.jpg' ) imgs = glob.glob(f_img_d) """ 用图片总数均分音频时间 """ f, l = 'mybaidu.parp.b.txt' , [] with open (f, 'r' , encoding = 'utf-8' ) as fr: for i in fr: ii = i.replace( '\n' , '') l.append(ii) char_loop_l = [] for i in l: mystr, le = '', len (i) for ii in range (le): iii = i[ii] # print('-----', iii) mystr = '{}{}' . format (mystr, iii) # print(mystr) char_loop_l.append(iii) # # from fontTools.ttLib import TTFont # myfont = TTFont('simhei.ttf') def resize_rescale_pilimg(img_f, w_h_tuple = (mode_img_size_wh[ 0 ], mode_img_size_wh[ 1 ]), mid_factor = 1 ): # print(img_f) img_n, img_type = img_f.split( '.' )[ - 2 ], img_f.split( '.' )[ - 1 ] # print(img_n) img_n_resize_rescale_pilimg_dir = '{}{}{}' . format (os_sep.join(img_n.split(os_sep)[: - 1 ]), 'resize_rescale_pilimg' , os_sep, img_n.split(os_sep)[ - 1 ], os_sep) img_n_resize_rescale_pilimg = '{}{}{}' . format (img_n_resize_rescale_pilimg_dir, img_n.split(os_sep)[ - 1 ], '.PNG' ) # print(img_n_resize_rescale_pilimg) img_type = 'PNG' # img_f_new = '{}{}{}{}'.format(img_n, int(time.time()), 'resize_rescale.', img_type) img_f_new = img_n_resize_rescale_pilimg mid_icon = Image. open (img_f) mid_icon_w, mid_icon_h = w_h_tuple[ 0 ] * mid_factor, w_h_tuple[ 1 ] * mid_factor mid_icon = mid_icon.resize((mid_icon_w, mid_icon_h), Image.ANTIALIAS) mid_icon.save(img_n_resize_rescale_pilimg, img_type) return img_f_new def compute_video_playtime(f): # Create a VideoCapture object and read from input file # If the input is the camera, pass 0 instead of the video file name cap = cv2.VideoCapture(f) # Check if camera opened successfully if (cap.isOpened() = = False ): print ( "Error opening video stream or file" ) # Read until video is completed while (cap.isOpened()): # Capture frame-by-frame ret, frame = cap.read() if ret = = True : # Display the resulting frame cv2.imshow( 'Frame' , frame) # Press Q on keyboard to exit if cv2.waitKey( 25 ) & 0xFF = = ord ( 'q' ): break # Break the loop else : break # When everything done, release the video capture object cap.release() # Closes all the frames cv2.destroyAllWindows() return time.time() - this_time from PIL import Image, ImageDraw, ImageFont # myfont = ImageFont.truetype("simhei.ttf", 50, encoding="utf-8") myfont = ImageFont.truetype( "simhei.ttf" , encoding = "utf-8" ) import cv2 import numpy as np l = sentence_l_chk char_loop_l = sentence_l_chk # 2个空格有别于1个空格 # char_loop_l_len = len(''.join(sentence_l_chk).replace(' ', '')) + 2*len(char_loop_l) # char_loop_l_len = 3*len(char_loop_l) char_loop_l_len = len (char_loop_l) char_loop_l_len = len (''.join(sentence_l_chk)) char_loop_l_len = len (' '.join(sentence_l_chk).replace(' ', ' ')) # char_loop_l_len=len(char_loop_l) ''' ''' # l=sentence_l_chk # char_loop_l=sentence_l_chk # #2个空格有别于1个空格 # char_loop_l_len=len(char_loop_l) # # import imageio imageio.plugins.ffmpeg.download() from moviepy.editor import VideoFileClip # f='g3dbliukeyuanCAKE_whole_parag3uidliukeyuanCAKE_whole_para1523498532saveVideo.b.avi' # # clip = VideoFileClip(f) def gen_video(os_delay_factor = 0.245 , mystep = 0.01 , bear_error_second = 1 , audio_spend = t_spend, step_para = 1 ): f_v = '{}{}' . format ( int (time.time()), 'saveVideo.b.avi' ) f_v = '{}{}{}{}{}{}{}' . format ( 'D:\\myv\\', ' g3db ', uid, ' g3uid ', uid, int(time.time()), ' saveVideo.b.avi') fps, fourcc = 15 , cv2.VideoWriter_fourcc( 'M' , 'J' , 'P' , 'G' ) # fourcc = cv2.VideoWriter_fourcc('M', 'J', 'P', 'G') # opencv3.0 videoWriter = cv2.VideoWriter(f_v, fourcc, fps, (mode_img_size_wh[ 0 ], mode_img_size_wh[ 1 ])) # f_v = '{}{}'.format(int(time.time()), 'saveVideo.b.avi') for i in l: myinterval = t_spend / (char_loop_l_len * 1 ) * os_delay_factor i_index = l.index(i) img_index = i_index % len (imgs) imgname = imgs[img_index] mystr = '' le = len (i) br_step = 34 br_times = math.ceil(le / br_step) l_tmp = [] for i_br_loop in range (br_times): i_br = i[i_br_loop * br_step:i_br_loop * br_step + br_step] l_tmp.append(i_br) mystr = '\n' .join(l_tmp) print (mystr) this_time = time.time() ''' !!!!!!!!!!!!!!!! ''' # myinterval*=le myinterval * = len (mystr.replace( ' ' , ' ').replace(' \n ', ' ')) while time.time() - this_time < myinterval: frame = cv2.imread(imgname) del_f = False if (frame.shape[ 1 ], frame.shape[ 0 ]) ! = (mode_img_size_wh[ 0 ], mode_img_size_wh[ 1 ]): imgname = resize_rescale_pilimg(imgname) frame = cv2.imread(imgname) del_f = True else : pass frame_cv2 = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB) frame_pil = Image.fromarray(frame_cv2) # 转为PIL的图片格式 # font = ImageFont.truetype("simhei.ttf", 50, encoding="utf-8") font = ImageFont.truetype( "simhei.ttf" , encoding = "utf-8" ) ImageDraw.Draw(frame_pil).text(( 100 , 20 ), mystr, ( 0 , 0 , 255 ), font) frame_cv2 = cv2.cvtColor(np.array(frame_pil), cv2.COLOR_RGB2BGR) img = frame_cv2 videoWriter.write(img) # 换图 延迟 # videoWriter.write(img) # if del_f: # if os.path.exists(imgname): # print(imgname) # print('del') # # 删除文件,可使用以下两种方法。 # os.remove(imgname) # # os.unlink(my_file) # else: # pass videoWriter.release() time.sleep( 1 ) # video_playtime = compute_video_playtime(f_v) # f = 'g3dbliukeyuanCAKE_whole_parag3uidliukeyuanCAKE_whole_para1523498532saveVideo.b.avi' video_playtime = VideoFileClip(f_v).duration if video_playtime - audio_spend > bear_error_second: # os_delay_factor -= mystep os_delay_factor * = t_spend / video_playtime gen_video(os_delay_factor = os_delay_factor, mystep = 0.005 , audio_spend = t_spend) elif audio_spend - video_playtime > bear_error_second: # os_delay_factor += mystep os_delay_factor * = t_spend / video_playtime gen_video(os_delay_factor = os_delay_factor, mystep = 0.005 , audio_spend = t_spend) else : os._exit( 123 ) mycom = 0.19928228783504076 * 577 / 615 # gen_video(os_delay_factor=1, mystep=0.003, bear_error_second=0.5, audio_spend=t_spend) mycom = 577 / 1030 * 0.3 mycom = 577 / 1025 * 0.17858123692538752 mycom = 577 / 328 * 0.10052816946921814 gen_video(os_delay_factor = mycom, mystep = 0.003 , bear_error_second = 0.5 , audio_spend = t_spend) |
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· AI与.NET技术实操系列:向量存储与相似性搜索在 .NET 中的实现
· 基于Microsoft.Extensions.AI核心库实现RAG应用
· Linux系列:如何用heaptrack跟踪.NET程序的非托管内存泄露
· 开发者必知的日志记录最佳实践
· SQL Server 2025 AI相关能力初探
· winform 绘制太阳,地球,月球 运作规律
· 震惊!C++程序真的从main开始吗?99%的程序员都答错了
· 【硬核科普】Trae如何「偷看」你的代码?零基础破解AI编程运行原理
· 超详细:普通电脑也行Windows部署deepseek R1训练数据并当服务器共享给他人
· 上周热点回顾(3.3-3.9)
2017-04-12 WikiMedia system architecture
2017-04-12 沙箱机制
2017-04-12 Open System Interconnection
2017-04-12 丢包 ICMP