File size: 5,825 Bytes
37efd00 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 |
import os
import re
import sentencepiece
from pytube import YouTube
from youtube_transcript_api import YouTubeTranscriptApi
from transformers import MarianMTModel, MarianTokenizer
import torch
from TTS.api import TTS
from moviepy.editor import VideoFileClip
from pydub import AudioSegment
import subprocess
from moviepy.editor import *
def tov(input, output, text):
video = VideoFileClip(input)
txt_clip = TextClip(text, fontsize=24, color='white').set_position('center').set_duration(video.duration)
result = CompositeVideoClip([video, txt_clip])
result.write_videofile(output, codec='libx264', audio_codec='aac', remove_temp=True)
def video_audio(video_file_path, new_audio_file_path, output_video_file_path, translated_text,new_video_path):
video = VideoFileClip(video_file_path)
new_audio = AudioFileClip(new_audio_file_path)
new_audio = new_audio.subclip(0, video.duration)
video = video.set_audio(new_audio)
video.write_videofile(output_video_file_path, codec="libx264", audio_codec="aac", remove_temp=True)
except Exception as e:
print("Error writing video file:", e)
def tos(translated_text_file_path, video_path):
device = "cuda" if torch.cuda.is_available() else "cpu"
tts = TTS("tts_models/fr/mai/tacotron2-DDC").to(device)
output_audio_dir = 'CS370-M5/audio'
os.makedirs(output_audio_dir, exist_ok=True)
file_name_only = os.path.splitext(os.path.basename(translated_text_file_path))[0]
output_file_path = os.path.join(output_audio_dir, f"{file_name_only}.wav")
with open(translated_text_file_path, 'r', encoding='utf-8') as file:
translated_text =
tts.tts_to_file(text=translated_text, file_path=output_file_path)
output = f"CS370-M5/videos/{file_name_only}.mp4"
new_video_path = f"CS370-M5/videos/{file_name_only}_new.mp4"
video_audio(video_path, output_file_path, output,translated_text,new_video_path)
return output
def translate(input_text_path, output_text_path, source_lang='en', target_lang='fr', model_name="Helsinki-NLP/opus-mt-en-fr", batch_size=8):
model = MarianMTModel.from_pretrained(model_name)
tokenizer = MarianTokenizer.from_pretrained(model_name)
def batch(model, tokenizer, sentences):
sentences = [f"{source_lang}: {sentence}" for sentence in sentences]
input_ids = tokenizer(sentences, return_tensors="pt", padding=True, truncation=True)["input_ids"]
translation_ids = model.generate(input_ids)
translated_texts = tokenizer.batch_decode(translation_ids, skip_special_tokens=True)
return translated_texts
def rtff(file_path):
with open(file_path, 'r', encoding='utf-8') as file:
text = file.readlines()
return text
def wtff(file_path, translated_texts):
with open(file_path, 'w', encoding='utf-8') as file:
file.writelines([f"{line}\n" for line in translated_texts])
translated_lines = []
input_lines = rtff(input_text_path)
for i in range(0, len(input_lines), batch_size):
batch = input_lines[i:i + batch_size]
translated_batch = batch(model, tokenizer, batch)
wtff(output_text_path, translated_lines)
return translated_lines
def downloading(video_url, target_lang='fr'):
video_id ="(?<=v=)[\w-]+", video_url)
if video_id:
video_id =
yt = YouTube(video_url)
stream = yt.streams.get_highest_resolution()
modified_title = yt.title.replace(" ", "_")
download_path = 'CS370-M5/videos'
captions_path = 'CS370-M5/captions'
os.makedirs(download_path, exist_ok=True)
os.makedirs(captions_path, exist_ok=True)
video_file = f'{download_path}/{modified_title}.mp4', filename=modified_title + '.mp4')
transcript_list = YouTubeTranscriptApi.list_transcripts(video_id)
for transcript in transcript_list:
print(f"Language: {transcript.language}")
transcript = None
for source_lang in ['en', 'auto']:
transcript = transcript_list.find_generated_transcript([source_lang]).fetch()
except Exception as e:
original_captions = ""
for i, line in enumerate(transcript):
start_time = line['start']
formatted_time = f"{int(start_time // 60):02d}:{int(start_time % 60):02d}"
original_captions += f"{formatted_time} {line['text']}\n"
original_filename = f'{captions_path}/{modified_title}_original.txt'
with open(original_filename, 'w', encoding='utf-8') as file:
# Translation part
translated_captions = translate(original_filename,
translated_text_filename = f'{captions_path}/{modified_title}_translated.txt'
new_video_path = tos(translated_text_filename, video_file)
return original_captions, translated_captions, original_filename, translated_text_filename, new_video_path
print("video id not found.")
return None, None, None, None, None
except Exception as e:
print("Error:", e)
return None, None, None, None, None