translatevideo.py

﻿# ==================================================================================
# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.

# Permission is hereby granted, free of charge, to any person obtaining a copy of this
# software and associated documentation files (the "Software"), to deal in the Software
# without restriction, including without limitation the rights to use, copy, modify,
# merge, publish, distribute, sublicense, and/or sell copies of the Software, and to
# permit persons to whom the Software is furnished to do so.

# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
# INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A
# PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
# HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
# OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
# ==================================================================================
#
# translatevideo.py
# by: Rob Dachowski
# For questions or feedback, please contact robdac@amazon.com
# 
# Edited by: Md. Farhan Memon
# For questions or feedback, please contact md.farhanmemon@gmail.com
# 
# Purpose: This code drives the process to create a transription job, translate it into another language,
#          create subtitles, use Amazon Polly to synthesize an alternate audio track, and finally put it all together
#          into a new video.
#
# Change Log:
#          06/29/2018: Initial version
#          09/04/2018: Added optional params to skip audio/video files
#
# ==================================================================================


import argparse
import sys
from transcribeUtils import *
from srtUtils import *
import time
from videoUtils import *
from audioUtils import *

# Get the command line arguments and parse them
if __name__ == '__main__':
	parser = argparse.ArgumentParser(prog = 'translatevideo.py', description = 'Process a video found in the input file, process it, and write it out to the output file')
	parser.add_argument('-r', '--region', required = True, help = "The AWS region containing the S3 buckets")
	parser.add_argument('-ib', '--inbucket', required = True, help = 'The S3 bucket containing the input file')
	parser.add_argument('-if', '--infile', required = True, help = 'The input file to process')
	parser.add_argument('-ol', '--outlang', required = True, nargs = '+', help = 'The language codes for the desired output.  E.g. en = English, de = German')
	parser.add_argument('-av', '--videofiles', required = False, help = '"true" if you want audio and video files alongwith translated subtitles')		
	parser.add_argument('-ofn', '--outfilename', required = '-av' in sys.argv, help = 'The file name without the extension, required if -av present')
	parser.add_argument('-ob', '--outbucket', required = '-av' in sys.argv, help = 'The S3 bucket containing the input file, required if -av present')
	parser.add_argument('-oft', '--outfiletype', required = '-av' in sys.argv, help = 'The output file type.  E.g. mp4, mov, required if -av present')
	args = parser.parse_args()

# print out parameters and key header information for the user
print("==> translatevideo.py:\n")
print("==> Parameters: ")
print("\tInput bucket/object: " + args.inbucket + '/' + args.infile)
if args.videofiles == 'true':
	print("\tOutput bucket/object: " + args.outbucket + '/' + args.outfilename + "." + args.outfiletype)

print("\n==> Target Language Translation Output: ")

for lang in args.outlang:
	if args.videofiles == 'true':
		print("\t" + args.outbucket + args.outfilename + "-" + lang + "." + args.outfiletype)

# Create Transcription Job
response = createTranscribeJob(args.region, args.inbucket, args.infile)

# loop until the job successfully completes
print("\n==> Transcription Job: " + response["TranscriptionJob"]["TranscriptionJobName"] + "\n\tIn Progress")

while(response["TranscriptionJob"]["TranscriptionJobStatus"] == "IN_PROGRESS"):
	sys.stdout.write('. ')
	sys.stdout.flush()
	time.sleep(15)
	response = getTranscriptionJobStatus(response["TranscriptionJob"]["TranscriptionJobName"])

print("\n==> Job Complete")
print("\tStart Time: " + str(response["TranscriptionJob"]["CreationTime"]))
print("\tEnd Time: "  + str(response["TranscriptionJob"]["CompletionTime"]))
print("\tTranscript URI: " + str(response["TranscriptionJob"]["Transcript"]["TranscriptFileUri"]))

# Now get the transcript JSON from AWS Transcribe
transcript = getTranscript(str(response["TranscriptionJob"]["Transcript"]["TranscriptFileUri"])) 
# print("\n==> Transcript: \n" + transcript)

# Create the SRT File for the original transcript and write it out.  
writeTranscriptToSRT(transcript, 'en', "subtitles-en.srt")
if args.videofiles == 'true':
	createVideo(args.infile, "subtitles-en.srt", args.outfilename + "-en." + args.outfiletype, "audio-en.mp3", True)

# Now write out the translation to the transcript for each of the target languages
for lang in args.outlang:
	writeTranslationToSRT(transcript, 'en', lang, "subtitles-" + lang + ".srt", args.region, args.videofiles) 	

	if args.videofiles == 'true':
		#Now that we have the subtitle files, let's create the audio track
		createAudioTrackFromTranslation(args.region, transcript, 'en', lang, "audio-" + lang + ".mp3")

		# Finally, create the composited video
		createVideo(args.infile, "subtitles-" + lang + ".srt", args.outfilename + "-" + lang + "." + args.outfiletype, "audio-" + lang + ".mp3", False)