def main(args=None):
args = docopt(__doc__, argv=args, version=VERSION)
# from the whole input bag, split media files from transcriptions
# media and its transcript must be paired (i.e same order)
# for example, supose a folder with a video file macri_gato.mp4 and
# its transcription is macri_gato.txt
#
# *.mp4 *.txt
# macri_gato.*
# macri_gato.mp4 macri_gato.txt
media = []
transcripts = []
for filename in chain.from_iterable(glob.iglob(pattern) for pattern in args['<input_files>']):
output_extension = os.path.splitext(filename)[1][1:]
if output_extension in extensions_dict:
media.append(filename)
else:
transcripts.append(filename)
media_str = ' \n'.join(media)
transcripts_str = ' \n'.join(transcripts)
info = "Audio/Video:\n {}\nTranscripts/subtitle:\n {}".format(media_str, transcripts_str)
logging.info(info)
if not media or len(media) != len(transcripts):
raise DocoptExit(
"Input mismatch: the quantity of inputs and transcriptions differs"
)
try:
return miau(
media,
transcripts,
args['--remix'],
args['--output'],
args['--dump'],
debug=args['--debug'],
force_language=args['--lang']
)
except ValueError as e:
raise DocoptExit(str(e))
评论列表
文章目录