Added script for adding spoken lead-in messages to mp3 files

2025-08-23 01:13:22 +02:00 · 2019-04-02 10:14:11 +02:00
parent 92fe3f4440
commit 75fa9a53a8
1 changed files with 141 additions and 0 deletions
--- a/add_lead_in_messages.py
+++ b/add_lead_in_messages.py
@@ -0,0 +1,141 @@
 #!/usr/bin/python
 # Adds a lead-in message to each mp3 file of a directory storing the result in another directory.
 # So - when played e.g. on a TonUINO - you first will hear the title of the track, then the track itself.
 import argparse, base64, json, os, re, subprocess, sys
 class PatchedArgumentParser(argparse.ArgumentParser):
    def error(self, message):
        sys.stderr.write('error: %s\n\n' % message)
        self.print_help()
        sys.exit(2)
 argFormatter = lambda prog: argparse.HelpFormatter(prog, max_help_position=27, width=100)
 argparser = PatchedArgumentParser(
    description=
        'Adds a lead-in message to each mp3 file of a directory storing the result in another directory.\n' +
        'So - when played e.g. on a TonUINO - you first will hear the title of the track, then the track itself.',
    usage='%(prog)s -i my/source/dir -o my/output/dir [optional arguments...]',
    formatter_class=argFormatter)
 argparser.add_argument('-i', '--input', type=str, required=True, help='The input directory or mp3 file to process (input won\'t be changed)')
 argparser.add_argument('-o', '--output', type=str, required=True, help='The output directory where to write the mp3 files (will be created if not existing)')
 argparser.add_argument('--lang', choices=['de', 'en'], default='de', help='The language')
 argparser.add_argument('--google-key', type=str, default=None, help="The API key of the Google text-to-speech account to use. If missing the MacOS tool `say` will be used.")
 argparser.add_argument('--file-regex', type=str, default=None, help="The regular expression to use for parsing the mp3 file name. If missing the whole file name except a leading number will be used as track title.")
 argparser.add_argument('--title-pattern', type=str, default=None, help="The pattern to use as track title. May contain groups of `--file-regex`, e.g. '\\1'")
 argparser.add_argument('--add-numbering', action='store_true', help='Whether to add a three-digit number to the mp3 files (suitable for DFPlayer Mini)')
 argparser.add_argument('--dry-run', action='store_true', help='Dry run: Only prints what the script would do, without actually creating files')
 args = argparser.parse_args()
 googleVoiceByLang = {
    'de': { 'languageCode': 'de-DE', 'name': 'de-DE-Wavenet-C' },
    'en': { 'languageCode': 'en-US', 'name': 'en-US-Wavenet-D' },
 }
 sayVoiceByLang = {
    'de': 'Anna',
    'en': 'Samantha',
 }
 fileRegex = re.compile(args.file_regex if args.file_regex is not None else '\\d*(.*)')
 titlePattern = args.title_pattern if args.title_pattern is not None else '\\1'
 mp3FileIndex = 0
 def fail(msg):
    print('ERROR: ' + msg)
    sys.exit(1)
 def postJson(url, postBody):
    response = subprocess.check_output(['curl', '--header', 'Content-Type: application/json; charset=utf-8', '--data', json.dumps(postBody).encode('utf-8'), url])
    return json.loads(response)
 def textToSpeech(text, targetFile):
    if args.google_key:
        responseJson = postJson(
            'https://texttospeech.googleapis.com/v1beta1/text:synthesize?key=' + args.google_key,
            {
                'audioConfig': {
                    'audioEncoding': 'MP3',
                    'speakingRate': 1.0,
                    'pitch': 2.0,  # Default is 0.0
                    'sampleRateHertz': 44100,
                    'effectsProfileId': [ 'small-bluetooth-speaker-class-device' ]
                },
                'voice': googleVoiceByLang[args.lang],
                'input': { 'text': text }
            }
        )
        mp3Data = base64.b64decode(responseJson['audioContent'])
        with open(targetFile, 'wb') as f:
            f.write(mp3Data)
    else:
        subprocess.call([ 'say', '-v', sayVoiceByLang[args.lang], '-o', 'temp.aiff', text ])
        subprocess.call([ 'ffmpeg', '-y', '-i', 'temp.aiff', '-acodec', 'libmp3lame', '-ab', '128k', '-ac', '1', targetFile ])
        os.remove('temp.aiff')
 def addLeadInMessage(inputPath, outputPath):
    global mp3FileIndex
    if not os.path.exists(inputPath):
        fail('Input does not exist: ' + os.path.abspath(inputPath))
    if os.path.isdir(inputPath):
        if os.path.exists(outputPath):
            if not os.path.isdir(outputPath):
                fail('Input is a directory, but output isn\'t: ' + os.path.abspath(outputPath))
        elif not args.dry_run:
            os.mkdir(outputPath)
        mp3FileIndex = 0
        for child in sorted(os.listdir(inputPath)):
            addLeadInMessage(os.path.join(inputPath, child), os.path.join(outputPath, child))
        return
    inputFileNameSplit = os.path.splitext(os.path.basename(inputPath))
    inputFileName = inputFileNameSplit[0]
    inputFileExt = inputFileNameSplit[1].lower()
    if inputFileExt != '.mp3':
        print('Ignoring {} (no mp3 file)'.format(os.path.abspath(inputPath)))
        return
    if args.add_numbering:
        outputPathSplit = os.path.split(outputPath)
        outputPath = os.path.join(outputPathSplit[0], '{:0>3}_{}'.format(mp3FileIndex + 1, outputPathSplit[1]))
        mp3FileIndex += 1
    if os.path.isfile(outputPath):
        print('Skipping {} (file already exists)'.format(os.path.abspath(outputPath)))
        return
    text = re.sub(fileRegex, titlePattern, inputFileName).replace('_', ' ').strip()
    print('Adding lead-in "{}" to {}'.format(text, os.path.abspath(outputPath)))
    if not args.dry_run:
        tempLeadInFile = 'temp-lead-in.mp3'
        textToSpeech(text, tempLeadInFile)
        subprocess.call([ 'ffmpeg', '-i', 'concat:{}|{}'.format(tempLeadInFile, inputPath), '-acodec', 'copy', outputPath, '-map_metadata', '0:1' ])
        os.remove(tempLeadInFile)
        print('\n')
 if not os.path.exists(args.output) and not args.dry_run:
    outputParent = os.path.dirname(args.output)
    if not os.path.isdir(outputParent):
        fail('Parent of output is no directory: ' + os.path.abspath(outputParent))
 addLeadInMessage(args.input, args.output)