feat: better splitting for common markdown syntaxes
- list items - multiple new lines - stamements ending with punctuations
This commit is contained in:
parent
8f6c46f638
commit
a5a32903e0
1 changed files with 13 additions and 1 deletions
14
tts.py
14
tts.py
|
@ -143,7 +143,19 @@ def main():
|
||||||
name = name.replace("\\", "_")
|
name = name.replace("\\", "_")
|
||||||
name = name.replace("/", "_")
|
name = name.replace("/", "_")
|
||||||
|
|
||||||
generator = pipeline(text, voice=voice, split_pattern=r'[:.?!;]\n+|\n[*-]')
|
'''
|
||||||
|
Split patterns:
|
||||||
|
- only multiple consecutive new line (to handle wrapped statements)
|
||||||
|
- statements ending in punctuations (:.?!;)
|
||||||
|
- list items starting in '-' or '*'
|
||||||
|
- numbered items starting with a digit followed by a dot '.'
|
||||||
|
'''
|
||||||
|
generator = pipeline(
|
||||||
|
text,
|
||||||
|
voice=voice,
|
||||||
|
split_pattern=r'\n{2,}|[:.?!;]\n+|\n[\*\-(\d+\.)]'
|
||||||
|
)
|
||||||
|
|
||||||
output_files = generate_audio(generator, name, voice, args.device)
|
output_files = generate_audio(generator, name, voice, args.device)
|
||||||
directory, output_file_name = os.path.split(output_files[0])
|
directory, output_file_name = os.path.split(output_files[0])
|
||||||
if args.skip_play:
|
if args.skip_play:
|
||||||
|
|
Loading…
Reference in a new issue