diff options
Diffstat (limited to 'bin')
| -rwxr-xr-x | bin/pdf2mp3 | 32 | 
1 files changed, 32 insertions, 0 deletions
| diff --git a/bin/pdf2mp3 b/bin/pdf2mp3 new file mode 100755 index 0000000..3c9946c --- /dev/null +++ b/bin/pdf2mp3 @@ -0,0 +1,32 @@ +#!/usr/bin/env python3 + +# first run this +# docker run -p 9977:9998 apache/tika:2.0.0 +# export export TIKA_SERVER_ENDPOINT="http://127.0.0.1:9977" +# finally run the script +import argparse +from gtts import gTTS +from tika import parser + + +class Argparser(): +    def __init__(self): +        parser = argparse.ArgumentParser() +        parser.add_argument( +            "--pdf", +            type=str, help="path to the pdf") +        parser.add_argument("--bool", action="store_true", +                            help="bool", default=False) +        self.args = parser.parse_args() + + +def main() -> None: +    argparser = Argparser() +    raw = parser.from_file(argparser.args.pdf) +    print(raw['content']) +    tts = gTTS(raw['content']) +    tts.save("out.mp3") + + +if __name__ == "__main__": +    main() | 
