Warning: this is an htmlized version!
The original is here, and the conversion rules are here. |
####### # # E-scripts on programs that do speech synthesis and speech-to-text. # # Note 1: use the eev command (defined in eev.el) and the # ee alias (in my .zshrc) to execute parts of this file. # Executing this file as a whole makes no sense. # An introduction to eev can be found here: # # (find-eev-quick-intro) # http://angg.twu.net/eev-intros/find-eev-quick-intro.html # # Note 2: be VERY careful and make sure you understand what # you're doing. # # Note 3: If you use a shell other than zsh things like |& # and the for loops may not work. # # Note 4: I always run as root. # # Note 5: some parts are too old and don't work anymore. Some # never worked. # # Note 6: the definitions for the find-xxxfile commands are on my # .emacs. # # Note 7: if you see a strange command check my .zshrc -- it may # be defined there as a function or an alias. # # Note 8: the sections without dates are always older than the # sections with dates. # # This file is at <http://angg.twu.net/e/speech.e> # or at <http://angg.twu.net/e/speech.e.html>. # See also <http://angg.twu.net/emacs.html>, # <http://angg.twu.net/.emacs[.html]>, # <http://angg.twu.net/.zshrc[.html]>, # <http://angg.twu.net/escripts.html>, # and <http://angg.twu.net/>. # ####### # «.speech-dispatcher» (to "speech-dispatcher") # «.spd-say» (to "spd-say") # «.spd-say-ipa» (to "spd-say-ipa") # «.speechd-git» (to "speechd-git") # «.speechd-mailing-list» (to "speechd-mailing-list") # «.mbrola» (to "mbrola") # «.openai-whisper» (to "openai-whisper") # «.aeneas» (to "aeneas") # https://askubuntu.com/questions/501910/how-to-text-to-speech-output-using-command-line # https://blends.debian.org/accessibility/tasks/speechsynthesis ##### # # speech-dispatcher in debian # 2019dec17 # ##### # «speech-dispatcher» (to ".speech-dispatcher") # (find-zsh "installeddebs | sort | grep speech-dispatcher") # (find-zsh "availabledebs | sort | grep speech-dispatcher") # (find-status "speech-dispatcher") # (find-vldifile "speech-dispatcher.list") # (find-udfile "speech-dispatcher/") * (eepitch-shell) * (eepitch-kill) * (eepitch-shell) # (find-man "8 apt-cache") apt-cache show speech-dispatcher apt-cache search speech-dispatcher apt-cache depends speech-dispatcher apt-cache rdepends speech-dispatcher apt-cache showpkg speech-dispatcher # (find-node "(spd-say)Top") # (find-node "(speech-dispatcher)Top") # (find-node "(ssip)Top") ##### # # spd-say # 2019dec17 # ##### # «spd-say» (to ".spd-say") # (find-man "1 spd-say") # (find-man "1 spd-say" "-l, --language" "Set the language (iso code)") # https://askubuntu.com/questions/842447/how-can-i-a-language-to-spd-say # (find-sh "spd-say -L") # https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes * (eepitch-shell) * (eepitch-kill) * (eepitch-shell) spd-say Hello spd-say -l en Hello spd-say -l pt viagem spd-say -l fr fromage spd-say "/zoʊˈtɛroʊ/" ##### # # spd-say-ipa # 2019dec17 # ##### # «spd-say-ipa» (to ".spd-say-ipa") # https://mail.google.com/mail/ca/u/0/#sent/KtbxLrjCNKlqTSzjswftLsdrzpwGhXnVbq # https://en.wikipedia.org/wiki/International_Phonetic_Alphabet Hi, beginner question here... Is there a way to make spd-say pronounce text in IPA? I mean, (some hack that would behave) like this: spd-say -l ipa "/zoʊˈtɛroʊ/" Thanks in advance! Eduardo Ochs http;//angg.twu.net/ http://angg.twu.net/emacsconf2019.html ##### # # speechd from git # 2019dec17 # ##### # «speechd-git» (to ".speechd-git") # http://devel.freebsoft.org/speechd # https://github.com/brailcom/speechd.git * (eepitch-shell) * (eepitch-kill) * (eepitch-shell) # rm -Rfv ~/usrc/speechd/ cd ~/usrc/ git clone https://github.com/brailcom/speechd.git cd ~/usrc/speechd/ git branch --list -a git for-each-ref PAGER=cat git log --oneline --graph --all -20 # (find-fline "~/usrc/") # (find-fline "~/usrc/speechd/") # (find-gitk "~/usrc/speechd/") # (code-c-d "speechd" "~/usrc/speechd/") # (find-speechdfile "") # (find-speechdgrep "grep --color -niRH --null -e languages *") # https://freebsoft.org/speechd-el # https://freebsoft.org/speechd-in-detail ##### # # speechd-mailing-list # 2019dec17 # ##### # «speechd-mailing-list» (to ".speechd-mailing-list") # https://lists.nongnu.org/mailman/listinfo/speechd-discuss # https://lists.nongnu.org/archive/html/speechd-discuss/ ##### # # MBROLA # 2020apr03 # ##### # «mbrola» (to ".mbrola") # https://english.stackexchange.com/questions/264239/is-there-any-online-tool-to-read-pronounce-ipa-and-apa-written-words # http://www.lfsag.unito.it/ipa/converter_en.html # https://en.wikipedia.org/wiki/MBROLA # https://github.com/numediart/MBROLA ##### # # openai-whisper # 2023aug02 # ##### # «openai-whisper» (to ".openai-whisper") # (find-angg "WHISPER/test1.py") # https://emacsconf.org/captioning/ # (find-fline "~/LOGS/2023aug02.emacs") # (find-fline "~/LOGS/2023aug02.emacs" "openai whisper") # (find-fline "~/LOGS/2023aug02.emacs" "Mozilla Deepspeech") # (find-pip3-links "assemblyai") # (find-importlib-links "assemblyai") # (find-pypi-links "assemblyai") # (find-pip3spfile "assemblyai/__init__.py") # https://github.com/AssemblyAI/assemblyai-python-sdk # (find-gitk "~/usrc/assemblyai-python-sdk/") # (code-c-d "aaipythonsdk" "~/usrc/assemblyai-python-sdk/") # (find-aaipythonsdkfile "") # (find-aaipythonsdkgrep "grep --color=auto -niRH --null -e language *") # (find-aaipythonsdkgrep "grep --color=auto -nRH --null -e LanguageCode *") # (find-aaipythonsdkgrep "grep --color=auto -nRH --null -e language_detection *") # (find-aaipythonsdkfile "assemblyai/types.py" "def language_code(self) ->") # (find-aaipythonsdkfile "assemblyai/types.py" "language_detection: Optional[bool]") # (find-aaipythonsdkfile "setup.py" "Natural Language :: English") # (find-aaipythonsdkfile "tests/unit/test_transcriber.py" "language_code=None") # (find-aaipythonsdkfile "tests/unit/factories.py" "language_code = aai.LanguageCode.en") # https://www.assemblyai.com/dashboard/activation # https://www.assemblyai.com/docs/Guides/generating_subtitles_for_videos * (eepitch-shell) * (eepitch-kill) * (eepitch-shell) cd /tmp/ scp -v 2023mateus.mp3 $LINP/tmp/m.mp3 * (eepitch-python) * (eepitch-kill) * (eepitch-python) import assemblyai as aai aai.settings.api_key = "45a318aad48d46f7a2ec55978f6674b1" transcriber = aai.Transcriber() print(aai.LanguageCode.en) print(aai.LanguageCode.pt) print(aai.LanguageCode.foo) print(transcriber) print(transcriber.language_code()) # transcript = transcriber.transcribe("https://storage.googleapis.com/aai-web-samples/news.mp4") transcript = transcriber.transcribe("/tmp/2023mateus.mp3") print(transcript.text) print(transcript.export_subtitles_srt()) print(transcript.export_subtitles_vtt()) * (eepitch-shell) * (eepitch-kill) * (eepitch-shell) pip3 install assemblyai https://github.com/openai/whisper https://www.google.com/search?q=how+do+I+set+the+language+in+openai+whisper&oq=how+do+I+set+the+language+in+openai+whisper ##### # # aeneas # 2024dec30 # ##### # «aeneas» (to ".aeneas") # https://sachachua.com/blog/category/subed/ # (find-fline "~/2024dec29.emacs" "https://github.com/readbeyond/aeneas") # (find-sh "espeak -s 130 -vfr 'maison voiture nappe'") https://itinerarium.github.io/phoneme-synthesis/ https://github.com/itinerarium/phoneme-synthesis/ https://en.wikipedia.org/wiki/International_Phonetic_Alphabet https://packages.debian.org/sid/transcriber http://trans.sourceforge.net/en/presentation.php http://transag.sourceforge.net/ https://en.wikipedia.org/wiki/P%C3%A1draig https://en.wikipedia.org/wiki/Help:IPA/Irish https://lists.gnu.org/archive/html/emacs-tangents/2021-01/msg00076.html Devin Prater https://wiki.hyperbola.info/doku.php?id=en:main:downloads&redirect=1#hypertalking_live_image https://per.quest/ https://news.ycombinator.com/item?id=28170609 Show HN: Instantly listen to any URL (per.quest) https://emacspeak.blogspot.com/2021/11/emacspeak-in-age-of-cloud-computing.html http://emacspeak.sourceforge.net/raman/publications/bc-emacspeak/ https://emacspeak.blogspot.com/2022/04/announcing-emacspeak-560-agiledog.html https://emacspeak.blogspot.com/2022/06/emacspeak-complete-audio-desktop-under.html https://news.ycombinator.com/item?id=33278785 Buzz: Transcribe audio from your microphones in real-time using OpenAI's Whisper (github.com/chidiwilliams) - speech https://github.com/chidiwilliams/buzz https://github.com/openai/whisper#setup https://openai.com/blog/whisper/ https://news.ycombinator.com/item?id=34211457 Ask HN: Are there any good open source text-to-speech tools? https://news.ycombinator.com/item?id=34229502 Ask HN: Alternatives to Scratch for a blind child? https://news.ycombinator.com/item?id=34361651 This Voice Doesn't Exist – Generative Voice AI (elevenlabs.io) https://news.ycombinator.com/item?id=35365399 Universal Speech Model (research.google) https://github.com/huggingface/distil-whisper https://news.ycombinator.com/item?id=38093353 Distil-Whisper: distilled version of Whisper that is 6 times faster, 49% smaller (github.com/huggingface) https://github.com/abus-aikorea/voice-pro https://news.ycombinator.com/item?id=42261909 Show HN: Voice-Pro – AI Voice Cloning Magic: Transform Any Voice in 15 Seconds (github.com/abus-aikorea) # Local Variables: # coding: utf-8-unix # End: