| /* |
| * skeleton0.c - Trivial module example |
| * |
| * Copyright (C) 2020-2022, 2025 Samuel Thibault <samuel.thibault@ens-lyon.org> |
| * All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in the |
| * documentation and/or other materials provided with the distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY Samuel Thibault AND CONTRIBUTORS ``AS IS'' AND |
| * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE |
| * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL |
| * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS |
| * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) |
| * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT |
| * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY |
| * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF |
| * SUCH DAMAGE. |
| */ |
| |
| /* |
| * This module is based on skeleton0, and shows how it can be completed easily |
| * to run Espeak-NG asynchronously, with server-side audio. |
| */ |
| |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <unistd.h> |
| #include <string.h> |
| #include <stdint.h> |
| |
| #include <espeak-ng/espeak_ng.h> |
| #include <espeak-ng/speak_lib.h> |
| |
| #include "spd_module_main.h" |
| |
| static char *voicetype; |
| static char *voicename; |
| static char *language; |
| |
| int module_config(const char *configfile) |
| { |
| /* Optional: Open and parse configfile */ |
| fprintf(stderr, "opening %s\n", configfile); |
| |
| return 0; |
| } |
| |
| static int callback(short *, int, espeak_EVENT*); |
| |
| int module_init(char **msg) |
| { |
| /* Actually initialize synthesizer */ |
| fprintf(stderr, "initializing\n"); |
| |
| espeak_ng_ERROR_CONTEXT context = NULL; |
| espeak_ng_STATUS result; |
| |
| espeak_ng_InitializePath(NULL); |
| result = espeak_ng_Initialize(&context); |
| |
| if (result == ENS_OK) { |
| fprintf(stderr, "initialized, opening audio output\n"); |
| result = espeak_ng_InitializeOutput(0, 0, NULL); |
| } |
| |
| if (result == ENS_OK) { |
| espeak_SetSynthCallback(callback); |
| } |
| |
| if (result != ENS_OK) { |
| char buf[128]; |
| espeak_ng_GetStatusCodeMessage(result, buf, sizeof(buf)); |
| fprintf(stderr, "espeak-ng initialization failed: '%s'\n", buf); |
| *msg = strdup(buf); |
| return -1; |
| } |
| |
| *msg = strdup("ok!"); |
| |
| return 0; |
| } |
| |
| SPDVoice **module_list_voices(void) |
| { |
| /* Return list of voices */ |
| SPDVoice **ret = malloc(3*sizeof(*ret)); |
| |
| ret[0] = malloc(sizeof(*(ret[0]))); |
| ret[0]->name = strdup("English (America)"); |
| ret[0]->language = strdup("en"); |
| ret[0]->variant = NULL; |
| |
| ret[1] = malloc(sizeof(*(ret[0]))); |
| ret[1]->name = strdup("French (France)"); |
| ret[1]->language = strdup("fr"); |
| ret[1]->variant = NULL; |
| |
| ret[2] = NULL; |
| |
| return ret; |
| } |
| |
| |
| int module_set(const char *var, const char *val) |
| { |
| /* Optional: accept parameter */ |
| espeak_ng_STATUS result; |
| |
| fprintf(stderr,"got var '%s' to be set to '%s'\n", var, val); |
| |
| if (!strcmp(var, "voice")) { |
| free(voicetype); |
| voicetype = strdup(val); |
| return 0; |
| } else if (!strcmp(var, "synthesis_voice")) { |
| free(voicename); |
| voicename = strdup(val); |
| return 0; |
| } else if (!strcmp(var, "language")) { |
| free(language); |
| language = strdup(val); |
| return 0; |
| } else if (!strcmp(var, "rate")) { |
| /* TODO */ |
| return 0; |
| } else if (!strcmp(var, "pitch")) { |
| /* convert from [-100, 100] to [0, 100] */ |
| int pitch = (atoi(val) + 100) / 2; |
| result = espeak_SetParameter(espeakPITCH, pitch, 0); |
| if (result != ENS_OK) { |
| espeak_ng_PrintStatusCodeMessage(result, stderr, NULL); |
| return -1; |
| } |
| return 0; |
| } else if (!strcmp(var, "pitch_range")) { |
| /* TODO */ |
| return 0; |
| } else if (!strcmp(var, "volume")) { |
| /* TODO */ |
| return 0; |
| } else if (!strcmp(var, "punctuation_mode")) { |
| /* TODO */ |
| return 0; |
| } else if (!strcmp(var, "spelling_mode")) { |
| /* TODO */ |
| return 0; |
| } else if (!strcmp(var, "cap_let_recogn")) { |
| /* TODO */ |
| return 0; |
| } |
| return -1; |
| } |
| |
| int module_audio_set(const char *var, const char *val) |
| { |
| /* Optional: interpret audio parameter */ |
| if (!strcmp(var, "audio_output_method")) { |
| /* Only server-side audio supported */ |
| if (strcmp(val, "server") != 0) |
| return -1; |
| return 0; |
| } |
| return -1; |
| } |
| |
| int module_audio_init(char **status) |
| { |
| /* Optional: open audio */ |
| return 0; |
| } |
| |
| int module_loglevel_set(const char *var, const char *val) |
| { |
| /* Optional: accept loglevel change */ |
| return 0; |
| } |
| |
| int module_debug(int enable, const char *file) |
| { |
| /* Optional: if enable == 1, open file to dump debugging */ |
| /* Otherwise close it */ |
| return 0; |
| } |
| |
| int module_loop(void) |
| { |
| /* Main loop */ |
| fprintf(stderr, "main loop\n"); |
| |
| /* Let module_process run the protocol */ |
| /* You may want to monitor STDIN_FILENO yourself, to be able to also |
| * monitor other FDs. */ |
| int ret = module_process(STDIN_FILENO, 1); |
| |
| if (ret != 0) |
| fprintf(stderr, "Broken pipe, exiting...\n"); |
| |
| return ret; |
| } |
| |
| static void set_voice(void) |
| { |
| espeak_ng_STATUS result; |
| |
| if (voicetype || language) { |
| fprintf(stderr, "setting voice type %s language %s\n", voicetype ? voicetype : "none", language ? language : "none"); |
| |
| espeak_VOICE voice_select; |
| memset(&voice_select, 0, sizeof(voice_select)); |
| |
| if (voicetype) { |
| if (!strncmp(voicetype, "male", 4)) { |
| voice_select.gender = 1; |
| voice_select.variant = atoi(voicetype+4) - 1; |
| } else if (!strncmp(voicetype, "female", 6)) { |
| voice_select.gender = 2; |
| voice_select.variant = atoi(voicetype+6) - 1; |
| } else if (!strncmp(voicetype, "child_male", 10)) { |
| voice_select.gender = 1; |
| voice_select.age = 10; |
| } else if (!strncmp(voicetype, "child_female", 12)) { |
| voice_select.gender = 2; |
| voice_select.age = 10; |
| } |
| } |
| |
| if (language) { |
| voice_select.languages = language; |
| } |
| |
| result = espeak_ng_SetVoiceByProperties(&voice_select); |
| if (result != ENS_OK) |
| espeak_ng_PrintStatusCodeMessage(result, stderr, NULL); |
| } |
| |
| if (voicename && strcmp(voicename, "NULL") != 0) { |
| fprintf(stderr, "setting voice name %s\n", voicename); |
| |
| result = espeak_ng_SetVoiceByName(voicename); |
| if (result != ENS_OK) |
| espeak_ng_PrintStatusCodeMessage(result, stderr, NULL); |
| } |
| } |
| |
| static int began; |
| /* Asynchronous version, when the synthesis implements asynchronous |
| * processing in another thread. */ |
| int module_speak(char *data, size_t bytes, SPDMessageType msgtype) |
| { |
| set_voice(); |
| |
| /* Speak the provided data asynchronously in another thread */ |
| fprintf(stderr, "speaking '%s'\n", data); |
| |
| began = 0; |
| espeak_Synth(data, strlen(data) + 1, 0, POS_CHARACTER, 0, |
| espeakCHARS_AUTO | espeakPHONEMES | espeakENDPAUSE | espeakSSML, |
| NULL, NULL); |
| |
| return 1; |
| } |
| |
| void send_samples(short *wav, int len, int rate) |
| { |
| if (!len) |
| return; |
| |
| AudioTrack track = { |
| .bits = 16, |
| .num_channels = 1, |
| .sample_rate = rate, |
| .num_samples = len, |
| .samples = wav, |
| }; |
| module_tts_output_server(&track, SPD_AUDIO_LE); |
| } |
| |
| /* This is getting called in the espeak-ng thread */ |
| static int callback(short *wav, int numsamples, espeak_EVENT *events) |
| { |
| espeak_EVENT *cur = events; |
| int rate = espeak_ng_GetSampleRate(); |
| int done = 0; |
| |
| if (!began) { |
| began = 1; |
| /* We started producing audio */ |
| module_report_event_begin(); |
| } |
| while (cur->type != espeakEVENT_LIST_TERMINATED) |
| { |
| fprintf(stderr, "got event %d from synth\n", cur->type); |
| |
| /* First send pending audio */ |
| switch (cur->type) { |
| case espeakEVENT_MARK: |
| case espeakEVENT_PLAY: |
| { |
| int64_t pos = cur->audio_position; |
| int sample = pos * rate / 1000; |
| if (sample > numsamples) |
| sample = numsamples; |
| |
| send_samples(wav + done, sample - done, rate); |
| |
| done = sample; |
| } |
| default: |
| break; |
| } |
| |
| /* Then process event */ |
| switch (cur->type) { |
| case espeakEVENT_MARK: |
| module_report_index_mark(cur->id.name); |
| break; |
| case espeakEVENT_PLAY: |
| module_report_icon(cur->id.name); |
| break; |
| case espeakEVENT_MSG_TERMINATED: |
| /* We have finished the synth, tell the server so it can send us the next message. */ |
| module_report_event_end(); |
| break; |
| default: |
| break; |
| } |
| cur++; |
| } |
| |
| send_samples(wav + done, numsamples - done, rate); |
| |
| return 0; |
| } |
| |
| size_t module_pause(void) |
| { |
| /* Pause playing */ |
| fprintf(stderr, "pausing\n"); |
| |
| /* Only supports stopping */ |
| espeak_Cancel(); |
| |
| module_report_event_stop(); |
| |
| return 0; |
| } |
| |
| int module_stop(void) |
| { |
| /* Stop any current synth */ |
| fprintf(stderr, "stopping\n"); |
| |
| espeak_Cancel(); |
| |
| module_report_event_stop(); |
| |
| return 0; |
| } |
| |
| int module_close(void) |
| { |
| /* Deinitialize synthesizer */ |
| fprintf(stderr, "closing\n"); |
| |
| espeak_ng_Terminate(); |
| |
| return 0; |
| } |