src/modules/skeleton0_espeak-ng-async-server.c - external/github.com/brailcom/speechd - Git at Google

 /*
  * skeleton0.c - Trivial module example
  *
  * Copyright (C) 2020-2022, 2025 Samuel Thibault <samuel.thibault@ens-lyon.org>
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY Samuel Thibault AND CONTRIBUTORS ``AS IS'' AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  * SUCH DAMAGE.
  */

 /*
  * This module is based on skeleton0, and shows how it can be completed easily
  * to run Espeak-NG asynchronously, with server-side audio.
  */

 #include <stdio.h>
 #include <stdlib.h>
 #include <unistd.h>
 #include <string.h>
 #include <stdint.h>

 #include <espeak-ng/espeak_ng.h>
 #include <espeak-ng/speak_lib.h>

 #include "spd_module_main.h"

 static char *voicetype;
 static char *voicename;
 static char *language;

 int module_config(const char *configfile)
 {
 	/* Optional: Open and parse configfile */
 	fprintf(stderr, "opening %s\n", configfile);

 	return 0;
 }

 static int callback(short *, int, espeak_EVENT*);

 int module_init(char **msg)
 {
 	/* Actually initialize synthesizer */
 	fprintf(stderr, "initializing\n");

 	espeak_ng_ERROR_CONTEXT context = NULL;
 	espeak_ng_STATUS result;

 	espeak_ng_InitializePath(NULL);
 	result = espeak_ng_Initialize(&context);

 	if (result == ENS_OK) {
 		fprintf(stderr, "initialized, opening audio output\n");
 		result = espeak_ng_InitializeOutput(0, 0, NULL);
 	}

 	if (result == ENS_OK) {
 		espeak_SetSynthCallback(callback);
 	}

 	if (result != ENS_OK) {
 		char buf[128];
 		espeak_ng_GetStatusCodeMessage(result, buf, sizeof(buf));
 		fprintf(stderr, "espeak-ng initialization failed: '%s'\n", buf);
 		*msg = strdup(buf);
 		return -1;
 	}

 	*msg = strdup("ok!");

 	return 0;
 }

 SPDVoice **module_list_voices(void)
 {
 	/* Return list of voices */
 	SPDVoice **ret = malloc(3*sizeof(*ret));

 	ret[0] = malloc(sizeof(*(ret[0])));
 	ret[0]->name = strdup("English (America)");
 	ret[0]->language = strdup("en");
 	ret[0]->variant = NULL;

 	ret[1] = malloc(sizeof(*(ret[0])));
 	ret[1]->name = strdup("French (France)");
 	ret[1]->language = strdup("fr");
 	ret[1]->variant = NULL;

 	ret[2] = NULL;

 	return ret;
 }


 int module_set(const char *var, const char *val)
 {
 	/* Optional: accept parameter */
 	espeak_ng_STATUS result;

 	fprintf(stderr,"got var '%s' to be set to '%s'\n", var, val);

 	if (!strcmp(var, "voice")) {
 		free(voicetype);
 		voicetype = strdup(val);
 		return 0;
 	} else if (!strcmp(var, "synthesis_voice")) {
 		free(voicename);
 		voicename = strdup(val);
 		return 0;
 	} else if (!strcmp(var, "language")) {
 		free(language);
 		language = strdup(val);
 		return 0;
 	} else if (!strcmp(var, "rate")) {
 		/* TODO */
 		return 0;
 	} else if (!strcmp(var, "pitch")) {
 		/* convert from [-100, 100] to [0, 100] */
 		int pitch = (atoi(val) + 100) / 2;
 		result = espeak_SetParameter(espeakPITCH, pitch, 0);
 		if (result != ENS_OK) {
 			espeak_ng_PrintStatusCodeMessage(result, stderr, NULL);
 			return -1;
 		}
 		return 0;
 	} else if (!strcmp(var, "pitch_range")) {
 		/* TODO */
 		return 0;
 	} else if (!strcmp(var, "volume")) {
 		/* TODO */
 		return 0;
 	} else if (!strcmp(var, "punctuation_mode")) {
 		/* TODO */
 		return 0;
 	} else if (!strcmp(var, "spelling_mode")) {
 		/* TODO */
 		return 0;
 	} else if (!strcmp(var, "cap_let_recogn")) {
 		/* TODO */
 		return 0;
 	}
 	return -1;
 }

 int module_audio_set(const char *var, const char *val)
 {
 	/* Optional: interpret audio parameter */
 	if (!strcmp(var, "audio_output_method")) {
 		/* Only server-side audio supported */
 		if (strcmp(val, "server") != 0)
 			return -1;
 		return 0;
 	}
 	return -1;
 }

 int module_audio_init(char **status)
 {
 	/* Optional: open audio */
 	return 0;
 }

 int module_loglevel_set(const char *var, const char *val)
 {
 	/* Optional: accept loglevel change */
 	return 0;
 }

 int module_debug(int enable, const char *file)
 {
 	/* Optional: if enable == 1, open file to dump debugging */
 	/* Otherwise close it */
 	return 0;
 }

 int module_loop(void)
 {
 	/* Main loop */
 	fprintf(stderr, "main loop\n");

 	/* Let module_process run the protocol */
 	/* You may want to monitor STDIN_FILENO yourself, to be able to also
 	 * monitor other FDs. */
 	int ret = module_process(STDIN_FILENO, 1);

 	if (ret != 0)
 		fprintf(stderr, "Broken pipe, exiting...\n");

 	return ret;
 }

 static void set_voice(void)
 {
 	espeak_ng_STATUS result;

 	if (voicetype || language) {
 		fprintf(stderr, "setting voice type %s language %s\n", voicetype ? voicetype : "none", language ? language : "none");

 		espeak_VOICE voice_select;
 		memset(&voice_select, 0, sizeof(voice_select));

 		if (voicetype) {
 			if (!strncmp(voicetype, "male", 4)) {
 				voice_select.gender = 1;
 				voice_select.variant = atoi(voicetype+4) - 1;
 			} else if (!strncmp(voicetype, "female", 6)) {
 				voice_select.gender = 2;
 				voice_select.variant = atoi(voicetype+6) - 1;
 			} else if (!strncmp(voicetype, "child_male", 10)) {
 				voice_select.gender = 1;
 				voice_select.age = 10;
 			} else if (!strncmp(voicetype, "child_female", 12)) {
 				voice_select.gender = 2;
 				voice_select.age = 10;
 			}
 		}

 		if (language) {
 			voice_select.languages = language;
 		}

 		result = espeak_ng_SetVoiceByProperties(&voice_select);
 		if (result != ENS_OK)
 			espeak_ng_PrintStatusCodeMessage(result, stderr, NULL);
 	}

 	if (voicename && strcmp(voicename, "NULL") != 0) {
 		fprintf(stderr, "setting voice name %s\n", voicename);

 		result = espeak_ng_SetVoiceByName(voicename);
 		if (result != ENS_OK)
 			espeak_ng_PrintStatusCodeMessage(result, stderr, NULL);
 	}
 }

 static int began;
 /* Asynchronous version, when the synthesis implements asynchronous
  * processing in another thread. */
 int module_speak(char *data, size_t bytes, SPDMessageType msgtype)
 {
 	set_voice();

 	/* Speak the provided data asynchronously in another thread */
 	fprintf(stderr, "speaking '%s'\n", data);

 	began = 0;
 	espeak_Synth(data, strlen(data) + 1, 0, POS_CHARACTER, 0,
 		     espeakCHARS_AUTO | espeakPHONEMES | espeakENDPAUSE | espeakSSML,
 		     NULL, NULL);

 	return 1;
 }

 void send_samples(short *wav, int len, int rate)
 {
 	if (!len)
 		return;

 	AudioTrack track = {
 		.bits = 16,
 		.num_channels = 1,
 		.sample_rate = rate,
 		.num_samples = len,
 		.samples = wav,
 	};
 	module_tts_output_server(&track, SPD_AUDIO_LE);
 }

 /* This is getting called in the espeak-ng thread */
 static int callback(short *wav, int numsamples, espeak_EVENT *events)
 {
 	espeak_EVENT *cur = events;
 	int rate = espeak_ng_GetSampleRate();
 	int done = 0;

 	if (!began) {
 		began = 1;
 		/* We started producing audio */
 		module_report_event_begin();
 	}
 	while (cur->type != espeakEVENT_LIST_TERMINATED)
 	{
 		fprintf(stderr, "got event %d from synth\n", cur->type);

 		/* First send pending audio */
 		switch (cur->type) {
 			case espeakEVENT_MARK:
 			case espeakEVENT_PLAY:
 			{
 				int64_t pos = cur->audio_position;
 				int sample = pos * rate / 1000;
 				if (sample > numsamples)
 					sample = numsamples;

 				send_samples(wav + done, sample - done, rate);

 				done = sample;
 			}
 			default:
 				break;
 		}

 		/* Then process event */
 		switch (cur->type) {
 			case espeakEVENT_MARK:
 				module_report_index_mark(cur->id.name);
 				break;
 			case espeakEVENT_PLAY:
 				module_report_icon(cur->id.name);
 				break;
 			case espeakEVENT_MSG_TERMINATED:
 				/* We have finished the synth, tell the server so it can send us the next message. */
 				module_report_event_end();
 				break;
 			default:
 				break;
 		}
 		cur++;
 	}

 	send_samples(wav + done, numsamples - done, rate);

 	return 0;
 }

 size_t module_pause(void)
 {
 	/* Pause playing */
 	fprintf(stderr, "pausing\n");

 	/* Only supports stopping */
 	espeak_Cancel();

 	module_report_event_stop();

 	return 0;
 }

 int module_stop(void)
 {
 	/* Stop any current synth */
 	fprintf(stderr, "stopping\n");

 	espeak_Cancel();

 	module_report_event_stop();

 	return 0;
 }

 int module_close(void)
 {
 	/* Deinitialize synthesizer */
 	fprintf(stderr, "closing\n");

 	espeak_ng_Terminate();

 	return 0;
 }
	/*
	* skeleton0.c - Trivial module example
	*
	* Copyright (C) 2020-2022, 2025 Samuel Thibault <samuel.thibault@ens-lyon.org>
	* All rights reserved.
	*
	* Redistribution and use in source and binary forms, with or without
	* modification, are permitted provided that the following conditions
	* are met:
	* 1. Redistributions of source code must retain the above copyright
	* notice, this list of conditions and the following disclaimer.
	* 2. Redistributions in binary form must reproduce the above copyright
	* notice, this list of conditions and the following disclaimer in the
	* documentation and/or other materials provided with the distribution.
	*
	* THIS SOFTWARE IS PROVIDED BY Samuel Thibault AND CONTRIBUTORS ``AS IS'' AND
	* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
	* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
	* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
	* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
	* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
	* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
	* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
	* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
	* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
	* SUCH DAMAGE.
	*/

	/*
	* This module is based on skeleton0, and shows how it can be completed easily
	* to run Espeak-NG asynchronously, with server-side audio.
	*/

	#include <stdio.h>
	#include <stdlib.h>
	#include <unistd.h>
	#include <string.h>
	#include <stdint.h>

	#include <espeak-ng/espeak_ng.h>
	#include <espeak-ng/speak_lib.h>

	#include "spd_module_main.h"

	static char *voicetype;
	static char *voicename;
	static char *language;

	int module_config(const char *configfile)
	{
	/* Optional: Open and parse configfile */
	fprintf(stderr, "opening %s\n", configfile);

	return 0;
	}

	static int callback(short , int, espeak_EVENT);

	int module_init(char **msg)
	{
	/* Actually initialize synthesizer */
	fprintf(stderr, "initializing\n");

	espeak_ng_ERROR_CONTEXT context = NULL;
	espeak_ng_STATUS result;

	espeak_ng_InitializePath(NULL);
	result = espeak_ng_Initialize(&context);

	if (result == ENS_OK) {
	fprintf(stderr, "initialized, opening audio output\n");
	result = espeak_ng_InitializeOutput(0, 0, NULL);
	}

	if (result == ENS_OK) {
	espeak_SetSynthCallback(callback);
	}

	if (result != ENS_OK) {
	char buf[128];
	espeak_ng_GetStatusCodeMessage(result, buf, sizeof(buf));
	fprintf(stderr, "espeak-ng initialization failed: '%s'\n", buf);
	*msg = strdup(buf);
	return -1;
	}

	*msg = strdup("ok!");

	return 0;
	}

	SPDVoice **module_list_voices(void)
	{
	/* Return list of voices */
	SPDVoice *ret = malloc(3sizeof(*ret));

	ret[0] = malloc(sizeof(*(ret[0])));
	ret[0]->name = strdup("English (America)");
	ret[0]->language = strdup("en");
	ret[0]->variant = NULL;

	ret[1] = malloc(sizeof(*(ret[0])));
	ret[1]->name = strdup("French (France)");
	ret[1]->language = strdup("fr");
	ret[1]->variant = NULL;

	ret[2] = NULL;

	return ret;
	}


	int module_set(const char var, const char val)
	{
	/* Optional: accept parameter */
	espeak_ng_STATUS result;

	fprintf(stderr,"got var '%s' to be set to '%s'\n", var, val);

	if (!strcmp(var, "voice")) {
	free(voicetype);
	voicetype = strdup(val);
	return 0;
	} else if (!strcmp(var, "synthesis_voice")) {
	free(voicename);
	voicename = strdup(val);
	return 0;
	} else if (!strcmp(var, "language")) {
	free(language);
	language = strdup(val);
	return 0;
	} else if (!strcmp(var, "rate")) {
	/* TODO */
	return 0;
	} else if (!strcmp(var, "pitch")) {
	/* convert from [-100, 100] to [0, 100] */
	int pitch = (atoi(val) + 100) / 2;
	result = espeak_SetParameter(espeakPITCH, pitch, 0);
	if (result != ENS_OK) {
	espeak_ng_PrintStatusCodeMessage(result, stderr, NULL);
	return -1;
	}
	return 0;
	} else if (!strcmp(var, "pitch_range")) {
	/* TODO */
	return 0;
	} else if (!strcmp(var, "volume")) {
	/* TODO */
	return 0;
	} else if (!strcmp(var, "punctuation_mode")) {
	/* TODO */
	return 0;
	} else if (!strcmp(var, "spelling_mode")) {
	/* TODO */
	return 0;
	} else if (!strcmp(var, "cap_let_recogn")) {
	/* TODO */
	return 0;
	}
	return -1;
	}

	int module_audio_set(const char var, const char val)
	{
	/* Optional: interpret audio parameter */
	if (!strcmp(var, "audio_output_method")) {
	/* Only server-side audio supported */
	if (strcmp(val, "server") != 0)
	return -1;
	return 0;
	}
	return -1;
	}

	int module_audio_init(char **status)
	{
	/* Optional: open audio */
	return 0;
	}

	int module_loglevel_set(const char var, const char val)
	{
	/* Optional: accept loglevel change */
	return 0;
	}

	int module_debug(int enable, const char *file)
	{
	/* Optional: if enable == 1, open file to dump debugging */
	/* Otherwise close it */
	return 0;
	}

	int module_loop(void)
	{
	/* Main loop */
	fprintf(stderr, "main loop\n");

	/* Let module_process run the protocol */
	/* You may want to monitor STDIN_FILENO yourself, to be able to also
	* monitor other FDs. */
	int ret = module_process(STDIN_FILENO, 1);

	if (ret != 0)
	fprintf(stderr, "Broken pipe, exiting...\n");

	return ret;
	}

	static void set_voice(void)
	{
	espeak_ng_STATUS result;

	if (voicetype \|\| language) {
	fprintf(stderr, "setting voice type %s language %s\n", voicetype ? voicetype : "none", language ? language : "none");

	espeak_VOICE voice_select;
	memset(&voice_select, 0, sizeof(voice_select));

	if (voicetype) {
	if (!strncmp(voicetype, "male", 4)) {
	voice_select.gender = 1;
	voice_select.variant = atoi(voicetype+4) - 1;
	} else if (!strncmp(voicetype, "female", 6)) {
	voice_select.gender = 2;
	voice_select.variant = atoi(voicetype+6) - 1;
	} else if (!strncmp(voicetype, "child_male", 10)) {
	voice_select.gender = 1;
	voice_select.age = 10;
	} else if (!strncmp(voicetype, "child_female", 12)) {
	voice_select.gender = 2;
	voice_select.age = 10;
	}
	}

	if (language) {
	voice_select.languages = language;
	}

	result = espeak_ng_SetVoiceByProperties(&voice_select);
	if (result != ENS_OK)
	espeak_ng_PrintStatusCodeMessage(result, stderr, NULL);
	}

	if (voicename && strcmp(voicename, "NULL") != 0) {
	fprintf(stderr, "setting voice name %s\n", voicename);

	result = espeak_ng_SetVoiceByName(voicename);
	if (result != ENS_OK)
	espeak_ng_PrintStatusCodeMessage(result, stderr, NULL);
	}
	}

	static int began;
	/* Asynchronous version, when the synthesis implements asynchronous
	* processing in another thread. */
	int module_speak(char *data, size_t bytes, SPDMessageType msgtype)
	{
	set_voice();

	/* Speak the provided data asynchronously in another thread */
	fprintf(stderr, "speaking '%s'\n", data);

	began = 0;
	espeak_Synth(data, strlen(data) + 1, 0, POS_CHARACTER, 0,
	espeakCHARS_AUTO \| espeakPHONEMES \| espeakENDPAUSE \| espeakSSML,
	NULL, NULL);

	return 1;
	}

	void send_samples(short *wav, int len, int rate)
	{
	if (!len)
	return;

	AudioTrack track = {
	.bits = 16,
	.num_channels = 1,
	.sample_rate = rate,
	.num_samples = len,
	.samples = wav,
	};
	module_tts_output_server(&track, SPD_AUDIO_LE);
	}

	/* This is getting called in the espeak-ng thread */
	static int callback(short wav, int numsamples, espeak_EVENT events)
	{
	espeak_EVENT *cur = events;
	int rate = espeak_ng_GetSampleRate();
	int done = 0;

	if (!began) {
	began = 1;
	/* We started producing audio */
	module_report_event_begin();
	}
	while (cur->type != espeakEVENT_LIST_TERMINATED)
	{
	fprintf(stderr, "got event %d from synth\n", cur->type);

	/* First send pending audio */
	switch (cur->type) {
	case espeakEVENT_MARK:
	case espeakEVENT_PLAY:
	{
	int64_t pos = cur->audio_position;
	int sample = pos * rate / 1000;
	if (sample > numsamples)
	sample = numsamples;

	send_samples(wav + done, sample - done, rate);

	done = sample;
	}
	default:
	break;
	}

	/* Then process event */
	switch (cur->type) {
	case espeakEVENT_MARK:
	module_report_index_mark(cur->id.name);
	break;
	case espeakEVENT_PLAY:
	module_report_icon(cur->id.name);
	break;
	case espeakEVENT_MSG_TERMINATED:
	/* We have finished the synth, tell the server so it can send us the next message. */
	module_report_event_end();
	break;
	default:
	break;
	}
	cur++;
	}

	send_samples(wav + done, numsamples - done, rate);

	return 0;
	}

	size_t module_pause(void)
	{
	/* Pause playing */
	fprintf(stderr, "pausing\n");

	/* Only supports stopping */
	espeak_Cancel();

	module_report_event_stop();

	return 0;
	}

	int module_stop(void)
	{
	/* Stop any current synth */
	fprintf(stderr, "stopping\n");

	espeak_Cancel();

	module_report_event_stop();

	return 0;
	}

	int module_close(void)
	{
	/* Deinitialize synthesizer */
	fprintf(stderr, "closing\n");

	espeak_ng_Terminate();

	return 0;
	}