mirror of
https://github.com/jambonz/jambonz-feature-server.git
synced 2025-12-19 04:17:44 +00:00
* feat fallback speech * feat fallback speech * feat fallback speech * gather verb * fix * wip * wip * wip * wip * wip * transcribe * transcribe * fix * wip * wip * wip * wip * fix * wip * fix
351 lines
13 KiB
JavaScript
351 lines
13 KiB
JavaScript
const Task = require('./task');
|
|
const {TaskName, TaskPreconditions} = require('../utils/constants');
|
|
const { normalizeJambones } = require('@jambonz/verb-specifications');
|
|
|
|
class Lex extends Task {
|
|
constructor(logger, opts) {
|
|
super(logger, opts);
|
|
this.preconditions = TaskPreconditions.Endpoint;
|
|
|
|
if (this.data.credentials) {
|
|
this.awsAccessKeyId = this.data.credentials.accessKey;
|
|
this.awsSecretAccessKey = this.data.credentials.secretAccessKey;
|
|
}
|
|
this.bot = this.data.botId;
|
|
this.alias = this.data.botAlias;
|
|
this.region = this.data.region;
|
|
this.locale = this.data.locale || 'en_US';
|
|
this.intent = this.data.intent || {};
|
|
this.metadata = this.data.metadata;
|
|
this.welcomeMessage = this.data.welcomeMessage;
|
|
this.bargein = this.data.bargein || false;
|
|
this.passDtmf = this.data.passDtmf || false;
|
|
if (this.data.noInputTimeout) this.noInputTimeout = this.data.noInputTimeout * 1000;
|
|
if (this.data.tts) {
|
|
this.vendor = this.data.tts.vendor || 'default';
|
|
this.language = this.data.tts.language || 'default';
|
|
this.voice = this.data.tts.voice || 'default';
|
|
this.speechCredentialLabel = this.data.tts.label || 'default';
|
|
|
|
// fallback tts
|
|
this.fallbackVendor = this.data.tts.fallbackVendor || 'default';
|
|
this.fallbackLanguage = this.data.tts.fallbackLanguage || 'default';
|
|
this.fallbackVoice = this.data.tts.fallbackLanguage || 'default';
|
|
this.fallbackLabel = this.data.tts.fallbackLabel || 'default';
|
|
}
|
|
|
|
this.botName = `${this.bot}:${this.alias}:${this.region}`;
|
|
if (this.data.eventHook) this.eventHook = this.data.eventHook;
|
|
this.events = this.eventHook ?
|
|
[
|
|
'intent',
|
|
'transcription',
|
|
'dtmf',
|
|
'start-play',
|
|
'stop-play',
|
|
'play-interrupted',
|
|
'response-text'
|
|
] : [];
|
|
if (this.data.actionHook) this.actionHook = this.data.actionHook;
|
|
}
|
|
|
|
get name() { return TaskName.Lex; }
|
|
|
|
async exec(cs, {ep}) {
|
|
await super.exec(cs);
|
|
|
|
try {
|
|
await this.init(cs, ep);
|
|
|
|
// kick it off
|
|
const obj = {};
|
|
let cmd = `${this.ep.uuid} ${this.bot} ${this.alias} ${this.region} ${this.locale} `;
|
|
|
|
if (this.metadata) Object.assign(obj, this.metadata);
|
|
if (this.intent.name) {
|
|
cmd += this.intent.name;
|
|
if (this.intent.slots) Object.assign(obj, {slots: this.intent.slots});
|
|
}
|
|
|
|
if (Object.keys(obj).length > 0) cmd += ` '${JSON.stringify(obj)}'`;
|
|
|
|
this.logger.debug({cmd}, `starting lex bot ${this.botName} with locale ${this.locale}`);
|
|
this.ep.api('aws_lex_start', cmd)
|
|
.catch((err) => {
|
|
this.logger.error({err}, `Error starting lex bot ${this.botName}`);
|
|
this.notifyTaskDone();
|
|
});
|
|
|
|
await this.awaitTaskDone();
|
|
} catch (err) {
|
|
this.logger.error({err}, 'Lex:exec error');
|
|
}
|
|
}
|
|
|
|
async kill(cs) {
|
|
super.kill(cs);
|
|
if (this.ep.connected) {
|
|
this.logger.debug('Lex:kill');
|
|
this.ep.removeCustomEventListener('lex::intent');
|
|
this.ep.removeCustomEventListener('lex::transcription');
|
|
this.ep.removeCustomEventListener('lex::audio_provided');
|
|
this.ep.removeCustomEventListener('lex::text_response');
|
|
this.ep.removeCustomEventListener('lex::playback_interruption');
|
|
this.ep.removeCustomEventListener('lex::error');
|
|
this.ep.removeAllListeners('dtmf');
|
|
|
|
this.performAction({lexResult: 'caller hungup'})
|
|
.catch((err) => this.logger.error({err}, 'lex - error w/ action webook'));
|
|
|
|
await this.ep.api('uuid_break', this.ep.uuid).catch((err) => this.logger.info(err, 'Error killing audio'));
|
|
}
|
|
this.notifyTaskDone();
|
|
}
|
|
|
|
async init(cs, ep) {
|
|
this.ep = ep;
|
|
try {
|
|
if (this.vendor === 'default') {
|
|
this.vendor = cs.speechSynthesisVendor;
|
|
this.language = cs.speechSynthesisLanguage;
|
|
this.voice = cs.speechSynthesisVoice;
|
|
this.speechCredentialLabel = cs.speechSynthesisLabel;
|
|
}
|
|
if (this.fallbackVendor === 'default') {
|
|
this.fallbackVendor = cs.fallbackSpeechSynthesisVendor;
|
|
this.fallbackLanguage = cs.fallbackSpeechSynthesisLanguage;
|
|
this.fallbackVoice = cs.fallbackSpeechSynthesisVoice;
|
|
this.fallbackLabel = cs.fallbackSpeechSynthesisLabel;
|
|
}
|
|
|
|
this.ttsCredentials = cs.getSpeechCredentials(this.vendor, 'tts', this.speechCredentialLabel);
|
|
|
|
this.ep.addCustomEventListener('lex::intent', this._onIntent.bind(this, ep, cs));
|
|
this.ep.addCustomEventListener('lex::transcription', this._onTranscription.bind(this, ep, cs));
|
|
this.ep.addCustomEventListener('lex::audio_provided', this._onAudioProvided.bind(this, ep, cs));
|
|
this.ep.addCustomEventListener('lex::text_response', this._onTextResponse.bind(this, ep, cs));
|
|
this.ep.addCustomEventListener('lex::playback_interruption', this._onPlaybackInterruption.bind(this, ep, cs));
|
|
this.ep.addCustomEventListener('lex::error', this._onError.bind(this, ep, cs));
|
|
this.ep.on('dtmf', this._onDtmf.bind(this, ep, cs));
|
|
|
|
const channelVars = {};
|
|
if (this.bargein) {
|
|
Object.assign(channelVars, {'x-amz-lex:barge-in-enabled': 1});
|
|
}
|
|
if (this.noInputTimeout) {
|
|
Object.assign(channelVars, {'x-amz-lex:audio:start-timeout-ms': this.noInputTimeout});
|
|
}
|
|
if (this.awsAccessKeyId && this.awsSecretAccessKey) {
|
|
Object.assign(channelVars, {
|
|
AWS_ACCESS_KEY_ID: this.awsAccessKeyId,
|
|
AWS_SECRET_ACCESS_KEY: this.awsSecretAccessKey
|
|
});
|
|
}
|
|
if (this.vendor) Object.assign(channelVars, {LEX_USE_TTS: 1});
|
|
//if (this.intent.name) Object.assign(channelVars, {LEX_WELCOME_INTENT: this.intent});
|
|
if (this.welcomeMessage && this.welcomeMessage.length) {
|
|
Object.assign(channelVars, {LEX_WELCOME_MESSAGE: this.welcomeMessage});
|
|
}
|
|
if (Object.keys(channelVars).length) await this.ep.set(channelVars);
|
|
|
|
} catch (err) {
|
|
this.logger.error({err}, 'Error setting listeners');
|
|
throw err;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* An intent has been returned.
|
|
* we may get an empty intent, signified by ...
|
|
* In such a case, we just restart the bot.
|
|
* @param {*} ep - media server endpoint
|
|
* @param {*} evt - event data
|
|
*/
|
|
_onIntent(ep, cs, evt) {
|
|
this.logger.debug({evt}, `got intent for ${this.botName}`);
|
|
if (this.events.includes('intent')) {
|
|
this._performHook(cs, this.eventHook, {event: 'intent', data: evt});
|
|
}
|
|
}
|
|
|
|
/**
|
|
* A transcription - either interim or final - has been returned.
|
|
* If we are doing barge-in based on hotword detection, check for the hotword or phrase.
|
|
* If we are playing a filler sound, like typing, during the fullfillment phase, start that
|
|
* if this is a final transcript.
|
|
* @param {*} ep - media server endpoint
|
|
* @param {*} evt - event data
|
|
*/
|
|
_onTranscription(ep, cs, evt) {
|
|
this.logger.debug({evt}, `got transcription for ${this.botName}`);
|
|
if (this.events.includes('transcription')) {
|
|
this._performHook(cs, this.eventHook, {event: 'transcription', data: evt});
|
|
}
|
|
}
|
|
|
|
async _fallbackSynthAudio(cs, msg, stats, synthAudio) {
|
|
try {
|
|
const {filePath} = await synthAudio(stats, {
|
|
account_sid: cs.accountSid,
|
|
text: msg,
|
|
vendor: this.vendor,
|
|
language: this.language,
|
|
voice: this.voice,
|
|
salt: cs.callSid,
|
|
credentials: this.ttsCredentials
|
|
});
|
|
|
|
return filePath;
|
|
} catch (error) {
|
|
this.logger.info({error}, 'failed to synth audio from primary vendor');
|
|
if (this.fallbackVendor) {
|
|
try {
|
|
const credential = cs.getSpeechCredentials(this.fallbackVendor, 'tts', this.fallbackLabel);
|
|
const {filePath} = await synthAudio(stats, {
|
|
account_sid: cs.accountSid,
|
|
text: msg,
|
|
vendor: this.fallbackVendor,
|
|
language: this.fallbackLanguage,
|
|
voice: this.fallbackVoice,
|
|
salt: cs.callSid,
|
|
credentials: credential
|
|
});
|
|
return filePath;
|
|
} catch (err) {
|
|
this.logger.info({err}, 'failed to synth audio from fallback vendor');
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @param {*} evt - event data
|
|
*/
|
|
async _onTextResponse(ep, cs, evt) {
|
|
this.logger.debug({evt}, `got text response for ${this.botName}`);
|
|
const messages = evt.messages;
|
|
if (this.events.includes('response-text')) {
|
|
this._performHook(cs, this.eventHook, {event: 'response-text', data: evt});
|
|
}
|
|
if (this.vendor && Array.isArray(messages) && messages.length) {
|
|
const msg = messages[0].msg;
|
|
const type = messages[0].type;
|
|
if (['PlainText', 'SSML'].includes(type) && msg) {
|
|
const {srf} = cs;
|
|
const {stats} = srf.locals;
|
|
const {synthAudio} = srf.locals.dbHelpers;
|
|
|
|
try {
|
|
this.logger.debug(`tts with ${this.vendor} ${this.voice}`);
|
|
const filePath = await this._fallbackSynthAudio(cs, msg, stats, synthAudio);
|
|
if (filePath) cs.trackTmpFile(filePath);
|
|
|
|
if (this.events.includes('start-play')) {
|
|
this._performHook(cs, this.eventHook, {event: 'start-play', data: {path: filePath}});
|
|
}
|
|
await ep.play(filePath);
|
|
if (this.events.includes('stop-play')) {
|
|
this._performHook(cs, this.eventHook, {event: 'stop-play', data: {path: filePath}});
|
|
}
|
|
this.logger.debug(`finished tts, sending play_done ${this.vendor} ${this.voice}`);
|
|
this.ep.api('aws_lex_play_done', this.ep.uuid)
|
|
.catch((err) => {
|
|
this.logger.error({err}, `Error sending play_done ${this.botName}`);
|
|
});
|
|
} catch (err) {
|
|
this.logger.error({err}, 'Lex:_onTextResponse - error playing tts');
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @param {*} evt - event data
|
|
*/
|
|
_onPlaybackInterruption(ep, cs, evt) {
|
|
this.logger.debug({evt}, `got playback interruption for ${this.botName}`);
|
|
if (this.bargein) {
|
|
if (this.events.includes('play-interrupted')) {
|
|
this._performHook(cs, this.eventHook, {event: 'play-interrupted', data: {}});
|
|
}
|
|
this.ep.api('uuid_break', this.ep.uuid)
|
|
.catch((err) => this.logger.info(err, 'Lex::_onPlaybackInterruption - Error killing audio'));
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Lex has returned an error of some kind.
|
|
* @param {*} evt - event data
|
|
*/
|
|
_onError(ep, cs, evt) {
|
|
this.logger.error({evt}, `got error for bot ${this.botName}`);
|
|
}
|
|
|
|
/**
|
|
* Audio has been received from lex and written to a temporary disk file.
|
|
* Start playing the audio, after killing any filler sound that might be playing.
|
|
* When the audio completes, start the no-input timer.
|
|
* @param {*} ep - media server endpoint
|
|
* @param {*} evt - event data
|
|
*/
|
|
async _onAudioProvided(ep, cs, evt) {
|
|
if (this.vendor) return;
|
|
|
|
this.waitingForPlayStart = false;
|
|
this.logger.debug({evt}, `got audio file for bot ${this.botName}`);
|
|
|
|
try {
|
|
if (this.events.includes('start-play')) {
|
|
this._performHook(cs, this.eventHook, {event: 'start-play', data: {path: evt.path}});
|
|
}
|
|
await ep.play(evt.path);
|
|
if (this.events.includes('stop-play')) {
|
|
this._performHook(cs, this.eventHook, {event: 'stop-play', data: {path: evt.path}});
|
|
}
|
|
this.logger.debug({evt}, `done playing audio file for bot ${this.botName}`);
|
|
this.ep.api('aws_lex_play_done', this.ep.uuid)
|
|
.catch((err) => {
|
|
this.logger.error({err}, `Error sending play_done ${this.botName}`);
|
|
});
|
|
} catch (err) {
|
|
this.logger.error({err}, `Error playing file ${evt.path} for both ${this.botName}`);
|
|
}
|
|
|
|
}
|
|
|
|
/**
|
|
* receive a dmtf entry from the caller.
|
|
* If we have active dtmf instructions, collect and process accordingly.
|
|
*/
|
|
_onDtmf(ep, cs, evt) {
|
|
this.logger.debug({evt}, 'Lex:_onDtmf');
|
|
if (this.events.includes('dtmf')) {
|
|
this._performHook(cs, this.eventHook, {event: 'dtmf', data: evt});
|
|
}
|
|
if (this.passDtmf) {
|
|
this.ep.api('aws_lex_dtmf', `${this.ep.uuid} ${evt.dtmf}`)
|
|
.catch((err) => {
|
|
this.logger.error({err}, `Error sending dtmf ${evt.dtmf} ${this.botName}`);
|
|
});
|
|
}
|
|
}
|
|
|
|
async _performHook(cs, hook, results) {
|
|
const b3 = this.getTracingPropagation();
|
|
const httpHeaders = b3 && {b3};
|
|
const json = await this.cs.requestor.request('verb:hook', hook, results, httpHeaders);
|
|
if (json && Array.isArray(json)) {
|
|
const makeTask = require('./make_task');
|
|
const tasks = normalizeJambones(this.logger, json).map((tdata) => makeTask(this.logger, tdata));
|
|
if (tasks && tasks.length > 0) {
|
|
this.logger.info({tasks: tasks}, `${this.name} replacing application with ${tasks.length} tasks`);
|
|
this.performAction({lexResult: 'redirect'}, false);
|
|
cs.replaceApplication(tasks);
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
module.exports = Lex;
|