在 Skype 上使用 Bing 语音识别 API 和 node.js Bot Framework

Using Bing Speech Recognition API with node.js Bot Framework on Skype

在 Skype 中向我的 node.js 聊天机器人发送音频附件时,我想使用 Bing 语音识别 API 将语音转换为文本。我曾尝试使用 BotBuilder-Samples intelligence-SpeechToText 中的代码,但语音识别仅适用于模拟器。在 Skype 中发送 audio/wave 文件时,机器人根本没有响应,而是 "You said: What’s the weather like?".

我怀疑问题可能是由于需要 JWT 令牌才能访问 Skype 中的附件。因此,我尝试使用 BotBuilder-Samples core-ReceiveAttachment 中的代码访问 Skype 中的音频附件,该代码使用 request-promise 而不是 needle 来发出 HTTP 请求。但是,request-promise 的结果不是流,函数无法处理 getTextFromAudioStream().

我想问一下如何让语音识别与 Skype 中的音频附件一起工作。

谢谢并致以最诚挚的问候!

// Add your requirements
var restify = require("restify");
var builder = require("botbuilder");
var fs = require("fs");
var needle = require("needle");
var request = require("request");
var speechService = require("./speech-service.js");
var Promise = require('bluebird');
var request = require('request-promise').defaults({ encoding: null });

//=========================================================
// Bot Setup
//=========================================================

// Setup Restify Server
var server = restify.createServer();
server.listen(process.env.PORT || 3000, function() {
   console.log("%s listening to %s", server.name, server.url); 
});

// Create chat bot
var connector = new builder.ChatConnector ({
    appId: process.env.MICROSOFT_APP_ID,
    appPassword: process.env.MICROSOFT_APP_PASSWORD
});

server.post("/api/messages", connector.listen());

var bot = new builder.UniversalBot(connector);

//=========================================================
// Bots Middleware
//=========================================================

// Anytime the major version is incremented any existing conversations will be restarted.
bot.use(builder.Middleware.dialogVersion({ version: 1.0, resetCommand: /^reset/i }));

//=========================================================
// Bots Dialogs
//=========================================================

bot.dialog("/", [
    function (session, results, next) {
        var msg = session.message;

        if (hasAudioAttachment(msg)) {
            // Message with attachment, proceed to download it.
            // Skype attachment URLs are secured by a JwtToken, so we need to pass the token from our bot.
            var attachment = msg.attachments[0];
            var fileDownload = isSkypeMessage(msg)
                ? requestWithToken(attachment.contentUrl)
                : request(attachment.contentUrl);

            fileDownload.then(
                function (response) {
                    // Send reply with attachment type & size
                    var reply = new builder.Message(session)
                        .text('Attachment from %s of %s type and size of %s bytes received.', msg.source, attachment.contentType, response.length);
                    session.send(reply);
                }).catch(function (err) {
                    console.log('Error downloading attachment:', { statusCode: err.statusCode, message: err.response.statusMessage });
            });

            var stream = isSkypeMessage(msg)
                ? getAudioStreamWithToken(attachment)
                : getAudioStream(attachment);

            speechService.getTextFromAudioStream(stream)
                .then(text => {
                    session.send("You said: " + text);
                })
                .catch(error => {
                    session.send("Oops! Something went wrong. Try again later.");
                    console.error(error);
                });
        }
        else {
            session.send("Did you upload an audio file? I'm more of an audible person. Try sending me a wav file");
        }
    }
]);

function getAudioStream(attachment) {
    return needle.get(attachment.contentUrl, { headers: {'Content-Type': "audio/wav"} });
}

function getAudioStreamWithToken(attachment) {
    var headers = {};

    connector.getAccessToken((error, token) => {
        headers['Authorization'] = 'Bearer ' + token;
    });

    headers['Content-Type'] = attachment.contentType;

    return needle.get(attachment.contentUrl, { headers: headers });
}

// Request file with Authentication Header
function requestWithToken(url) {
    return obtainToken().then(function (token) {
        return request({
            url: url,
            headers: {
                'Authorization': 'Bearer ' + token,
                'Content-Type': 'application/octet-stream'
            }
        });
    });
};

// Promise for obtaining JWT Token (requested once)
var obtainToken = Promise.promisify(connector.getAccessToken.bind(connector));

function isSkypeMessage(message) {
    return message.source === "skype";
};

示例中的代码在访问附件时已经考虑了 Skype(请参阅 here)。我认为您遇到的问题是因为样本中的密钥超出了配额。昨天一个新的 Bing Speech Key 被添加到示例中,所以我建议你再试一次。

另外,示例的更新版本即将添加。代码目前在code review.