智能语音计算器

Posted wzqstudy

tags:

篇首语:本文由小常识网(cha138.com)小编为大家整理,主要介绍了智能语音计算器相关的知识,希望对你有一定的参考价值。

这边来说界面的实现,个人觉得该模块实现有点乱,因为其中包括了录音功能,还需要改进。

#ifndef CALCULATORUI_H
#define CALCULATORUI_H

#include <qt5/QtWidgets/QWidget>
#include <qt5/QtWidgets/QLineEdit>
#include <qt5/QtWidgets/QPushButton>
#include <qt5/QtCore/QFile>
#include <qt5/QtMultimedia/QAudioInput>
#include <qt5/QtCore/QDebug>
#include <qt5/QtCore/QProcess>
#include <qt5/QtCore/QString>
#include <iostream>

#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>

#include <qt5/QtCore/QString>
#include "ICalculator.h"
#include "CalculatorASR.h"


#include <unistd.h>

using namespace std;

#define RET_SIZE 100
/*
QT       += core gui
QT       += widgets
QT       += multimedia

LIBS += -L./libs/x64 -lmsc
*/
class CalculatorUI : public QWidget
{
    Q_OBJECT
public:
    static CalculatorUI* newInstance();
    ~CalculatorUI();
    void show();
    void setCalculator(ICalculator* cal);
    ICalculator *getCalculator();
   

    qint64 addWavHeader(QString catheFileName,QString wavFileName);

    void startASR();
    void getResult();
    string changeResult(string &str);

private:
    CalculatorUI();
    bool Construct();

    private slots:
        void onCalculate();
        void onRecording();

private:
    QLineEdit *m_edit;
    QPushButton *m_start_record;
    QPushButton *m_buttons[20];
    ICalculator *m_cal;

    QAudioInput *m_audioInput;
    bool m_isRecord;
    QFile destinationFile;

    QProcess *caller;
    CalculatorASR *cal_asr=NULL;
    string ASRret;
};

#endif

界面是手写代码实现的,没有选择用designer设计器。

原因之一是界面不是很复杂,还有就是因为connect时更简洁。

#include "CalculatorUI.h"
#include <qt5/QtWidgets/QMessageBox>


#define RAW_RECORD_FIKENAME "./audio/test.raw"  //录音文件名
#define WAV_RECORD_FIKENAME "./audio/test.wav"  //录音文件转wav格式文件名

const qint64 TIME_TRANSFORM = 1000 * 1000;      //微秒转秒

struct WAVFILEHEADER
{
    char RiffName[4];
    unsigned long nRiffLength;

    char WavName[4];

    char FmtName[4];
    unsigned long nFmtLength;

    unsigned short nAudioFormat;
    unsigned short nChannleNumber;
    unsigned long nSampleRate;
    unsigned long nBytesPerSecond;
    unsigned short nBytesPerSample;
    unsigned short nBitsPerSample;

    char DATANAME[4];
    unsigned long nDataLength;
};

CalculatorUI::CalculatorUI() : QWidget()
{
    m_cal = NULL;
    m_audioInput = NULL;
    m_isRecord = false;
    cal_asr = new CalculatorASR();
    if(cal_asr!=NULL)
    {
        cal_asr->myLogin();
    }
}

CalculatorUI* CalculatorUI::newInstance()
{
    CalculatorUI *ret = new CalculatorUI();
    if(NULL == ret || !ret->Construct())
    {
        delete ret;
        ret = NULL;
    }
    return ret;
}

CalculatorUI::~CalculatorUI()
{
     cal_asr->myLogOut();
}

void CalculatorUI::show()
{
    QWidget::show();
    setFixedSize(width(),height());
}

bool CalculatorUI::Construct()
{
    bool ret = true;
    m_edit = new QLineEdit(this);
    if(m_edit!=NULL)
    {
        m_edit->move(10,10);
        m_edit->resize(200,30);
        m_edit->setReadOnly(true);
    }
    else
    {
        ret = false;
    }
    m_start_record = new QPushButton(this);
    if(m_start_record!=NULL)
    {
        m_start_record->move(210,10);
        m_start_record->resize(40,30);
        m_start_record->setText("录音");
        connect(m_start_record,SIGNAL(clicked()),this,SLOT(onRecording()));
    }
    else
    {
        ret = false;
    }

    const char* buttontext[20] = 
    {
        "7","8","9","+","(",
        "4","5","6","-",")",
        "1","2","3","*","<-",
        "0",".","=","/","C"
    };
    for(int i = 0;(i<4)&&ret;i++)
    {
        for(int j = 0;(j<5)&&ret;j++)
        {
            m_buttons[5*i + j] = new QPushButton(this);
            if(m_buttons[5*i + j]!=NULL)
            {
                m_buttons[5*i + j]->move(10 + (10 + 40)*j,50 + (10 + 40)*i);
                m_buttons[5*i + j]->resize(40,40);
                m_buttons[5*i + j]->setText(buttontext[5*i + j]);
                connect(m_buttons[5*i + j],SIGNAL(clicked()),this,SLOT(onCalculate()));
            }
            else
            {
                ret = false;
            }
        }
    }
    return ret;
}

void CalculatorUI::setCalculator(ICalculator* cal)
{
    m_cal = cal;
}

ICalculator* CalculatorUI::getCalculator()
{
    return m_cal;
}

void CalculatorUI::onCalculate()
{
    QPushButton* button = dynamic_cast<QPushButton*>(sender());

    if(button!=NULL)
    {
        QString buttontext = button->text();

        if(buttontext == "<-")
        {
            QString text = m_edit->text();

            if(text.length() > 0)
            {
                text.remove(text.length()-1,1);
                m_edit->setText(text);
            }
        }
        else if(buttontext == "C")
        {
            m_edit->setText("");
        }
        else if(buttontext =="=")
        {
            if(m_cal != NULL)
            {
                m_cal->expression(m_edit->text());
                m_edit->setText(m_cal->result());
            }
        }
        else
        {
            m_edit->setText(m_edit->text() + buttontext);
        }
    }
}

qint64 CalculatorUI::addWavHeader(QString catheFileName,QString wavFileName)
{
        //开始设置WAV的头文件
    WAVFILEHEADER WavFileHeader;
    qstrcpy(WavFileHeader.RiffName,"RIFF");
    qstrcpy(WavFileHeader.WavName,"WAVE");
    qstrcpy(WavFileHeader.FmtName,"fmt");
    qstrcpy(WavFileHeader.DATANAME,"data");

    WavFileHeader.nFmtLength = 16;
    WavFileHeader.nAudioFormat = 1;
    WavFileHeader.nChannleNumber =1;
    WavFileHeader.nSampleRate = 8000;

    WavFileHeader.nBytesPerSample = 2;
    WavFileHeader.nBytesPerSecond = 16000;

    WavFileHeader.nBitsPerSample = 16;

    QFile cacheFile(catheFileName);
    QFile wavFile(wavFileName);

    if(!cacheFile.open(QIODevice::ReadWrite))
    {
        return -1;
    }
    if(!wavFile.open(QIODevice::WriteOnly))
    {
        return -2;
    }

    int nSize = sizeof(WavFileHeader);
    qint64 nFileLen = cacheFile.bytesAvailable();

    WavFileHeader.nRiffLength = nFileLen - 8 + nSize;
    WavFileHeader.nDataLength = nFileLen;

    wavFile.write((char *)&WavFileHeader,nSize);
    wavFile.write(cacheFile.readAll());

    cacheFile.close();
    wavFile.close();

    return nFileLen;
}

void CalculatorUI::onRecording()
{
    
    //如果当前没有开始录音则允许录音
    if(!m_isRecord)
    {
        m_isRecord = true;
        m_start_record->setText("结束");
        //判断本地设备是否支持该格式
        QAudioDeviceInfo audioDeveiceInfo = QAudioDeviceInfo::defaultInputDevice();
        //判断本地是否有录音设备
        if(!audioDeveiceInfo.isNull())
        {
            m_isRecord = true;
            destinationFile.setFileName(RAW_RECORD_FIKENAME);
            destinationFile.open(QIODevice::WriteOnly | QIODevice::Truncate);

            //设置音频文件格式
            QAudioFormat format;
            format.setSampleRate(8000);
            format.setChannelCount(1);
            format.setSampleSize(16);
            format.setCodec("audio/pcm");
            format.setByteOrder(QAudioFormat::LittleEndian);
            format.setSampleType(QAudioFormat::SignedInt);

            //判断当前设备是否支持该音频格式
            if(!audioDeveiceInfo.isFormatSupported(format))
            {
                qDebug() << "Default format not supported,trying to use the nearest.";
                format = audioDeveiceInfo.nearestFormat(format);
            }
            //开始录音
            m_audioInput = new QAudioInput(format,this);
            m_audioInput->start(&destinationFile);
        }
        else
        {
        //没有录音设备
        QMessageBox::information(NULL,tr("Record"),tr("Current No Record Device"));
        }
    }
    else
    {
        m_isRecord = false;
        m_start_record->setText("录音");
        if(m_audioInput!=NULL)
        {
            m_audioInput->stop();
            destinationFile.close();
            delete m_audioInput;
            m_audioInput = NULL;
        }

        //将生成的.raw文件转成.wav格式文件:
        if(addWavHeader(RAW_RECORD_FIKENAME,WAV_RECORD_FIKENAME)>0)
        {
           // QMessageBox::information(NULL,tr("save"),tr("RecordFile Save Success"));
        }

        //启动语音识别引擎
        startASR();
        //获取识别结果
        getResult();
        
        m_edit->setText(QString::fromStdString(ASRret));

        if(m_cal != NULL)
            {
                m_cal->expression(m_edit->text());
                m_edit->setText(m_edit->text() + "=" + m_cal->result());
            }
    }
}

void CalculatorUI::startASR()
{
    const char* session_begin_params    =    "sub = iat, domain = iat, language = zh_cn, accent = mandarin, sample_rate = 16000, result_type = plain, result_encoding = utf8";
    cal_asr->run_iat(WAV_RECORD_FIKENAME, session_begin_params);
}

void CalculatorUI::getResult()
{
    string str = cal_asr->getResult();
    CalculatorUI::ASRret = changeResult(str);
    std::cout << ASRret << endl;
}

string CalculatorUI::changeResult(string &str)
{
    string ret;
    int num = str.size();
    int i = 0;
    while(i<num)
    {
        int size = 1;
        if(str[i] & 0x80)
        {
            char temp = str[i];
            temp <<= 1;
            do
            {
                temp <<= 1;
                ++size;
            }while(temp & 0x80);
        }
        string subWord;
        subWord = str.substr(i,size);
        if(subWord == "÷")
            ret += "/";
        else if(subWord == "×")
            ret += "*";
        else if(subWord == "")
                        ;
        else
            ret += subWord;
        i += size;
    }
    return ret;
}

这里重点说一下

string CalculatorUI::changeResult(string &str);
这个问题困扰了我好长时间,因为语音引擎返回的是中文,而我计算引擎中对字符串的处理都是英文,所以这里需要处理一些从语音引擎得到的结果。
这种方法我也是在博客上看到的,所有还是要感谢乐于分享知识的人们。
如果代码没有看明白,可以私信联系我,互相学习。



以上是关于智能语音计算器的主要内容,如果未能解决你的问题,请参考以下文章

自然语言处理NLP之文本蕴涵智能问答语音识别对话系统文本分类情感计算

人工智能代码实战:AI李白如何创作诗词

智能语音技术:从哪儿来?往何处去?

音频技术智能语音

音频技术智能语音

音频技术智能语音