ARM-software
/
CMSIS_5
oglindă de https://github-proxy.rt-thread.io/ARM-software/CMSIS_5.git


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352
							/* ----------------------------------------------------------------------
 * Project:      CMSIS DSP Library
 * Title:        AppNodes.h
 * Description:  Application nodes for the C compute graph
 *
 * $Date:        16 March 2022
 *
 * Target Processor: Cortex-M and Cortex-A cores
 * -------------------------------------------------------------------- */
/*
 * Copyright (C) 2010-2022 ARM Limited or its affiliates. All rights reserved.
 *
 * SPDX-License-Identifier: Apache-2.0
 *
 * Licensed under the Apache License, Version 2.0 (the License); you may
 * not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an AS IS BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */


#ifndef _APPNODES_H_
#define _APPNODES_H_

#include <hal/nrf_pdm.h>
#include "coef.h"

#include <Arduino.h>
#include <HardwareSerial.h>

// When enabled, lots of additional trace is generated
//#define DEBUG

// Buffer to read samples into, each sample is 16-bits
// This is written by the PDM driver
extern short sampleBuffer[AUDIOBUFFER_LENGTH];

// Number of audio samples available in the audio buffer
extern volatile int samplesRead;

// Sink node. It is just printing the recognized word
template<typename IN, int inputSize> class Sink;

template<int inputSize>
class Sink<q15_t, inputSize>: public GenericSink<q15_t, inputSize>
{
public:
    Sink(FIFOBase<q15_t> &src):GenericSink<q15_t,inputSize>(src){};

    int run()
    {
        #if defined(DEBUG)
        Serial.println("==== Sink");
        #endif

        q15_t *b=this->getReadBuffer();

        if (b[0]==-1)
        {
            Serial.println("Unknown");
        };
        
        if (b[0]==0)
        {
            Serial.println("Yes");
        };

        return(0);
    };

};


// Source node. It is getting audio data from the PDM driver
template<typename OUT, int outputSize> class Source;

template<int outputSize>
class Source<q15_t,outputSize>: public GenericSource<q15_t,outputSize>
{
public:
    Source(FIFOBase<q15_t> &dst):GenericSource<q15_t,outputSize>(dst)
    {

    };

    int run(){
       
        #if defined(DEBUG)
        Serial.println("==== Source"); 
        #endif 
        q15_t *b=this->getWriteBuffer();

        // We wait until enough samples are available.
        // In a future version we may experiment with sleeping the board
        while(samplesRead<outputSize)
        {
            #if defined(DEBUG)
              Serial.print("Sample reads ");  
              Serial.println(samplesRead);  
            #endif
        };
        
        #if defined(DEBUG)
        Serial.println("Received");  
        #endif
       
        // We get the samples and update the 
        // sampleBuffer.
        // Since this buffer is also accessed by the IRQ, we need to disable it
        NVIC_DisableIRQ(PDM_IRQn);
        memcpy(b,sampleBuffer,sizeof(q15_t)*outputSize);
        if ((samplesRead-outputSize) > 0)
        {
            memmove(sampleBuffer,sampleBuffer+outputSize,sizeof(q15_t)*(samplesRead-outputSize));
        }
        samplesRead = samplesRead - outputSize;
        NVIC_EnableIRQ(PDM_IRQn);

        #if defined(DEBUG)
        Serial.print("After read : Sample reads ");  
        Serial.println(samplesRead);
        #endif
        

        return(0);
    };


};

template<typename IN, int inputSize,typename OUT,int outputSize> class FIR;


// FIR node
template<int inputSize>
class FIR<q15_t,inputSize,q15_t,inputSize>: public GenericNode<q15_t,inputSize,q15_t,inputSize>
{
public:
    FIR(FIFOBase<q15_t> &src,FIFOBase<q15_t> &dst):GenericNode<q15_t,inputSize,q15_t,inputSize>(src,dst){
        int blockSize=inputSize;
        int numTaps=10;
        int stateLength = numTaps + blockSize - 1;

        state=(q15_t*)malloc(stateLength * sizeof(q15_t*));
    };

    int run(){
        #if defined(DEBUG)
        Serial.println("==== FIR");
        #endif
        q15_t *a=this->getReadBuffer();
        q15_t *b=this->getWriteBuffer();
        int blockSize=inputSize;
        int stateLength = NUMTAPS + blockSize - 1;

        arm_status status=arm_fir_init_q15(&(this->firq15),NUMTAPS,fir_coefs,state,blockSize);

        arm_fir_q15(&(this->firq15),a,b,blockSize);
        return(0);
    };

arm_fir_instance_q15 firq15;
q15_t *state;

};

/* Not available in the older CMSIS-DSP version provided with Arduino.
So we copy the definition here */

arm_status arm_divide_q15(q15_t numerator,
  q15_t denominator,
  q15_t *quotient,
  int16_t *shift)
{
  int16_t sign=0;
  q31_t temp;
  int16_t shiftForNormalizing;

  *shift = 0;

  sign = (numerator>>15) ^ (denominator>>15);

  if (denominator == 0)
  {
     if (sign)
     {
        *quotient = 0x8000;
     }
     else
     {
        *quotient = 0x7FFF;
     }
     return(ARM_MATH_NANINF);
  }

  numerator = abs(numerator);
  denominator = abs(denominator);
  
  temp = ((q31_t)numerator << 15) / ((q31_t)denominator);

  shiftForNormalizing= 17 - __CLZ(temp);
  if (shiftForNormalizing > 0)
  {
     *shift = shiftForNormalizing;
     temp = temp >> shiftForNormalizing;
  }

  if (sign)
  {
    temp = -temp;
  }

  *quotient=temp;

  return(ARM_MATH_SUCCESS);
}


// We similar to the Python implementation
q15_t dsp_zcr_q15(q15_t *w,int blockSize)
{
    q15_t m;
    arm_mean_q15(w,blockSize,&m);

    // Negate can saturate so we use CMSIS-DSP function which is working on array (and we have a scalar)
    arm_negate_q15(&m,&m,1);
    arm_offset_q15(w,m,w,blockSize);
    
    int k=0;
    for(int i=0;i<blockSize-1;i++)
    {
         int f = w[i];
         int g = w[i+1];
         if ((((f>0) && (g<0)) || ((f<0) && (g>0))) && g>f)
         {
            k++;
         }
    }

    
    // k < len(f) so shift should be 0 except when k == len(f)
    // When k==len(f) normally quotient is 0x4000 and shift 1 and we convert
    // this to 0x7FFF

    q15_t quotient;
    int16_t shift;

    arm_status status=arm_divide_q15(k,blockSize-1,&quotient,&shift);

    if (shift==1)
    {
        arm_shift_q15(&quotient,shift,&quotient,1);
        return(quotient);
    }
    else
    {
        return(quotient);
    }
};

template<typename IN, int inputSize,typename OUT,int outputSize> class Feature;

template<int inputSize>
class Feature<q15_t,inputSize,q15_t,1>: public GenericNode<q15_t,inputSize,q15_t,1>
{
public:
    Feature(FIFOBase<q15_t> &src,FIFOBase<q15_t> &dst,const q15_t *window):
       GenericNode<q15_t,inputSize,q15_t,1>(src,dst),mWindow(window){
    };

    int run(){
        #if defined(DEBUG)
        Serial.println("==== Feature");
        #endif
        q15_t *a=this->getReadBuffer();
        q15_t *b=this->getWriteBuffer();

        arm_mult_q15(a,this->mWindow,a,inputSize);

        b[0] = dsp_zcr_q15(a,inputSize);

        return(0);
    };

const q15_t* mWindow;

};

template<typename IN, int inputSize,typename OUT,int outputSize> class KWS;

template<int inputSize>
class KWS<q15_t,inputSize,q15_t,1>: public GenericNode<q15_t,inputSize,q15_t,1>
{
public:
    KWS(FIFOBase<q15_t> &src,FIFOBase<q15_t> &dst,
    const q15_t* coef_q15,
    const int coef_shift,
    const q15_t intercept_q15,
    const int intercept_shift):GenericNode<q15_t,inputSize,q15_t,1>(src,dst),
    mCoef_q15(coef_q15),
    mCoef_shift(coef_shift),
    mIntercept_q15(intercept_q15),
    mIntercept_shift(intercept_shift)
    {
         
    };

    int run(){
        #if defined(DEBUG)
        Serial.println("==== KWS");
        #endif
        q15_t *a=this->getReadBuffer();
        q15_t *b=this->getWriteBuffer();

        q63_t res;
        arm_dot_prod_q15(this->mCoef_q15,a,inputSize,&res);
    
        q15_t scaled;
        arm_shift_q15(&(this->mIntercept_q15),this->mIntercept_shift-this->mCoef_shift,&scaled,1);
        // Because dot prod output is in Q34.30
        // and ret is on 64 bits
        q63_t scaled_Q30 = (q63_t)(scaled) << 15; 
    
        res = res + scaled_Q30;
    
        if (res<0)
        {
            b[0]=-1;
        }
        else
        {
            b[0]=0;
        }
        

        return(0);
    };

const q15_t* mCoef_q15;
const int mCoef_shift;
const q15_t mIntercept_q15;
const int mIntercept_shift;

};
#endif