usr/src/cmd/audio/utilities/AudioGain.cc

root/usr/src/cmd/audio/utilities/AudioGain.cc
/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License, Version 1.0 only
 * (the "License").  You may not use this file except in compliance
 * with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */
/*
 * Copyright 2004 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */

#include <stdio.h>
#include <malloc.h>
#include <math.h>
#include <errno.h>
#include <memory.h>
#include <sys/param.h>
#include <sys/types.h>
#include <sys/ioctl.h>

#include <AudioGain.h>
#include <AudioTypePcm.h>

#define irint(d)        ((int)d)


// initialize constants for instananeous gain normalization
const double    AudioGain::LoSigInstantRange    = .008;
const double    AudioGain::HiSigInstantRange    = .48;

// initialize constants for weighted gain normalization
const double    AudioGain::NoSigWeight          = .0000;
const double    AudioGain::LoSigWeightRange     = .001;
const double    AudioGain::HiSigWeightRange     = .050;

// u-law max value converted to floating point
const double    AudioGain::PeakSig              = .9803765;

// XXX - patchable dc time constant:  TC = 1 / (sample rate / DCfreq)
int DCfreq = 500;
const double    AudioGain::DCtimeconstant       = .1;

// patchable debugging flag
int debug_agc = 0;


// Constructor
AudioGain::
AudioGain():
        clipcnt(0), DCaverage(0.), instant_gain(0.),
        weighted_peaksum(0.), weighted_sum(0.),
        weighted_avgsum(0.), weighted_cnt(0),
        gain_cache(NULL)
{
}

// Destructor
AudioGain::
~AudioGain()
{
        if (gain_cache != NULL) {
                delete gain_cache;
        }
}

// Return TRUE if we can handle this data type
Boolean AudioGain::
CanConvert(
        const AudioHdr& hdr) const
{
        return (float_convert.CanConvert(hdr));
}

// Return latest instantaneous gain
double AudioGain::
InstantGain()
{
        return ((double)instant_gain);
}

// Return latest weighted gain
double AudioGain::
WeightedGain()
{
        double          g;

        // Accumulated sum is averaged by the cache size and number of sums
        if ((weighted_cnt > 0) && (gain_cache_size > 0.)) {
                g = weighted_avgsum / gain_cache_size;
                g /=  weighted_cnt;
                g -= NoSigWeight;
                if (g > HiSigWeightRange) {
                        g = 1.;
                } else if (g < 0.) {
                        g = 0.;
                } else {
                        g /= HiSigWeightRange;
                }
        } else {
                g = 0.;
        }
        return (g);
}

// Return latest weighted peak
// Clears the weighted peak for next calculation.
double AudioGain::
WeightedPeak()
{
        double          g;

        // Peak sum is averaged by the cache size
        if (gain_cache_size > 0.) {
                g = weighted_peaksum / gain_cache_size;
                g -= NoSigWeight;
                if (g > HiSigWeightRange) {
                        g = 1.;
                } else if (g < 0.) {
                        g = 0.;
                } else {
                        g /= HiSigWeightRange;
                }
        } else {
                g = 0.;
        }
        weighted_peaksum = 0.;
        return (g);
}

// Return TRUE if signal clipped during last processed buffer
Boolean AudioGain::
Clipped()
{
        Boolean         clipped;

        clipped = (clipcnt > 0);
        return (clipped);
}

// Flush gain state
void AudioGain::
Flush()
{
        clipcnt = 0;
        DCaverage = 0.;
        instant_gain = 0.;
        weighted_peaksum = 0.;
        weighted_sum = 0.;
        weighted_avgsum = 0.;
        weighted_cnt = 0;
        if (gain_cache != NULL) {
                delete gain_cache;
                gain_cache = NULL;
        }
}

// Process an input buffer according to the specified flags
// The input buffer is consumed if the reference count is zero!
AudioError AudioGain::
Process(
        AudioBuffer*    inbuf,
        int             type)
{
        AudioHdr        newhdr;
        AudioError      err;

        if (inbuf == NULL)
                return (AUDIO_ERR_BADARG);

        if (Undefined(inbuf->GetLength())) {
                err = AUDIO_ERR_BADARG;
process_error:
                // report error and toss the buffer if it is not referenced
                inbuf->RaiseError(err);
                inbuf->Reference();
                inbuf->Dereference();
                return (err);
        }

        // Set up to convert to floating point; verify all header formats
        newhdr = inbuf->GetHeader();
        if (!float_convert.CanConvert(newhdr)) {
                err = AUDIO_ERR_HDRINVAL;
                goto process_error;
        }
        newhdr.encoding = FLOAT;
        newhdr.bytes_per_unit = 8;
        if ((err = newhdr.Validate()) || !float_convert.CanConvert(newhdr)) {
                err = AUDIO_ERR_HDRINVAL;
                goto process_error;
        }

        // Convert to floating-point up front, if necessary
        if (inbuf->GetHeader() != newhdr) {
                err = float_convert.Convert(inbuf, newhdr);
                if (err)
                        goto process_error;
        }

        // Reference the resulting buffer to make sure it gets ditched later
        inbuf->Reference();

        // run through highpass filter to reject DC
        process_dcfilter(inbuf);

        if (type & AUDIO_GAIN_INSTANT)
                process_instant(inbuf);

        if (type & AUDIO_GAIN_WEIGHTED)
                process_weighted(inbuf);

        inbuf->Dereference();
        return (AUDIO_SUCCESS);
}

// Run the buffer through a simple, dc filter.
// Buffer is assumed to be floating-point double PCM
void AudioGain::
process_dcfilter(
        AudioBuffer*    inbuf)
{
        int             i;
        Boolean         lastpeak;
        double          val;
        double          dcweight;
        double          timeconstant;
        AudioHdr        inhdr;
        double          *inptr;
        size_t          frames;

        inhdr = inbuf->GetHeader();
        inptr = (double *)inbuf->GetAddress();
        frames = (size_t)inhdr.Time_to_Samples(inbuf->GetLength());
        clipcnt = 0;
        lastpeak = FALSE;

        // Time constant corresponds to the number of samples for 500Hz
        timeconstant = 1. / (inhdr.sample_rate / (double)DCfreq);
        dcweight = 1. - timeconstant;

        // loop through the input buffer, rewriting with weighted data
        // XXX - should deal with multi-channel data!
        // XXX - for now, check first channel only
        for (i = 0; i < frames; i++, inptr += inhdr.channels) {
                val = *inptr;

                // Two max values in a row constitutes clipping
                if ((val >= PeakSig) || (val <= -PeakSig)) {
                        if (lastpeak) {
                                clipcnt++;
                        } else {
                                lastpeak = TRUE;
                        }
                } else {
                        lastpeak = FALSE;
                }

                // Add in this value to weighted average
                DCaverage = (DCaverage * dcweight) + (val * timeconstant);
                val -= DCaverage;
                if (val > 1.)
                        val = 1.;
                else if (val < -1.)
                        val = -1.;
                *inptr = val;
        }
}

// Calculate a single energy value averaged from the input buffer
// Buffer is assumed to be floating-point double PCM
void AudioGain::
process_instant(
        AudioBuffer*    inbuf)
{
        int             i;
        double          val;
        double          sum;
        double          sv;
        AudioHdr        inhdr;
        double          *inptr;
        size_t          frames;

        inhdr = inbuf->GetHeader();
        inptr = (double *)inbuf->GetAddress();
        frames = (size_t)inhdr.Time_to_Samples(inbuf->GetLength());

        // loop through the input buffer, calculating gain
        // XXX - should deal with multi-channel data!
        // XXX - for now, check first channel only
        sum = 0.;
        for (i = 0; i < frames; i++, inptr += inhdr.channels) {
                // Get absolute value
                sum += fabs(*inptr);
        }
        sum /= (double)frames;

        // calculate level meter value (between 0 & 1)
        val = log10(1. + (9. * sum));
        sv = val;

        // Normalize to within a reasonable range
        val -= LoSigInstantRange;
        if (val > HiSigInstantRange) {
                val = 1.;
        } else if (val < 0.) {
                val = 0.;
        } else {
                val /= HiSigInstantRange;
        }
        instant_gain = val;

        if (debug_agc != 0) {
                printf("audio_amplitude: avg = %7.5f  log value = %7.5f, "
                    "adjusted = %7.5f\n", sum, sv, val);
        }
}

// Calculate a weighted gain for agc computations
// Buffer is assumed to be floating-point double PCM
void AudioGain::
process_weighted(
        AudioBuffer*    inbuf)
{
        int             i;
        double          val;
        double          nosig;
        AudioHdr        inhdr;
        double          *inptr;
        size_t          frames;
        Double          sz;

        inhdr = inbuf->GetHeader();
        inptr = (double *)inbuf->GetAddress();
        frames = (size_t)inhdr.Time_to_Samples(inbuf->GetLength());
        sz = (Double) frames;

        // Allocate gain cache...all calls will hopefully be the same length
        if (gain_cache == NULL) {
                gain_cache = new double[frames];
                for (i = 0; i < frames; i++) {
                        gain_cache[i] = 0.;
                }
                gain_cache_size = sz;
        } else if (sz > gain_cache_size) {
                frames = (size_t)irint(gain_cache_size);
        }
        // Scale up the 'no signal' level to avoid a divide in the inner loop
        nosig = NoSigWeight * gain_cache_size;

        // For each sample:
        //   calculate the sum of squares for a window around the sample;
        //   save the peak sum of squares;
        //   keep a running average of the sum of squares
        //
        // XXX - should deal with multi-channel data!
        // XXX - for now, check first channel only

        for (i = 0; i < frames; i++, inptr += inhdr.channels) {
                val = *inptr;
                val *= val;
                weighted_sum += val;
                weighted_sum -= gain_cache[i];
                gain_cache[i] = val;            // save value to subtract later
                if (weighted_sum > weighted_peaksum)
                        weighted_peaksum = weighted_sum;        // save peak

                // Only count this sample towards the average if it is
                // above threshold (this attempts to keep the volume
                // from pumping up when there is no input signal).
                if (weighted_sum > nosig) {
                        weighted_avgsum += weighted_sum;
                        weighted_cnt++;
                }
        }
}
Illumos