Вперед Назад

DemonstrateConvolution.c

/*

        File: DemonstrateConvolution.c

    Abstract: Demonstration of vDSP convolution routine.

     Version: 1.2

    Disclaimer: IMPORTANT:  This Apple software is supplied to you by Apple

    Inc. ("Apple") in consideration of your agreement to the following

    terms, and your use, installation, modification or redistribution of

    this Apple software constitutes acceptance of these terms.  If you do

    not agree with these terms, please do not use, install, modify or

    redistribute this Apple software.

    In consideration of your agreement to abide by the following terms, and

    subject to these terms, Apple grants you a personal, non-exclusive

    license, under Apple's copyrights in this original Apple software (the

    "Apple Software"), to use, reproduce, modify and redistribute the Apple

    Software, with or without modifications, in source and/or binary forms;

    provided that if you redistribute the Apple Software in its entirety and

    without modifications, you must retain this notice and the following

    text and disclaimers in all such redistributions of the Apple Software.

    Neither the name, trademarks, service marks or logos of Apple Inc. may

    be used to endorse or promote products derived from the Apple Software

    without specific prior written permission from Apple.  Except as

    expressly stated in this notice, no other rights or licenses, express or

    implied, are granted by Apple herein, including but not limited to any

    patent rights that may be infringed by your derivative works or by other

    works in which the Apple Software may be incorporated.

    The Apple Software is provided by Apple on an "AS IS" basis.  APPLE

    MAKES NO WARRANTIES, EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION

    THE IMPLIED WARRANTIES OF NON-INFRINGEMENT, MERCHANTABILITY AND FITNESS

    FOR A PARTICULAR PURPOSE, REGARDING THE APPLE SOFTWARE OR ITS USE AND

    OPERATION ALONE OR IN COMBINATION WITH YOUR PRODUCTS.

    IN NO EVENT SHALL APPLE BE LIABLE FOR ANY SPECIAL, INDIRECT, INCIDENTAL

    OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

    SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

    INTERRUPTION) ARISING IN ANY WAY OUT OF THE USE, REPRODUCTION,

    MODIFICATION AND/OR DISTRIBUTION OF THE APPLE SOFTWARE, HOWEVER CAUSED

    AND WHETHER UNDER THEORY OF CONTRACT, TORT (INCLUDING NEGLIGENCE),

    STRICT LIABILITY OR OTHERWISE, EVEN IF APPLE HAS BEEN ADVISED OF THE

    POSSIBILITY OF SUCH DAMAGE.

    Copyright (C) 2012 Apple Inc. All Rights Reserved.

    This is a sample module to illustrate the use of vDSP_conv for

    convolution and correlation.  This module also times the vDSP_conv.

    Copyright (C) 2007 Apple Inc.  All rights reserved.

*/

#include <stdio.h>

#include <stdlib.h>

#include <Accelerate/Accelerate.h>

#include "Demonstrate.h"

#define Iterations 1000 // How many iterations to use in the timer loop.

// Demonstrate vDSP_conv.

void DemonstrateConvolution(void)

    /*  Define strides for the arrays being passed to the convolution.

        In many applications, the strides are one and are passed to the

        vDSP routine as constants.  We give them names here just so

        that the routine call is more illustrative, showing the

        arguments by name.

*/

    const vDSP_Stride

        SignalStride = 1,

        FilterStride = 1,

        ResultStride = 1;

    /*  Lengths tend to differ more than strides, although it is might

        not be unusual to have constants in a particular application.

        (For example, your filter length might be a constant because

        the code is written specially for a very specific filter.  The

        result length is more likely to be a named constant at least,

        representing a frame size.)

        The signal length is padded a bit.  This length is not actually

        passed to the vDSP_conv routine; it is the number of elements

        that the signal array must contain.  The SignalLength defined

        below is used to allocate space, and it is the filter length

        rounded up to a multiple of four elements and added to the

        result length.  The extra elements give the vDSP_conv routine

        leeway to perform vector-load instructions, which load multiple

        elements even if they are not all used.  If the caller did not

        guarantee that memory beyond the values used in the signal

        array were accessible, a memory access violation might result.

*/

    vDSP_Length

        FilterLength = 256,

        ResultLength = 2048,

        SignalLength = (FilterLength+3 & -4u) + ResultLength;

    // Define pointers to the arrays we will use.

    float *Signal, *Filter, *Result;

    // Define a variable for a loop iterator.

    vDSP_Length i;

    // Define some variables used to time the routine.

    ClockData t0, t1;

    float Time, Gigaflops;

    printf("Begin %s.\n\n", __func__);

    // Allocate memory for the arrays.

    Signal = malloc(SignalLength * SignalStride * sizeof *Signal);

    Filter = malloc(FilterLength * FilterStride * sizeof *Filter);

    Result = malloc(ResultLength * ResultStride * sizeof *Result);

    if (Signal == NULL || Filter == NULL || Result == NULL)

        fprintf(stderr, "Error, failed to allocate memory.\n");

        exit(EXIT_FAILURE);

    /*  Initialize the input signal.  In a real application, data would

        of course be provided from an image file, sensors, or other

        source.

*/

    for (i = 0; i < SignalLength; i++)

        Signal[i*SignalStride] = 1.0;

    /*  Initialize the filter.  A real application would have different

        filter coefficients.

*/

    for (i = 0; i < FilterLength; i++)

        Filter[i*FilterStride] = 1.0;

    // Perform a correlation.

    vDSP_conv(Signal, SignalStride, Filter, FilterStride,

        Result, ResultStride, ResultLength, FilterLength);

    /*  Perform a convolution by using the filter backward.  To do

        this, we pass -1 for the filter stride and pass vDSP_conv a

        pointer to the first element of the backward filter, which is

        the last element of the forward filter.

*/

    vDSP_conv(Signal, SignalStride, Filter + FilterLength - 1, -1,

        Result, ResultStride, ResultLength, FilterLength);

    /*  The above calls show how to use the vDSP_conv routine.  Now we

        will see how fast it is.

*/

    t0 = Clock();

    for (i = 0; i < Iterations; i++)

        vDSP_conv(Signal, SignalStride, Filter, FilterStride,

            Result, ResultStride, ResultLength, FilterLength);

    t1 = Clock();

    // Average the time over all the loop iterations.

    Time = ClockToSeconds(t1, t0) / Iterations;

    /*  For each result element, a convolution takes a multiply for

        each filter element and an addition for each element after the

        first.  So there are ResultLength * (2 * FilterLength - 1)

        floating-point operations in this convolution.  We divide that

        by the number of seconds it takes to do the convolution to get

        floating-point operations per second and then scale by 1e-9 to

        get gigaflops.

*/

    Gigaflops = ResultLength * (2 * FilterLength - 1) / Time * 1e-9;

    printf("\tA %lu * %lu convolution takes %g microseconds,\n"

        "\twhich is a performance of %g gigaflops.\n\n",

        (unsigned long) ResultLength, (unsigned long) FilterLength,

        Time * 1e6, Gigaflops);

    // Free allocated memory.

    free(Signal);

    free(Filter);

    free(Result);

    printf("End %s.\n\n\n", __func__);

Вперед Назад