Revision 9a94756d01d9071ff1610bfc4cb170bd47f701a8 authored by Alexander Root on 21 July 2022, 15:01:16 UTC, committed by GitHub on 21 July 2022, 15:01:16 UTC
* use pmaddubsw 8-bit horizontal widening adds * add SSE3 versions too * add pmaddubsw tests
1 parent 967c3bf
BoundSmallAllocations.h
#ifndef HALIDE_BOUND_SMALL_ALLOCATIONS
#define HALIDE_BOUND_SMALL_ALLOCATIONS
#include "Expr.h"
/** \file
* Defines the lowering pass that attempts to rewrite small
* allocations to have constant size.
*/
namespace Halide {
namespace Internal {
/** \file
*
* Use bounds analysis to attempt to bound the sizes of small
* allocations. Inside GPU kernels this is necessary in order to
* compile. On the CPU this is also useful, because it prevents malloc
* calls for (provably) tiny allocations. */
Stmt bound_small_allocations(const Stmt &s);
} // namespace Internal
} // namespace Halide
#endif
![swh spinner](/static/img/swh-spinner.gif)
Computing file changes ...