https://github.com/halide/Halide
Raw File
Tip revision: 65c26cba6a3eca2d08a0bccf113ca28746012cc3 authored by Steven Johnson on 26 August 2019, 21:49:31 UTC
Merge pull request #4174 from halide/srj-tidy
Tip revision: 65c26cb
LowerWarpShuffles.h
#ifndef HALIDE_LOWER_WARP_SHUFFLES_H
#define HALIDE_LOWER_WARP_SHUFFLES_H

/** \file
 * Defines the lowering pass that injects CUDA warp shuffle
 * instructions to access storage outside of a GPULane loop.
 */

#include "IR.h"

namespace Halide {
namespace Internal {

/** Rewrite access to things stored outside the loop over GPU lanes to
 * use nvidia's warp shuffle instructions. */
Stmt lower_warp_shuffles(Stmt s);

}  // namespace Internal
}  // namespace Halide

#endif
back to top