mirror of
https://github.com/tensorflow/tensorflow.git
synced 2024-11-21 21:05:19 +00:00
904e48fc27
This allows us to better isolate the special build flags that DUCC requires in order to enable exceptions and RTTI. PiperOrigin-RevId: 575358706
148 lines
6.1 KiB
C++
148 lines
6.1 KiB
C++
/* Copyright 2023 The TensorFlow Authors. All Rights Reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
==============================================================================*/
|
|
#include "ducc/google/fft.h"
|
|
|
|
#include <complex>
|
|
#include <cstddef>
|
|
#include <cstdlib>
|
|
#include <exception>
|
|
#include <iostream>
|
|
#include <ostream>
|
|
#include <vector>
|
|
|
|
#include "ducc/google/threading.h"
|
|
#include "ducc/src/ducc0/fft/fft.h"
|
|
#include "ducc/src/ducc0/fft/fft1d_impl.h" // IWYU pragma: keep, DUCC definitions.
|
|
#include "ducc/src/ducc0/fft/fftnd_impl.h" // IWYU pragma: keep, DUCC definitions.
|
|
#include "ducc/src/ducc0/infra/mav.h"
|
|
#include "ducc/src/ducc0/infra/threading.h"
|
|
#include "unsupported/Eigen/CXX11/ThreadPool"
|
|
|
|
namespace ducc0 {
|
|
|
|
// Wrappers around DUCC calls.
|
|
namespace google {
|
|
|
|
using Shape = std::vector<std::size_t>;
|
|
using Stride = std::vector<std::ptrdiff_t>;
|
|
|
|
template <typename RealScalar>
|
|
void c2c(const std::complex<RealScalar>* in, const Shape& in_shape,
|
|
const Stride& in_stride, std::complex<RealScalar>* out,
|
|
const Shape& out_shape, const Stride& out_stride, const Shape& axes,
|
|
bool forward, RealScalar scale,
|
|
Eigen::ThreadPoolInterface* thread_pool) {
|
|
ducc0::cfmav<std::complex<RealScalar>> m_in(in, in_shape, in_stride);
|
|
ducc0::vfmav<std::complex<RealScalar>> m_out(out, out_shape, out_stride);
|
|
|
|
try {
|
|
if (thread_pool == nullptr) {
|
|
// Use a fake threadpool.
|
|
ducc0::google::NoThreadPool no_thread_pool;
|
|
ducc0::detail_threading::ScopedUseThreadPool thread_pool_guard(
|
|
no_thread_pool);
|
|
ducc0::c2c(m_in, m_out, axes, forward, scale, 1);
|
|
} else {
|
|
EigenThreadPool eigen_thread_pool(*thread_pool);
|
|
ducc0::detail_threading::ScopedUseThreadPool thread_pool_guard(
|
|
eigen_thread_pool);
|
|
ducc0::c2c(m_in, m_out, axes, forward, scale,
|
|
eigen_thread_pool.nthreads());
|
|
}
|
|
} catch (const std::exception& ex) {
|
|
std::cerr << "DUCC FFT c2c failed: " << ex.what() << std::endl;
|
|
std::abort();
|
|
}
|
|
}
|
|
|
|
template <typename RealScalar>
|
|
void r2c(const RealScalar* in, const Shape& in_shape, const Stride& in_stride,
|
|
std::complex<RealScalar>* out, const Shape& out_shape,
|
|
const Stride& out_stride, const Shape& axes, bool forward,
|
|
RealScalar scale, Eigen::ThreadPoolInterface* thread_pool) {
|
|
ducc0::cfmav<RealScalar> m_in(in, in_shape, in_stride);
|
|
ducc0::vfmav<std::complex<RealScalar>> m_out(out, out_shape, out_stride);
|
|
|
|
try {
|
|
if (thread_pool == nullptr) {
|
|
// Use a fake threadpool.
|
|
ducc0::google::NoThreadPool no_thread_pool;
|
|
ducc0::detail_threading::ScopedUseThreadPool thread_pool_guard(
|
|
no_thread_pool);
|
|
ducc0::r2c(m_in, m_out, axes, forward, scale, 1);
|
|
} else {
|
|
EigenThreadPool eigen_thread_pool(*thread_pool);
|
|
ducc0::detail_threading::ScopedUseThreadPool thread_pool_guard(
|
|
eigen_thread_pool);
|
|
ducc0::r2c(m_in, m_out, axes, forward, scale,
|
|
eigen_thread_pool.nthreads());
|
|
}
|
|
} catch (const std::exception& ex) {
|
|
std::cerr << "DUCC FFT r2c failed: " << ex.what() << std::endl;
|
|
std::abort();
|
|
}
|
|
}
|
|
|
|
template <typename RealScalar>
|
|
void c2r(const std::complex<RealScalar>* in, const Shape& in_shape,
|
|
const Stride& in_stride, RealScalar* out, const Shape& out_shape,
|
|
const Stride& out_stride, const Shape& axes, bool forward,
|
|
RealScalar scale, Eigen::ThreadPoolInterface* thread_pool) {
|
|
ducc0::cfmav<std::complex<RealScalar>> m_in(in, in_shape, in_stride);
|
|
ducc0::vfmav<RealScalar> m_out(out, out_shape, out_stride);
|
|
|
|
try {
|
|
if (thread_pool == nullptr) {
|
|
// Use a fake threadpool.
|
|
ducc0::google::NoThreadPool no_thread_pool;
|
|
ducc0::detail_threading::ScopedUseThreadPool thread_pool_guard(
|
|
no_thread_pool);
|
|
ducc0::c2r(m_in, m_out, axes, forward, scale, 1);
|
|
} else {
|
|
EigenThreadPool eigen_thread_pool(*thread_pool);
|
|
ducc0::detail_threading::ScopedUseThreadPool thread_pool_guard(
|
|
eigen_thread_pool);
|
|
ducc0::c2r(m_in, m_out, axes, forward, scale,
|
|
eigen_thread_pool.nthreads());
|
|
}
|
|
} catch (const std::exception& ex) {
|
|
std::cerr << "DUCC FFT c2r failed: " << ex.what() << std::endl;
|
|
std::abort();
|
|
}
|
|
}
|
|
|
|
#define FFT_DEFINITIONS(RealScalar) \
|
|
template void c2c<RealScalar>( \
|
|
const std::complex<RealScalar>* in, const Shape& in_shape, \
|
|
const Stride& in_stride, std::complex<RealScalar>* out, \
|
|
const Shape& out_shape, const Stride& out_stride, const Shape& axes, \
|
|
bool forward, RealScalar scale, \
|
|
Eigen::ThreadPoolInterface* thread_pool); \
|
|
template void r2c<RealScalar>( \
|
|
const RealScalar* in, const Shape& in_shape, const Stride& in_stride, \
|
|
std::complex<RealScalar>* out, const Shape& out_shape, \
|
|
const Stride& out_stride, const Shape& axes, bool forward, \
|
|
RealScalar scale, Eigen::ThreadPoolInterface* thread_pool); \
|
|
template void c2r(const std::complex<RealScalar>* in, const Shape& in_shape, \
|
|
const Stride& in_stride, RealScalar* out, \
|
|
const Shape& out_shape, const Stride& out_stride, \
|
|
const Shape& axes, bool forward, RealScalar scale, \
|
|
Eigen::ThreadPoolInterface* thread_pool)
|
|
FFT_DEFINITIONS(float);
|
|
FFT_DEFINITIONS(double);
|
|
#undef FFT_DEFINITIONS
|
|
|
|
} // namespace google
|
|
} // namespace ducc0
|