// Copyright (c) Meta Platforms, Inc. and affiliates. // All rights reserved. // // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. #pragma once #include #include #include #include #include "FFMPEGCommon.h" #include "Frame.h" extern "C" { #include #include } namespace facebook::torchcodec { // Pytorch can only handle up to 128 GPUs. // https://github.com/pytorch/pytorch/blob/e30c55ee527b40d67555464b9e402b4b7ce03737/c10/cuda/CUDAMacros.h#L44 constexpr int MAX_CUDA_GPUS = 128; void initializeCudaContextWithPytorch(const torch::Device& device); // Unique pointer type for NPP stream context using UniqueNppContext = std::unique_ptr; torch::Tensor convertNV12FrameToRGB( UniqueAVFrame& avFrame, const torch::Device& device, const UniqueNppContext& nppCtx, at::cuda::CUDAStream nvdecStream, std::optional preAllocatedOutputTensor = std::nullopt); UniqueNppContext getNppStreamContext(const torch::Device& device); void returnNppStreamContextToCache( const torch::Device& device, UniqueNppContext nppCtx); void validatePreAllocatedTensorShape( const std::optional& preAllocatedOutputTensor, const UniqueAVFrame& avFrame); int getDeviceIndex(const torch::Device& device); } // namespace facebook::torchcodec