mirror of
https://git.rwth-aachen.de/acs/public/villas/node/
synced 2025-03-30 00:00:11 +01:00
147 lines
4.3 KiB
C++
147 lines
4.3 KiB
C++
/** GPU unit tests.
|
|
*
|
|
* @author Steffen Vogel <post@steffenvogel.de>
|
|
* @copyright 2017-2022, Steffen Vogel
|
|
* @license GNU General Public License (version 3)
|
|
*
|
|
* VILLASfpga
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*********************************************************************************/
|
|
|
|
#include <criterion/criterion.h>
|
|
|
|
#include <map>
|
|
#include <string>
|
|
|
|
#include <villas/log.hpp>
|
|
#include <villas/fpga/card.hpp>
|
|
#include <villas/fpga/ips/dma.hpp>
|
|
#include <villas/fpga/ips/bram.hpp>
|
|
|
|
#include <villas/utils.hpp>
|
|
|
|
#include "global.hpp"
|
|
|
|
#include <villas/memory.hpp>
|
|
#include <villas/gpu.hpp>
|
|
|
|
using namespace villas;
|
|
|
|
// cppcheck-suppress unknownMacro
|
|
Test(fpga, gpu_dma, .description = "GPU DMA tests")
|
|
{
|
|
auto logger = logging.get("unit-test:dma");
|
|
|
|
auto &card = state.cards.front();
|
|
|
|
auto gpuPlugin = Plugin::Registry<GpuFactory>("cuda");
|
|
cr_assert_not_null(gpuPlugin, "No GPU plugin found");
|
|
|
|
auto gpus = gpuPlugin->make();
|
|
cr_assert(gpus.size() > 0, "No GPUs found");
|
|
|
|
// Just get first cpu
|
|
auto &gpu = gpus.front();
|
|
|
|
size_t count = 0;
|
|
for (auto &ip : card->ips) {
|
|
// Skip non-dma IPs
|
|
if (*ip != fpga::Vlnv("xilinx.com:ip:axi_bram_ctrl:"))
|
|
continue;
|
|
|
|
logger->info("Testing {}", *ip);
|
|
|
|
auto bram = dynamic_cast<fpga::ip::Bram*>(ip.get());
|
|
cr_assert_not_null(bram, "Couldn't find BRAM");
|
|
|
|
count++;
|
|
|
|
size_t len = 4 * (1 << 10);
|
|
|
|
// Allocate memory to use with DMA
|
|
|
|
auto bram0 = bram->getAllocator().allocate<char>(len);
|
|
auto bram1 = bram->getAllocator().allocate<char>(len);
|
|
|
|
gpu->makeAccessibleFromPCIeOrHostRam(bram0.getMemoryBlock());
|
|
gpu->makeAccessibleFromPCIeOrHostRam(bram1.getMemoryBlock());
|
|
|
|
auto hostRam0 = HostRam::getAllocator().allocate<char>(len);
|
|
auto hostRam1 = HostRam::getAllocator().allocate<char>(len);
|
|
|
|
gpu->makeAccessibleFromPCIeOrHostRam(hostRam0.getMemoryBlock());
|
|
gpu->makeAccessibleFromPCIeOrHostRam(hostRam1.getMemoryBlock());
|
|
|
|
auto dmaRam0 = HostDmaRam::getAllocator().allocate<char>(len);
|
|
auto dmaRam1 = HostDmaRam::getAllocator().allocate<char>(len);
|
|
|
|
gpu->makeAccessibleFromPCIeOrHostRam(dmaRam0.getMemoryBlock());
|
|
gpu->makeAccessibleFromPCIeOrHostRam(dmaRam1.getMemoryBlock());
|
|
|
|
auto gpuMem0 = gpu->getAllocator().allocate<char>(64 << 10);
|
|
auto gpuMem1 = gpu->getAllocator().allocate<char>(64 << 10);
|
|
|
|
gpu->makeAccessibleToPCIeAndVA(gpuMem0.getMemoryBlock());
|
|
gpu->makeAccessibleToPCIeAndVA(gpuMem1.getMemoryBlock());
|
|
|
|
// auto &src = bram0;
|
|
// auto &dst = bram1;
|
|
|
|
// auto &src = hostRam0;
|
|
// auto &dst = hostRam1;
|
|
|
|
auto &src = dmaRam0;
|
|
// auto &dst = dmaRam1;
|
|
|
|
// auto &src = gpuMem0;
|
|
auto &dst = gpuMem1;
|
|
|
|
std::list<std::pair<std::string, std::function<void()>>> memcpyFuncs = {
|
|
{"cudaMemcpy", [&]() {gpu->memcpySync(src.getMemoryBlock(), dst.getMemoryBlock(), len);}},
|
|
{"CUDA kernel", [&]() {gpu->memcpyKernel(src.getMemoryBlock(), dst.getMemoryBlock(), len);}},
|
|
};
|
|
|
|
auto dmaIp = card->lookupIp(fpga::Vlnv("xilinx.com:ip:axi_dma:"));
|
|
auto dma = std::dynamic_pointer_cast<fpga::ip::Dma>(dmaIp);
|
|
|
|
if (dma != nullptr and dma->connectLoopback()) {
|
|
memcpyFuncs.push_back({
|
|
"DMA memcpy", [&] (){
|
|
dma->makeAccesibleFromVA(src.getMemoryBlock());
|
|
dma->makeAccesibleFromVA(dst.getMemoryBlock());
|
|
dma->memcpy(src.getMemoryBlock(), dst.getMemoryBlock(), len);
|
|
}});
|
|
}
|
|
|
|
for (auto& [name, memcpyFunc] : memcpyFuncs) {
|
|
logger->info("Testing {}", name);
|
|
|
|
// Get new random data
|
|
const size_t lenRandom = utils::read_random(&src, len);
|
|
cr_assert(len == lenRandom, "Failed to get random data");
|
|
|
|
memcpyFunc();
|
|
const bool success = memcmp(&src, &dst, len) == 0;
|
|
|
|
logger->info(" {}", success ?
|
|
CLR_GRN("Passed") :
|
|
CLR_RED("Failed"));
|
|
}
|
|
|
|
MemoryManager::getGraph().dump();
|
|
}
|
|
|
|
cr_assert(count > 0, "No BRAM found");
|
|
}
|