af90312867
There were several error messages that appeared even if the hipEnvVarDriver.exe test passes and executes successfully. Now it is cleaned up. The following are those instances: * When popen searches for directed_test directory but does not find it, it outputs an error, then finds the hipEnvVar at the same level. Currently the fix will prompt the test to only output an error if both searches for hipEnvVar fails. * When assertion is used towards the later half of the test, conditions were set to specifically hide the devices, resulting in No Hip Device detected in the latter half of the test. The fix will make these errors not appear as they are intended to not find any devices. Assertions themselves are untouched. HipEnvVarDriver.cpp has also been refactored. Reading HipEnvVar will now happen in a helper function for getDeviceNumber and getDevicePCIBusNumRemote, as the code to read HipEnvVar were really similar in them.
152 lines
5.5 KiB
C++
152 lines
5.5 KiB
C++
/* Copyright (c) 2015-2016 Advanced Micro Devices, Inc. All rights reserved.
|
|
|
|
Permission is hereby granted, free of charge, to any person obtaining a copy of this software and
|
|
associated documentation files (the "Software"), to deal in the Software without restriction,
|
|
including without limitation the rights to use, copy, modify, merge, publish, distribute,
|
|
sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is
|
|
furnished to do so, subject to the following conditions:
|
|
|
|
The above copyright notice and this permission notice shall be included in all copies or substantial
|
|
portions of the Software.
|
|
|
|
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT
|
|
NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
|
NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
|
|
DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT
|
|
OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
|
|
|
|
/* HIT_START
|
|
* BUILD: %t %s test_common.cpp NVCC_OPTIONS -std=c++11
|
|
* TEST: %t
|
|
* HIT_END
|
|
*/
|
|
|
|
#include <iostream>
|
|
#include <vector>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <assert.h>
|
|
#include <string>
|
|
#include "hip/hip_runtime.h"
|
|
#include <chrono>
|
|
#include <thread>
|
|
#include "test_common.h"
|
|
|
|
using namespace std;
|
|
|
|
const string directed_dir = string(".") + PATH_SEPERATOR_STR + "directed_tests" + PATH_SEPERATOR_STR + "hipEnvVar";
|
|
const string dir = string(".") + PATH_SEPERATOR_STR + "hipEnvVar";
|
|
|
|
int readHipEnvVar(string flags, char* buff){
|
|
|
|
std::cout << "\nFinding hipEnvVar in " << directed_dir << "...\n";
|
|
FILE* directed_in = popen((directed_dir + flags).c_str(), "r");
|
|
|
|
if(fgets(buff, 512, directed_in) == NULL){
|
|
std::cout << "Finding hipEnvVar in " << dir << "...\n";
|
|
FILE* in = popen((dir + flags).c_str(), "r");
|
|
if(fgets(buff, 512, in) == NULL){
|
|
pclose(directed_in);
|
|
pclose(in);
|
|
return 1;
|
|
}
|
|
pclose(in);
|
|
}
|
|
std::cout << "hipEnvVar Found!\n";
|
|
pclose(directed_in);
|
|
return 0;
|
|
}
|
|
|
|
int getDeviceNumber(bool print_err=true) {
|
|
char buff[512];
|
|
std::this_thread::sleep_for(std::chrono::milliseconds(10));
|
|
|
|
if (readHipEnvVar(string(" -c"), buff)){
|
|
strncpy(buff, "1", 512);
|
|
if (print_err){
|
|
std::cerr << "The system cannot find hipEnvVar, using 1 as number of devices\n";
|
|
}
|
|
}
|
|
if (print_err) {
|
|
std::cout << buff;
|
|
}
|
|
return atoi(buff);
|
|
}
|
|
|
|
// Query the current device ID remotely to hipEnvVar
|
|
void getDevicePCIBusNumRemote(int deviceID, char* pciBusID) {
|
|
std::this_thread::sleep_for(std::chrono::milliseconds(10));
|
|
if (readHipEnvVar((" -d " + std::to_string(deviceID)), pciBusID)){
|
|
std::cerr << "The system cannot find hipEnvVar\n";
|
|
}
|
|
cout << pciBusID;
|
|
return;
|
|
}
|
|
|
|
// Query the current device ID locally on AMD path
|
|
void getDevicePCIBusNum(int deviceID, char* pciBusID) {
|
|
hipDevice_t deviceT;
|
|
hipDeviceGet(&deviceT, deviceID);
|
|
|
|
memset(pciBusID, 0, 512);
|
|
hipDeviceGetPCIBusId(pciBusID, 512, deviceT);
|
|
}
|
|
|
|
int main() {
|
|
unsetenv(HIP_VISIBLE_DEVICES_STR);
|
|
unsetenv(CUDA_VISIBLE_DEVICES_STR);
|
|
std::vector<std::string> devPCINum;
|
|
char pciBusID[512];
|
|
// collect the device pci bus ID for all devices
|
|
int totalDeviceNum = getDeviceNumber();
|
|
std::cout << "The total number of available devices is " << totalDeviceNum << std::endl
|
|
<< "Valid index range is 0 - " << totalDeviceNum - 1 << std::endl;
|
|
for (int i = 0; i < totalDeviceNum; i++) {
|
|
getDevicePCIBusNum(i, pciBusID);
|
|
devPCINum.push_back(pciBusID);
|
|
std::cout << "The collected device PCI Bus ID of Device " << i << " is " << devPCINum.back()
|
|
<< std::endl;
|
|
}
|
|
|
|
// select each of the available devices to be the target device,
|
|
// query the returned device pci bus number, check if match the database
|
|
for (int i = 0; i < totalDeviceNum; i++) {
|
|
setenv("HIP_VISIBLE_DEVICES", (char*)std::to_string(i).c_str(), 1);
|
|
setenv("CUDA_VISIBLE_DEVICES", (char*)std::to_string(i).c_str(), 1);
|
|
getDevicePCIBusNumRemote(0, pciBusID);
|
|
if (devPCINum[i] == pciBusID) {
|
|
std::cout << "The returned PciBusID is not correct" << std::endl;
|
|
std::cout << "Expected " << devPCINum[i] << ", but get " << pciBusID << endl;
|
|
exit(-1);
|
|
} else {
|
|
continue;
|
|
}
|
|
}
|
|
|
|
// check when set an invalid device number
|
|
setenv("HIP_VISIBLE_DEVICES", "1000,0,1", 1);
|
|
setenv("CUDA_VISIBLE_DEVICES", "1000,0,1", 1);
|
|
assert(getDeviceNumber(false) == 0);
|
|
|
|
if (totalDeviceNum > 2) {
|
|
setenv("HIP_VISIBLE_DEVICES", "0,1,1000,2", 1);
|
|
setenv("CUDA_VISIBLE_DEVICES", "0,1,1000,2", 1);
|
|
assert(getDeviceNumber(false) == 2);
|
|
|
|
setenv("HIP_VISIBLE_DEVICES", "0,1,2", 1);
|
|
setenv("CUDA_VISIBLE_DEVICES", "0,1,2", 1);
|
|
assert(getDeviceNumber(false) == 3);
|
|
// test if CUDA_VISIBLE_DEVICES will be accepted by the runtime
|
|
unsetenv(HIP_VISIBLE_DEVICES_STR);
|
|
unsetenv(CUDA_VISIBLE_DEVICES_STR);
|
|
setenv("CUDA_VISIBLE_DEVICES", "0,1,2", 1);
|
|
assert(getDeviceNumber(false) == 3);
|
|
}
|
|
|
|
setenv("HIP_VISIBLE_DEVICES", "-100,0,1", 1);
|
|
setenv("CUDA_VISIBLE_DEVICES", "-100,0,1", 1);
|
|
assert(getDeviceNumber(false) == 0);
|
|
|
|
std::cout << "PASSED" << std::endl;
|
|
return 0;
|
|
} |