diff --git a/Samples/p2pBandwidthLatencyTest/p2pBandwidthLatencyTest.cu b/Samples/p2pBandwidthLatencyTest/p2pBandwidthLatencyTest.cu index 181785124..7b83e392d 100644 --- a/Samples/p2pBandwidthLatencyTest/p2pBandwidthLatencyTest.cu +++ b/Samples/p2pBandwidthLatencyTest/p2pBandwidthLatencyTest.cu @@ -277,10 +277,9 @@ void outputBandwidthMatrix(int numGPUs, bool p2p, P2PDataTransfer p2p_method) { cudaCheckError(); cudaStreamDestroy(stream[d]); cudaCheckError(); + cudaDeviceReset(); + cudaCheckError(); } - - cudaFreeHost((void *)flag); - cudaCheckError(); } void outputBidirectionalBandwidthMatrix(int numGPUs, bool p2p) { @@ -433,10 +432,9 @@ void outputBidirectionalBandwidthMatrix(int numGPUs, bool p2p) { cudaCheckError(); cudaStreamDestroy(stream1[d]); cudaCheckError(); + cudaDeviceReset(); + cudaCheckError(); } - - cudaFreeHost((void *)flag); - cudaCheckError(); } void outputLatencyMatrix(int numGPUs, bool p2p, P2PDataTransfer p2p_method) { @@ -586,12 +584,11 @@ void outputLatencyMatrix(int numGPUs, bool p2p, P2PDataTransfer p2p_method) { cudaCheckError(); cudaStreamDestroy(stream[d]); cudaCheckError(); + cudaDeviceReset(); + cudaCheckError(); } sdkDeleteTimer(&stopWatch); - - cudaFreeHost((void *)flag); - cudaCheckError(); } int main(int argc, char **argv) {