nvshmem_add_perftest(bw.cpp) nvshmem_add_perftest(latency.cpp) nvshmem_add_perftest(stream_latency.cu)