nvshmem_add_perftest(bw.cpp)
nvshmem_add_perftest(latency.cpp)
nvshmem_add_perftest(stream_latency.cu)