// Initialize input vectors for (int i = 0; i < n; i++) h_a[i] = rand() / (float)RAND_MAX; h_b[i] = rand() / (float)RAND_MAX;
run: $(TARGET) ./$(TARGET)
$(TARGET): $(SOURCES) $(NVCC) $(NVCC_FLAGS) -o $@ $^ cuda toolkit
std::cout << (correct ? "SUCCESS" : "FAILURE") << std::endl; // Initialize input vectors for (int i =
// Copy result back to host cudaMemcpy(h_c, d_c, bytes, cudaMemcpyDeviceToHost); i++) h_a[i] = rand() / (float)RAND_MAX
all: $(TARGET)
clean: rm -f $(TARGET)