瀏覽代碼

Merge pull request #34 from jeng1220/bugfix_stdpar

Bugfix for stdpar
Bharatkumar Sharma 4 年之前
父節點
當前提交
20ec4c4746

+ 5 - 2
hpc/nways/nways_labs/nways_MD/English/C/jupyter_notebook/stdpar/nways_stdpar.ipynb

@@ -160,7 +160,10 @@
    "outputs": [],
    "source": [
     "#Compile the code for muticore\n",
-    "!cd ../../source_code/stdpar && nvc++ -std=c++17 -stdpar=multicore -o rdf rdf.cpp -ltbb"
+    "!cd ../../source_code/stdpar && nvc++ -std=c++17 -stdpar=multicore \\\n",
+    "-I/opt/nvidia/hpc_sdk/Linux_x86_64/21.3/cuda/11.2/include \\\n",
+    "-o rdf rdf.cpp -fopenmp \\\n",
+    "-L/opt/nvidia/hpc_sdk/Linux_x86_64/21.3/cuda/11.2/lib64 -lnvToolsExt"
    ]
   },
   {
@@ -232,7 +235,7 @@
    "outputs": [],
    "source": [
     "#compile for Tesla GPU\n",
-    "!cd ../../source_code/stdpar && nvc++ -std=c++17 -DUSE_COUNTING_ITERATIOR  -stdpar=gpu -o rdf rdf.cpp "
+    "!cd ../../source_code/stdpar && nvc++ -std=c++17 -DUSE_COUNTING_ITERATOR  -stdpar=gpu -o rdf rdf.cpp "
    ]
   },
   {

+ 1 - 1
hpc/nways/nways_labs/nways_MD/English/C/source_code/stdpar/rdf.cpp

@@ -12,7 +12,7 @@
 #include <algorithm>
 #include <vector>
 #include <atomic>
-#include </opt/nvidia/hpc_sdk/Linux_x86_64/21.3/cuda/11.2/include>
+#include <nvtx3/nvToolsExt.h>
 
 //Note: The addition of execution header file
 #include <execution>