fix tutorial

This commit is contained in:
Dun Liang 2020-03-22 10:51:44 +08:00
parent c6b40bb485
commit 212862980f
2 changed files with 2 additions and 2 deletions

View File

@ -204,7 +204,7 @@ for i0 in range(shape[0]):
for i4 in range(shape[4]):
for i5 in range(shape[5]):
for i6 in range(shape[6]):
y[i0,i1,i2,i6] += yy[i0,i1,i2,i3,i4,i5,i6]
y[i0,i1,i2,i6] += x[i0,i1+i3,i2+i4,i5] * w[i3,i4,i5,i6]
```
**After loop fusion:**

View File

@ -691,7 +691,7 @@ def check_cuda():
return
global cc_flags, has_cuda, core_link_flags, cuda_dir, cuda_lib, cuda_include
cuda_dir = os.path.dirname(get_full_path_of_executable(nvcc_path))
assert cuda_dir.endswith("bin") and "cuda" in cuda_dir, f"Wrong cuda_dir: {cuda_dir}"
assert cuda_dir.endswith("bin") and "cuda" in cuda_dir.lower(), f"Wrong cuda_dir: {cuda_dir}"
cuda_include = os.path.abspath(os.path.join(cuda_dir, "..", "include"))
cuda_lib = os.path.abspath(os.path.join(cuda_dir, "..", "lib64"))
cuda_include2 = os.path.join(jittor_path, "extern","cuda","inc")