summaryrefslogtreecommitdiffstats
path: root/docs
diff options
context:
space:
mode:
authorYong He <yonghe@outlook.com>2023-03-29 10:00:48 -0700
committerGitHub <noreply@github.com>2023-03-29 10:00:48 -0700
commita862f5b7007ef50b5def30506f0cea138b73c710 (patch)
treeb45a82fc5668f6652ba3f2f17b326c5be9a678a2 /docs
parentbbf12c20dfa7d835a430decc4e029ad467293f20 (diff)
Update a1-02-slangpy.md
Diffstat (limited to 'docs')
-rw-r--r--docs/user-guide/a1-02-slangpy.md4
1 files changed, 2 insertions, 2 deletions
diff --git a/docs/user-guide/a1-02-slangpy.md b/docs/user-guide/a1-02-slangpy.md
index 6ee039d43..6a9b8baa3 100644
--- a/docs/user-guide/a1-02-slangpy.md
+++ b/docs/user-guide/a1-02-slangpy.md
@@ -37,7 +37,7 @@ void square_fwd_kernel(TensorView<float> input, TensorView<float> output)
{
uint3 globalIdx = cudaBlockIdx() * cudaBlockDim() + cudaThreadIdx();
- if (globalIdx.x > input.size(0) || globalIdx.x > input.size(1))
+ if (globalIdx.x > input.size(0) || globalIdx.y > input.size(1))
return;
float result = square(input[globalIdx.xy]);
output[globalIdx.xy] = result;
@@ -134,7 +134,7 @@ void square_bwd_kernel(TensorView<float> input, TensorView<float> grad_out, Tens
{
uint3 globalIdx = cudaBlockIdx() * cudaBlockDim() + cudaThreadIdx();
- if (globalIdx.x > input.size(0) || globalIdx.x > input.size(1))
+ if (globalIdx.x > input.size(0) || globalIdx.y > input.size(1))
return;
DifferentialPair<float> dpInput = diffPair(input[globalIdx.xy]);