<?xml version="1.0"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="en">
		<id>http://mars.merhot.dk/w/index.php?action=history&amp;feed=atom&amp;title=CUDA_example_1</id>
		<title>CUDA example 1 - Revision history</title>
		<link rel="self" type="application/atom+xml" href="http://mars.merhot.dk/w/index.php?action=history&amp;feed=atom&amp;title=CUDA_example_1"/>
		<link rel="alternate" type="text/html" href="http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;action=history"/>
		<updated>2026-04-30T21:54:29Z</updated>
		<subtitle>Revision history for this page on the wiki</subtitle>
		<generator>MediaWiki 1.29.0</generator>

	<entry>
		<id>http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11918&amp;oldid=prev</id>
		<title>Heth at 10:05, 16 May 2010</title>
		<link rel="alternate" type="text/html" href="http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11918&amp;oldid=prev"/>
				<updated>2010-05-16T10:05:38Z</updated>
		
		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table class=&quot;diff diff-contentalign-left&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;tr style='vertical-align: top;' lang='en'&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;← Older revision&lt;/td&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;Revision as of 10:05, 16 May 2010&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot; id=&quot;mw-diff-left-l1&quot; &gt;Line 1:&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;Line 1:&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;source lang=&lt;del class=&quot;diffchange diffchange-inline&quot;&gt;C&lt;/del&gt;&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;source lang=&lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;CUDA&lt;/ins&gt;&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;// includes, system&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;// includes, system&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;#include &amp;lt;stdio.h&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;#include &amp;lt;stdio.h&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Heth</name></author>	</entry>

	<entry>
		<id>http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11915&amp;oldid=prev</id>
		<title>Heth at 10:04, 16 May 2010</title>
		<link rel="alternate" type="text/html" href="http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11915&amp;oldid=prev"/>
				<updated>2010-05-16T10:04:07Z</updated>
		
		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table class=&quot;diff diff-contentalign-left&quot; data-mw=&quot;interface&quot;&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;tr style='vertical-align: top;' lang='en'&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;← Older revision&lt;/td&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;Revision as of 10:04, 16 May 2010&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot; id=&quot;mw-diff-left-l98&quot; &gt;Line 98:&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;Line 98:&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;}&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;}&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/source&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/source&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot;&gt;&amp;#160;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;[[Category:CUDA]]&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Heth</name></author>	</entry>

	<entry>
		<id>http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11913&amp;oldid=prev</id>
		<title>Heth: CUDA notes 1 moved to CUDA example 1</title>
		<link rel="alternate" type="text/html" href="http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11913&amp;oldid=prev"/>
				<updated>2010-05-16T09:53:51Z</updated>
		
		<summary type="html">&lt;p&gt;&lt;a href=&quot;/w/index.php/CUDA_notes_1&quot; class=&quot;mw-redirect&quot; title=&quot;CUDA notes 1&quot;&gt;CUDA notes 1&lt;/a&gt; moved to &lt;a href=&quot;/w/index.php/CUDA_example_1&quot; title=&quot;CUDA example 1&quot;&gt;CUDA example 1&lt;/a&gt;&lt;/p&gt;
&lt;table class=&quot;diff diff-contentalign-left&quot; data-mw=&quot;interface&quot;&gt;
				&lt;tr style='vertical-align: top;' lang='en'&gt;
				&lt;td colspan='1' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;← Older revision&lt;/td&gt;
				&lt;td colspan='1' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;Revision as of 09:53, 16 May 2010&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan='2' style='text-align: center;' lang='en'&gt;&lt;div class=&quot;mw-diff-empty&quot;&gt;(No difference)&lt;/div&gt;
&lt;/td&gt;&lt;/tr&gt;&lt;/table&gt;</summary>
		<author><name>Heth</name></author>	</entry>

	<entry>
		<id>http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11912&amp;oldid=prev</id>
		<title>Heth: New page: &lt;source lang=C&gt; // includes, system #include &lt;stdio.h&gt; #include &lt;assert.h&gt;  // Simple utility function to check for CUDA runtime errors void checkCUDAError(const char* msg);  // Part3: imp...</title>
		<link rel="alternate" type="text/html" href="http://mars.merhot.dk/w/index.php?title=CUDA_example_1&amp;diff=11912&amp;oldid=prev"/>
				<updated>2010-05-16T09:53:37Z</updated>
		
		<summary type="html">&lt;p&gt;New page: &amp;lt;source lang=C&amp;gt; // includes, system #include &amp;lt;stdio.h&amp;gt; #include &amp;lt;assert.h&amp;gt;  // Simple utility function to check for CUDA runtime errors void checkCUDAError(const char* msg);  // Part3: imp...&lt;/p&gt;
&lt;p&gt;&lt;b&gt;New page&lt;/b&gt;&lt;/p&gt;&lt;div&gt;&amp;lt;source lang=C&amp;gt;&lt;br /&gt;
// includes, system&lt;br /&gt;
#include &amp;lt;stdio.h&amp;gt;&lt;br /&gt;
#include &amp;lt;assert.h&amp;gt;&lt;br /&gt;
&lt;br /&gt;
// Simple utility function to check for CUDA runtime errors&lt;br /&gt;
void checkCUDAError(const char* msg);&lt;br /&gt;
&lt;br /&gt;
// Part3: implement the kernel&lt;br /&gt;
__global__ void reverseArrayBlock(int *d_out, int *d_in)&lt;br /&gt;
{&lt;br /&gt;
    int inOffset  = blockDim.x * blockIdx.x;&lt;br /&gt;
    int outOffset = blockDim.x * (gridDim.x - 1 - blockIdx.x);&lt;br /&gt;
    int in  = inOffset + threadIdx.x;&lt;br /&gt;
    int out = outOffset + (blockDim.x - 1 - threadIdx.x);&lt;br /&gt;
    d_out[out] = d_in[in];&lt;br /&gt;
}&lt;br /&gt;
/////////////////////////////////////////////////////////////////////&lt;br /&gt;
// Program main&lt;br /&gt;
/////////////////////////////////////////////////////////////////////&lt;br /&gt;
int main( int argc, char** argv) &lt;br /&gt;
{&lt;br /&gt;
    // pointer for host memory and size&lt;br /&gt;
    int *h_a;&lt;br /&gt;
    int dimA = 256 * 1024; // 256K elements (1MB total)&lt;br /&gt;
&lt;br /&gt;
    // pointer for device memory&lt;br /&gt;
    int *d_b, *d_a;&lt;br /&gt;
&lt;br /&gt;
    // define grid and block size&lt;br /&gt;
    int numThreadsPerBlock = 256;&lt;br /&gt;
&lt;br /&gt;
    // Part 1: compute number of blocks needed based on &lt;br /&gt;
    // array size and desired block size&lt;br /&gt;
    int numBlocks = dimA / numThreadsPerBlock;  &lt;br /&gt;
&lt;br /&gt;
    // allocate host and device memory&lt;br /&gt;
    size_t memSize = numBlocks * numThreadsPerBlock * sizeof(int);&lt;br /&gt;
    h_a = (int *) malloc(memSize);&lt;br /&gt;
    cudaMalloc( (void **) &amp;amp;d_a, memSize );&lt;br /&gt;
    cudaMalloc( (void **) &amp;amp;d_b, memSize );&lt;br /&gt;
&lt;br /&gt;
    // Initialize input array on host&lt;br /&gt;
    for (int i = 0; i &amp;lt; dimA; ++i)&lt;br /&gt;
    {&lt;br /&gt;
        h_a[i] = i;&lt;br /&gt;
    }&lt;br /&gt;
&lt;br /&gt;
    // Copy host array to device array&lt;br /&gt;
    cudaMemcpy( d_a, h_a, memSize, cudaMemcpyHostToDevice );&lt;br /&gt;
&lt;br /&gt;
    // launch kernel&lt;br /&gt;
    dim3 dimGrid(numBlocks);&lt;br /&gt;
    dim3 dimBlock(numThreadsPerBlock);&lt;br /&gt;
    reverseArrayBlock&amp;lt;&amp;lt;&amp;lt; dimGrid, dimBlock &amp;gt;&amp;gt;&amp;gt;( d_b, d_a );&lt;br /&gt;
&lt;br /&gt;
    // block until the device has completed&lt;br /&gt;
    cudaThreadSynchronize();&lt;br /&gt;
&lt;br /&gt;
    // check if kernel execution generated an error&lt;br /&gt;
    // Check for any CUDA errors&lt;br /&gt;
    checkCUDAError(&amp;quot;kernel invocation&amp;quot;);&lt;br /&gt;
&lt;br /&gt;
    // device to host copy&lt;br /&gt;
    cudaMemcpy( h_a, d_b, memSize, cudaMemcpyDeviceToHost );&lt;br /&gt;
&lt;br /&gt;
    // Check for any CUDA errors&lt;br /&gt;
    checkCUDAError(&amp;quot;memcpy&amp;quot;);&lt;br /&gt;
&lt;br /&gt;
    // verify the data returned to the host is correct&lt;br /&gt;
    for (int i = 0; i &amp;lt; dimA; i++)&lt;br /&gt;
    {&lt;br /&gt;
        assert(h_a[i] == dimA - 1 - i );&lt;br /&gt;
    }&lt;br /&gt;
&lt;br /&gt;
    // free device memory&lt;br /&gt;
    cudaFree(d_a);&lt;br /&gt;
    cudaFree(d_b);&lt;br /&gt;
&lt;br /&gt;
    // free host memory&lt;br /&gt;
    free(h_a);&lt;br /&gt;
&lt;br /&gt;
    // If the program makes it this far, then the results are &lt;br /&gt;
    // correct and there are no run-time errors.  Good work!&lt;br /&gt;
    printf(&amp;quot;Correct!\n&amp;quot;);&lt;br /&gt;
&lt;br /&gt;
    return 0;&lt;br /&gt;
}&lt;br /&gt;
void checkCUDAError(const char *msg)&lt;br /&gt;
{&lt;br /&gt;
    cudaError_t err = cudaGetLastError();&lt;br /&gt;
    if( cudaSuccess != err) &lt;br /&gt;
    {&lt;br /&gt;
        fprintf(stderr, &amp;quot;Cuda error: %s: %s.\n&amp;quot;, msg, &lt;br /&gt;
                                  cudaGetErrorString( err) );&lt;br /&gt;
        exit(EXIT_FAILURE);&lt;br /&gt;
    }                         &lt;br /&gt;
}&lt;br /&gt;
&amp;lt;/source&amp;gt;&lt;/div&gt;</summary>
		<author><name>Heth</name></author>	</entry>

	</feed>