Base64 Encoding on a GPU

Nick Kopp

Rate me:

4.89/5 (26 votes)

16 Sep 2013LGPL310 min read

64.3K

1.8K

Performing base64 encoding on a graphics processing unit using CUDAfy.NET (CUDA in .NET).

Base64EncodingOnGPU_src-noexe.zip
- Base64EncodingOnGPU
  - Base64EncodingOnGPU.sln
  - Base64EncodingOnGPU
    - app.config
    - Base64EncodingOnGPU.csproj
    - GPUConvert.cs
    - Program.cs
    - Properties
      - AssemblyInfo.cs
  - CudafyV1.26
    - bin
      - Cudafy.NET.xml
    - CUDA.NET.Readme.txt
    - CUDAfy API Documentation.url
    - CUDAfy_User_Manual_1_22.pdf
    - CudafyByExample
      - app.config
      - chapter03
        
        enum_gpu.cs
        
        hello_world.cs
        
        simple_kernel.cs
        
        simple_kernel_params.cs
      - chapter04
        
        add_loop_cpu.cs
        
        add_loop_gpu.cs
        
        add_loop_gpu_alt.cs
        
        add_loop_long.cs
        
        cuComplex.cs
        
        julia_cpu.cs
        
        julia_cpu.Designer.cs
        
        julia_cpu.resx
        
        julia_gpu.cs
      - chapter05
        
        add_loop_blocks.cs
        
        add_loop_long_blocks.cs
        
        dot.cs
        
        ripple.cs
        
        ripple.Designer.cs
        
        ripple.resx
        
        ripple_gpu.cs
      - chapter06
        
        ray.cs
        
        ray_gui.cs
        
        ray_gui.Designer.cs
        
        ray_gui.resx
        
        ray_noconst.cs
        
        ray_opencl.cs
        
        ray_opencl_const.cs
      - chapter09
        
        hist_gpu_shmem_atomics.cs
      - chapter10
        
        basic_double_stream_correct.cs
        
        copy_timed.cs
      - CudafyByExample.csproj
      - CudafyByExample.sln
      - Program.cs
      - Properties
        
        AssemblyInfo.cs
    - CUDAfy-License.txt
    - ILSpy-license.txt
    - README.txt
    - Visit www.hybriddsp.com for full CUDAfy.NET SDK.txt
Base64EncodingOnGPU_src.zip
- Base64EncodingOnGPU.sln
- .svn
  - app.config
  - Base64EncodingOnGPU.csproj
  - GPUConvert.cs
  - Program.cs
  - AssemblyInfo.cs
  - Cudafy.NET.dll
  - Cudafy.NET.xml
  - CUDA.NET.Readme.txt
  - CUDAfy API Documentation.url
  - CUDAfy_User_Manual_1_22.pdf
  - app.config
  - enum_gpu.cs
  - hello_world.cs
  - simple_kernel.cs
  - simple_kernel_params.cs
  - add_loop_cpu.cs
  - add_loop_gpu.cs
  - add_loop_gpu_alt.cs
  - add_loop_long.cs
  - cuComplex.cs
  - julia_cpu.cs
  - julia_cpu.Designer.cs
  - julia_cpu.resx
  - julia_gpu.cs
  - add_loop_blocks.cs
  - add_loop_long_blocks.cs
  - dot.cs
  - ripple.cs
  - ripple.Designer.cs
  - ripple.resx
  - ripple_gpu.cs
  - ray.cs
  - ray_gui.cs
  - ray_gui.Designer.cs
  - ray_gui.resx
  - ray_noconst.cs
  - ray_opencl.cs
  - ray_opencl_const.cs
  - hist_gpu_shmem_atomics.cs
  - basic_double_stream_correct.cs
  - copy_timed.cs
  - CudafyByExample.csproj
  - CudafyByExample.sln
  - Program.cs
  - AssemblyInfo.cs
  - CUDAfy-License.txt
  - ILSpy-license.txt
  - README.txt
  - Visit www.hybriddsp.com for full CUDAfy.NET SDK.txt

/* 
 * This software is based upon the book CUDA By Example by Sanders and Kandrot
 * and source code provided by NVIDIA Corporation.
 * It is a good idea to read the book while studying the examples!
*/
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Threading;
using System.Runtime.InteropServices;
using Cudafy;
using Cudafy.Host;
using Cudafy.Translator;

namespace CudafyByExample
{
    [Cudafy]
    public struct SphereOpenCL
    {
        public float r;
        public float b;
        public float g;
        public float radius;
        public float x;
        public float y;
        public float z;
    }

    public class ray_opencl
    {
        public const int RAND_MAX = Int32.MaxValue;
        public const float INF = 2e10f;

        public static float rnd(float x)
        {
            float f = x * (float)rand.NextDouble();
            return f;
        }

        public static Random rand = new Random((int)DateTime.Now.Ticks);

        public const int SPHERES = 20;

        [Cudafy]
        public static float hit(SphereOpenCL s, float ox1, float oy1, ref float n1)
        {
            float dx = ox1 - s.x;
            float dy = oy1 - s.y;
            if (dx * dx + dy * dy < s.radius * s.radius)
            {
                float dz = GMath.Sqrt(s.radius * s.radius - dx * dx - dy * dy);
                n1 = dz / GMath.Sqrt(s.radius * s.radius);
                return dz + s.z;
            }
            return -2e10f;
        }

        [Cudafy]
        public static void thekernel(GThread thread, SphereOpenCL[] s, byte[] ptr)
        {
            //SphereOpenCL localSphere = s[0];
            SphereOpenCL[] sharedSphere = thread.AllocateShared<SphereOpenCL>("sharedSphere", 16);
            int[] sharedInt = thread.AllocateShared<int>("sharedInt", 16);
            //float somefloat = GMath.Pow(localSphere.b, 2.0F);
            // map from threadIdx/BlockIdx to pixel position
            int x = thread.threadIdx.x + thread.blockIdx.x * thread.blockDim.x;
            int y = thread.threadIdx.y + thread.blockIdx.y * thread.blockDim.y;
            int offset = x + y * thread.blockDim.x * thread.gridDim.x;
            float ox = (x - ray_gui.DIM / 2);
            float oy = (y - ray_gui.DIM / 2);

            float r = 0, g = 0, b = 0;
            float maxz = -INF;
            for (int i = 0; i < SPHERES; i++)
            {
                float n = 0;                
                float t = hit(s[i], ox, oy, ref n);
                if (t > maxz)
                {
                    float fscale = n;
                    r = s[i].r * fscale;
                    g = s[i].g * fscale;
                    b = s[i].b * fscale;
                    maxz = t;
                }
            }

            ptr[offset * 4 + 0] = (byte)(r * 255);
            ptr[offset * 4 + 1] = (byte)(g * 255);
            ptr[offset * 4 + 2] = (byte)(b * 255);
            ptr[offset * 4 + 3] = 255;
        }

        public static void Execute(byte[] bitmap)
        {
            CudafyModule km = CudafyModule.TryDeserialize();
            if (km == null || !km.TryVerifyChecksums())
            {
                km = CudafyTranslator.Cudafy(typeof(SphereOpenCL), typeof(ray_opencl));
                km.TrySerialize();
            }

            GPGPU gpu = CudafyHost.GetDevice(CudafyModes.Target, CudafyModes.DeviceId);
            gpu.LoadModule(km);

            // capture the start time
            gpu.StartTimer();

            // allocate memory on the GPU for the bitmap (same size as ptr)
            byte[] dev_bitmap = gpu.Allocate(bitmap);

            // allocate memory for the Sphere dataset
            SphereOpenCL[] s = gpu.Allocate<SphereOpenCL>(SPHERES);

            // allocate temp memory, initialize it, copy to constant memory on the GPU
            SphereOpenCL[] temp_s = new SphereOpenCL[SPHERES];
            for (int i = 0; i < SPHERES; i++)
            {
                temp_s[i].r = rnd(1.0f);
                temp_s[i].g = rnd(1.0f);
                temp_s[i].b = rnd(1.0f);

                temp_s[i].x = rnd(1000.0f) - 500;
                temp_s[i].y = rnd(1000.0f) - 500;
                temp_s[i].z = rnd(1000.0f) - 500;
                temp_s[i].radius = rnd(100.0f) + 20;

            }
            gpu.CopyToDevice(temp_s, s);

            // generate a bitmap from our sphere data
            dim3 grids = new dim3(ray_gui.DIM / 16, ray_gui.DIM / 16);
            dim3 threads = new dim3(16, 16);
            //gpu.Launch(grids, threads).kernel(s, dev_bitmap); // Dynamic
            gpu.Launch(grids, threads, ((Action<GThread, SphereOpenCL[], byte[]>)thekernel), s, dev_bitmap); // Strongly typed

            // copy our bitmap back from the GPU for display
            gpu.CopyFromDevice(dev_bitmap, bitmap);

            // get stop time, and display the timing results
            float elapsedTime = gpu.StopTimer();
            Console.WriteLine("Time to generate: {0} ms", elapsedTime);

            gpu.FreeAll();
        }
    }
}

By viewing downloads associated with this article you agree to the Terms of Service and the article's licence.

If a file you wish to view isn't highlighted, and is a text file (not binary), please let us know and we'll add colourisation support for it.

License

This article, along with any associated source code and files, is licensed under The GNU Lesser General Public License (LGPLv3)

Written By

Nick Kopp

Systems Engineer Hybrid DSP Systems

Netherlands

Nick is co owner of Hybrid DSP , a company specialized in high speed data acquisition, processing and storage.

CUDAfy.NET took considerable effort to develop and we ask nothing in return from users of the LGPL library other than that you please consider donating to Harmony through Education . This small charity helps handicapped children in developing countries by providing suitable schooling.

Base64 Encoding on a GPU

License

Comments and Discussions