CUDA

The document contains code for performing vector addition and matrix multiplication on a GPU using CUDA. For vector addition, two arrays are copied to the GPU memory and a kernel is launched to add the corresponding elements of the arrays and store the results in a third array. For matrix multiplication, two matrices are copied to the GPU and a kernel is launched that calculates the dot product of each row of the first matrix with each column of the second matrix to produce the output matrix. The results are then copied back from the GPU to CPU memory and printed.

Uploaded by

killua gojo

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

17 views

CUDA

Uploaded by

killua gojo

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 3

HPC ASSIGNMENT 4

VECTOR ADDITION

%%cu
#include<stdio.h>
#include<cuda.h>
__global__ void arradd(int *x,int *y, int *z) //kernel definition
{
int id=blockIdx.x;
/* blockIdx.x gives the respective block id which starts from 0 */
z[id]=x[id]+y[id];
}
int main()
{
int a[6]={1,2,4,5,6};
int b[6]={2,3,4,5};
int c[6];
int *d,*e,*f;
int i;
printf("\n Enter six elements of first array\n");
for(i=0;i<6;i++)
{
scanf("%d",&a[i]);
}
printf("\n Enter six elements of second array\n");
for(i=0;i<6;i++)
{
scanf("%d",&b[i]);
}
/* cudaMalloc() allocates memory from Global memory on GPU */
cudaMalloc((void **)&d,6*sizeof(int));
cudaMalloc((void **)&e,6*sizeof(int));
cudaMalloc((void **)&f,6*sizeof(int));
/* cudaMemcpy() copies the contents from destination to source. Here de
stination is GPU(d,e) and source is CPU(a,b) */
cudaMemcpy(d,a,6*sizeof(int),cudaMemcpyHostToDevice);
cudaMemcpy(e,b,6*sizeof(int),cudaMemcpyHostToDevice);
/* call to kernel. Here 6 is number of blocks, 1 is the number of threa
ds per block and d,e,f are the arguments */
arradd<<<6,1>>>(d,e,f);
/* Here we are copying content from GPU(Device) to CPU(Host) */
cudaMemcpy(c,f,6*sizeof(int),cudaMemcpyDeviceToHost);
printf("\nSum of two arrays:\n ");
for(i=0;i<6;i++)
{
printf("%d\t",c[i]);
}
/* Free the memory allocated to pointers d,e,f */
cudaFree(d);
cudaFree(e);
cudaFree(f);
return 0;
}

OUTPUT:-
Enter six elements of first array

Enter six elements of second array

Sum of two arrays:

3 5 8 10 6 0

MATRIX MULTIPLICATION

%%cu
#include<stdio.h>
#include<cuda.h>
#define row1 2 /* Number of rows of first matrix */
#define col1 3 /* Number of columns of first matrix */
#define row2 3 /* Number of rows of second matrix */
#define col2 2 /* Number of columns of second matrix */

global void matproduct(int l,int m, int *n)

{
int x=blockIdx.x;
int y=blockIdx.y;
int k;

n[col2*y+x]=0;
for(k=0;k<col1;k++)
{
n[col2*y+x]=n[col2*y+x]+l[col1*y+k]*m[col2*k+x];
}
}

int main()
{
int a[row1][col1] = { 10, 11, 12, 13, 14, 15};

int b[row2][col2] = { 10, 11, 12, 13, 14, 15};

int c[row1][col2];
int *d,*e,*f;
int i,j;

cudaMalloc((void **)&d,row1*col1*sizeof(int));
cudaMalloc((void **)&e,row2*col2*sizeof(int));
cudaMalloc((void **)&f,row1*col2*sizeof(int));

cudaMemcpy(d,a,row1*col1*sizeof(int),cudaMemcpyHostToDevice);
cudaMemcpy(e,b,row2*col2*sizeof(int),cudaMemcpyHostToDevice);

dim3 grid(col2,row1);
/* Here we are defining two dimensional Grid(collection of blocks) stru
cture. Syntax is dim3 grid(no. of columns,no. of rows) */

matproduct<<<grid,1>>>(d,e,f);

cudaMemcpy(c,f,row1*col2*sizeof(int),cudaMemcpyDeviceToHost);
printf("\nProduct of two matrices:\n ");
for(i=0;i<row1;i++)
{
for(j=0;j<col2;j++)
{
printf("%d\t",c[i][j]);
}
printf("\n");
}

cudaFree(d);
cudaFree(e);
cudaFree(f);

return 0;
}

OUTPUT:-
Product of two matrices:
400 433
508 550

Roots of Polynomials Integral Topic Assessment
100% (2)
Roots of Polynomials Integral Topic Assessment
6 pages
GNG1106 Final 2008 Solutions PDF
No ratings yet
GNG1106 Final 2008 Solutions PDF
11 pages
1.1 Equivalence Relations
100% (1)
1.1 Equivalence Relations
17 pages
38 - Matrix True False
No ratings yet
38 - Matrix True False
4 pages
Mulmatrix Cu
No ratings yet
Mulmatrix Cu
3 pages
Input: Output: 1. Sub String Program
No ratings yet
Input: Output: 1. Sub String Program
8 pages
20 Quiz 14
No ratings yet
20 Quiz 14
12 pages
Sem II C++ Programs
No ratings yet
Sem II C++ Programs
40 pages
Program 9: Create A Database Regarding Its Indoor Patients
No ratings yet
Program 9: Create A Database Regarding Its Indoor Patients
13 pages
CS200 Final Exam Fall 2023 SOLUTION
No ratings yet
CS200 Final Exam Fall 2023 SOLUTION
13 pages
C++
No ratings yet
C++
15 pages
Pointers Example22
No ratings yet
Pointers Example22
1 page
Program To Calculate 100!
No ratings yet
Program To Calculate 100!
25 pages
Task Intermediate
No ratings yet
Task Intermediate
15 pages
DPC LAB MANUAL For Print
No ratings yet
DPC LAB MANUAL For Print
29 pages
1prac Cgr Merged
No ratings yet
1prac Cgr Merged
24 pages
sample_answer_end_sem_IC100_2024
No ratings yet
sample_answer_end_sem_IC100_2024
11 pages
C/C++ Source Codes: Programme For E.G. of Width and Setew Functions
No ratings yet
C/C++ Source Codes: Programme For E.G. of Width and Setew Functions
10 pages
2 Ques
No ratings yet
2 Ques
2 pages
C Assignment
No ratings yet
C Assignment
30 pages
1 C++Answer
No ratings yet
1 C++Answer
9 pages
Gedung 3dimensi Visual Studio
No ratings yet
Gedung 3dimensi Visual Studio
13 pages
Week 3 - Prog2 - Two Dimensional Array
No ratings yet
Week 3 - Prog2 - Two Dimensional Array
12 pages
Program
No ratings yet
Program
7 pages
CPP LABPGM 1- 12
No ratings yet
CPP LABPGM 1- 12
20 pages
Oop Practicals 1-14
No ratings yet
Oop Practicals 1-14
36 pages
ArraysString
No ratings yet
ArraysString
35 pages
2d Array - Prod - Add
No ratings yet
2d Array - Prod - Add
3 pages
KNC Asic
No ratings yet
KNC Asic
10 pages
DS Programs
No ratings yet
DS Programs
29 pages
Program #1 Implementation of Line Generation Using DDA Algorithms
No ratings yet
Program #1 Implementation of Line Generation Using DDA Algorithms
27 pages
CGR
No ratings yet
CGR
32 pages
PROGRAM 1
No ratings yet
PROGRAM 1
9 pages
Unit 4 & 5
No ratings yet
Unit 4 & 5
17 pages
Computer Graphics Lab
No ratings yet
Computer Graphics Lab
43 pages
Program: / Implementing Class With Static Data Member
No ratings yet
Program: / Implementing Class With Static Data Member
49 pages
Menu Driven Program For Creation, Deletion, Insertion
No ratings yet
Menu Driven Program For Creation, Deletion, Insertion
9 pages
Department of Computer Engineering BE Laboratory Practice-I A.Y 2021-22 SEM1
No ratings yet
Department of Computer Engineering BE Laboratory Practice-I A.Y 2021-22 SEM1
45 pages
CodeISM Class 4 (STL Pair, Sort, Structure)
No ratings yet
CodeISM Class 4 (STL Pair, Sort, Structure)
9 pages
Assignment 1 To 7 With Output
No ratings yet
Assignment 1 To 7 With Output
30 pages
HPC (Pra 04)
No ratings yet
HPC (Pra 04)
11 pages
DAy 2 DSA Vivek
No ratings yet
DAy 2 DSA Vivek
14 pages
C++ Program
No ratings yet
C++ Program
17 pages
Data Structures Lab Using C
No ratings yet
Data Structures Lab Using C
86 pages
By Shahbaz Alvi Awan
No ratings yet
By Shahbaz Alvi Awan
26 pages
Lab Manual CG
No ratings yet
Lab Manual CG
24 pages
DSP Code Not Run Yet
No ratings yet
DSP Code Not Run Yet
4 pages
MCS02
No ratings yet
MCS02
167 pages
Partial Code
No ratings yet
Partial Code
14 pages
10 Programs
No ratings yet
10 Programs
21 pages
Mid Term 1 - Solution
No ratings yet
Mid Term 1 - Solution
4 pages
Untitled
No ratings yet
Untitled
8 pages
Data Structure in C Book Programs
No ratings yet
Data Structure in C Book Programs
210 pages
Kuldeep Trivedi (CG)ada
No ratings yet
Kuldeep Trivedi (CG)ada
28 pages
MMTE-001 P 1
No ratings yet
MMTE-001 P 1
35 pages
Bezier-Surfaces C++ Code
No ratings yet
Bezier-Surfaces C++ Code
9 pages
Koch Fractal - One of The Easiest Algorithms With Graphics
No ratings yet
Koch Fractal - One of The Easiest Algorithms With Graphics
4 pages
Java Experiments
No ratings yet
Java Experiments
32 pages
C++ 4th Sem Pgms
No ratings yet
C++ 4th Sem Pgms
24 pages
Assignment 3 PF
No ratings yet
Assignment 3 PF
9 pages
Exercise 1 (1pt) : Master M1 SMA Computer Programming Class 2012/13. Exam. 2 Hours, Open Book
No ratings yet
Exercise 1 (1pt) : Master M1 SMA Computer Programming Class 2012/13. Exam. 2 Hours, Open Book
11 pages
Computer Network Lab Manual 2024 5 Pro
No ratings yet
Computer Network Lab Manual 2024 5 Pro
16 pages
150+ C Pattern Programs
From Everand
150+ C Pattern Programs
Hernando Abella
No ratings yet
FALLSEM2024-25 MVLD601L TH VL2024250106607 2024-07-22 Reference-Material-I
No ratings yet
FALLSEM2024-25 MVLD601L TH VL2024250106607 2024-07-22 Reference-Material-I
12 pages
Numerical Solution of Ordinary Differential Equations: Dr. Abdul Muis, ST - Meng. Dr. Ir. Feri Yusivar Meng
No ratings yet
Numerical Solution of Ordinary Differential Equations: Dr. Abdul Muis, ST - Meng. Dr. Ir. Feri Yusivar Meng
24 pages
Report On The Applications of DFS and BFS
No ratings yet
Report On The Applications of DFS and BFS
7 pages
False Position Method
No ratings yet
False Position Method
7 pages
Discrete Hartley Transform
No ratings yet
Discrete Hartley Transform
5 pages
Function? ( (2, - 3), (4, 6), (3, - 1), (6, 6), (2, 3) ) : Domain and Range
No ratings yet
Function? ( (2, - 3), (4, 6), (3, - 1), (6, 6), (2, 3) ) : Domain and Range
17 pages
Trigonometry Formulas
No ratings yet
Trigonometry Formulas
5 pages
CAPE Unit 1 Trig Notes
No ratings yet
CAPE Unit 1 Trig Notes
19 pages
Relations and Functions: Module 1 Lesson 1
No ratings yet
Relations and Functions: Module 1 Lesson 1
24 pages
Difference Equation
No ratings yet
Difference Equation
8 pages
1 Math
No ratings yet
1 Math
67 pages
CH 8 - Trigonometry Class X PDF
No ratings yet
CH 8 - Trigonometry Class X PDF
2 pages
Partitions Exercise
No ratings yet
Partitions Exercise
2 pages
DAY 1 Illustrating Polynomial Functions
No ratings yet
DAY 1 Illustrating Polynomial Functions
15 pages
24 - Inverse Trigonometric Functions
No ratings yet
24 - Inverse Trigonometric Functions
36 pages
19MAT209 3 MVUO Geometrical AnalyticalSolns
No ratings yet
19MAT209 3 MVUO Geometrical AnalyticalSolns
16 pages
2022 - 111 - Digital Syllabus
No ratings yet
2022 - 111 - Digital Syllabus
7 pages
LINEAR ALGEBRA AND COMPLEX ANALYSIS S3 B.Tech May 2019 R & S - Ktu Qbank
No ratings yet
LINEAR ALGEBRA AND COMPLEX ANALYSIS S3 B.Tech May 2019 R & S - Ktu Qbank
2 pages
John Patrick de Silva Quiz 2B Methods C2S2SY2122 I.C. ANSWERS PDF
No ratings yet
John Patrick de Silva Quiz 2B Methods C2S2SY2122 I.C. ANSWERS PDF
3 pages
Introduction To The Dfs and The DFT
No ratings yet
Introduction To The Dfs and The DFT
5 pages
Numerical Methods & Probability Theory (20A54402) : Lecture Notes
No ratings yet
Numerical Methods & Probability Theory (20A54402) : Lecture Notes
199 pages
Content Discussion: The Nature of Mathematics
No ratings yet
Content Discussion: The Nature of Mathematics
7 pages
QM Mar1 2024
No ratings yet
QM Mar1 2024
11 pages
Tutorialsheet 3
No ratings yet
Tutorialsheet 3
2 pages
Half Range Sine and Cosine Series
No ratings yet
Half Range Sine and Cosine Series
18 pages
5 Chapter 6 Network Model
No ratings yet
5 Chapter 6 Network Model
30 pages
CS3401 Algorithms Exps
No ratings yet
CS3401 Algorithms Exps
44 pages

CUDA

Uploaded by

CUDA

Uploaded by

HPC ASSIGNMENT 4

Enter six elements of second array

Sum of two arrays:

__global__ void matproduct(int *l,int *m, int *n)

int b[row2][col2] = { 10, 11, 12, 13, 14, 15};

You might also like

global void matproduct(int l,int m, int *n)