0% found this document useful (0 votes)

19 views12 pages

Lab 02 - Compound Data Structures

The document provides a comprehensive overview of compound data structures in R, including vectors, matrices, lists, factors, and data frames. It covers creation, indexing, slicing, and operations on these structures, along with functions for data manipulation and analysis. Additionally, it discusses importing external datasets and performing data simulation.

Uploaded by

testingcode44

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

19 views12 pages

Lab 02 - Compound Data Structures

Uploaded by

testingcode44

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 12

Fundamentals-02 Compound Data Structures

Created by H. M. Samadhi Chathuranga Rathnayake

#Compound data structures
#Vectors
#Creating vectors with c function
a=c(12,22,23,34,35)
a

class(a)

b=c("Dog","Cat","Rat")
b

class(b)

x=c(12,22,23,"Man","Car")
x #This is called the coercion

#logical < integer < numeric < complex < character (This is the order)
class(x)

y=c(TRUE,FALSE,12)
y

class(y)

#Other ways of creating vectors

d=1:10
d

p=15:5
p

k=seq(from=10,to=50,by=5)
k

h=seq(from=10,to=50,length.out = 20)
h

f=seq_len(20)
f

h=replicate(10,c("Dog","Cow"))
h

#Indexing & slicing vector elements

a=c(23,33,34,32,45,50,65)
a[1]

a[c(1,3,6)]

a[-c(1,3,6)] #All other elements except these indexes

a[1:3]

a[c(T,T,T,F,T,T,F)] #Boolean masking

a[a>40]

a[a%%2==0]

#Element wise operations in numerical vectors

a=c(2,3,4,6,3)
b=c(3,4,1,6,4)

a+10

a*2

a/3

a^2

a>3

a+b

a*b

a/b

a^b

a>b

a%in%b #This is the membership

#Element wise operations with recursive property in vectors

p=c(10,20,30,40,50)
q=c(100,200,300)

p+q

#Vector properties with functions

a=c(2,3,5,3,6,7,4,5,8,1,3,4,2)

#Basic summary functions

length(a)

summary(a)
str(a)

min(a)

max(a)

sum(a)

mean(a)

median(a)

var(a)

sd(a)

range(a)

#Cumulative functions
cumsum(a)

cumprod(a)

cummin(a)

cummax(a)

#Vector operations with functions

a=c(20,30,40)
b=append(a,100)
b

d=append(x = a,values = 200,after = 2)

k=append(x = a,values = c(100,200,300),after = 2)

h=c(a,100,200,300) #This another way of appending

a=c(20,30,40)
rep(a,3)

b=c(10,20,25,30,35,40)
all(b>20)

all(b<50)

any(b>20)

any(b>50)

b=c(100,50,25,30,15,40,15,40)
sort(b)
order(b)

rev(b)

unique(b)

h=c(12,22,23,34,45,43,32,33,21,23,45,56,67,56,70)
s=sample(h,5)
s

set.seed(1000)
h=c(12,22,23,34,45,43,32,33,21,23,45,56,67,56,70)
s=sample(h,5)
s

p=sample(h,5,replace = T)
p

f=c(12,22,23)
q=sample(f,10,replace = T)
q

k=c(20,12,25,30,32,22,33)
which(k>=25)

which.min(k)

which.max(k)

a=c(12,22,23,34,45,56,43,43,33,34)
idx=which(a%in%c(22,23,34))
b=a[-idx]
b

g=c("Male","Female","Female","Female","Male")
table(g)

g=c("Male","Female","Female","Female","Male")
replace(x = g,list = c(1,5),values = "M")

#Matrices
#Matrix creation
a=matrix(c(12,23,32,33,45,43),3,2)
a

b=matrix(c(12,23,32,33,45,43),3,2,byrow = TRUE)
b

c=array(c(12,23,32,33,45,43),c(3,2))
c
a=matrix(10,3,2)
a

#Matrix properties
b=matrix(c(12,23,32,33,45,43),3,2,byrow = TRUE)
b

dim(b)

nrow(b)

ncol(b)

str(b)

summary(b)

#Merging matrices
a=matrix(c(12,23,32,33),2,2)
b=matrix(c(22,26,37,43),2,2)

c=cbind(a,b)
c

d=rbind(a,b)
d

#Indexing & slicing matrices

a=matrix(c(12,23,32,33,45,43,34,55,56),3,3)
a

a[1,3]

a[1,]

a[,2]

a[c(1,3),2]

a[,2:3]

a>40

a[a>40]

#Matrix operations
a=matrix(c(12,23,32,33),2,2)
b=matrix(c(22,26,37,43),2,2)
c=matrix(c(12,23,32,33,45,43,34,55,56),3,3)

b
a+b

a-b

a*b

a/b

a%*%b

t(c)

det(c)

solve(c)

diag(c)

#Lists
#Creating a list
a=c(12,22,23,34)
b=c("Cat","Dog")
c=100
d="Man"
m=matrix(c(12,22,23,34,45,32),3,2)

L=list(a,b,c,d,m)
L

#A name can be given for each segment of the list

names(L)=c("Part1","Part2","Part3","Part4","Part5")
L

#Accessing items and elements in items inside the list

L[[1]] #Accessing the first items

L$Part1

L[[1]][2] #Accessing elements inside the items

#Adding elements to a list

L$Part6="Cow"
L

#Removing elements from a list

L$Part3=NULL
L
#Convert a list into a vector
v1=unlist(L)
v1

#Merge lists
L1=list("Man",c(12,22,23),TRUE)
L2=list(matrix(1:20,4,5),c("Cat","Dog"))

L3=c(L1,L2)
L3

#Splitting a list
a=c(12,22,23,34)
b=c("Cat","Dog")
c=100
d="Man"
m=matrix(c(12,22,23,34,45,32),3,2)

L=list(a,b,c,d,m)
L

L1=L[1:2]
L2=L[3:5]
L1

#Factors
#Un Ordered factors
g=c("Male","Female","Male","Male","Male","Female")
g

fg=factor(g)
fg

#Ordered factors
h=c("first","first","fifth","fourth","second","fifth","third","second","fourt
h")
h

fh=factor(h)
fh

ofh=factor(h,levels = c("first","second","third","fourth","fifth"))
ofh
#Data Frames
name=c("Kane","Jane","David","Harry","Larry","Mary","John","Jessy","Anne","Li
lly","Julia","Pale")
age=c(23,33,34,32,21,22,23,34,32,18,21,23)
marks=c(89,78,88,59,67,78,88,90,59,75,77,69)

df=data.frame(name,age,marks)
df

#Accessing columns in a data frame

df["name"] #This shows a sub data frame

df["age"]

df$name #This is giving the output as a vector

attach(df) #This will make these columns as global variables

name

age

marks

detach(df) #Make them again local variables

#Selecting several columns

df[c("name","age")]

#Accessing the elements in a data frame

df[1,1] #First column first element

df[1,"age"] #First row age value

df[c(1,5),"age"] #First and fifth rows age value

df[2,] #All values in the 2nd row

df[,3] #All values in the 3rd column

df[,-3] #All values except 3rd column

df[2:6,2] #2nd to 6th row of 2nd column

df$name[1:5] #1st to 5th name in name column

#Change elements in a data frame

df[1,1]="Sammie"
df
df[2:6,2]=c(50,50,50,50,50)
df

#Adding a new column

df$class=c("C1","C2","C3","C4","C5","C6","C1","C2","C3","C4","C5","C6")
df

#Removing an existing column

df$age=NULL
df

#Basic column operations

df$marks_new=df$marks+5
df

df$marks_diff=df$marks_new-df$marks
df

#Checking conditions
df$marks>=70 #Returns TRUE for marks greater than 70

#Boolean masking for data frames

df_new=df[df$marks>=70,]
df_new

#Data frame functions

View(df) #View the data frame

head(df) #Top elements

head(x = df,n = 8)

tail(df) #Bottom elements

tail(x = df,n = 8)

dim(df) #Dimensions

nrow(df)

ncol(df)

#Row and column names

row.names(df)

colnames(df)

colnames(df)=c("Student_Name","Previous_Marks","Class","New_Marks","Marks_Dif
ference")
df

#Column and row sums

colSums(df[c("Previous_Marks","New_Marks")])
rowSums(df[c("Previous_Marks","New_Marks")])

#Column and row means

colMeans(df[c("Previous_Marks","New_Marks")])

rowMeans(df[c("Previous_Marks","New_Marks")])

#edit function can be used for editing a data frame manually

df1=edit(df)
df1

#str function will give all the data types in the data frame
str(df)

#summary function will give a summary about the data frame

summary(df)

#which function can be used for identifying the indexes of some criteria
which(df["Previous_Marks"]>=70)

#table function will give frequencies in a categorical column

table(df$Class)

#Factorize the categorical columns

df=data.frame(Name=c("Sam","Kane","Jane"),Gender=c("M","M","F"),Age=c(23,32,2
1),University_Year=c(2,3,1))
df

str(df)

summary(df)

df$Gender=factor(df$Gender)
df$University_Year=factor(df$University_Year,levels = c(1,2,3))

str(df)

summary(df)

#Working with external data sets

#CSV files
#Importing CSV files
data=read.csv("D:\\Workshops\\R Programming for Data Science Workshop\\Part
01 - Fundamentals of R Programming\\Datasets\\default.CSV")

getwd()

setwd("D:\\Workshops\\R Programming for Data Science Workshop\\Part 01 -

Fundamentals of R Programming\\Datasets")
data=read.csv("default.CSV")
data
#Now we can treat this as a data frame
head(data)

dim(data)

colnames(data)

str(data)

table(data$Loan.Offered)

table(data$Own.house)

data$Gender=factor(data$Gender)
data$Loan.Offered=factor(data$Loan.Offered)
data$Job=factor(data$Job)
data$Status=factor(data$Status)
data$Credit.History=factor(data$Credit.History)
data$Own.house=factor(data$Own.house)
data$Purpose=factor(data$Purpose)

str(data)

head(data)

summary(data)

#We can perform any data frame operation

data_male=data[data$Gender=="Male",]
data_female=data[data$Gender=="Female",]
data_female=data[!data$Gender=="Male",]

summary(data_female)

data_female$CS_Ex_Ratio=data_female$Credit.Score/data_female$Work.Exp
head(data_female)

summary(data_male)

data_male$Exp_Level="Low"
head(data_male)

data_male[data_male$Work.Exp>=15,]$Exp_Level="High"
head(data_male)

#Data simulation
datanorm=rnorm(100) #Standard normal distribution
datanorm

datanorm2=rnorm(n = 100,mean = 20,sd = 5) #Standard normal distribution

datanorm2
datauni=runif(n = 100,min = 10,max = 20) #Uniform distribution
datauni

datapois=rpois(n = 100,lambda = 5)
datapois

databin=rbinom(n = 100,size = 1, prob = 0.5)

databin

#rnbinom(),rgamma(),rhyper(),rbeta()

R File Code
No ratings yet
R File Code
16 pages
Data Science
No ratings yet
Data Science
20 pages
R - Tutorial: Matrices Are Vectors
No ratings yet
R - Tutorial: Matrices Are Vectors
13 pages
R Programming Basics for Beginners
No ratings yet
R Programming Basics for Beginners
2 pages
DMPA Codes
No ratings yet
DMPA Codes
16 pages
R Machine Learning Lab Guide
0% (1)
R Machine Learning Lab Guide
9 pages
Base R
No ratings yet
Base R
9 pages
Kiran R1
No ratings yet
Kiran R1
12 pages
Module 2.9
No ratings yet
Module 2.9
12 pages
Programming Foundation
No ratings yet
Programming Foundation
14 pages
R Commands
No ratings yet
R Commands
18 pages
R Basics for Beginners
No ratings yet
R Basics for Beginners
24 pages
An Introduction To R Language
No ratings yet
An Introduction To R Language
11 pages
R Studio
No ratings yet
R Studio
8 pages
R Study Material I
No ratings yet
R Study Material I
8 pages
Experiment 5
No ratings yet
Experiment 5
13 pages
R Programmimg Practical Journal All-1
No ratings yet
R Programmimg Practical Journal All-1
25 pages
Practical 1 - Basics of R
No ratings yet
Practical 1 - Basics of R
8 pages
Arunav Da Prac
No ratings yet
Arunav Da Prac
55 pages
Matrix, Dataframes, List
No ratings yet
Matrix, Dataframes, List
8 pages
Essential R Commands Guide
No ratings yet
Essential R Commands Guide
11 pages
Lecture 5 (Managing and Understanding Data)
No ratings yet
Lecture 5 (Managing and Understanding Data)
9 pages
SCIBD
No ratings yet
SCIBD
3 pages
R Programming Materials
No ratings yet
R Programming Materials
51 pages
Ba Ca4
No ratings yet
Ba Ca4
3 pages
R-Script 2
No ratings yet
R-Script 2
10 pages
R-Programming Record - Odd Sem 21-22
No ratings yet
R-Programming Record - Odd Sem 21-22
35 pages
All Codes
No ratings yet
All Codes
10 pages
Day 2
No ratings yet
Day 2
5 pages
Stastistics and Probability With R Programming Language: Lab Report
50% (2)
Stastistics and Probability With R Programming Language: Lab Report
44 pages
A Short List of Some Useful R Commands: Input and Display
No ratings yet
A Short List of Some Useful R Commands: Input and Display
2 pages
MLlab 5 TH
No ratings yet
MLlab 5 TH
17 pages
Applied Statistics MAT1011
No ratings yet
Applied Statistics MAT1011
22 pages
6 Working With Data Frames in R
No ratings yet
6 Working With Data Frames in R
8 pages
Unit - 3 Learning Notes
No ratings yet
Unit - 3 Learning Notes
8 pages
Practical 2 Kunal
No ratings yet
Practical 2 Kunal
6 pages
R Programming: © 2016 SMART Training Resources Pvt. LTD
No ratings yet
R Programming: © 2016 SMART Training Resources Pvt. LTD
28 pages
R Assignment
No ratings yet
R Assignment
9 pages
R Guru Cheat Sheet
No ratings yet
R Guru Cheat Sheet
2 pages
Model 1
No ratings yet
Model 1
14 pages
My R Report
No ratings yet
My R Report
52 pages
18 3 24 Upto Week 6 A B Latest 1
No ratings yet
18 3 24 Upto Week 6 A B Latest 1
25 pages
R Programing
No ratings yet
R Programing
32 pages
Dar Lecture 7
No ratings yet
Dar Lecture 7
24 pages
Network Analysis and Visualization With R and Igraph
No ratings yet
Network Analysis and Visualization With R and Igraph
62 pages
FE418 RLectureNotes1
No ratings yet
FE418 RLectureNotes1
15 pages
Assignment
No ratings yet
Assignment
4 pages
R Exam
No ratings yet
R Exam
18 pages
Simple Tutorial in R
No ratings yet
Simple Tutorial in R
15 pages
Experiment No 8
No ratings yet
Experiment No 8
11 pages
R Lecture 2-1
No ratings yet
R Lecture 2-1
28 pages
M2 Dar
No ratings yet
M2 Dar
46 pages
R Program
No ratings yet
R Program
22 pages
R Programming Essentials
No ratings yet
R Programming Essentials
27 pages
Teaching R
No ratings yet
Teaching R
15 pages
Dsda Manual
No ratings yet
Dsda Manual
64 pages
R Programming-Chapiter 4
No ratings yet
R Programming-Chapiter 4
16 pages
A Short List of The Most Useful R Commands
No ratings yet
A Short List of The Most Useful R Commands
8 pages
BIO259 Note
No ratings yet
BIO259 Note
55 pages
UG ComputerScience NEP
No ratings yet
UG ComputerScience NEP
48 pages
DSA Lecture 1
No ratings yet
DSA Lecture 1
16 pages
Array List - LAB1
No ratings yet
Array List - LAB1
20 pages
Data Structures and Algorithms With Python 100 Coding Q A Code of Code by Cakal Yasin 1
100% (2)
Data Structures and Algorithms With Python 100 Coding Q A Code of Code by Cakal Yasin 1
327 pages
RAG and Vector Database Guide
No ratings yet
RAG and Vector Database Guide
18 pages
DSU Important Questios
No ratings yet
DSU Important Questios
4 pages
Unit 5 IRS
No ratings yet
Unit 5 IRS
17 pages
Dsa Index
No ratings yet
Dsa Index
2 pages
A Novel Hybrid Quicksort Algorithm Vectorized Using AVX-512 On Intel Skylake (1704.08579)
No ratings yet
A Novel Hybrid Quicksort Algorithm Vectorized Using AVX-512 On Intel Skylake (1704.08579)
9 pages
MATLAB For Engineers 6th Edition Holly Moore - The Ebook Is Ready For Download With Just One Simple Click
83% (6)
MATLAB For Engineers 6th Edition Holly Moore - The Ebook Is Ready For Download With Just One Simple Click
65 pages
11-20 Programs Data Science and Computer Vision
No ratings yet
11-20 Programs Data Science and Computer Vision
8 pages
DS in 7 Hours
No ratings yet
DS in 7 Hours
346 pages
CSE215 Chapter 8 Multi-dim-Arrays
No ratings yet
CSE215 Chapter 8 Multi-dim-Arrays
26 pages
DSA Learning Roadmap C++
No ratings yet
DSA Learning Roadmap C++
3 pages
Cse IV Bcs403 Pue
No ratings yet
Cse IV Bcs403 Pue
3 pages
IIT M ES FOUNDATION FN EXAM FEF1 24 Dec 2023
No ratings yet
IIT M ES FOUNDATION FN EXAM FEF1 24 Dec 2023
89 pages
Python Data Visualization Guide
No ratings yet
Python Data Visualization Guide
55 pages
ML Unit 2
No ratings yet
ML Unit 2
25 pages
Instant Ebooks Textbook Beginning C++23 7th Edition Ivor Horton Download All Chapters
100% (3)
Instant Ebooks Textbook Beginning C++23 7th Edition Ivor Horton Download All Chapters
76 pages
B.Tech ECE - R23
No ratings yet
B.Tech ECE - R23
96 pages
Advance Notice June July 2025 16052025
No ratings yet
Advance Notice June July 2025 16052025
27 pages
Unit 2 - Array - Function - String
No ratings yet
Unit 2 - Array - Function - String
44 pages
REVISION 9 Arrays and Functions
No ratings yet
REVISION 9 Arrays and Functions
8 pages
2.enquiry Routines-R17
No ratings yet
2.enquiry Routines-R17
27 pages
Advanced Python & Data Science Programs
No ratings yet
Advanced Python & Data Science Programs
16 pages
BSIT Data Structures Syllabus
No ratings yet
BSIT Data Structures Syllabus
8 pages
II CSM B DS Unit-1
No ratings yet
II CSM B DS Unit-1
31 pages
Previous PPS EXTERNAL PAPERS
No ratings yet
Previous PPS EXTERNAL PAPERS
11 pages
B.Tech CSE & AIML Syllabus 2023
No ratings yet
B.Tech CSE & AIML Syllabus 2023
35 pages
Class Template Array
No ratings yet
Class Template Array
14 pages

Lab 02 - Compound Data Structures

Uploaded by

Lab 02 - Compound Data Structures

Uploaded by

Fundamentals-02 Compound Data Structures

Created by H. M. Samadhi Chathuranga Rathnayake

#Other ways of creating vectors

#Indexing & slicing vector elements

a[-c(1,3,6)] #All other elements except these indexes

a[c(T,T,T,F,T,T,F)] #Boolean masking

#Element wise operations in numerical vectors

a%in%b #This is the membership

#Element wise operations with recursive property in vectors

#Vector properties with functions

#Basic summary functions

#Vector operations with functions

d=append(x = a,values = 200,after = 2)

k=append(x = a,values = c(100,200,300),after = 2)

h=c(a,100,200,300) #This another way of appending

#Indexing & slicing matrices

#A name can be given for each segment of the list

#Accessing items and elements in items inside the list

L[[1]][2] #Accessing elements inside the items

#Adding elements to a list

#Removing elements from a list

#Accessing columns in a data frame

df$name #This is giving the output as a vector

attach(df) #This will make these columns as global variables

detach(df) #Make them again local variables

#Selecting several columns

#Accessing the elements in a data frame

df[1,1] #First column first element

df[1,"age"] #First row age value

df[c(1,5),"age"] #First and fifth rows age value

df[2,] #All values in the 2nd row

df[,3] #All values in the 3rd column

df[,-3] #All values except 3rd column

df[2:6,2] #2nd to 6th row of 2nd column

df$name[1:5] #1st to 5th name in name column

#Change elements in a data frame

#Adding a new column

#Removing an existing column

#Basic column operations

#Boolean masking for data frames

#Data frame functions

head(df) #Top elements

tail(df) #Bottom elements

#Row and column names

#Column and row sums

#Column and row means

#edit function can be used for editing a data frame manually

#summary function will give a summary about the data frame

#table function will give frequencies in a categorical column

#Factorize the categorical columns

#Working with external data sets

setwd("D:\\Workshops\\R Programming for Data Science Workshop\\Part 01 -

#We can perform any data frame operation

datanorm2=rnorm(n = 100,mean = 20,sd = 5) #Standard normal distribution

databin=rbinom(n = 100,size = 1, prob = 0.5)

You might also like