Professional Documents
Culture Documents
MBA SectionD MBA20235 PranayGupta Assignment R
MBA SectionD MBA20235 PranayGupta Assignment R
Problem 1
a)
> 27*(38-17)
[1] 567
b)
> 14^7
[1] 105413504
c)
> sqrt(436/12)
[1] 6.027714
Problem 2
> a <- seq(5, 160, by=5) -(a sequence of numbers from 5 to 160 with an interval of 5)
>a
>b
[1] 87 86 85 84 83 82 81 80 79 78 77 76 75 74 73 72 71 70 69 68 67 66 65 64 63 62 61 60 59 58 57 56
> d= a*b
>d
[1] 435 860 1275 1680 2075 2460 2835 3200 3555 3900 4235 4560 4875 5180 5475 5760 6035 6300
6555 6800 7035 7260 7475 7680 7875 8060 8235 8400 8555 8700 8835 8960
a)
> d[19:21]
b)
> d[d<2000]
Problem 3
a)
> sum(d)
[1] 175120
b)
> median(d)
[1] 5897.5
c)
> sd(d)
[1] 2608.563
Problem 4
a)
student<- c("Pranay","Ankita","Himanshu","Harshit","Srishti","Nitesh","Ajay","Nisha","Anshul","Kamya")
b)
> age<-c(22,25,23,21,25,22,26,24,23,24)
c)
> student
[1] "Pranay" "Ankita" "Himanshu" "Harshit" "Srishti" "Nitesh" "Ajay" "Nisha" "Anshul"
"Kamya"
> age
[1] 22 25 23 21 25 22 26 24 23 24
d)
> student[x]
e)
> rbind(student,age)
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8] [,9] [,10]
student "Pranay" "Ankita" "Himanshu" "Harshit" "Srishti" "Nitesh" "Ajay" "Nisha" "Anshul" "Kamya"
age "22" "25" "23" "21" "25" "22" "26" "24" "23" "24"
f)
> subject<-c("WCTB","OB","FA","FM","ME","BS","IS","OB","ME","WOC")
> rbind(student,age,subject)
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8] [,9] [,10]
student "Pranay" "Ankita" "Himanshu" "Harshit" "Srishti" "Nitesh" "Ajay" "Nisha" "Anshul" "Kamya"
age "22" "25" "23" "21" "25" "22" "26" "24" "23" "24"
subject "WCTB" "OB" "FA" "FM" "ME" "BS" "IS" "OB" "ME" "WOC"
g)
> age<-append(age,26)
> subject<-append(subject,"WCTB")
> rbind(student,age,subject)
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8] [,9] [,10] [,11]
student "Pranay" "Ankita" "Himanshu" "Harshit" "Srishti" "Nitesh" "Ajay" "Nisha" "Anshul" "Kamya"
"Ankur"
age "22" "25" "23" "21" "25" "22" "26" "24" "23" "24" "26"
subject "WCTB" "OB" "FA" "FM" "ME" "BS" "IS" "OB" "ME" "WOC" "WCTB"
Problem 5
> vec
[[1]]
[1] 1
[[2]]
[1] 2
[[3]]
[1] 3
> char_vec
[[1]]
[1] "Hadoop"
[[2]]
[1] "Spark"
[[3]]
[1] "Flink"
[[4]]
[1] "Mahout"
> logic_vec
[[1]]
[1] TRUE
[[2]]
[1] FALSE
[[3]]
[1] TRUE
[[4]]
[1] FALSE
> char_vec[3]
[[1]]
[1] "Flink"
> fulllist<-list(vec,char_vec,logic_vec) -(a list of lists is created with the name “fulllist”)
> fulllist
[[1]]
[[1]][[1]]
[1] 1
[[1]][[2]]
[1] 2
[[1]][[3]]
[1] 3
[[1]][[4]]
[1] 4
[[2]]
[[2]][[1]]
[1] "Hadoop"
[[2]][[2]]
[1] "Spark"
[[2]][[3]]
[1] "Flink"
[[2]][[4]]
[1] "Mahout"
[[3]]
[[3]][[1]]
[1] TRUE
[[3]][[2]]
[1] FALSE
[[3]][[3]]
[1] TRUE
[[3]][[4]]
[1] FALSE
Problem 6
> getwd()
[1] "C:/Users/pranay/Downloads/WHO"
> str(WHO1) -(data structure, it shows the data type and first few observations of every variable)
$ iso2 : chr "AF" "AF" "AF" "AF" ... –(chr: character data)
$ year : int 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 ...
$ e_inc_100k : num 190 189 189 189 189 189 189 189 189 189 ... –(num: number data)
$ e_inc_100k_lo : num 123 123 122 122 122 122 122 122 122 123 ...
$ e_inc_100k_hi : num 271 271 270 270 270 270 270 270 270 270 ...
$ e_inc_num : int 39000 41000 43000 45000 47000 48000 50000 51000 52000 54000 ...
$ e_inc_num_lo : int 26000 26000 28000 29000 30000 31000 32000 33000 34000 35000 ...
$ e_inc_num_hi : int 56000 58000 61000 64000 67000 69000 71000 73000 75000 77000 ...
$ e_tbhiv_prct : num 0.32 0.34 0.21 0.26 0.28 0.31 0.32 0.4 0.39 0.41 ...
$ e_tbhiv_prct_lo : num 0.11 0.12 0.08 0.1 0.11 0.12 0.13 0.17 0.17 0.19 ...
$ e_tbhiv_prct_hi : num 0.65 0.68 0.42 0.5 0.53 0.57 0.59 0.72 0.68 0.72 ...
$ e_inc_tbhiv_100k : num 0.61 0.65 0.41 0.49 0.53 0.58 0.61 0.75 0.73 0.78 ...
$ e_inc_tbhiv_100k_lo : num 0.17 0.19 0.12 0.16 0.18 0.2 0.21 0.28 0.28 0.3 ...
$ e_inc_tbhiv_100k_hi : num 1.3 1.4 0.86 1 1.1 1.2 1.2 1.5 1.4 1.5 ...
$ e_inc_tbhiv_num : int 130 140 92 120 130 150 160 200 200 220 ...
$ e_inc_tbhiv_num_hi : int 270 300 190 240 270 300 320 400 390 420 ...
$ e_mort_exc_tbhiv_num : int 14000 13000 13000 14000 13000 12000 11000 10000 11000 13000 ...
$ e_mort_exc_tbhiv_num_lo : int 8100 7800 7500 7900 7400 7100 6600 6200 6600 7400 ...
$ e_mort_exc_tbhiv_num_hi : int 22000 21000 20000 21000 19000 18000 17000 16000 17000
19000 ...
$ e_mort_tbhiv_100k : num 0.4 0.4 0.23 0.28 0.27 0.27 0.26 0.3 0.3 0.35 ...
$ e_mort_tbhiv_100k_lo : num 0.11 0.11 0.07 0.09 0.09 0.09 0.09 0.11 0.11 0.13 ...
$ e_mort_tbhiv_100k_hi : num 0.87 0.85 0.48 0.58 0.55 0.55 0.52 0.58 0.58 0.66 ...
$ e_mort_tbhiv_num_hi : int 180 180 110 140 140 140 140 160 160 190 ...
$ e_mort_num : int 14000 14000 13000 14000 13000 12000 11000 11000 11000 13000 ...
$ e_mort_num_lo : int 8200 7900 7500 8000 7500 7100 6700 6300 6700 7500 ...
$ e_mort_num_hi : int 22000 21000 20000 21000 19000 18000 17000 16000 17000 19000 ...
> summary(WHO1) -(summary fn, shows arithmetic averages like mean, median, mode, range etc.)
Mean :430.6
3rd Qu.:643.0
Max. :894.0
1st Qu.: 11.0 1st Qu.: 15.0 1st Qu.: 220 1st Qu.: 160
3rd Qu.:116.0 3rd Qu.: 221.0 3rd Qu.: 17000 3rd Qu.: 12000
1st Qu.: 280 1st Qu.: 1.20 1st Qu.: 0.460 1st Qu.: 2.80
3rd Qu.: 22000 3rd Qu.: 17.00 3rd Qu.:10.000 3rd Qu.: 26.00
1st Qu.: 0.29 1st Qu.: 0.11 1st Qu.: 0.71 1st Qu.: 16.2
Median : 2.10 Median : 0.92 Median : 3.90 Median : 210.0
3rd Qu.: 13.00 3rd Qu.: 6.50 3rd Qu.: 24.00 3rd Qu.: 1800.0
1st Qu.: 0.000 1st Qu.: 0.05 1st Qu.: 0 1st Qu.: 0
3rd Qu.: 1.000 3rd Qu.: 4.40 3rd Qu.: 330 3rd Qu.: 130
1st Qu.: 1 1st Qu.: 1.10 1st Qu.: 0.87 1st Qu.: 1.30
3rd Qu.: 580 3rd Qu.: 24.00 3rd Qu.: 17.00 3rd Qu.: 32.00
1st Qu.: 19 1st Qu.: 16 1st Qu.: 22 1st Qu.:0.070 1st Qu.:0.05
Median : 300 Median : 250 Median : 340 Median :0.100 Median :0.07
Mean : 9303 Mean : 7050 Mean : 11985 Mean :0.138 Mean :0.09
3rd Qu.: 2800 3rd Qu.: 1900 3rd Qu.: 3700 3rd Qu.:0.170 3rd Qu.:0.11
Max. :735000 Max. :622000 Max. :875000 Max. :0.740 Max. :0.61
1st Qu.:0.080 1st Qu.: 7.00 1st Qu.: 5.000 1st Qu.: 8.00 1st Qu.: 11
3rd Qu.:0.250 3rd Qu.:17.00 3rd Qu.:11.000 3rd Qu.:25.00 3rd Qu.: 97
Max. :0.940 Max. :74.00 Max. :61.000 Max. :94.00 Max. :949
NA's :3824 NA's :3824 NA's :3824 NA's :3824 NA's :150
-(The plot suggests that there is more or less a direct relationship between the no. of incident cases
and the mortality rate, barring a few exceptions)
Problem 7
a)
> str(x)
$ Marks : num 35 75 45 30 85
> print(x)
1 Ron 35 Fail
2 Jake 75 Pass
3 Ava 45 Fail
4 Sophia 30 Fail
5 Mia 85 Pass
b) “mymat” function forms a matrix with the number of rows and columns specified by the “nrow”
and “ncol” functions. “i” is the row number and “j” is the column number. “dim” refers to the
dimensions of the matrix.
+ for(j in 1:dim(mymat)[2]) {
+ mymat[i,j] = i*j}}
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8] [,9] [,10]
[1,] 1 2 3 4 5 6 7 8 9 10
[2,] 2 4 6 8 10 12 14 16 18 20
[3,] 3 6 9 12 15 18 21 24 27 30
[4,] 4 8 12 16 20 24 28 32 36 40
[5,] 5 10 15 20 25 30 35 40 45 50
[6,] 6 12 18 24 30 36 42 48 54 60
[7,] 7 14 21 28 35 42 49 56 63 70
[8,] 8 16 24 32 40 48 56 64 72 80
[9,] 9 18 27 36 45 54 63 72 81 90
[10,] 10 20 30 40 50 60 70 80 90 100