19 min to read
R in One Post
Learn R For Free
Getting Started
This tutorial is desgined for the beginner who has some computer programming experience. Remember rule number one in Programming
Dont Panic
Download RStudion Here https://www.rstudio.com/products/rstudio/download/
Storing Values
Types of variables
integer <- 1
double <- 5.0
character <- "A"
string <- "ABCDEFGHIJKLMNOQRSTUVWXYZ"
boolean <- TRUE
data <- list(12,3.14,"Henry","Bernreuter")
data_1 <- list(dozen = 12, pi = 3.14, user = "henry", happy = TRUE )
print(double)
[1] 5
print(integer)
[1] 1
print(character)
[1] "A"
print(string)
[1] "ABCDEFGHIJKLMNOQRSTUVWXYZ"
print(data)
[[1]]
[1] 12
[[2]]
[1] 3.14
[[3]]
[1] "Henry"
[[4]]
[1] "Bernreuter"
print(data_1)
$`dozen`
[1] 12
$pi
[1] 3.14
$user
[1] "henry"
$happy
[1] TRUE
data_1$user
[1] "henry"
vector_months <- c("Jan","Feb","Mar","Apr")
vector_months[1]
[1] "Jan"
Performing operations
#Addition
2+2
[1] 4
#Subtraction
2-2
[1] 0
#Division
2/2
[1] 1
#Multiplcation
2*2
[1] 4
#Exponent
3^2
[1] 9
#Modulus
22%%7
[1] 1
Testing Conditions
#Equaliy: 0 equals 0
0 == 0
[1] TRUE
#InEquality: 1 does not equal 0
1 != 0
[1] TRUE
#Greater Than: 1 is greater than 0
1 > 0
[1] TRUE
#Less Than: 0 is less than 1
0 < 1
[1] TRUE
#Less Than or Egual to: 0 is less than or equal to 1
0 <= 1
[1] TRUE
#Logical NOT: TRU does not equal TRUE
!TRUE
[1] FALSE
#Logical AND: TRUE and TRUE equals TRUE
TRUE && TRUE
[1] TRUE
#Logical OR: TRUE OR FALSE equals TRUE
TRUE || TRUE
[1] TRUE
Employing Functions
R has many built in functions. You have already seen the print() function
name = "Henry Bernreuter"
print(name)
[1] "Henry Bernreuter"
#Absolute Value
abs(-1)
[1] 1
#Square Root
sqrt(2)
[1] 1.414214
#Integer rounded up
ceiling(4.4)
[1] 5
#Integer rounded down
floor(4.6)
[1] 4
#Truncated
trunc(22/7)
[1] 3
#Round to the nearest number X to N siginficate digits
round(22/7, digits = 3 )
[1] 3.143
#Nearest number to X to n decimal places
signif(22/7, digits = 7)
[1] 3.142857
#Trigonometry
#cosign
cos(0)
[1] 1
#sin
sin(0)
[1] 0
#tangent
tan(0)
[1] 0
#arccos
acos(0)
[1] 1.570796
#arcsin
asin(0)
[1] 0
#arctan
atan(0)
[1] 0
#logarithm
log(10)
[1] 2.302585
#exponent
exp(0)
[1] 1
#String Functions
substr(string,0,25)
[1] "ABCDEFGHIJKLMNOQRSTUVWXYZ"
substr(string,0,3)
[1] "ABC"
#Make a string all uppercase
toupper(string)
[1] "ABCDEFGHIJKLMNOQRSTUVWXYZ"
#make a sting all lower
tolower(string)
[1] "abcdefghijklmnoqrstuvwxyz"
#substute one character for another in a string
sub('ABC','123',string)
[1] "123DEFGHIJKLMNOQRSTUVWXYZ"
#current date and time of computer
# %e = day number
# %a = shorten day name %A = full day name
# %b = shorten month name %B = full month name
# %H = hour number (00 - 23)
# %M = minute number(00-59)
# %y = Year number 4-digit
format(Sys.time(), "%A %b %d %X %Y")
[1] "Tuesday Jul 23 12:50:05 PM 2019"
#built in constants
print(LETTERS)
[1] "A" "B" "C" "D" "E" "F" "G" "H" "I" "J" "K" "L" "M" "N" "O" "P" "Q" "R" "S" "T" "U" "V" "W" "X" "Y"
[26] "Z"
print(letters)
[1] "a" "b" "c" "d" "e" "f" "g" "h" "i" "j" "k" "l" "m" "n" "o" "p" "q" "r" "s" "t" "u" "v" "w" "x" "y"
[26] "z"
print(month.name)
[1] "January" "February" "March" "April" "May" "June" "July" "August"
[9] "September" "October" "November" "December"
print(month.abb)
[1] "Jan" "Feb" "Mar" "Apr" "May" "Jun" "Jul" "Aug" "Sep" "Oct" "Nov" "Dec"
#Concatenate And Print
#is useful for producing output in user-defined functions.
#It converts its arguments to character vectors
#concatenates them to a single character vector
#appends the given sep function string(s) to each element and then outputs them.
half.year = month.abb[1:6]
cat("Constant", half.year)
Constant Jan Feb Mar Apr May Jun
#create a random number wih runif() function
random = runif(10)
random
[1] 0.8594901 0.2222176 0.6988373 0.7076233 0.8870411 0.2806615 0.3656753 0.7706948 0.6509018 0.4191367
#Creat a sample of number in a range
lottery_numbers = c(1:59)
cat("The winning lottery numbers are:", sample(lottery_numbers,6))
The winning lottery numbers are: 50 1 16 37 57 49
#random normally distrubieted numbers
rnorm(10)
[1] -2.08473016 0.03460206 0.57954210 1.56998413 0.44054716 -0.32980232 0.10264708 0.50898951
[9] -1.20265356 0.53597390
#randome generated numbers with a mean and standard deviation
normalNumbers = rnorm(10, mean = 1,sd = 1)
#To get the mean
mean(normalNumbers)
[1] 0.9155609
#To get the median
median(normalNumbers)
[1] 0.8837336
#To get the standard deviation
sd(normalNumbers)
[1] 0.8256223
#To get the qualtile
quantile(normalNumbers)
0% 25% 50% 75% 100%
-0.03241776 0.14866118 0.88373356 1.64802192 2.12232888
#To get the sum
sum(normalNumbers)
[1] 9.155609
#To get the range
range(normalNumbers)
[1] -0.03241776 2.12232888
#to get the max
max(normalNumbers)
[1] 2.122329
#to get the min
min(normalNumbers)
[1] -0.03241776
#First Plot
plot(1:10,normalNumbers,type = "o")
Create new functions with loops
#For Loops
half.year = month.abb[1:6]
for (month in half.year){
print(paste("The months of the year are", month))
}
[1] "The months of the year are Jan"
[1] "The months of the year are Feb"
[1] "The months of the year are Mar"
[1] "The months of the year are Apr"
[1] "The months of the year are May"
[1] "The months of the year are Jun"
#While loop
i = 1
while (i < 6) {
print(i)
i = i+1
}
[1] 1
[1] 2
[1] 3
[1] 4
[1] 5
#The standard function syntax is
# Function name = function(arg1, arg2, arg3)
#{
# statement to be executed
# return(object)
#}
f2c = function(degrees){
result = ((degrees -32)* 5/9)
return(result)
}
cat("Body Temperature 98.6F =",f2c(98.6), "C")
Body Temperature 98.6F = 37 C
Building matrices
data = seq(1:32)
table = matrix(data, nrow = 4, ncol = 8)
print(table)
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8]
[1,] 1 5 9 13 17 21 25 29
[2,] 2 6 10 14 18 22 26 30
[3,] 3 7 11 15 19 23 27 31
[4,] 4 8 12 16 20 24 28 32
#Retrieve a cell value
cat("Cell 4,5 Contains", table[4,5])
Cell 4,5 Contains 20
#Replace the value with another value
table[4,5] = 10
cat("Cell 4,5 now Contains", table[4,5])
Cell 4,5 now Contains 10
#Spiral Matrix using a loop
i <- 1
j <- 1
i.start = 1
j.start <- 1
i.max <- 10
j.max <- 10
run <- 1
map <- matrix("MT",nrow = 10,ncol = 10)
while(i <= i.max & j <= j.max){
while (j <= j.max){
if(map[i,j] == "MT"){ #horizontal to the right
map[i,j] = run
run = run +1
j = j +1
}
}
j = j -1
while (i <= i.max) {
if(map[i,j] != "MT") i = i+1 #next row
else if(map[i,j] == "MT"){ #vertical to the bottom
map[i,j] = run
run = run +1
i = i+1
}
}
i = i -1
while(j <= j.max & j >= j.start){
if(map[i,j] != "MT") j = j-1 #previous column
else if (map[i,j] == "MT"){
map[i,j] = run
run = run +1
j = j -1
}
}
i = i -1
j = j.start #reset
while(i<= i.max & i > i.start){
if(map[i,j] == "MT"){
map[i,j] = run
i = i -1
}
}
i = i +1
j = j +1
i.start = i.start +1
j.start = j.start +1
i.max = i.max -1
j.max = j.max -1
}
map
[,1] [,2] [,3] [,4] [,5] [,6] [,7] [,8] [,9] [,10]
[1,] "1" "2" "3" "4" "5" "6" "7" "8" "9" "10"
[2,] "29" "29" "30" "31" "32" "33" "34" "35" "36" "11"
[3,] "29" "51" "51" "52" "53" "54" "55" "56" "37" "12"
[4,] "29" "51" "67" "67" "68" "69" "70" "57" "38" "13"
[5,] "29" "51" "67" "77" "77" "78" "71" "58" "39" "14"
[6,] "29" "51" "67" "77" "80" "79" "72" "59" "40" "15"
[7,] "29" "51" "67" "76" "75" "74" "73" "60" "41" "16"
[8,] "29" "51" "66" "65" "64" "63" "62" "61" "42" "17"
[9,] "29" "50" "49" "48" "47" "46" "45" "44" "43" "18"
[10,] "28" "27" "26" "25" "24" "23" "22" "21" "20" "19"
Plots
##Plotting matrices
### Make matrix with three vectors
ny = c(3.8,5.5,9.9,15.7,21.5,26.3)
la = c(19.5,19.4,19.7,20.8,21.3,22.7)
fw = c(13.7,15.4,20.0,24.6,28.5,32.7)
### bind all the vectors into a table
table = cbind(ny,la,fw)
### Change the names of the rows
colnames(table) = c("New York","Los Angeles","Fort Worth")
### Cahnge the names of the cloumns
rownames(table) = month.abb[1:6]
### Check to see what it looks like
table
New York Los Angeles Fort Worth
Jan 3.8 19.5 13.7
Feb 5.5 19.4 15.4
Mar 9.9 19.7 20.0
Apr 15.7 20.8 24.6
May 21.5 21.3 28.5
Jun 26.3 22.7 32.7
###Plot with matplot function
### types : "p" = points "l" eguals lines "b" = both
### pch : eguals type of characters
### col : equals colors
matplot(table, type = "b", pch = 15:17, col = 2:4)
Data Frames
#Use the build in data frame know as mtcars
mtcars
#Extract frame subets
edge = mtcars[c(1,2,3),]
edge
# Retrieve a column from the table (column slice)
my_data1 <- mtcars$mpg
my_data2 <- mtcars[, 1] # retrieve a column by index. Column indices start from 1, not 0.
my_data3 <- mtcars[, c("mpg", "cyl", "hp")] # retrieve multiple columns by names
my_data1
[1] 21.0 21.0 22.8 21.4 18.7 18.1 14.3 24.4 22.8 19.2 17.8 16.4 17.3 15.2 10.4 10.4 14.7 32.4 30.4 33.9
[21] 21.5 15.5 15.2 13.3 19.2 27.3 26.0 30.4 15.8 19.7 15.0 21.4
my_data2
[1] 21.0 21.0 22.8 21.4 18.7 18.1 14.3 24.4 22.8 19.2 17.8 16.4 17.3 15.2 10.4 10.4 14.7 32.4 30.4 33.9
[21] 21.5 15.5 15.2 13.3 19.2 27.3 26.0 30.4 15.8 19.7 15.0 21.4
my_data3
#create new dataframes
newdataMTcars = mtcars[c(1,2,3,4,5,6)]
nextdataMtcars = mtcars[c(7,8,9,10)]
#Statistic Funciton in Dataframes
mean(mtcars$mpg)
[1] 20.09062
median(mtcars$mpg)
[1] 19.2
range(mtcars$mpg)
[1] 10.4 33.9
sd(mtcars$mpg)
[1] 6.026948
More Plots
qqnorm(mtcars$mpg)
qqline(mtcars$mpg)
qqplot(mtcars$mpg, mtcars$hp)
---
title: "R in One Post"
output: html_notebook
---


#Getting Started
This tutorial is desgined for the beginner who has some computer programming experience. 
Remember rule number one in Programming 

#Dont Panic
Download RStudion Here https://www.rstudio.com/products/rstudio/download/


#Storing Values
Types of variables
```{r}
integer <- 1
double <- 5.0
character <- "A"
string <- "ABCDEFGHIJKLMNOQRSTUVWXYZ"
boolean <- TRUE
data <- list(12,3.14,"Henry","Bernreuter")
data_1 <- list(dozen = 12, pi = 3.14, user = "henry", happy = TRUE )
print(double)
print(integer)
print(character)
print(string)
print(data)
print(data_1)
data_1$user
vector_months <- c("Jan","Feb","Mar","Apr")
vector_months[1]

```
#Performing operations
```{r}
#Addition
2+2
#Subtraction
2-2
#Division
2/2
#Multiplcation
2*2
#Exponent
3^2
#Modulus
22%%7 

```
#Testing Conditions
```{r}
#Equaliy: 0 equals 0
0 == 0
#InEquality: 1 does not equal 0
1 != 0
#Greater Than: 1 is greater than 0
1 > 0
#Less Than: 0 is less than 1
0 < 1
#Less Than or Egual to: 0 is less than or equal to 1
0 <= 1
#Logical NOT: TRU does not equal TRUE
!TRUE
#Logical AND: TRUE and TRUE equals TRUE
TRUE && TRUE
#Logical OR: TRUE OR FALSE equals TRUE
TRUE || TRUE

```
#Employing Functions
##R has many built in functions. You have already seen the print() function
```{r}

name = "Henry Bernreuter"
print(name)

#Absolute Value
abs(-1)

#Square Root
sqrt(2)

#Integer rounded up
ceiling(4.4)

#Integer rounded down
floor(4.6)

#Truncated
trunc(22/7)

#Round to the nearest number X to N siginficate digits
round(22/7, digits = 3 )

#Nearest number to X to n decimal places
signif(22/7, digits = 7)

#Trigonometry

#cosign
cos(0)
#sin
sin(0)
#tangent
tan(0)
#arccos
acos(0)
#arcsin
asin(0)
#arctan
atan(0)
#logarithm
log(10)
#exponent
exp(0)

#String Functions
substr(string,0,25)
substr(string,0,3)

#Make a string all uppercase
toupper(string)
#make a sting all lower
tolower(string)

#substute one character for another in a string
sub('ABC','123',string)

#current date and time of computer 
# %e = day number
# %a = shorten day name %A = full day name
# %b = shorten month name %B = full month name
# %H = hour number (00 - 23)
# %M = minute number(00-59)
# %y = Year number 4-digit
format(Sys.time(), "%A %b %d %X %Y")

#built in constants
print(LETTERS)
print(letters)
print(month.name)
print(month.abb)

#Concatenate And Print 
#is useful for producing output in user-defined functions.
#It converts its arguments to character vectors
#concatenates them to a single character vector
#appends the given sep function string(s) to each element and then outputs them.

half.year = month.abb[1:6]
cat("Constant", half.year)

#create a random number wih runif() function
random = runif(10)
random

#Creat a sample of number in a range
lottery_numbers = c(1:59)
cat("The winning lottery numbers are:", sample(lottery_numbers,6))

#random normally distrubieted numbers 
rnorm(10)

#randome generated numbers with a mean and standard deviation
normalNumbers = rnorm(10, mean = 1,sd = 1)

#To get the mean
mean(normalNumbers)

#To get the median
median(normalNumbers)
#To get the standard deviation
sd(normalNumbers)
#To get the qualtile
quantile(normalNumbers)
#To get the sum
sum(normalNumbers)
#To get the range
range(normalNumbers)
#to get the max
max(normalNumbers)
#to get the min
min(normalNumbers)

#First Plot 
plot(1:10,normalNumbers,type = "o")



```
#Create new functions with loops
```{r}
#For Loops
half.year = month.abb[1:6]
for (month in half.year){
  print(paste("The months of the year are", month))
}

#While loop
i = 1
while (i < 6) {
print(i)
i = i+1
}
#The standard function syntax is
#  Function name = function(arg1, arg2, arg3)
#{
#  statement to be executed
#  return(object)
#}

f2c = function(degrees){
  result = ((degrees -32)* 5/9)
  return(result)
}
cat("Body Temperature 98.6F =",f2c(98.6), "C")

```
#Building matrices
```{r}
data = seq(1:32)
table = matrix(data, nrow = 4, ncol = 8)
print(table)

#Retrieve a cell value
cat("Cell 4,5 Contains", table[4,5])

#Replace the value with another value
table[4,5] = 10
cat("Cell 4,5 now Contains", table[4,5])



#Spiral Matrix using a loop
i <- 1
j <- 1
i.start = 1
j.start <- 1
i.max <- 10
j.max <- 10
run <- 1
map <- matrix("MT",nrow = 10,ncol = 10)

while(i <= i.max & j <= j.max){
  
  while (j <= j.max){
    if(map[i,j] == "MT"){ #horizontal to the right
      map[i,j] = run
      run = run +1
      j = j +1
    }
  }
  
  j = j -1
  
  while (i <= i.max) {
    if(map[i,j] != "MT") i = i+1 #next row
    else if(map[i,j] == "MT"){ #vertical to the bottom
      map[i,j] = run
      run = run +1
      i = i+1
    }
  }
  
  i = i -1
  
  while(j <= j.max & j >= j.start){
    if(map[i,j] != "MT") j = j-1 #previous column
    else if (map[i,j] == "MT"){
      map[i,j] = run
      run = run +1 
      j = j -1
    }
  }  
  
  i = i -1
  j = j.start #reset
  
  while(i<= i.max & i > i.start){
    if(map[i,j] == "MT"){
      map[i,j] = run
      i = i -1
    }
  } 
  
  i = i +1 
  j = j +1
  i.start = i.start +1
  j.start = j.start +1
  i.max = i.max -1
  j.max = j.max -1
  
}


map
```
#Plots
```{r}
##Plotting matrices
### Make matrix with three vectors 
ny = c(3.8,5.5,9.9,15.7,21.5,26.3)
la = c(19.5,19.4,19.7,20.8,21.3,22.7)
fw = c(13.7,15.4,20.0,24.6,28.5,32.7)
### bind all the vectors into a table
table = cbind(ny,la,fw)
### Change the names of the rows
colnames(table) = c("New York","Los Angeles","Fort Worth")
### Cahnge the names of the cloumns
rownames(table) = month.abb[1:6]
### Check to see what it looks like
table


###Plot with matplot function
### types : "p" = points "l" eguals lines "b" = both
### pch : eguals type of characters
### col : equals colors
matplot(table, type = "b", pch = 15:17, col = 2:4)


```
#Data Frames
```{r}
#Use the build in data frame know as mtcars
mtcars

#Extract frame subets
edge = mtcars[c(1,2,3),]
edge

# Retrieve a column from the table (column slice)
my_data1 <- mtcars$mpg
my_data2 <- mtcars[, 1] # retrieve a column by index. Column indices start from 1, not 0.
my_data3 <- mtcars[, c("mpg", "cyl", "hp")] # retrieve multiple columns by names
my_data1
my_data2
my_data3

#create new dataframes
newdataMTcars = mtcars[c(1,2,3,4,5,6)]
nextdataMtcars = mtcars[c(7,8,9,10)]

#Statistic Funciton in Dataframes
mean(mtcars$mpg)

median(mtcars$mpg)

range(mtcars$mpg)

sd(mtcars$mpg)


```

#More Plots
```{r}
plot(mtcars$mpg, mtcars$cyl)
```
```{r}
hist(mtcars$disp)
```
```{r}
dotchart(mtcars$mpg,labels=row.names(mtcars), cex=0.7, xlab="Miles Per Gallon")
```
```{r}
qqnorm(mtcars$mpg)
qqline(mtcars$mpg)

qqplot(mtcars$mpg, mtcars$hp)
```
```{r}
barplot(mtcars$hp)
```


