R Basics

relative

# print
print('hello world!')
## [1] "hello world!"
# sequence
seq(1, 10)
##  [1]  1  2  3  4  5  6  7  8  9 10
# random numbers
rnorm(100, mean = 10, sd = 2)
##   [1]  9.515524 10.387648  9.330865  9.937639 15.173624  9.755387 10.053197
##   [8] 12.026068 10.254522 11.311913  9.212438 10.772671 12.025905 12.143794
##  [15] 11.129311 15.235886  9.052250  7.623404 10.437346 12.569324  5.318555
##  [22] 13.704500  8.809425 10.038005 10.555874  9.972604 11.215663  9.093054
##  [29]  9.469838 10.131670 12.015468 11.627364 11.008364 12.992889  4.894744
##  [36] 11.473410 16.818322 13.561521  9.161741  9.445026 13.082480  9.380048
##  [43] 11.676142  8.981869 10.982992 11.117855  9.003581  9.453374  8.700419
##  [50] 11.374864  8.917515  8.697298 12.523493 12.933565 12.372217 10.081599
##  [57] 10.172981  9.052852  7.493094 10.489881  9.280688  9.094326 11.058797
##  [64]  6.837192  9.315553  7.769018 11.293130  9.782203  7.578923 11.371979
##  [71] 12.676619 11.055435 10.793742 10.138712 13.778246  9.922188 10.504992
##  [78] 10.159337  9.267272  9.916807 13.051147  9.035931 10.598369  9.134227
##  [85] 10.450397 12.727803 11.383838 12.139811  8.123777 11.633742 11.888562
##  [92] 10.651049  7.738851  7.080023  9.144406 11.606789 10.741442 13.062311
##  [99]  8.111122  9.642038
# average 
mean(rnorm(100))
## [1] 0.1414498
# sum
sum(rnorm(100))
## [1] -8.166785
my_random_sum <- sum(rnorm(100))
my_random_sum
## [1] 4.49654
# install packages from CRAN
install.packages("tidyverse")
install.packages("sf")
install.packages("mapview")
library("tidyverse")
library("sf")
library("mapview")
# Using the help command/shortcut
# When you know the name of a function
help("print") # Help on the print command
?print # Help on the print command using the `?` shortcut

# When you know the name of the package
help(package = "sf") # Help on the package `dplyr`

# Don't know the exact name or just part of it
apropos("print") # Returns all available functions with "print" in the name
??print # shortcut, but also searches demos and vignettes in a formatted page
dbl_var <- c(1, 2.5, 4.5)
int_var <- c(1L, 6L, 10L)
log_var <- c(TRUE, FALSE, T, F)
chr_var <- c("a", "b", "c")
class(dbl_var)
## [1] "numeric"
length(log_var)
## [1] 4
# taking the mean of a character vector
mean(chr_var)

# adding two numeric vectors of different lengths
vec1 <- c(1, 2, 3, 4)
vec2 <- c(2, 3, 5)
vec1 + vec2
ltrs <- c('a', 'b', 'c')
nums <- c(1, 2, 3)
logs <- c(T, F, T)
mydf <- data.frame(ltrs, nums, logs)
mydf
##   ltrs nums  logs
## 1    a    1  TRUE
## 2    b    2 FALSE
## 3    c    3  TRUE
fishdat <- read_csv('data/fishdat.csv')
statloc <- read_csv('data/statloc.csv')
# get the dimensions
dim(fishdat)
## [1] 2844   12
dim(statloc)
## [1] 2173    3
# get the column names
names(fishdat)
##  [1] "OBJECTID"      "Reference"     "Sampling_Date" "yr"           
##  [5] "Gear"          "ExDate"        "Bluefish"      "Common Snook" 
##  [9] "Mullets"       "Pinfish"       "Red Drum"      "Sand Seatrout"
names(statloc)
## [1] "Reference" "Latitude"  "Longitude"
# see the first six rows
head(fishdat)
## # A tibble: 6 x 12
##   OBJECTID Reference     Sampling_Date    yr  Gear ExDate              Bluefish
##      <dbl> <chr>         <date>        <dbl> <dbl> <dttm>                 <dbl>
## 1  1550020 TBM1996032006 1996-03-20     1996   300 2018-04-12 10:27:38        0
## 2  1550749 TBM1996032004 1996-03-20     1996    22 2018-04-12 10:25:23        0
## 3  1550750 TBM1996032004 1996-03-20     1996    22 2018-04-12 10:25:23        0
## 4  1550762 TBM1996032207 1996-03-22     1996    20 2018-04-12 10:25:23        0
## 5  1550828 TBM1996042601 1996-04-26     1996   160 2018-04-12 10:25:23        0
## 6  1550838 TBM1996051312 1996-05-13     1996   300 2018-04-12 10:25:23        0
## # ... with 5 more variables: Common Snook <dbl>, Mullets <dbl>, Pinfish <dbl>,
## #   Red Drum <dbl>, Sand Seatrout <dbl>
head(statloc)
## # A tibble: 6 x 3
##   Reference     Latitude Longitude
##   <chr>            <dbl>     <dbl>
## 1 TBM1996032006     27.9     -82.6
## 2 TBM1996032004     27.9     -82.6
## 3 TBM1996032207     27.9     -82.5
## 4 TBM1996042601     28.0     -82.7
## 5 TBM1996051312     27.9     -82.6
## 6 TBM1996051407     27.9     -82.6
# get the overall structure
str(fishdat)
## spec_tbl_df[,12] [2,844 x 12] (S3: spec_tbl_df/tbl_df/tbl/data.frame)
##  $ OBJECTID     : num [1:2844] 1550020 1550749 1550750 1550762 1550828 ...
##  $ Reference    : chr [1:2844] "TBM1996032006" "TBM1996032004" "TBM1996032004" "TBM1996032207" ...
##  $ Sampling_Date: Date[1:2844], format: "1996-03-20" "1996-03-20" ...
##  $ yr           : num [1:2844] 1996 1996 1996 1996 1996 ...
##  $ Gear         : num [1:2844] 300 22 22 20 160 300 300 300 300 22 ...
##  $ ExDate       : POSIXct[1:2844], format: "2018-04-12 10:27:38" "2018-04-12 10:25:23" ...
##  $ Bluefish     : num [1:2844] 0 0 0 0 0 0 0 0 0 0 ...
##  $ Common Snook : num [1:2844] 0 0 0 0 0 0 0 0 0 0 ...
##  $ Mullets      : num [1:2844] 0 0 0 0 0 0 0 0 0 0 ...
##  $ Pinfish      : num [1:2844] 0 54 0 80 0 0 0 0 1 1 ...
##  $ Red Drum     : num [1:2844] 0 0 1 0 4 0 0 0 0 0 ...
##  $ Sand Seatrout: num [1:2844] 1 0 0 0 0 1 5 66 0 0 ...
##  - attr(*, "spec")=
##   .. cols(
##   ..   OBJECTID = col_double(),
##   ..   Reference = col_character(),
##   ..   Sampling_Date = col_date(format = ""),
##   ..   yr = col_double(),
##   ..   Gear = col_double(),
##   ..   ExDate = col_datetime(format = ""),
##   ..   Bluefish = col_double(),
##   ..   `Common Snook` = col_double(),
##   ..   Mullets = col_double(),
##   ..   Pinfish = col_double(),
##   ..   `Red Drum` = col_double(),
##   ..   `Sand Seatrout` = col_double()
##   .. )
str(statloc)
## spec_tbl_df[,3] [2,173 x 3] (S3: spec_tbl_df/tbl_df/tbl/data.frame)
##  $ Reference: chr [1:2173] "TBM1996032006" "TBM1996032004" "TBM1996032207" "TBM1996042601" ...
##  $ Latitude : num [1:2173] 27.9 27.9 27.9 28 27.9 ...
##  $ Longitude: num [1:2173] -82.6 -82.6 -82.5 -82.7 -82.6 ...
##  - attr(*, "spec")=
##   .. cols(
##   ..   Reference = col_character(),
##   ..   Latitude = col_double(),
##   ..   Longitude = col_double()
##   .. )
View(fishdat)
View(statloc)
library(readxl)
dat <- read_excel('location/of/excel/file.xlsx')

R Basics

Lesson Outline

Lesson Exercises

Goals and Motivation

Why should I invest time in R?

RStudio

Open R and RStudio

RStudio projects

Scripting

Executing code in RStudio

Exercise 1

R language fundamentals

What is the environment?

Packages

CRAN

Installing packages

Exercise 2

Getting Help

Help from the console

Official R Resources

Google and StackOverflow

Other Resources

Data structures in R

Vectors (one-dimensional data)

2-dimensional data

Getting your data into R

The working directory

Exercise 3

Other ways to import data

Summary