a <- c(1,0,2,1) # Input vector (1-dimensional array)
a <- sort(a) # Sort vector
a

[1] 0 1 1 2


n <- length(a) # Calculate length of vector 'a'
n

[1] 4


m <- (n + 1) %/% 2 # Calculate mid-point, %/% is operator for integer division 
m

[1] 2


n %% 2 == 1 # Check whether the number of elements is odd, %% (modulo) gives remainder of division

[1] FALSE


mean(a[m:m+1])

[1] 1


a <- c(1, 0, 2, 1, 100)
a <- sort(a)
n <- length(a)
m <- (n + 1) %/% 2
if (n %% 2 == 1) {
  a[m]
}

[1] 1


a <- c(1, 0, 2, 1)
a <- sort(a)
n <- length(a)
m <- (n + 1) %/% 2
if (n %% 2 == 1) {
  a[m]
} else {
  mean(a[m:m+1])
}

[1] 1


x <- 42
if (x > 0) {
  print("Positive")
} else if (x < 0) {
  print("Negative")
} else {
  print("Zero")
}

[1] "Positive"


# Ask for user input and cast as double
num <- as.double(readline("Please, enter a number:"))
if (num %% 2 == 0) {
  print("Even")
} else if (num %% 2 == 1) {
  print("Odd")
} else {
  print("This is a real number")
}

Please, enter a number:43
[1] "Odd"


num <- as.integer(readline("Please, enter a number:")) # Ask for user input and cast as integer
if (num > 0) {
  if (num %% 2 == 0) {
    print("Positive even")
  } else {
    print("Positive odd")  
  }    
} else if (num < 0) {
  if (num %% 2 == 0) {
    print("Negative even") # Notice that odd/even check appears twice    
  } else {
    print("Negative odd") # Consider abstracting this as a function 
  }
} else {
  print("Zero")  
}

Please, enter a number:-43
[1] "Negative odd"


num <- 1:10
num

 [1]  1  2  3  4  5  6  7  8  9 10


ifelse(num %% 2 == 0, "even", "odd")

 [1] "odd"  "even" "odd"  "even" "odd"  "even" "odd"  "even" "odd"  "even"


# Calculate a factorial with decrementing function
# E.g. 5! = 1 * 2 * 3 * 4 * 5 = 120
x <- 5
factorial <- 1
while (x > 0) {
  factorial <- factorial * x
  x <- x - 1
}
factorial

[1] 120


x <- seq(5)
factorial <- 1
for (i in x) {
  factorial <- factorial * i
}
factorial

[1] 120


# Find maximum value in a vector with exhaustive enumeration
v <- c(3, 27, 9, 42, 10, 2, 5)
max_val <- v[1]
for (i in v) {
  if (i > max_val) {
    max_val <- i
  }
}
max_val

[1] 42


# If by argument is omitted, it defaults to 1
s <- seq(25, 44)
s

 [1] 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44


# seq_len() is equivalent to seq(1, length(<object>))
seq_len(length(s))

 [1]  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20


seq_along(s)

 [1]  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20


# The sequence that you are supplying to seq_along() doesn't have to be numeric
seq_along(letters[1:20])

 [1]  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20


# vector() function is useful for initiliazing empty vectors of known type and length
s2 <- vector(mode = "double", length = length(s))
for (i in seq_len(length(s))) {
    s2[i] <- s[i] * 2
}

s2

 [1] 50 52 54 56 58 60 62 64 66 68 70 72 74 76 78 80 82 84 86 88


s3 <- vector(mode = "double", length = length(s))
for (i in seq_along(s)) {
    s3[i] <- s[i] * 3
}

s3

 [1]  75  78  81  84  87  90  93  96  99 102 105 108 111 114 117 120 123 126 129
[20] 132


for (i in seq(1,6)) {
  if (i %% 2 == 0) {
    break
  }
  print(i)
}

[1] 1


for (i in seq(1,6)) {
  if (i %% 2 == 0) {
    next
  }
  print(i)
}

[1] 1
[1] 3
[1] 5


i <- 1
while (TRUE) {
  i <- i + 1
  if (i > 10) {
    break
  }
}

i

[1] 11


i <- 1
repeat {
  i <- i + 1
  if (i > 10) {
    break
  }
}

i

[1] 11


foo <- function(arg) {
  # <function_body>
}


is_positive <- function(num) {
  if (num > 0) {
    return(TRUE)
  } else {
    return(FALSE)
  }
}


body(is_positive)

{
    if (num > 0) {
        return(TRUE)
    }
    else {
        return(FALSE)
    }
}


formals(is_positive)

$num


environment(is_positive)

<environment: R_GlobalEnv>


is_positive <- function(num) {
  if (num > 0) {
    res <- TRUE
  } else {
    res <- FALSE
  }
  return(res)
}


res_1 <- is_positive(5)
res_2 <- is_positive(-7)


print(res_1)
print(res_2)

[1] TRUE
[1] FALSE


is_positive <- function(num) {
  if (num > 0) {
    res <- TRUE
  } else {
    res <- FALSE
  }
  res
}


res_1 <- is_positive(5)
res_2 <- is_positive(-7)


print(res_1)
print(res_2)

[1] TRUE
[1] FALSE


# While this function provides the same functionality as the two versions above
# This is an example of a bad programming style, return value is very unintuitive
is_positive <- function(num) {
  if (num > 0) {
    res <- TRUE
  } else {
    res <- FALSE
  }
}


res_1 <- is_positive(5)
res_2 <- is_positive(-7)


print(res_1)
print(res_2)

[1] TRUE
[1] FALSE


format_date <- function(day, month, year, reverse = TRUE) {
  if (isTRUE(reverse)) {
    formatted <- paste(
      as.character(year), as.character(month), as.character(day), sep = "-"
    )
  } else {
    formatted <- paste(
      as.character(day), as.character(month), as.character(year), sep = "-"
    )
  }
  return(formatted)
}


format_date(4, 10, 2021)

[1] "2021-10-4"


format_date(y = 2021, m = 10, d = 4) # Technically correct, but rather unintuitive

[1] "2021-10-4"


format_date(y = 2021, m = 10, d = 4, FALSE) # Technically correct, but rather unintuitive

[1] "4-10-2021"


format_date(day = 4, month = 10, year = 2021, FALSE)

[1] "4-10-2021"


which_integer <- function(num) {
  even_or_odd <- function(num) {
    if (num %% 2 == 0) {
      return("even")
    } else {
      return("odd")
    }
  }
  eo <- even_or_odd(num)
  if (num > 0) {
    return(paste0("positive ", eo))
  } else if (num < 0) {
    return(paste0("negative ", eo))
  } else {
    return("zero")
  }
}


which_integer(-43)

[1] "negative odd"


even_or_odd(-43)

Error in even_or_odd(-43): could not find function "even_or_odd"
Traceback:


x <- 42
# is equivalent to:
# Binding R object '42', double vector of length 1, to name 'x' in the global environment
assign("x", 42, envir = .GlobalEnv)
x

[1] 42


x <- 5
foo <- function() {
  x <- 12
  return(x)
}
y <- foo()
print(y)
print(x)

[1] 12
[1] 5


`+`(3, 2) # Equivalent to: 3 + 2

[1] 5


`<-`(x, c(10, 12, 14)) # x <- c(10, 12, 14)
x

[1] 10 12 14


`[`(x, 3) # x[3]

[1] 14


`>`(x, 10) # x > 10

[1] FALSE  TRUE  TRUE


add_five <- function() {
  return(function(x) x + 5)
}
af <- add_five()


af # 'af' is just a function, which is yet to be invoked (called)

function(x) x + 5
<environment: 0x55baf8cccac0>


af(10) # Here we call a function and supply 10 as an argument

[1] 15


# Due to vectorized functions in R this example is an obvious overkill (seq(10) ^ 2 would do just fine)
# but it shows a general approach when we might need to apply a non-vectorized functions
sapply(seq(10), function(x) x ^ 2)

 [1]   1   4   9  16  25  36  49  64  81 100


# Applies a supplied function to a random draw
# from the normal distribution with mean 0 and sd 1
functional <- function(f) { f(rnorm(10)) }


functional(mean)

[1] 0.3186378


functional(median)

[1] -0.2481884


functional(sum)

[1] 1.492055


l <- list(a = 1:2, b = 3:4, c = 5:6, d = 7:8, e = 9:10)


# Apply sum() to each element of list 'l'
lapply(l, sum)

$a
[1] 3

$b
[1] 7

$c
[1] 11

$d
[1] 15

$e
[1] 19


# We can exploit the fact that basic operators are function calls
# Here, each subsetting operator `[` with argument 2 is applied to each element
# Which gives us second element within each element of the list
lapply(l, `[`, 2)

$a
[1] 2

$b
[1] 4

$c
[1] 6

$d
[1] 8

$e
[1] 10


m <- matrix(1:12, nrow = 3, ncol = 4)
m

     [,1] [,2] [,3] [,4]
[1,] 1    4    7    10  
[2,] 2    5    8    11  
[3,] 3    6    9    12


# Sum up rows (can also be achieved with rowSums() function)
apply(m, 1, sum)

[1] 22 26 30


# Calculate averages across columns (also available in colMeans())
apply(m, 2, mean)

[1]  2  5  8 11


# Find maximum value in each column
apply(m, 2, max)

[1]  3  6  9 12


means <- -2:2
sds <- 1:5


# Generate one draw from a normal distribution where
# each mean is an element of vector 'means'
# and each standard deivation is an element of vector 'sds'
#
# rnorm(n, mean, sd) takes 3 arguments: n, mean, sd

mapply(rnorm, 1, means, sds)

[1] -0.7043966 -2.9181125  0.7705752  0.8115289  4.9755344


# While simplification of output
# (attempt to collapse it in fewer dimensions)
# makes hard to predict the object returned 
# by apply() functions that have simplified = TRUE by default

mapply(rnorm, 5, means, sds)

     [,1]      [,2]       [,3]        [,4]       [,5]      
[1,] -3.058834 -1.0853410 -0.08222913 -0.6397508  1.8098831
[2,] -2.759082 -3.6308276 -1.53727082  1.4870609 -0.4620664
[3,] -1.633935 -0.1775828 -3.99636499  2.7069711  4.1554896
[4,] -1.241012 -1.8139769 -0.35165313  5.2904383 11.1715264
[5,] -1.227846 -1.5496606  2.82421174  5.9838118  4.9411164


# Package 'Matrix' is part of the standard R library and doesn't have to be installed separately
library("Matrix")


# While it is possible to just use function sparseVector() after loading the library,
# it is good practice to state explicitly which package the object is coming from.
sv <- Matrix::sparseVector(x = c(1, 2, 3), i = c(3, 6, 9), length = 10)

sv

sparse vector (nnz/length = 3/10) of class "dsparseVector"
 [1] . . 1 . . 2 . . 3 .

Function	Description	Input Object	Output Object	Simplified
`apply()`	Apply a given function to margins (rows/columns) of input object	matrix/array/data.frame	vector/matrix/array/list	Yes
`lapply()`	Apply a given function to each element of input object	vector/list	list	No
`sapply()`	Same as `lapply()`, but output is simplified	vector/list	vector/matrix	Yes
`vapply()`	Same as `sapply()`, but data type of output is specified	vector/list	vector	No
`mapply()`	Multivariate version of `sapply()`, takes multiple objects as input	vectors/lists	vector/matrix	Yes

Week 3: Control Flow and Functions¶

Introduction to Computer Programming for Data Analysis I¶

Tom Paskhalis¶

11 May 2022¶

Overview¶

Algorithm flowchart¶

Algorithm flowchart (R)¶

Calculate median¶

Control flow in R¶

Branching programs¶

Conditional statements¶

Conditional statements: if¶

Conditional statements: if - else¶

Conditional statements: if - else if - else¶

Example of longer conditional statement¶

Optimising conditional statements¶

Nesting conditional statements¶

ifelse() function¶

Iteration (looping)¶

Iteration: while¶

Iteration: for¶

Iteration with conditional statements¶

Generating sequences for iteration¶

Generating sequences for iteration examples¶

Generating sequences for iteration examples continued¶

Iteration: break and next¶

Infinite loop¶

Infinite loops¶

Iteration: repeat¶

Decomposition and abstraction¶

Decomposition and abstraction¶

Functions¶

Functions in R¶

Function components¶

Function components example¶

Function call¶

Function call example¶

Implicit return example¶

Implicit return example continued¶

Function arguments¶

Function arguments example¶

Nested functions¶

R environment basics¶

R environment example¶

Every operation is a function call¶

Examples of operators as function calls¶

Anonymous functions¶

Functionals¶

Functional example¶

Summary of common apply() functions¶

lapply() function¶

lapply() examples¶

apply() function¶

apply() examples¶

mapply() function¶

mapply() examples¶

Packages¶

Package loading example¶

Next¶

Conditional statements: `if`¶

Conditional statements: `if - else`¶

Conditional statements: `if - else if - else`¶

`ifelse()` function¶

Iteration: `while`¶

Iteration: `for`¶

Iteration: `break` and `next`¶

Iteration: `repeat`¶

Summary of common `apply()` functions¶

`lapply()` function¶

`lapply()` examples¶

`apply()` function¶

`apply()` examples¶

`mapply()` function¶

`mapply()` examples¶