We’ve already shown that in functional programming we prefer to use recursive functions over imperative loops with mutable state, and we’ve demonstrated the power of recursion in a few examples. However, as simple as the examples are, it would simply be too tedious to write a fully-blown recursive function every single time we want to have some repetition in our code.
A very common reason to repeatedly evaluate the same code against different values happens whenever we need to process sequential data such as collections, lists, arrays, lines of text. Imagine that we have an array of numbers, and we need to perform the same calculation, e.g. to double the value, on all elements and capture the results.
An iterative solution would look like this:
let double = function(x){
return x * 2;
}
let processAllIterative = function(fn, coll) {
let results = []
for (let i = 0; i < coll.length; i++) {
results[i] = fn(coll[i])
}
return results;
}
processAllIterative(double, [1, 0, 3, 5, 7])
//=> [2, 0, 6, 10, 14]
And a recursive solution:
let processAllRecursive = function(fn, coll) {
if(coll.length == 0){
return [];
}
if(coll.length == 1){
return [fn(coll[0])]
}
return [fn(coll[0]), ...processAllRecursive(fn, coll.slice(1))];
}
processAllRecursive(double, [1, 0, 3, 5, 7])
//=> [2, 0, 6, 10, 14]
Notice how, whether we used iteration or recursion, we were able to come up with a reusable higher order function that we can now use to apply any kind of function on any kind of array of data. Let’s say we want to capitalize all words in a word list:
let capitalize = function(word){
return word.toUpperCase()
}
let wordList = ["apple", "banana", "pear"]
processAllIterative(capitalize, wordList)
//=> ["APPLE", "BANANA", "PEAR"]
processAllRecursive(capitalize, wordList)
//=> ["APPLE", "BANANA", "PEAR"]
Or, that we wanted to count all the letters in each of these words:
let countLetters = function(word){
return word.length;
}
processAllIterative(countLetters, wordList)
//=> [5, 6, 4]
processAllRecursive(countLetters, wordList)
//=> [5, 6, 4]
The point we’re reaching to in this exercise is that in some cases we can transparently use a recursive (or even a plain old iterative) algorithm without having to explicitly write a recursive function ourselves.
Instead, we get to rely on a higher order function to do the boring generic things like recursing (or looping) through the collection and we supply the specific part like the transformation function as a function as object parameter.
In this example, we wrote the higher order recursive functions processAllIterative
and processAllRecursive
ourselves. We did that primarily for illustration purposes, however. The best thing about processing sequential
data is that it is such a common problem to solve. So much that every respectable programming language has troves of
off-the-shelf functions that cover most situations that we may encounter.
In fact, when we wrote processAllIterative
and processAllRecursive
we sort of reinvented the wheel, because
this function is commonly known as map
and it is already available in JavaScript and many other languages.
In this chapter, we’ll explore it along with the other most representative sequence transformation functions:
map
- takes a sequence and returns another sequence of the same lengthreduce
- takes a sequence and typically returns a scalar or an otherwise aggregated valuefilter
- takes a sequence and returns another sequence which is either shorter or of the same length- sequence generators like
range
,repeat
oriterate
And when we’re done with them, we’ll show how we can compose all these individually useful functions into very powerful pipelines using function composition and threading.
So, let’s get started!
Map
Map is a function that receives a transformation function and an input sequence and returns the output sequence with all the results of the transformation function applied to elements of the input sequence, in the same order. Map always returns an output sequence of the same length as the input sequence.
In JavaScript, map
is implemented as a method of array object. That is to say that we invoke it on the array
object and then pass the function as the parameter:
wordList.map(capitalize)
//=> ["APPLE", "BANANA", "PEAR"]
wordList.map(countLetters)
//=> [5, 6, 4]
The function being passed to map
is expected to have up to three parameters:
map(function(element, index, array){ /* ... */ })
- element - the current element
- index - index of the current element in the array
- array - reference to the whole array
Typically, we only need the element value, but sometimes having access to its position in the array can be useful, e.g. let’s say that we have a list of chapters in a book, much like the one you are reading right now, and let’s say we want to format their title names to start with their ordinal number:
let chapters = ["Intro", "Basic", "Advanced", "Summary"];
let formatTitle = function(chapterName, index){
return (index + 1) + ". " + chapterName; //don't forget - index is zero-based!
}
chapters.map(formatTitle)
//=> ["1. Intro", "2. Basic", "3. Advanced", "4. Summary"]
And why would we ever need the third parameter, the reference to the whole array? Let’s say we want to format the chapter numbers to include the total number of chapters:
let formatTitle = function(item, index, array){
return (index + 1) + "/" + array.length + " " + item;
}
chapters.map(formatTitle)
//=> ["1/4 Intro", "2/4 Basic", "3/4 Advanced", "4/4 Summary"]
Now that we’ve seen JavaScript support for map
, let’s see how the equivalent function looks like in Clojure:
(def word-list ["apple" "banana" "pear"])
(map #(.toUpperCase %) word-list)
;;=> ("APPLE" "BANANA" "PEAR")
(map count word-list)
;;=> (5 6 4)
Full function documentation string:
clojure.core/map
([f] [f coll] [f c1 c2] [f c1 c2 c3] [f c1 c2 c3 & colls])
Returns a lazy sequence consisting of the result of applying f to
the set of first items of each coll, followed by applying f to the
set of second items in each coll, until any one of the colls is
exhausted. Any remaining items in other colls are ignored. Function
f should accept number-of-colls arguments. Returns a transducer when
no collection is provided.
So far it looks similar. How about having access to element index? In Clojure we do that with a separate
function called map-indexed
:
(defn format-title [index item]
(str (inc index) ". " item))
(map-indexed format-title word-list)
;;=> ("1. Intro", "2. Basic", "3. Advanced", "4. Summary")
And the docstring:
([f] [f coll])
Returns a lazy sequence consisting of the result of applying f to 0
and the first item of coll, followed by applying f to 1 and the second
item in coll, etc, until coll is exhausted. Thus function f should
accept 2 arguments, index and item. Returns a stateful transducer when
no collection is provided.
Note that the expected order of index
and item
parameters is reverse between JavaScript and Clojure.
Another notable difference is that Clojure does not let you access the whole data structure in the item processing
function.
One thing Clojure map
can do that it JavaScript counterpart cannot is to process multiple sequences at once!
(map + [1 2 3] [10 20 30])
;;=> (11 22 33)
What happens in this case is that the passed function is expected to have as many parameters as we have sequences and it is being called for each pair of values one by one, constructing the output sequence from the results:
(+ 1 10)
(+ 2 20)
(+ 3 30)
The sequences don’t even have to match in length - as soon as the shortest sequence is fully consumed map
will
call it a day and the output will effectively have the length of the shortest input sequence:
(map + [1 2 3] [10])
;;=> (11)
Here the +
function evaluated just once, and then map
ran out of elements in the second sequence:
(+ 1 10)
Which means that we can even use infinite sequences. As long as at least one sequence in map is finite, we’ll get our result:
(map + [1 2 3] (repeat 10))
;;=> (11 12 13)
Function repeat
is returns an infinite lazy sequence that simply repeats the parameter it recieved,
so (repeat 10)
will just keep repeating 10
. Here map
will run out elements with the first sequence,
so it will only do the addition three times:
(+ 1 10)
(+ 2 10)
(+ 3 10)
Map is a very useful higher order function which we can use whenever we need to transform every element of a sequential data structure using the same function. But, what if we had to use a sequence to calculate a single piece of aggregated data? E.g. to calculate a sum of all the numbers in it? There’s a function for that as well - reduce.
Reduce
Let’s say we have this array of numbers:
let numbers = [1, 4, 3, 5, 6, 3];
How do we calculate its sum recursively?
- We start by saying that the initial sum is 0 - that’s the accumulator value in our recursion
- Then we calculate the sum of the accumulator and the first element of the collection: 0 + 1 = 3
- Now we recursively repeat the same thing with this result as our new accumulator and the rest of the numbers, until we run out of them.
Or in code:
let sum = function(numbers, acc = 0){
if(numbers.length == 0){
return 0;
}
if(numbers.length == 1){
return numbers[0]
}
return acc + sum(numbers.splice(1))
}
sum(numbers)
//=> 22
If we remember our example from the chapter on recursion, we can see that recursive function calculating the maximum value in an array is quite similar, especially if we refactor it a bit:
let maxOfTwo = function(a, b){
if(a > b){
return a;
}
return b;
}
let max = function (numbers, acc) {
if (numbers.length == 0) {
return null;
}
if (numbers.length == 1) {
return numbers[0];
}
if (acc === undefined) {
acc = numbers[0];
numbers = numbers.splice()
}
return maxOfTwo(acc, max(numbers.splice(1)))
}
In both cases we have:
- an accumulator parameter whose initial value we can either
- set explicitly like we set it to 0 in
sum
, or - default it to the first element of the array, like we did in
max
- set explicitly like we set it to 0 in
- an exit clause when the array is empty
- an exit clause when the array has exactly one element
- a call to the aggregation function passing two parameters: the accumulator and the recursive call on the rest of the array.
In JavaScript reduce
function is implemented as a method of Array
object:
reduce(function(previousValue, currentValue, currentIndex, array) { /* ... */ }, initialValue)
It expects two parameters:
- the aggregator function, which itself needs to expect some parameters:
previousValue
- the first value being aggregated, typically passed down as the accumulator or picked as the first element in the array.currentValue
- the second value being aggregated, typically the first element of the rest of the arraycurrentIndex
- just like withmap
, we can optionally use the element position in the arrayarray
- just like withmap
, we can optionally use the reference to the whole array
initialValue
- the initial value of the accumulator, if omitted the first element of the array will be used
To be able to use this with our example, we first need to write an aggregator function which satisfies these conditions:
let add = function(a, b){
return a + b;
}
numbers.reduce(add, 0)
//=> 22
//note that we could have omitted the initialValue - it would have worked just as well
numbers.reduce(add)
//however, it is a good practice to set it anyway, in case there's a chance that we might run reduce
//on an empty array:
[].reduce(add)
//=> Uncaught TypeError: Reduce of empty array with no initial value
[].reduce(add, 0)
//=> 0
Can we do the same thing for max
?
numbers.reduce(maxOfTwo)
//=> 6
And how does reduce
look like in Clojure?
(reduce + 0 [1 4 3 5 6 3])
;;=> 22
(reduce + [1 4 3 5 6 3])
;;=> 22
And the docstring:
clojure.core/reduce
([f coll] [f val coll])
f should be a function of 2 arguments. If val is not supplied,
returns the result of applying f to the first 2 items in coll, then
applying f to that result and the 3rd item, etc. If coll contains no
items, f must accept no arguments as well, and reduce returns the
result of calling f with no arguments. If coll has only 1 item, it
is returned and f is not called. If val is supplied, returns the
result of applying f to val and the first item in coll, then
applying f to that result and the 2nd item, etc. If coll contains no
items, returns val and f is not called.
So, we get to use another powerful recursive algorithm without having to write a recursive function! Sounds like a sure win - let’s see what other algorithms we can reuse.
Filter
Sometimes we have a sequence and want to filter out some elements based on some criteria.
In JavaScript, we can use array method filter
to do so.
filter(function(element, index, array){ /* ... */ })
E.g. let’s say that we have an array of numbers and we want to have an array containing only the even elements:
let numbers = [2, 11, 7, 3, 6, 7, 8]
let isEven = function(element){
return (element % 2) === 0;
}
numbers.filter(isEven)
//=> [2, 6, 8]
We call the criteria function a predicate, which is really just a fancy word for a function that returns a boolean value.
Consistently with map
and reduce
array methods, we optionally have access to each element’s index and even the
whole array in the predicate function. So, if we wanted to, we could also filter only the even-indexed elements:
let isEvenIndexed = function(element, index){
return (index % 2) === 0;
}
numbers.filter(isEvenIndexed)
//=> [2, 7, 6, 8]
In Clojure, we can use equivalent filter
function:
(filter even? [2 11 7 3 6 7 8])
;;=> [2 6 8]
The fact that there’s a built-in function even?
in Clojure makes this example even easier!
Notice how predicate even?
ends with question mark? Clojure code convention states that predicate function name
should end with a ?
which is a valid character to appear in a symbol name.
Sequence generators
Now we’ll explore several functions that generate sequential data structures from simple scalars. Since support for these is a bit better in Clojure, we’ll use that language first this time.
We already used one such function when we were playing with map
, actually. Remember repeat
?
clojure.core/repeat
([x] [n x])
Returns a lazy (infinite!, or length n if supplied) sequence of xs.
We can use repeat
to create an arbitrarily large or even infinite sequence that just keeps repeating the same value:
(repeat 5 "a")
;;=> ("a" "a" "a" "a" "a")
By supplying the first parameter, we ensured that we’d only get a five elements long sequence. If we omit it, we get an infinitely long one:
;;don't evaluate - it will kill your REPL
(repeat "a")
;;wrap infinite sequences with take when you evaluate them
;;you'll get a preview of what's in it and your REPL will live to tell the tale
(take 5 (repeat "a"))
;;=> ("a" "a" "a" "a" "a")
Now, JavaScript arrays are not lazy data structures, which, among other things, means that they cannot be infinite in size. As a consequence, the JavaScript equivalent only supports fixed length:
Array(5).fill("a")
//=> ["a", "a", "a", "a", "a"]
What actually happens here is that Array(5)
creates an empty five elements long array and then fill("a")
fills all the array elements with the same given value.
Another useful Clojure function is range
.
clojure.core/range
([] [end] [start end] [start end step])
Returns a lazy seq of nums from start (inclusive) to end
(exclusive), by step, where start defaults to 0, step to 1, and end to
infinity. When step is equal to 0, returns an infinite sequence of
start. When start is equal to end, returns empty list.
We can use it to quickly generate numerical sequences:
;;without any parameters, it returns an infinite sequence from 0 and on
(take 5 (range))
;;=> (0 1 2 3 4)
;;with one parameter, it returns a finite sequence from 0 to specified end, exclusive
(range 5)
;;=> (0 1 2 3 4)
;;with two parameters, it returns a finite sequence from start to end, exclusive
(range 3 5)
;;=> (3 4 5)
;;with three parameters, it returns a finite sequence from start to end, with a custom increment
(range 0 5 2)
;;=> (0 2 4)
;;increment may be a negative number, in which case start should be larger than end
(range 5 0 -1)
;;=> (5 4 3 2 1)
We don’t have a built-in range
function, but we can easily write one:
let range = function(start, end, step = 1){
if((step > 0 && start >= end) ||
(step < 0 && start <= end)){
return [];
}
return [start, ...range(start + step, end, step)]
}
range(3, 5)
//=> [3, 4, 5]
range(0, 5, 2)
//=> [0, 2, 4]
range(5, 0, -1)
//=> [5, 4, 3, 2, 1]
The third sequence generation function we’ll explore is iterate
. Contrary to its name, it is a recursive function
that starts with a single value, applies a function to it, then applies a function to the result, then applies it
to the new result and so on. The final result is a sequence that starts with the initial value and has all the
results in the order of their calculation.
clojure.core/iterate
([f x])
Returns a lazy sequence of x, (f x), (f (f x)) etc. f must be free of side-effects
Let’s try a few examples. Note that the result is an infinite lazy sequence, so we need to limit the number of items we want to evaluate
(defn square [x]
(* x x))
(take 5 (iterate square 2))
;;=> (2 4 16 256 65536)
Interestingly, range
can also be calculated with iterate
:
(take 5 (iterate inc 0))
;;=> (0 1 2 3 4)
Since JavaScript arrays cannot be lazy and infinite, we’ll need to constrain the size in the JavaScript implementation:
let iterate = function(fn, value, length, acc = [value]){
if(length === acc.length){
return acc;
}
let current = fn(value);
return iterate(fn, current, length, [...acc, current]);
}
let square = function(x){
return x * x;
}
iterate(square, 2, 5)
//=> [2, 4, 16, 256, 65536]
let inc = function(x){
return x + 1;
}
iterate(inc, 0, 5)
//=> [0, 1, 2, 3, 4]
Composite functions and pipelines
We explored a several important functions that work with sequential data structures:
map
reduce
filter
repeat
range
iterate
This is not by any means an exhaustive list of all such functions, even if it includes some of the more well known such functions.
Now, that we have a bunch of puzzle pieces, what do we do to assemble the big picture? Let’s say that we had a
slightly more complex problem to solve - write a function that calculates the sum of squares of all numbers
smaller than number
that have digit
as their penultimate digit. We express this problem in terms of operations we
just learned:
- We can start by getting all the numbers smaller than 100 - that’s
range
- Then we can
filter
the ones that have 7 as the penultimate digit, e.g. 71, 175, etc. - Finally, we can sum them all up with
reduce
In JavaScript, we would do something like this:
function partial(f, ...fixedParams){
return function(){
return f(...fixedParams, ...arguments)
}
}
let square = function(x){
return x * x;
}
let isPenultimateDigit = function(digit,number){
return Math.trunc(number / 10) % 10 === digit
}
let add = function(a, b){
return a + b;
}
let calculate = function(digit, number) {
let initial = range(0, number);
let squares = initial.map(square);
let eligible = squares.filter(partial(isPenultimateDigit, digit));
return eligible.reduce(add, 0)
}
calculate(2, 10)
//=> 25
And in Clojure:
(defn square [x]
(* x x))
(defn penultimate-digit? [digit number]
(= digit (mod (int (/ number 10)) 10)))
(defn calculate [digit number]
(reduce + (filter (partial penultimate-digit? digit) (map square (range number)))))
(calculate 2 10)
;;=> 25
It does the job, but looks a bit messy. Let us make it more readable by giving names to the intermediary results:
(defn calculate [digit number]
(let [initial (range number)
squares (map square initial)
eligible (filter (partial penultimate-digit? digit) squares)]
(reduce + eligible)))
(calculate 2 10)
;;=> 25
See how easily we combined all the operations into a whole. We even got to use partial
from the previous
chapters to reconcile the fact that penultimate-digit?
expects two parameters and filter
only passes one.
We can push things even further and use a higher order functions to compose the functions that perform all
the individual pieces of computation into one big function. In Clojure, we do that with comp
, which is short
for composition.
clojure.core/comp
([] [f] [f g] [f g & fs])
Takes a set of functions and returns a fn that is the composition
of those fns. The returned fn takes a variable number of args,
applies the rightmost of fns to the args, the next
fn (right-to-left) to the result, etc.
In our example, we’d get something like this:
(defn create-calculate [digit number]
(comp #(reduce + %)
#(filter (partial penultimate-digit? digit) %)
#(map square %)
#(range number)))
(def calculate
(create-calculate 2 10))
(calculate)
;;=> 25
It’s a step in the right direction, but we see some drawbacks as well:
- a bit counterintuitively, the functions listed in
comp
are evaluated in right-to-left order (or here, more specifically, upside-down) - we need every function to take exactly one argument and it needs to match the shape of the output argument of the function before it. This means that we have to capture any parameters which are used in arbitrary steps of the overall calculation in a closure and create a function with concrete parameter values.
In Clojure, we have another powerful built-in tool - threading macros:
->
- thread-first macro->>
- thread-last macro
Specifically for this example, we’ll use the thread-last macro:
(defn calculate [digit number]
(->> (range number)
(map square)
(filter (partial penultimate-digit? digit))
(reduce +)))
(calculate 2 10)
;;=> 25
Clojure macros aren’t regular functions. They are evaluated at compile time and they reshape the passed code into
something else. We can inspect what our expression gets reshaped into by using macroexpand
:
(macroexpand '(->> (range number)
(map square)
(filter (partial penultimate-digit? digit))
(reduce +))
;;=> (reduce + (filter (partial penultimate-digit? digit) (map square (range number))))
Which is… the very first thing we tried! So, threading macros are really just a fancy syntax to make deeply nested function calls readable.
We don’t have the equivalents of comp
or ->>
built-in with JavaScript, but that’s not a problem at all - we
can implement them ourselves:
let comp = function(current, ...rest){
if(rest.length === 0){
return current;
}
return function(x){
return current(comp(...rest)(x))
}
}
let threadFirst = function(initial, ...forms){
let [current, ...rest] = forms;
let [fn, ...params] = current;
return forms.reduce(function(acc, current){
if(Array.isArray(current)) {
let [fn, ...params] = current;
fn = fn.bind(acc);
return fn(acc, ...params);
}
current = current.bind(acc);
return current(acc);
}, initial);
}
let threadLast = function(initial, ...forms){
let [current, ...rest] = forms;
let [fn, ...params] = current;
return forms.reduce(function(acc, current){
if(Array.isArray(current)) {
let [fn, ...params] = current;
fn = fn.bind(acc);
return fn(...params, acc);
}
current = current.bind(acc);
return current(acc);
}, initial);
}
And our comp
example will look very much like its Clojure equivalent, with the same drawbacks:
let createCalculate = function(digit, number){
return comp((array) => array.reduce(add, 0),
(array) => array.filter(partial(isPenultimateDigit, digit)),
(array) => array.map(square),
() => range(0, number))
}
let calculate = createCalculate(2, 10);
calculate()
//=> 25
We also had to wrap our comp
call with a closure just to capture digit
and number
parameters and the order
of function evaluation is also right-to-left and upside-down.
Now let’s try our luck with threading:
//we need array methods as standalone functions
const map = Array.prototype.map;
const filter = Array.prototype.filter;
const reduce = Array.prototype.reduce;
//they will get invoked on the right array object, because threadLast binds its functions to treat the
//parameter passed down to them as `this`, thus making object methods also threadable
let calculate = function(digit, number) {
return threadLast(range(0, number),
[map, square],
[filter, partial(isPenultimateDigit, digit)],
[reduce, add, 0])
}
calculate(2, 10)
//=> 25
With this example we conclude the chapter on sequential data transformation. We’ve learned about a bunch of interesting and useful higher order functions that we can use to manipulate sequences and then we learned about a few useful ways to put them all together into composite functions and data processing pipeline of sorts.
It looks like we’ve got our stuff together when it comes to this thing called functional programming. What could possibly remain to keep making trouble? If it only weren’t for those pesky meddling side-effects!