ResearchCodingClub · LiamPattinson · Feb 14, 2026 · Feb 14, 2026 · Feb 14, 2026
diff --git a/config.yaml b/config.yaml
@@ -65,7 +65,7 @@ episodes:
 - 03-interacting-with-tests.Rmd
 - 04-unit-tests-best-practices.Rmd
 - 05-testing-exceptions.Rmd
-- 06-testing-data-structures.Rmd
+- 06-floating-point-data.Rmd
 - 07-fixtures.Rmd
 - 08-parametrization.Rmd
 - 09-testing-output-files.Rmd

diff --git a/episodes/04-unit-tests-best-practices.Rmd b/episodes/04-unit-tests-best-practices.Rmd
@@ -4,7 +4,7 @@ teaching: 10
 exercises: 2
 ---
 
-:::::::::::::::::::::::::::::::::::::: questions 
+:::::::::::::::::::::::::::::::::::::: questions
 
 - What to do about complex functions & tests?
 - What are some testing best practices for testing?
@@ -40,7 +40,7 @@ def process_data(data: list, maximum_value: float):
     for i in range(len(data_negative_removed)):
         if data_negative_removed[i] <= maximum_value:
             data_maximum_removed.append(data_negative_removed[i])
-    
+
     # Calculate the mean
     mean = sum(data_maximum_removed) / len(data_maximum_removed)
 
@@ -63,9 +63,17 @@ def test_process_data():
 
 ```
 
-This test is very complex and hard to debug if it fails. Imagine if the calculation of the mean broke - the test would fail but it would not tell us what part of the function was broken, requiring us to 
+This test is hard to debug if it fails. Imagine if the calculation of the mean broke - the test would fail but it would not tell us what part of the function was broken, requiring us to
 check each function manually to find the bug. Not very efficient!
 
+:::::::::::::::::::::::::::: callout
+
+Asserting that the standard deviation is equal to 16 decimal
+places is also quite error prone. We'll see in a later lesson
+how to improve this test.
+
+::::::::::::::::::::::::::::::::::::
+
 ## Unit Testing
 
 The process of unit testing is a fundamental part of software development. It is where you test individual units or components of a software instead of multiple things at once.
@@ -156,10 +164,10 @@ This makes your tests easier to read and understand for both yourself and others
 def test_calculate_mean():
     # Arrange
     data = [1, 2, 3, 4, 5]
-    
+
     # Act
     mean = calculate_mean(data)
-    
+
     # Assert
     assert mean == 3
 ```
@@ -190,10 +198,10 @@ Here is an example of the TDD process:
 def test_calculate_mean():
     # Arrange
     data = [1, 2, 3, 4, 5]
-    
+
     # Act
     mean = calculate_mean(data)
-    
+
     # Assert
     assert mean == 3.5
 ```
@@ -244,7 +252,7 @@ Random seeds work by setting the initial state of the random number generator.
 This means that if you set the seed to the same value, you will get the same sequence of random numbers each time you run the function.
 
 
-::::::::::::::::::::::::::::::::::::: challenge 
+::::::::::::::::::::::::::::::::::::: challenge
 
 ## Challenge: Write your own unit tests
 
@@ -258,35 +266,35 @@ Take this complex function, break it down and write unit tests for it.
 import random
 
 def randomly_sample_and_filter_participants(
-    participants: list, 
-    sample_size: int, 
-    min_age: int, 
-    max_age: int, 
-    min_height: int, 
+    participants: list,
+    sample_size: int,
+    min_age: int,
+    max_age: int,
+    min_height: int,
     max_height: int
 ):
     """Participants is a list of tuples, containing the age and height of each participant
     participants = [
-                      {age: 25, height: 180}, 
-                      {age: 30, height: 170}, 
-                      {age: 35, height: 160}, 
+                      {age: 25, height: 180},
+                      {age: 30, height: 170},
+                      {age: 35, height: 160},
     ]
     """
-    
+
     # Get the indexes to sample
     indexes = random.sample(range(len(participants)), sample_size)
 
     # Get the sampled participants
     sampled_participants = []
     for i in indexes:
         sampled_participants.append(participants[i])
-    
+
     # Remove participants that are outside the age range
     sampled_participants_age_filtered = []
     for participant in sampled_participants:
         if participant['age'] >= min_age and participant['age'] <= max_age:
             sampled_participants_age_filtered.append(participant)
-    
+
     # Remove participants that are outside the height range
     sampled_participants_height_filtered = []
     for participant in sampled_participants_age_filtered:
@@ -299,15 +307,15 @@ def randomly_sample_and_filter_participants(
 - Create a new file called `test_stats.py` in the `statistics` directory
 - Write unit tests for the `randomly_sample_and_filter_participants` function in `test_stats.py`
 
-:::::::::::::::::::::::: solution 
+:::::::::::::::::::::::: solution
 
 The function can be broken down into smaller functions, each of which can be tested separately:
 
 ```python
 import random
 
 def sample_participants(
-    participants: list, 
+    participants: list,
     sample_size: int
 ):
     indexes = random.sample(range(len(participants)), sample_size)
@@ -317,8 +325,8 @@ def sample_participants(
     return sampled_participants
 
 def filter_participants_by_age(
-    participants: list, 
-    min_age: int, 
+    participants: list,
+    min_age: int,
     max_age: int
 ):
     filtered_participants = []
@@ -328,8 +336,8 @@ def filter_participants_by_age(
     return filtered_participants
 
 def filter_participants_by_height(
-    participants: list, 
-    min_height: int, 
+    participants: list,
+    min_height: int,
     max_height: int
 ):
     filtered_participants = []
@@ -339,11 +347,11 @@ def filter_participants_by_height(
     return filtered_participants
 
 def randomly_sample_and_filter_participants(
-    participants: list, 
-    sample_size: int, 
-    min_age: int, 
-    max_age: int, 
-    min_height: int, 
+    participants: list,
+    sample_size: int,
+    min_age: int,
+    max_age: int,
+    min_height: int,
     max_height: int
 ):
     sampled_participants = sample_participants(participants, sample_size)
@@ -447,7 +455,7 @@ When time is limited, it's often better to only write tests for the most critica
 
 You should discuss with your team how much of the code you think should be tested, and what the most critical parts of the code are in order to prioritize your time.
 
-::::::::::::::::::::::::::::::::::::: keypoints 
+::::::::::::::::::::::::::::::::::::: keypoints
 
 - Complex functions can be broken down into smaller, testable units.
 - Testing each unit separately is called unit testing.