File size: 556 Bytes
b72652e
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
import os
import sys

# Fix for age slider showing extreme values from bad Transfermarkt DB records.
# The players.csv uses `height_in_cm` instead of a true `Age` column.
# The run_pipeline.py was randomly assigning age from `height_in_cm`.
# This fix ensures Age comes from `date_of_birth` if available.

print("This is a notes file about the age bug found through QA testing.")
print("The `Age` column in the merged df was populated from `height_in_cm` as a fallback.")
print("Fix: derive Age from `date_of_birth` column in players.csv during merging.")