From 71ee535e60e005270fd66cc594ea0290c3157faf Mon Sep 17 00:00:00 2001
From: Pieter Van Trappen <vtpieter@gmail.com>
Date: Wed, 6 May 2020 15:40:10 +0200
Subject: [PATCH] changed fillna for first lines from zeroes to backfill, as
 done last year; probably best for the model no to have large unreal jumps in
 data values

---
 src/preprocessing/preprocess_features.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/preprocessing/preprocess_features.py b/src/preprocessing/preprocess_features.py
index cba33a33..ff1d01c1 100755
--- a/src/preprocessing/preprocess_features.py
+++ b/src/preprocessing/preprocess_features.py
@@ -46,8 +46,8 @@ if __name__ == "__main__":
             missing_values.append(col)
     print('Forward-filling columns {}'.format(missing_values))
     features = features.fillna(method='ffill')
-    # additional fill with zeros as a dirty fix for first rows missing values
-    features.fillna(value=0, inplace=True)
+    # additional backfill as a dirty fix for remaining first rows missing values
+    features = features.fillna(method='bfill')
     print('Forward-filled {} columns'.format(len(missing_values)))
     print('\nNot filled columns are {}'.format(
         [c for c in features.columns.values.tolist() if not c in missing_values]))
-- 
GitLab