From 209657c50bc18257429c00e4d5f69afbce609fe5 Mon Sep 17 00:00:00 2001
From: Pieter Van Trappen <vtpieter@gmail.com>
Date: Thu, 23 Apr 2020 23:09:01 +0200
Subject: [PATCH] first changes to make it works, fails on missing
 logbook_test.csv now

---
 README2020.md                  | 15 ++++++++++-----
 src/scripts/grid_search_gmm.py | 12 ++++++++----
 2 files changed, 18 insertions(+), 9 deletions(-)

diff --git a/README2020.md b/README2020.md
index 72d3ddc8..b4c46339 100644
--- a/README2020.md
+++ b/README2020.md
@@ -1,7 +1,12 @@
-- pull ML_step
+# Pipeline instructions 
 
-- grid_search_gmm.py en grid_search_iforest.py zouden beiden moeten werken en output produceren in de data-cern subfolder onder oftewel gmm_results of iforest_results
+* grid_search_gmm.py en grid_search_iforest.py zouden beiden moeten werken en output produceren in de data-cern subfolder onder oftewel gmm_results of iforest_results
+* grid_search_gmm.py gerbuikt parameters '-b 1' (zonder string haakjes). grid_search_iforest.py gebruikt er geen.
+* voor de webapp run wsgi_lbds.py in de webapp folder
 
-- grid_search_gmm.py gerbuikt parameters '-b 1' (zonder string haakjes). grid_search_iforest.py gebruikt er geen.
-
-- voor de webapp run wsgi_lbds.py in de webapp folder
+run as follows:
+```
+pipenv shell
+cd src/scripts
+./grid_search_gmm.py
+```
diff --git a/src/scripts/grid_search_gmm.py b/src/scripts/grid_search_gmm.py
index c87ad9aa..56250e15 100755
--- a/src/scripts/grid_search_gmm.py
+++ b/src/scripts/grid_search_gmm.py
@@ -2,6 +2,7 @@
 
 import os
 import sys
+sys.path.append(os.path.join(os.path.dirname(__file__), '..'))
 
 from pipeline.grid_search import grid_search
 from preprocessing import builder
@@ -66,10 +67,13 @@ if __name__ == '__main__':
         fno = "res"
 
         df = pd.read_csv("../../data-cern/features.csv")
-        state_mode = pd.read_json("../../data-cern/seg.json",
-                                  lines=True)
-        state_mode = state_mode.set_index('acqStamp').sort_index()
-        state_mode.index = pd.to_datetime(state_mode.index).round('s')
+        try:
+            fn = "../../data-cern/seg.json"
+            state_mode = pd.read_json(fn, lines=True)
+            state_mode = state_mode.set_index('acqStamp').sort_index()
+            state_mode.index = pd.to_datetime(state_mode.index).round('s')
+        except:
+            print("ERROR - missing {}, continuing anyway".format(fn))
         df = df.set_index('acqStamp').sort_index()
         df.index = pd.to_datetime(df.index)
         labels = pd.DataFrame()
-- 
GitLab