Noticed anamolies in the data so manually corrected with an additional python script.

2023-12-28 21:22:53 -05:00
parent b5421232ea
commit b7410c37fb
6 changed files with 64159 additions and 0 deletions
--- a/data_repair.py
+++ b/data_repair.py
@@ -0,0 +1,21 @@
+import pandas as pd
+
+file_path = './input/modified/statistics-export-id-30.csv'
+df = pd.read_csv(file_path)
+
+# Select only the necessary columns
+df = df[['start_ts', 'sum', 'state']]
+
+# Convert 'start_ts' column to datetime
+df['start_ts'] = pd.to_datetime(df['start_ts'], unit='s')
+
+# Save the data in the desired format to a text file
+output_file_path = './output/repaired_id_30.txt'
+
+with open(output_file_path, 'w') as f:
+    for index, row in df.iterrows():
+        f.write(f"    - start: \"{row['start_ts']}+00:00\"\n")
+        f.write(f"      state: {row['state']}\n")
+        f.write(f"      sum: {row['sum']}\n")
+
+print(f"Data saved to: {output_file_path}")
--- a/input/modified/statistics-export-id-30.csv
+++ b/input/modified/statistics-export-id-30.csv
--- a/input/modified/statistics-export-id-31.csv
+++ b/input/modified/statistics-export-id-31.csv
--- a/input/modified/statistics-export.csv
+++ b/input/modified/statistics-export.csv
--- a/output/repaired_id_30.txt
+++ b/output/repaired_id_30.txt
--- a/output/repaired_id_31.txt
+++ b/output/repaired_id_31.txt