Noticed anamolies in the data so manually corrected with an additional python script.

2023-12-28 21:22:53 -05:00
parent b5421232ea
commit b7410c37fb
6 changed files with 64159 additions and 0 deletions
--- a/data_repair.py
+++ b/data_repair.py
@@ -0,0 +1,21 @@
 import pandas as pd
 file_path = './input/modified/statistics-export-id-30.csv'
 df = pd.read_csv(file_path)
 # Select only the necessary columns
 df = df[['start_ts', 'sum', 'state']]
 # Convert 'start_ts' column to datetime
 df['start_ts'] = pd.to_datetime(df['start_ts'], unit='s')
 # Save the data in the desired format to a text file
 output_file_path = './output/repaired_id_30.txt'
 with open(output_file_path, 'w') as f:
    for index, row in df.iterrows():
        f.write(f"    - start: \"{row['start_ts']}+00:00\"\n")
        f.write(f"      state: {row['state']}\n")
        f.write(f"      sum: {row['sum']}\n")
 print(f"Data saved to: {output_file_path}")
--- a/input/modified/statistics-export-id-30.csv
+++ b/input/modified/statistics-export-id-30.csv
--- a/input/modified/statistics-export-id-31.csv
+++ b/input/modified/statistics-export-id-31.csv
--- a/input/modified/statistics-export.csv
+++ b/input/modified/statistics-export.csv
--- a/output/repaired_id_30.txt
+++ b/output/repaired_id_30.txt
--- a/output/repaired_id_31.txt
+++ b/output/repaired_id_31.txt