fix: Standardized tavg availability filename and updated precipitation data filtering logic.
Browse files
global.R
CHANGED
|
@@ -15,7 +15,7 @@ source("utils/generateLabel.R", local = T)
|
|
| 15 |
|
| 16 |
# Read the metadata and availability data
|
| 17 |
tavg_meta <- read.csv("www/data/tabs/tavg_meta.csv")
|
| 18 |
-
tavg_avail <- read.csv("www/data/tabs/
|
| 19 |
|
| 20 |
# Merge the metadata and availability data on 'ID'
|
| 21 |
stations_data <- merge(tavg_meta, tavg_avail, by = "ID")
|
|
|
|
| 15 |
|
| 16 |
# Read the metadata and availability data
|
| 17 |
tavg_meta <- read.csv("www/data/tabs/tavg_meta.csv")
|
| 18 |
+
tavg_avail <- read.csv("www/data/tabs/tavg_availability.csv")
|
| 19 |
|
| 20 |
# Merge the metadata and availability data on 'ID'
|
| 21 |
stations_data <- merge(tavg_meta, tavg_avail, by = "ID")
|
misc/Python/ghcnm_read_prec.py
CHANGED
|
@@ -125,7 +125,8 @@ for i, file in enumerate(csv_files):
|
|
| 125 |
# 4. Skip this file if any 'precip_mm' value is greater than 5000
|
| 126 |
if (df['precip_mm'] > 2000).any():
|
| 127 |
#continue
|
| 128 |
-
|
|
|
|
| 129 |
|
| 130 |
# 5. Append cleaned and filtered dataframe
|
| 131 |
dataframes.append(df)
|
|
@@ -137,7 +138,7 @@ combined_df.to_parquet('www/data/tabs/prec_long.parquet', engine='pyarrow', inde
|
|
| 137 |
|
| 138 |
|
| 139 |
|
| 140 |
-
|
| 141 |
|
| 142 |
combined_df.describe()
|
| 143 |
|
|
|
|
| 125 |
# 4. Skip this file if any 'precip_mm' value is greater than 5000
|
| 126 |
if (df['precip_mm'] > 2000).any():
|
| 127 |
#continue
|
| 128 |
+
print(f"Skipping {file} due to extreme precipitation value (> 2000mm)")
|
| 129 |
+
continue
|
| 130 |
|
| 131 |
# 5. Append cleaned and filtered dataframe
|
| 132 |
dataframes.append(df)
|
|
|
|
| 138 |
|
| 139 |
|
| 140 |
|
| 141 |
+
|
| 142 |
|
| 143 |
combined_df.describe()
|
| 144 |
|
misc/Python/ghcnm_read_tavg.py
CHANGED
|
@@ -110,7 +110,7 @@ station_summary = long_format_data.groupby('ID')['YEAR'].agg(first_year='min', l
|
|
| 110 |
print(station_summary)
|
| 111 |
|
| 112 |
|
| 113 |
-
station_summary.to_csv("www/data/tabs/
|
| 114 |
|
| 115 |
|
| 116 |
### read text file
|
|
|
|
| 110 |
print(station_summary)
|
| 111 |
|
| 112 |
|
| 113 |
+
station_summary.to_csv("www/data/tabs/tavg_availability.csv", index=False)
|
| 114 |
|
| 115 |
|
| 116 |
### read text file
|
www/data/tabs/{tavg_vaialability.csv → tavg_availability.csv}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26e585ce08c48911e59b22f2ceec9eb6994a21b5a2d56eac3df275b9c879ac22
|
| 3 |
+
size 611360
|
www/data/tabs/tavg_long.parquet
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:899fd5826cdb0d597a405a0922011dac853f837f08776bc77fdf049ed1f05ede
|
| 3 |
+
size 29958269
|
www/data/tabs/tavg_meta.csv
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2726a073d64963e8e8410830ab59e5990554a3780183c3d5b41a1a1c93a62ad8
|
| 3 |
+
size 1296342
|