mirror of
https://github.com/PlaneQuery/OpenAirframes.git
synced 2026-06-08 06:03:55 +02:00
fix date parsing
This commit is contained in:
@@ -104,18 +104,16 @@ def download_and_merge_base_release(compressed_df: pl.DataFrame) -> tuple[pl.Dat
|
|||||||
base_df = pl.read_csv(base_path)
|
base_df = pl.read_csv(base_path)
|
||||||
print(f"Base release has {len(base_df)} records")
|
print(f"Base release has {len(base_df)} records")
|
||||||
|
|
||||||
|
# Parse time column as datetime
|
||||||
|
base_df = base_df.with_columns(
|
||||||
|
pl.col('time').str.to_datetime(time_unit='ms', time_zone='UTC')
|
||||||
|
)
|
||||||
|
|
||||||
# Extract earliest date from base release
|
# Extract earliest date from base release
|
||||||
earliest_date = None
|
earliest_timestamp = base_df['time'].min()
|
||||||
if 'time' in base_df.columns and len(base_df) > 0:
|
earliest_dt = datetime.fromisoformat(str(earliest_timestamp).replace('Z', '+00:00'))
|
||||||
try:
|
earliest_date = earliest_dt.strftime('%Y-%m-%d')
|
||||||
earliest_timestamp = base_df['time'].min()
|
print(f"Earliest date in base release: {earliest_date}")
|
||||||
if earliest_timestamp:
|
|
||||||
# Parse timestamp and extract date
|
|
||||||
earliest_dt = datetime.fromisoformat(str(earliest_timestamp).replace('Z', '+00:00'))
|
|
||||||
earliest_date = earliest_dt.strftime('%Y-%m-%d')
|
|
||||||
print(f"Earliest date in base release: {earliest_date}")
|
|
||||||
except Exception as e:
|
|
||||||
print(f"Could not extract earliest date from base release: {e}")
|
|
||||||
|
|
||||||
# Ensure columns match
|
# Ensure columns match
|
||||||
base_cols = set(base_df.columns)
|
base_cols = set(base_df.columns)
|
||||||
|
|||||||
Reference in New Issue
Block a user