|
|
@@ -281,6 +281,11 @@ def follow_up_handle():
|
|
|
if idx_to_rm_2:
|
|
|
df_keep_info.loc[idx_to_rm_2, "keep_flag"] = -1
|
|
|
|
|
|
+ # 将 df_to_add 添加到 df_keep_info 之后
|
|
|
+ add_rows = len(df_to_add) if "df_to_add" in locals() else 0
|
|
|
+ if add_rows:
|
|
|
+ df_keep_info = pd.concat([df_keep_info, df_to_add], ignore_index=True)
|
|
|
+
|
|
|
# 将长时间没更新的航班标记为-1
|
|
|
dt_update_hour = pd.to_datetime(df_keep_info["update_hour"], errors="coerce")
|
|
|
dt_crawl_date = pd.to_datetime(df_keep_info["crawl_date"], errors="coerce")
|
|
|
@@ -288,11 +293,6 @@ def follow_up_handle():
|
|
|
if mask_abnormal_time.any():
|
|
|
df_keep_info.loc[mask_abnormal_time.fillna(False), "keep_flag"] = -1
|
|
|
|
|
|
- # 将 df_to_add 添加到 df_keep_info 之后
|
|
|
- add_rows = len(df_to_add) if "df_to_add" in locals() else 0
|
|
|
- if add_rows:
|
|
|
- df_keep_info = pd.concat([df_keep_info, df_to_add], ignore_index=True)
|
|
|
-
|
|
|
df_keep_info_snapshot = df_keep_info.copy()
|
|
|
df_keep_info_snapshot.to_csv(keep_info_snapshot_path, index=False, encoding="utf-8-sig")
|
|
|
print(
|