Bläddra i källkod

调整数据处理底层

node04 3 veckor sedan
förälder
incheckning
dd13bf2b51
1 ändrade filer med 2 tillägg och 2 borttagningar
  1. 2 2
      data_preprocess.py

+ 2 - 2
data_preprocess.py

@@ -855,7 +855,7 @@ def preprocess_data_simple(df_input, is_train=False):
         df_input = df_input[~((df_input['is_filled'] == 1) & (_tail_filled == 1))]
     
     # 价格变化最小量阈值
-    price_change_amount_threshold = 5
+    price_change_amount_threshold = 1
     df_input['_raw_price_diff'] = df_input.groupby(['gid', 'baggage'], group_keys=False)['adult_total_price'].diff()
 
     # 计算价格变化量
@@ -1457,7 +1457,7 @@ def predict_data_simple(df_input, group_route_str, output_dir, predict_dir=".",
     # 要展示在预测表里的字段
     order_cols = ['city_pair', 'flight_day', 'flight_number_1', 'flight_number_2', 'from_time', 
                   'baggage', 'seats_remaining', 'currency',
-                  'adult_total_price', 'days_to_departure', 'hours_until_departure', 'price_change_percent', 'price_duration_hours', 
+                  'adult_total_price', 'days_to_departure', 'hours_until_departure', 'price_change_percent', 'price_change_amount', 'price_duration_hours', 
                   'update_hour', 'crawl_date',
                   'valid_begin_hour', 'valid_end_hour',
                   'simple_will_price_drop', 'simple_drop_in_hours', 'simple_drop_in_hours_prob', 'simple_drop_in_hours_dist',