Untitled

From Scanty Kangaroo, 2 Months ago, written in Plain Text, viewed 36 times.
URL http://codebin.org/view/6b1e04a3 Embed
Download Paste or View Raw
  1. features = ['lead_time',
  2.             'arrival_date_month',
  3.             'stays_in_weekend_nights',
  4.             'adults',
  5.             'has_children',
  6.             'has_babies',
  7.             'meal',
  8.             'country',
  9.             'distribution_channel',
  10.             'is_repeated_guest',
  11.             'previous_cancellations',
  12.             'previous_bookings_not_canceled',
  13.             'reserved_room_type',
  14.             'booking_changes',
  15.             'days_in_waiting_list',
  16.             'customer_type',
  17.             'need_car_parking_space',
  18.             'total_of_special_requests',
  19.             'total_nights']
  20. cat_features = ['arrival_date_month',
  21.             'stays_in_weekend_nights',
  22.             'meal',
  23.             'country',
  24.             'distribution_channel',
  25.             'is_repeated_guest',
  26.             'previous_cancellations',
  27.             'previous_bookings_not_canceled',
  28.             'reserved_room_type',
  29.             'booking_changes',
  30.             'customer_type',
  31.             'need_car_parking_space',
  32.             'total_of_special_requests',
  33.             'total_nights']
  34. target = 'is_canceled'
  35.  
  36. categorical_columns = df_train[features].select_dtypes(include='object').columns.to_list()
  37.  
  38. encoder = OneHotEncoder(handle_unknown='ignore')
  39. encoder.fit(df_train[categorical_columns])
  40. df_train_categorical = pd.DataFrame(encoder.transform(df_train[categorical_columns]).toarray())
  41. df_test_categorical = pd.DataFrame(encoder.transform(df_test[categorical_columns]).toarray())
  42.  
  43. df_train_categorical.columns = encoder.get_feature_names_out()
  44. df_test_categorical.columns = encoder.get_feature_names_out()
  45.  
  46. df_for_learn = pd.concat([df_train[features].select_dtypes(exclude='object').reset_index(drop=True), df_train_categorical.reset_index(drop=True)], axis=1)
  47. df_for_test = pd.concat([df_test[features].select_dtypes(exclude='object').reset_index(drop=True), df_test_categorical.reset_index(drop=True)], axis=1)

Reply to "Untitled"

Here you can reply to the paste above