name: "news"
train_path: "./dataset/tabsyn/news/train.csv"
test_path: "./dataset/tabsyn/news/test.csv"
holdout_path: "None"
n_rows_train: 35679
n_rows_test: 3965
n_rows_holdout: 0
n_cols: 48
n_categorical_cols: 2
n_numerical_cols: 46
has_missing_values: False
missing_element_ratio: 0.0
n_rows_missing_train: 0
n_rows_missing_test: 0
n_rows_missing_holdout: 0
missing_values:
  - ''
categorical_columns:
  - "data_channel"
  - "weekday"
numerical_columns:
  - " timedelta!!int"
  - " n_tokens_title!!int"
  - " n_tokens_content!!int"
  - " n_unique_tokens!!float"
  - " n_non_stop_words!!int"
  - " n_non_stop_unique_tokens!!float"
  - " num_hrefs!!int"
  - " num_self_hrefs!!int"
  - " num_imgs!!int"
  - " num_videos!!int"
  - " average_token_length!!float"
  - " num_keywords!!int"
  - " kw_min_min!!int"
  - " kw_max_min!!int"
  - " kw_avg_min!!float"
  - " kw_min_max!!int"
  - " kw_max_max!!int"
  - " kw_avg_max!!float"
  - " kw_min_avg!!float"
  - " kw_max_avg!!float"
  - " kw_avg_avg!!float"
  - " self_reference_min_shares!!int"
  - " self_reference_max_shares!!int"
  - " self_reference_avg_sharess!!float"
  - " LDA_00!!float"
  - " LDA_01!!float"
  - " LDA_02!!float"
  - " LDA_03!!float"
  - " LDA_04!!float"
  - " global_subjectivity!!float"
  - " global_sentiment_polarity!!float"
  - " global_rate_positive_words!!float"
  - " global_rate_negative_words!!float"
  - " rate_positive_words!!float"
  - " rate_negative_words!!float"
  - " avg_positive_polarity!!float"
  - " min_positive_polarity!!float"
  - " max_positive_polarity!!float"
  - " avg_negative_polarity!!float"
  - " min_negative_polarity!!float"
  - " max_negative_polarity!!float"
  - " title_subjectivity!!float"
  - " title_sentiment_polarity!!float"
  - " abs_title_subjectivity!!float"
  - " abs_title_sentiment_polarity!!float"
  - " shares!!int"
target_column: " shares"