global:
  problem_type: regression

steps:
  data:
    extract:
      filepath: data/regression_train.csv
      features:
        - bedrooms
        - bathrooms
        - sqft_living
        - sqft_lot
        - floors
        - waterfront
        - view
        - condition
        - grade
        - sqft_above
        - sqft_basement
        - yr_built
        - yr_renovated
        - zipcode
        - lat
        - long
        - sqft_living15
        - sqft_lot15
      target: price

    transform:
      normalize:
        features:
          module: sklearn.preprocessing.StandardScaler
          params:
            with_std: True
          columns:
            - sqft_living
            - sqft_lot
            - sqft_above
            - sqft_basement
            - sqft_living15
            - sqft_lot15
        target:
          module: sklearn.preprocessing.StandardScaler
          params:
            with_std: True
          columns:
            - price

  model:
    transform:
      fit:
        estimator:
          module: sklearn.ensemble.RandomForestRegressor
          params:
            n_estimators: 100
            random_state: 4
        cross_validation:
          module: sklearn.model_selection.KFold
          params:
            n_splits: 3
            random_state: 4
            shuffle: True
        metrics: mean_absolute_percentage_error

    load:
      filepath: honcaml_models/sklearn_regression.sav
