{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "b0fdabf1",
   "metadata": {},
   "outputs": [],
   "source": [
    "evaulate.sirus <- function(dataset_name, file_name, attributes, target, feature_map=list, cr=\"r\"){\n",
    "  train_data <- read.csv(file = file_name)\n",
    "  set.seed(seed=0)\n",
    "  for (k in names(feature_map)){\n",
    "      train_data[train_data==k]<-feature_map[k]\n",
    "  }\n",
    "  \n",
    "  train_data <- type.convert(train_data, as.is=TRUE)\n",
    "  train_data <- na.omit(train_data)\n",
    "  # print(str(train_data))\n",
    "  y<-train_data[, target]\n",
    "  \n",
    "  for (col in colnames(train_data)){\n",
    "    if (!is.element(col, attributes)){\n",
    "      train_data[col]<-NULL\n",
    "    }\n",
    "  }\n",
    "  require(sirus)\n",
    "  for (i in 1:11){\n",
    "    sirus.m <- sirus.fit(train_data, y, num.rule = i, discrete.limit = 10,\n",
    "                         num.trees = 10000)\n",
    "    \n",
    "    predictions <- sirus.predict(sirus.m, train_data)\n",
    "    print(sirus.print(sirus.m))\n",
    "    if (cr==\"c\"){\n",
    "      risk<-(sum(log2(1+exp(-y*predictions)))/nrow(train_data))\n",
    "    }else if (cr==\"r\"){\n",
    "      risk<-(sum((y-predictions)**2)/nrow(train_data))\n",
    "    }\n",
    "    print(risk)\n",
    "  }\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "5b3e33f6",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Loading required package: sirus\n",
      "\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "     Weights         Rules                                             \n",
      "[1,] \"Intercept = 0\" \"Mean of output y = 6.59 - Sample size n = 35\"    \n",
      "[2,] \"1\"             \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"\n",
      "[1] 0.1960121\n",
      "     Weights            Rules                                             \n",
      "[1,] \"Intercept = 0.79\" \"Mean of output y = 6.59 - Sample size n = 35\"    \n",
      "[2,] \"0.88\"             \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"\n",
      "[1] 0.2009454\n",
      "     Weights             Rules                                             \n",
      "[1,] \"Intercept = 0.461\" \"Mean of output y = 6.59 - Sample size n = 35\"    \n",
      "[2,] \"0.532\"             \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"\n",
      "[3,] \"0.398\"             \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"\n",
      "[1] 0.1916693\n",
      "     Weights             \n",
      "[1,] \"Intercept = -0.278\"\n",
      "[2,] \"0.556\"             \n",
      "[3,] \"0.407\"             \n",
      "[4,] \"0.0797\"            \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 12800 & GDP < 37000 then 6.03 (n=13) else 6.92 (n=22)\"\n",
      "[1] 0.1870657\n",
      "     Weights            \n",
      "[1,] \"Intercept = -1.55\"\n",
      "[2,] \"0.442\"            \n",
      "[3,] \"0.391\"            \n",
      "[4,] \"0.242\"            \n",
      "[5,] \"0.161\"            \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 17000 & GDP < 37000 then 5.97 (n=10) else 6.84 (n=25)\"\n",
      "[5,] \"if GDP < 12800 then 5.85 (n=4) else 6.69 (n=31)\"                \n",
      "[1] 0.1806127\n",
      "     Weights             \n",
      "[1,] \"Intercept = -0.961\"\n",
      "[2,] \"0.494\"             \n",
      "[3,] \"0.433\"             \n",
      "[4,] \"0.218\"             \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 17000 & GDP < 37000 then 5.97 (n=10) else 6.84 (n=25)\"\n",
      "[1] 0.1812207\n",
      "     Weights             \n",
      "[1,] \"Intercept = -0.961\"\n",
      "[2,] \"0.494\"             \n",
      "[3,] \"0.433\"             \n",
      "[4,] \"0.218\"             \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 17000 & GDP < 37000 then 5.97 (n=10) else 6.84 (n=25)\"\n",
      "[1] 0.1812207\n",
      "     Weights            \n",
      "[1,] \"Intercept = -1.14\"\n",
      "[2,] \"0.463\"            \n",
      "[3,] \"0.423\"            \n",
      "[4,] \"0.211\"            \n",
      "[5,] \"0.0748\"           \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 17000 & GDP < 37000 then 5.97 (n=10) else 6.84 (n=25)\"\n",
      "[5,] \"if GDP >= 37000 & GDP < 54300 then 7.15 (n=14) else 6.22 (n=21)\"\n",
      "[1] 0.182141\n",
      "     Weights             \n",
      "[1,] \"Intercept = -0.489\"\n",
      "[2,] \"0.52\"              \n",
      "[3,] \"0.396\"             \n",
      "[4,] \"0.0698\"            \n",
      "[5,] \"0.0883\"            \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 12800 & GDP < 37000 then 6.03 (n=13) else 6.92 (n=22)\"\n",
      "[5,] \"if GDP >= 37000 & GDP < 54300 then 7.15 (n=14) else 6.22 (n=21)\"\n",
      "[1] 0.1879205\n",
      "     Weights             \n",
      "[1,] \"Intercept = -0.489\"\n",
      "[2,] \"0.52\"              \n",
      "[3,] \"0.396\"             \n",
      "[4,] \"0.0698\"            \n",
      "[5,] \"0.0883\"            \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP >= 12800 & GDP < 37000 then 6.03 (n=13) else 6.92 (n=22)\"\n",
      "[5,] \"if GDP >= 37000 & GDP < 54300 then 7.15 (n=14) else 6.22 (n=21)\"\n",
      "[1] 0.1879205\n",
      "     Weights            \n",
      "[1,] \"Intercept = -1.79\"\n",
      "[2,] \"0.405\"            \n",
      "[3,] \"0.374\"            \n",
      "[4,] \"0.155\"            \n",
      "[5,] \"0.229\"            \n",
      "[6,] \"0.11\"             \n",
      "     Rules                                                            \n",
      "[1,] \"Mean of output y = 6.59 - Sample size n = 35\"                   \n",
      "[2,] \"if GDP < 37000 then 5.99 (n=17) else 7.16 (n=18)\"               \n",
      "[3,] \"if GDP < 28800 then 5.91 (n=14) else 7.04 (n=21)\"               \n",
      "[4,] \"if GDP < 12800 then 5.85 (n=4) else 6.69 (n=31)\"                \n",
      "[5,] \"if GDP >= 17000 & GDP < 37000 then 5.97 (n=10) else 6.84 (n=25)\"\n",
      "[6,] \"if GDP >= 37000 & GDP < 54300 then 7.15 (n=14) else 6.22 (n=21)\"\n",
      "[1] 0.1820535\n"
     ]
    }
   ],
   "source": [
    "evaulate.sirus(\"gdp\", \"./datasets/gdp_vs_satisfaction/GDP_vs_Satisfaction.csv\",list(\"GDP\"),\n",
    "               \"Satisfaction\", list())"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "76440604",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"\n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"   \n",
      "[1] 0.8602651\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"\n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"   \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"\n",
      "[1] 0.8687004\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"           \n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"              \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"           \n",
      "[4] \"if Pclass >= 3 & Sex < 1 then 0.461 (n=102) else 0.395 (n=610)\"\n",
      "[1] 0.8763768\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"          \n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"             \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"          \n",
      "[4] \"if Pclass < 3 & Sex < 1 then 0.943 (n=157) else 0.252 (n=555)\"\n",
      "[5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"           \n",
      "[1] 0.8698572\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"          \n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"             \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"          \n",
      "[4] \"if Pclass < 3 & Sex < 1 then 0.943 (n=157) else 0.252 (n=555)\"\n",
      "[5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"           \n",
      "[6] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"         \n",
      "[1] 0.8721196\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"          \n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"             \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"          \n",
      "[4] \"if Pclass < 3 & Sex < 1 then 0.943 (n=157) else 0.252 (n=555)\"\n",
      "[5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"           \n",
      "[6] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"         \n",
      "[7] \"if Embarked < 2 then 0.363 (n=554) else 0.551 (n=158)\"        \n",
      "[1] 0.8749142\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"           \n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"              \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"           \n",
      "[4] \"if Pclass >= 3 & Sex < 1 then 0.461 (n=102) else 0.395 (n=610)\"\n",
      "[5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"            \n",
      "[6] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"          \n",
      "[7] \"if Embarked < 2 then 0.363 (n=554) else 0.551 (n=158)\"         \n",
      "[8] \"if Sex >= 1 & Age >= 14 then 0.173 (n=416) else 0.73 (n=296)\"  \n",
      "[1] 0.8776973\n",
      "[1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"           \n",
      "[2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"              \n",
      "[3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"           \n",
      "[4] \"if Pclass >= 3 & Sex < 1 then 0.461 (n=102) else 0.395 (n=610)\"\n",
      "[5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"            \n",
      "[6] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"          \n",
      "[7] \"if Embarked < 2 then 0.363 (n=554) else 0.551 (n=158)\"         \n",
      "[8] \"if Sex >= 1 & Age >= 14 then 0.173 (n=416) else 0.73 (n=296)\"  \n",
      "[9] \"if Pclass < 2 & Sex >= 1 then 0.396 (n=101) else 0.406 (n=611)\"\n",
      "[1] 0.8796178\n",
      " [1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"           \n",
      " [2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"              \n",
      " [3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"           \n",
      " [4] \"if Pclass >= 3 & Sex < 1 then 0.461 (n=102) else 0.395 (n=610)\"\n",
      " [5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"            \n",
      " [6] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"          \n",
      " [7] \"if Embarked < 2 then 0.363 (n=554) else 0.551 (n=158)\"         \n",
      " [8] \"if Sex >= 1 & Age >= 14 then 0.173 (n=416) else 0.73 (n=296)\"  \n",
      " [9] \"if Pclass < 2 & Sex >= 1 then 0.396 (n=101) else 0.406 (n=611)\"\n",
      "[10] \"if Sex < 1 & Fare < 46.9 then 0.67 (n=182) else 0.313 (n=530)\" \n",
      "[1] 0.8797198\n",
      " [1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"            \n",
      " [2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"               \n",
      " [3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"            \n",
      " [4] \"if Pclass < 3 & Sex < 1 then 0.943 (n=157) else 0.252 (n=555)\"  \n",
      " [5] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"             \n",
      " [6] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"           \n",
      " [7] \"if Embarked < 2 then 0.363 (n=554) else 0.551 (n=158)\"          \n",
      " [8] \"if Sex >= 1 & Age >= 14 then 0.173 (n=416) else 0.73 (n=296)\"   \n",
      " [9] \"if Pclass >= 2 & Sex >= 1 then 0.151 (n=352) else 0.653 (n=360)\"\n",
      "[10] \"if Sex < 1 & Fare < 46.9 then 0.67 (n=182) else 0.313 (n=530)\"  \n",
      "[11] \"if Sex >= 1 & Fare < 15.6 then 0.128 (n=265) else 0.568 (n=447)\"\n",
      "[1] 0.8713187\n",
      " [1] \"Proportion of class 1 = 0.404 - Sample size n = 712\"             \n",
      " [2] \"if Sex < 1 then 0.753 (n=259) else 0.205 (n=453)\"                \n",
      " [3] \"if Pclass < 3 then 0.569 (n=357) else 0.239 (n=355)\"             \n",
      " [4] \"if Pclass < 3 & Sex < 1 then 0.943 (n=157) else 0.252 (n=555)\"   \n",
      " [5] \"if Fare < 15.6 then 0.258 (n=356) else 0.551 (n=356)\"            \n",
      " [6] \"if Parch < 1 then 0.355 (n=519) else 0.539 (n=193)\"              \n",
      " [7] \"if Sex >= 1 & Age >= 14 then 0.173 (n=416) else 0.73 (n=296)\"    \n",
      " [8] \"if Embarked < 2 then 0.363 (n=554) else 0.551 (n=158)\"           \n",
      " [9] \"if Pclass >= 2 & Sex >= 1 then 0.151 (n=352) else 0.653 (n=360)\" \n",
      "[10] \"if Sex < 1 & Fare < 46.9 then 0.67 (n=182) else 0.313 (n=530)\"   \n",
      "[11] \"if Sex >= 1 & Fare < 15.6 then 0.128 (n=265) else 0.568 (n=447)\" \n",
      "[12] \"if Pclass < 3 & Parch >= 1 then 0.735 (n=102) else 0.349 (n=610)\"\n",
      "[1] 0.872407\n"
     ]
    }
   ],
   "source": [
    "evaulate.sirus(\"titanic\", \"./datasets/titanic/train.csv\",\n",
    "               c('Pclass', 'Sex', 'Age', 'SibSp', 'Parch', 'Fare', 'Embarked'),\n",
    "               \"Survived\", c('male'= 1, 'female'=0, 'S'=1, 'C'=2, 'Q'=3), \"c\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "003f3da9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "     Weights         Rules                                             \n",
      "[1,] \"Intercept = 0\" \"Mean of output y = 32400 - Sample size n = 1379\" \n",
      "[2,] \"1\"             \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"\n",
      "[1] 865203162\n",
      "     Weights              Rules                                               \n",
      "[1,] \"Intercept = -28100\" \"Mean of output y = 32400 - Sample size n = 1379\"   \n",
      "[2,] \"0.994\"              \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"  \n",
      "[3,] \"0.872\"              \"if race < 2 then 33400 (n=1147) else 27900 (n=232)\"\n",
      "[1] 861021784\n",
      "     Weights             \n",
      "[1,] \"Intercept = -31700\"\n",
      "[2,] \"0.808\"             \n",
      "[3,] \"0.834\"             \n",
      "[4,] \"0.334\"             \n",
      "     Rules                                                   \n",
      "[1,] \"Mean of output y = 32400 - Sample size n = 1379\"       \n",
      "[2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"      \n",
      "[3,] \"if race < 2 then 33400 (n=1147) else 27900 (n=232)\"    \n",
      "[4,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"\n",
      "[1] 856418054\n",
      "     Weights             \n",
      "[1,] \"Intercept = -64200\"\n",
      "[2,] \"0.847\"             \n",
      "[3,] \"0.616\"             \n",
      "[4,] \"0.371\"             \n",
      "[5,] \"1.14\"              \n",
      "     Rules                                                   \n",
      "[1,] \"Mean of output y = 32400 - Sample size n = 1379\"       \n",
      "[2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"      \n",
      "[3,] \"if race < 2 then 33400 (n=1147) else 27900 (n=232)\"    \n",
      "[4,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"\n",
      "[5,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"    \n",
      "[1] 804759433\n",
      "     Weights             \n",
      "[1,] \"Intercept = -87600\"\n",
      "[2,] \"0.838\"             \n",
      "[3,] \"0.627\"             \n",
      "[4,] \"0.312\"             \n",
      "[5,] \"1.06\"              \n",
      "[6,] \"0.865\"             \n",
      "     Rules                                                   \n",
      "[1,] \"Mean of output y = 32400 - Sample size n = 1379\"       \n",
      "[2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"      \n",
      "[3,] \"if race < 2 then 33400 (n=1147) else 27900 (n=232)\"    \n",
      "[4,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"\n",
      "[5,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"    \n",
      "[6,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"     \n",
      "[1] 741163912\n",
      "     Weights             \n",
      "[1,] \"Intercept = -66000\"\n",
      "[2,] \"0.332\"             \n",
      "[3,] \"0.283\"             \n",
      "[4,] \"1.01\"              \n",
      "[5,] \"0.843\"             \n",
      "[6,] \"0.566\"             \n",
      "     Rules                                                         \n",
      "[1,] \"Mean of output y = 32400 - Sample size n = 1379\"             \n",
      "[2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"            \n",
      "[3,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"      \n",
      "[4,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"          \n",
      "[5,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"           \n",
      "[6,] \"if sex >= 1 & race < 2 then 49000 (n=432) else 24900 (n=947)\"\n",
      "[1] 733317944\n",
      "     Weights             \n",
      "[1,] \"Intercept = -69900\"\n",
      "[2,] \"0.346\"             \n",
      "[3,] \"0.289\"             \n",
      "[4,] \"0.719\"             \n",
      "[5,] \"0.815\"             \n",
      "[6,] \"0.546\"             \n",
      "[7,] \"0.439\"             \n",
      "     Rules                                                         \n",
      "[1,] \"Mean of output y = 32400 - Sample size n = 1379\"             \n",
      "[2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"            \n",
      "[3,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"      \n",
      "[4,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"          \n",
      "[5,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"           \n",
      "[6,] \"if sex >= 1 & race < 2 then 49000 (n=432) else 24900 (n=947)\"\n",
      "[7,] \"if age < 27 then 13300 (n=122) else 34300 (n=1257)\"          \n",
      "[1] 729817696\n",
      "     Weights              \n",
      "[1,] \"Intercept = -504000\"\n",
      "[2,] \"0.947\"              \n",
      "[3,] \"0.27\"               \n",
      "[4,] \"0.868\"              \n",
      "[5,] \"0.589\"              \n",
      "[6,] \"12.9\"               \n",
      "[7,] \"0.326\"              \n",
      "[8,] \"0.651\"              \n",
      "     Rules                                                          \n",
      "[1,] \"Mean of output y = 32400 - Sample size n = 1379\"              \n",
      "[2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"             \n",
      "[3,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"       \n",
      "[4,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"           \n",
      "[5,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"            \n",
      "[6,] \"if sex >= 1 & race >= 2 then 31500 (n=88) else 32500 (n=1291)\"\n",
      "[7,] \"if age < 27 then 13300 (n=122) else 34300 (n=1257)\"           \n",
      "[8,] \"if ed < 14 then 24500 (n=784) else 42900 (n=595)\"             \n",
      "[1] 700171147\n",
      "      Weights              \n",
      " [1,] \"Intercept = -540000\"\n",
      " [2,] \"0.483\"              \n",
      " [3,] \"0.272\"              \n",
      " [4,] \"1.3\"                \n",
      " [5,] \"0.585\"              \n",
      " [6,] \"13.1\"               \n",
      " [7,] \"0.317\"              \n",
      " [8,] \"0.64\"               \n",
      " [9,] \"0.91\"               \n",
      "      Rules                                                          \n",
      " [1,] \"Mean of output y = 32400 - Sample size n = 1379\"              \n",
      " [2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"             \n",
      " [3,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"       \n",
      " [4,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"           \n",
      " [5,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"            \n",
      " [6,] \"if sex >= 1 & race >= 2 then 31500 (n=88) else 32500 (n=1291)\"\n",
      " [7,] \"if age < 27 then 13300 (n=122) else 34300 (n=1257)\"           \n",
      " [8,] \"if ed < 14 then 24500 (n=784) else 42900 (n=595)\"             \n",
      " [9,] \"if sex < 1 & age >= 31 then 26000 (n=731) else 39800 (n=648)\" \n",
      "[1] 694404688\n",
      "      Weights              \n",
      " [1,] \"Intercept = -508000\"\n",
      " [2,] \"0.466\"              \n",
      " [3,] \"0.279\"              \n",
      " [4,] \"1.31\"               \n",
      " [5,] \"0.531\"              \n",
      " [6,] \"12.2\"               \n",
      " [7,] \"0.574\"              \n",
      " [8,] \"0.31\"               \n",
      " [9,] \"0.917\"              \n",
      "[10,] \"0.134\"              \n",
      "      Rules                                                          \n",
      " [1,] \"Mean of output y = 32400 - Sample size n = 1379\"              \n",
      " [2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"             \n",
      " [3,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"       \n",
      " [4,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"           \n",
      " [5,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"            \n",
      " [6,] \"if sex >= 1 & race >= 2 then 31500 (n=88) else 32500 (n=1291)\"\n",
      " [7,] \"if ed < 14 then 24500 (n=784) else 42900 (n=595)\"             \n",
      " [8,] \"if age < 27 then 13300 (n=122) else 34300 (n=1257)\"           \n",
      " [9,] \"if sex < 1 & age >= 31 then 26000 (n=731) else 39800 (n=648)\" \n",
      "[10,] \"if ed < 16 then 27200 (n=1042) else 48600 (n=337)\"            \n",
      "[1] 693827375\n",
      "      Weights              \n",
      " [1,] \"Intercept = -358000\"\n",
      " [2,] \"0.417\"              \n",
      " [3,] \"0.00898\"            \n",
      " [4,] \"1.32\"               \n",
      " [5,] \"0.53\"               \n",
      " [6,] \"7.53\"               \n",
      " [7,] \"0.57\"               \n",
      " [8,] \"0.304\"              \n",
      " [9,] \"0.93\"               \n",
      "[10,] \"0.135\"              \n",
      "[11,] \"0.292\"              \n",
      "      Rules                                                                \n",
      " [1,] \"Mean of output y = 32400 - Sample size n = 1379\"                    \n",
      " [2,] \"if sex < 1 then 24200 (n=859) else 46000 (n=520)\"                   \n",
      " [3,] \"if height < 68.5 then 26700 (n=965) else 45900 (n=414)\"             \n",
      " [4,] \"if age < 31 then 19300 (n=246) else 35300 (n=1133)\"                 \n",
      " [5,] \"if ed < 17 then 29200 (n=1229) else 58800 (n=150)\"                  \n",
      " [6,] \"if sex >= 1 & race >= 2 then 31500 (n=88) else 32500 (n=1291)\"      \n",
      " [7,] \"if ed < 14 then 24500 (n=784) else 42900 (n=595)\"                   \n",
      " [8,] \"if age < 27 then 13300 (n=122) else 34300 (n=1257)\"                 \n",
      " [9,] \"if sex < 1 & age >= 31 then 26000 (n=731) else 39800 (n=648)\"       \n",
      "[10,] \"if ed < 16 then 27200 (n=1042) else 48600 (n=337)\"                  \n",
      "[11,] \"if height >= 68.5 & race < 2 then 48400 (n=355) else 26900 (n=1024)\"\n",
      "[1] 694089772\n"
     ]
    }
   ],
   "source": [
    "evaulate.sirus('wage', './datasets/wages_demographics/wages.csv',\n",
    "                 c('height', 'sex', 'race', 'ed', 'age'),  'earn',\n",
    "                 c('male'=1, 'female'=0, 'white'=1, 'black'=2, 'hispanic'=3, 'other'=4))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3a627a77",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "R",
   "language": "R",
   "name": "ir"
  },
  "language_info": {
   "codemirror_mode": "r",
   "file_extension": ".r",
   "mimetype": "text/x-r-source",
   "name": "R",
   "pygments_lexer": "r",
   "version": "4.2.2"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
