Setup

User Defined Parameters

final_report <- T

Toolset

knitr::opts_chunk$set(echo = T, message = T, warning = T)
if (final_report) knitr::opts_chunk$set(message = F, warning = F)
library(dplyr)
library(readr)
library(DT)
library(data.table)
library(ggplot2)

Problem Analysis & My Goal

Problem Analysis

My Goal

Data Ingestion

# Read a sample
raw_data <- readr::read_csv('', n_max = 1000)
head(raw_data)
tail(raw_data)

Data Cleaning

# DT::datatable(head(dataset, 500)) # limited to a sample due to poor hardware

Data Transformation


Data Exploration

Exploration

Hypothesis 1

# # Compute Decision Tree Model
# model_dt <- rpart(koi_disposition ~ ., feats, maxdepth = 4)
# 
# # Plot tree
# rpart.plot(model_dt,
#            type = 4,
#            extra = 101,
#            under = TRUE,
#            branch = 0,
#            varlen = 0,
#            faclen = 0,
#            main = "Decision Tree | CONFIRMED versus FALSE POSITIVE",
#            box.col = c("yellow", "palegreen2")[model_dt$frame$yval])

Conclusion

Next Steps

Comments



rebordao/myrutils documentation built on May 27, 2019, 4:01 a.m.