#
# This is a Shiny web application. You can run the application by clicking
# the 'Run App' button above.
#
# Find out more about building applications with Shiny here:
#
# http://shiny.rstudio.com/
#
library(shinythemes)
library(shiny)
library(DT)
library(data.table)
library(ggplot2)
library(shinycssloaders)
library(h2o)
# Defining Non Changing Variables
data <- fread("2020.10.01.csv")
data_na_removed <- na.omit(data)
# Encoding the Label Column
# 1 - Benign 2 - Malicious 3 - Outlier
data_encoded <- data_na_removed
data_encoded$label <- factor(data_na_removed$label,
levels = c("benign", "malicious", "outlier"),
labels = c(1, 2, 3))
data_encoded$label = as.numeric(data_encoded$label)
# Define Default Values
pch = 16
features <- c("Average Input","Incoming Bytes","Outgoing Bytes",
"Destination IP", "Destination Port", "Entropy",
"Inbound Packets", "Outbound Packets", "Protocol",
"Source IP", "Source Port", "Start Time (s)",
"End Time (s)", "Total Entropy", "Type", "Duration")
feature_variables <- c("avg_ipt", "bytes_in", "bytes_out", "dest_ip",
"dest_port", "entropy", "num_pkts_out", "num_pkts_in",
"proto", "src_ip", "src_port", "time_end", "time_start",
"total_entropy", "label", "duration")
# Define Elementary Functions
get_color <- function(a = 1) {
return(alpha("#e95420", a))
}
# Load the models
model.dl <- h2o.loadModel(dl_model)
model.drf <- h2o.loadModel(drf_model)
model.gbm <- h2o.loadModel(gbm_model)
model.nb <- h2o.loadModel(nb_model)
# Define UI for application
ui <- fluidPage(
theme = shinytheme("united"),
# Application title
titlePanel("A Comprehensive Approach To Analysis and Detection of Emerging
Threats due to Network Intrusion"),
navbarPage(
"Network Intrusion Detection Demo",
tabPanel(
icon("home"),
p("Through this application, it is intended to develop a demo of a",
strong("Network Intrusion Detection System"),
"using different Machine Learning Techniques using the
LUFlow Network Intrusion Detection Data Set. This page is intended
to display the information about the dataset."
,style="text-align:justify;color:black;
background-color:lavender;padding:15px;border-radius:10px"),
br(),
p("The data used in this application are publicly available on the",
em("LUFlow Network Intrusion Detection Data Set"), "Kaggle page.
The Data Set contains telemetry cap- tured using Cisco’s Joy tool.
This tool records multiple measurements asso- ciated with flows.
Features are engineered from these measurements, which are also
outlined below",style="text-align:justify;color:black;
background-color:papayawhip;padding:15px;border-radius:10px"),
hr(),
tags$style(".fa-database {color:#e95420}"),
h3(p(icon("database",lib = "font-awesome"),
em("Dataset Exploration "),
style="color:black;text-align:center")),
fluidRow(column(DT::dataTableOutput("renderData"),
width = 12)),
hr(),
p(em("Developed by"), br("Kumar Priyansh, Ritu Dimri,
Sandeep Perumalla, Hemanth Katikala"),
style="text-align:center; font-family: times")
),
tabPanel(
"Data Visualization",
p("This part allows you to visualize features via different types of
plots. You can select whatever features you want to plot and hit
the \"Plot Graph\" button. Please keep in mind that all plots",
strong("might not be useful"),
"and you need to select which plots you want to visualize. If you
want to save an image of the currently visualized plot, please
right click on the plot and click on the relevant",
strong("save image"),
"option."
,style="text-align:justify;color:black;
background-color:lavender;padding:15px;border-radius:10px"),
sidebarLayout(
sidebarPanel(
selectInput(
"plotType",
p("Type of plot:"),
choices = c(Histogram = "hist",
"Scatter Plot" = "scatter",
"Mosaic Plot" = "mosaic")
),
# Only show this panel if the plot type is a histogram
conditionalPanel(
condition = "input.plotType == 'hist'",
selectInput(
"plotVariable",
p("Feature to visualize:"),
choices = features
),
selectInput(
"plotVariant",
p("Plot variant:"),
choices = c("Normal", "Log 10 Scale")
)
),
# Only show this panel if the plot type is a scatter plot
conditionalPanel(
condition = "input.plotType == 'scatter'",
selectInput(
"plotVariable1",
p("First feature to visualize:"),
choices = features
),
uiOutput("secondSelection")
),
# Single Mosiac Plot for now
conditionalPanel(
condition = "input.plotType == 'mosaic'",
selectInput(
"mosaicVariable",
p("Select features to visualize:"),
choices = c("Labels vs Protocols" = "labproto")
)
),
actionButton("plot", "Plot Graph",
width = "100%", icon = icon("chart-line"),
class = "btn btn-primary")
),
mainPanel(
withSpinner(
plotOutput("selectedFeatureVariableForVisualization"),
type = 6, color = "#e95420"
)
)
)
),
tabPanel(
"Predictions",
sidebarLayout(
sidebarPanel(
selectInput(
"modelType",
p("Choose a model to predict:"),
choices = c("Deep Learning" = "dl",
"Distributed Random Forest" = "drf",
"Gradient Boosting Machine" = "gbm",
"Naive Bayes" = "nb")
),
numericInput("npin", "Number of inbound packets:",
10, min = 0),
numericInput("npob", "Number of outbound packets:",
10, min = 0),
numericInput("nbin", "Number of bytes in:",
2000, min = 0),
numericInput("nbob", "Number of bytes out:",
10000, min = 0),
numericInput("dprt", "Destination port (1024 - 49151):",
5234, min = 1024, max = 49151),
numericInput("tepy", "Total entropy:",
18000, min = 0),
actionButton("predictButton", "Predict",
width = "100%", icon = icon("think-peaks"),
class = "btn btn-primary")
),
mainPanel(
tags$label(h3('Status/Output')),
verbatimTextOutput('contents'),
fluidRow(
column(
width = 6,
p(strong("Prediction Legend"), br(), br(), em("1"),
" - Benign", br(), em("2"), " - Malicious",
br(), em("3"), " - Outlier",
style="text-align:justify;color:black;
background-color:lavender;padding:15px;border-radius:10px"),
),
column(
width = 6,
p(strong("Probabilty Legend"), br(), br(), em("p1"),
" - Probability of being a Benign Connection",
br(), em("p2"), " - Probability of being a
Malicious Connection", br(), em("p3"), " -
Probability of being an Outlier Connection",
style="text-align:justify;color:black;
background-color:papayawhip;padding:15px;border-radius:10px"),
)
),
tableOutput('tabledata'), # Prediction results table
fluidRow(
column(
width = 6,
withSpinner(
plotOutput("varImpPlot"),
type = 6, color = "#e95420"
)
),
column(
width = 6,
withSpinner(
plotOutput("lcPlot"),
type = 6, color = "#e95420"
)
)
)
)
)
),
tabPanel(
"Model Metrics",
sidebarLayout(
sidebarPanel(
selectInput(
"metricModelType",
p("Choose a model to show metrics:"),
choices = c("Deep Learning" = "dl",
"Distributed Random Forest" = "drf",
"Gradient Boosting Machine" = "gbm",
"Naive Bayes" = "nb"),
),
actionButton("metricsButton", "Show Metrics",
width = "100%", icon = icon("tachometer-alt"),
class = "btn btn-primary")
),
mainPanel(
verbatimTextOutput('metrics')
)
)
),
tabPanel(
"Model Summary",
sidebarLayout(
sidebarPanel(
selectInput(
"summaryModelType",
p("Choose a model to show metrics:"),
choices = c("Deep Learning" = "dl",
"Distributed Random Forest" = "drf",
"Gradient Boosting Machine" = "gbm",
"Naive Bayes" = "nb"),
),
actionButton("summaryButton", "Show Information",
width = "100%", icon = icon("clipboard"),
class = "btn btn-primary")
),
mainPanel(
verbatimTextOutput('summary')
)
)
)
)
)
# Define server logic
server <- function(input, output) {
output$renderData <- DT::renderDataTable(
DT::datatable({
data_na_removed
},
options = list(
initComplete = JS(
"function(settings, json) {",
"$(this.api().table().header()).css({'background-color':
'moccasin', 'color': '1c1b1b'});",
"}"),
columnDefs=list(list(className='dt-center',targets="_all"))),
style = 'bootstrap',
class = 'cell-border stripe',
rownames = FALSE,
colnames = features)
)
datasetInput <- reactive({
modelType <- input$modelType
req(input$npin)
req(input$npob)
req(input$nbin)
req(input$nbob)
req(input$dprt)
req(input$tepy)
df <- data.frame(
Name = c("num_pkts_in", "bytes_in", "num_pkts_out", "bytes_out",
"dest_port", "total_entropy"),
Value = as.character(c(input$npin, input$nbin, input$npob,
input$nbob, input$dprt, input$tepy)),
stringsAsFactors = FALSE)
labels <- 0
df <- rbind(df, labels)
input <- transpose(df)
write.table(input,"input.csv", sep=",", quote = FALSE,
row.names = FALSE, col.names = FALSE)
test <- read.csv(paste("input", ".csv", sep=""), header = TRUE)
if (modelType == "dl") {
predict(model.dl, as.h2o(test))
} else if (modelType == "drf") {
predict(model.drf, as.h2o(test))
} else if (modelType == "gbm") {
predict(model.gbm, as.h2o(test))
} else if (modelType == "nb") {
predict(model.nb, as.h2o(test))
}
})
output$varImpPlot <- renderPlot({
modelType <- input$modelType
if (modelType == "dl") {
h2o.varimp_plot(model.dl)
} else if (modelType == "drf") {
h2o.varimp_plot(model.drf)
} else if (modelType == "gbm") {
h2o.varimp_plot(model.gbm)
}
})
output$lcPlot <- renderPlot({
modelType <- input$modelType
if (modelType == "dl") {
h2o.learning_curve_plot(model.dl)
} else if (modelType == "drf") {
h2o.learning_curve_plot(model.drf)
} else if (modelType == "gbm") {
h2o.learning_curve_plot(model.gbm)
}
})
output$metrics <- renderPrint({
input$metricsButton
isolate({
modelType <- input$metricModelType
if (modelType == "dl") {
h2o.performance(model.dl)
} else if (modelType == "drf") {
h2o.performance(model.drf)
} else if (modelType == "gbm") {
h2o.performance(model.gbm)
} else {
h2o.performance(model.nb)
}
})
})
output$summary <- renderPrint({
input$summaryButton
isolate({
modelType <- input$summaryModelType
if (modelType == "dl") {
summary(model.dl)
} else if (modelType == "drf") {
summary(model.drf)
} else if (modelType == "gbm") {
summary(model.gbm)
} else {
summary(model.nb)
}
})
})
# Status/Output Text Box
output$contents <- renderPrint({
if (input$predictButton>0) {
isolate("Calculation complete.")
} else {
return("Server is ready for calculation.")
}
})
# Prediction results table
output$tabledata <- renderTable({
if (input$predictButton>0) {
isolate(datasetInput())
}
})
output$secondSelection <- renderUI({
selectedFeature <- input$plotVariable1
selectInput(
"plotVariable2",
p("Second feature to visualize:"),
choices = features[!features %in% selectedFeature]
)
})
output$selectedFeatureVariableForVisualization <- renderPlot({
input$plot
isolate({
plotType <- input$plotType
if (plotType == 'hist') {
selectedFeature <- input$plotVariable
plotVariant <- input$plotVariant
positionInFeatureArray <- which(features == selectedFeature)
selectedFeatureVariable <- feature_variables[positionInFeatureArray]
if (plotVariant == "Normal") {
hist(data_encoded[[selectedFeatureVariable]],
main = paste("Histogram Plot of", selectedFeature, sep = " ", collapse = NULL),
ylab = "Frequency", xlab = selectedFeature,
col = get_color(), pch = pch)
} else {
nonZeroSelectedFeature = data_encoded[data_encoded[[selectedFeatureVariable]] > 0]
hist(log(nonZeroSelectedFeature[[selectedFeatureVariable]]),
main = paste("Log 10 Base Histogram Plot of", selectedFeature, sep = " ", collapse = NULL),
ylab = "Frequency", xlab = selectedFeature,
col = get_color(), pch = pch)
}
} else if (plotType == 'scatter') {
firstFeature <- feature_variables[which(features ==
input$plotVariable1)]
secondFeature <- feature_variables[which(features ==
input$plotVariable2)]
try(plot(data_encoded[[firstFeature]], data_encoded[[secondFeature]],
main = paste("Scatter Plot of", input$plotVariable1,
"vs", input$plotVariable2, sep = " ", collapse = NULL),
ylab = input$plotVariable2, xlab = input$plotVariable1,
col = get_color(0.02),
pch = 16,), silent = TRUE)
} else {
selectedFeatures <- input$mosaicVariable
if (selectedFeatures == 'labproto') {
proto_label_mosaic <- table(data_encoded$proto, data_encoded$label)
mosaicplot(~ factor(proto)+factor(label, labels=c("benign","malicious","outlier")),
data = data_encoded,xlab = "Protocol", ylab = "Category",
main= "Mosaic plot of Protocol vs Category",shade = TRUE)
}
}
})
})
}
# Run the application
shinyApp(ui = ui, server = server)