Ad2Play - Evaluation

Files

data/digital_twins.json structures both the Siemens and Cisco digital twins.
data/pattern.json defines relevant matching terms.
data/csaf.json stores the converted CSAF documents.
data/cacao.json holds the generated CACAO playbooks.
evaluation.csv provides the summary for the evaluation.

Imports

import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
from pywaffle import Waffle
import plotly.express as px
import matplotlib.patches as mpatches

from matplotlib import rc

User Definitions

sns.set(font_scale=1.4)
sentences_siemens = 220
sentences_cisa = 705
sentences_cisco = 136
sentences = sentences_siemens + sentences_cisa + sentences_cisco

def plot_confusion_matrix(source, df_tasks, sentences):
    fp = df_tasks.loc[df_tasks['source'] == source, 'useless_steps'].sum()
    fn = df_tasks.loc[df_tasks['source'] == source, 'actions_missing'].sum()
    tp = df_tasks.loc[df_tasks['source'] == source, 'detected_actions'].sum() - fp - df_tasks.loc[df_tasks['source'] == source, 'matched_wrong_pattern'].sum() - df_tasks.loc[df_tasks['source'] == source, 'nlp_error'].sum()
    tn = sentences - fp - fn - tp

    accuracy = (tp+tn)/(tp+fn+tn+fp)*100
    precision = tp/(tp+fp)*100
    recall = tp/(tp+fn)*100
    f1_score = (2 * precision * recall)/(precision + recall)

    ax = sns.heatmap([[tp,fp],[fn,tn]],cbar=False, annot=True, cmap='binary', fmt='.4g', alpha=0.7)

    stats = "\n\nAccuracy = {:0.2f}%        Precision = {:0.2f}%\nRecall = {:0.2f}%             F1 Score = {:0.2f}%".format(
                    accuracy,precision,recall,f1_score)
    ax.text(0.0, 2.5, stats,fontsize=17)
    ax.set_xlabel('Actual Actions\n', fontdict=dict(weight='bold'))
    ax.set_ylabel('Predicted Actions\n', fontdict=dict(weight='bold'))

    values = ["(TP)", "(FP)", "(FN)", "(TN)"]
    ax.texts[0].set_text(ax.texts[0].get_text() + "\n" + values[0])
    ax.texts[1].set_text(ax.texts[1].get_text() + "\n" + values[1])
    ax.texts[2].set_text(ax.texts[2].get_text() + "\n" + values[2])
    ax.texts[3].set_text(ax.texts[3].get_text() + "\n" + values[3])


    ## Ticket labels - List must be in alphabetical order
    ax.xaxis.set_ticklabels(['Positive','Negative'])
    ax.yaxis.set_ticklabels(['Positive','Negative'])
    ax.xaxis.set_label_position('top')
    ax.xaxis.tick_top()
    ax.yaxis.set_label_position('left')
    ax.yaxis.tick_left()

    plt.savefig(f'./charts/confusion_matrix_{source}.pdf', dpi=200, bbox_inches="tight")
    plt.show()

Import CSV

df_tasks = pd.read_csv("evaluation.csv", delimiter=";")
df_tasks.head()

	task_id	csaf_id	playbook_id	twin	source	manual	detected_actions	actual_actions	actions_missing	missing_actions	...	update_step	access_action_step	system_action_step	traffic_action_step
0	62c3f0af99cf253386589061	62c3f0af99cf253386588bb0	62c44b404466fa24127b09c9	Ad2Play:Mock_Siemens	Siemens ProductCERT	False	5	5	0	NaN	...	3	0	1	1
1	62c3f0af99cf253386588bae	62c3f0af99cf253386588945	62c44b404466fa24127b0858	Ad2Play:Mock_Siemens	Siemens ProductCERT	False	2	2	0	NaN	...	2	0	0	0
2	62c3f0af99cf253386588943	62c3f0af99cf253386588527	62c44b404466fa24127b079d	Ad2Play:Mock_Siemens	Siemens ProductCERT	False	3	3	0	NaN	...	1	0	1	1
3	62c3f0af99cf253386588525	62c3f0af99cf253386588485	62c44b3f4466fa24127b0652	Ad2Play:Mock_Siemens	Siemens ProductCERT	False	4	4	0	NaN	...	2	0	2	0
4	62c3f0af99cf253386588483	62c3f0af99cf2533865882e7	62c44b3f4466fa24127b05f6	Ad2Play:Mock_Siemens	Siemens ProductCERT	False	5	8	3	Update to V4.8 HF6; Deactivate the webserver ...	...	4	1	0	0

5 rows × 25 columns

CERT Quality

Advisories and Actions by CERT

# Use TeX for rendering text
rc('text', usetex=True)

# Extract actions and advisories for each source
cisco_actions = df_tasks.loc[df_tasks['source'] == "Cisco Security Advisory", 'detected_actions'].sum()
cisa_actions = df_tasks.loc[df_tasks['source'] == "CISA ICS CERT", 'detected_actions'].sum()
siemens_actions = df_tasks.loc[df_tasks['source'] == "Siemens ProductCERT", 'detected_actions'].sum()
cisco_advisories = df_tasks.loc[df_tasks['source'] == "Cisco Security Advisory", 'source'].count()
cisa_advisories = df_tasks.loc[df_tasks['source'] == "CISA ICS CERT", 'source'].count()
siemens_advisories = df_tasks.loc[df_tasks['source'] == "Siemens ProductCERT", 'source'].count()

# Create lists for pie charts
advisories = [siemens_advisories, cisa_advisories, cisco_advisories]
actions = [siemens_actions, cisa_actions, cisco_actions]

# Define labels and colors
mylabels = ["Siemens ProductCERT", "CISA ICS CERT", "Cisco CERT"]
mycolors = ["#555555", "#BBBBBB", "#beb9db"]

# Define autopct format for pie charts
def autopct_format(values):
    def my_format(pct):
        total = sum(values)
        val = int(round(pct*total/100.0))
        return '{v:d}'.format(v=val)
    return my_format

# Create subplots
fig, axs = plt.subplots(2, figsize=(4,7))

# Plot the first pie chart
axs[0].pie(advisories, autopct = autopct_format(advisories), pctdistance=1.15, colors = mycolors)
axs[0].set_title(r"\textbf{Advisories}")

# Plot the second pie chart
axs[1].pie(actions, autopct = autopct_format(actions), pctdistance=1.15, colors = mycolors)
axs[1].set_title(r"\textbf{Actions}")

# Add a legend
legend = plt.legend(mylabels, bbox_to_anchor=(0.9, 0.1), fontsize=17, 
                    bbox_transform=plt.gcf().transFigure, frameon=False)
legend.get_frame().set_alpha(None)
legend.get_frame().set_facecolor((0, 0, 0, 0))

# Show the plot
plt.show()

# Save the plot to a file
fig.savefig('./charts/actions.pdf', dpi = 200, bbox_inches="tight")

Categorization of Actions

import matplotlib.pyplot as plt
from pywaffle import Waffle

# Define data
data = {
    "Update": df_tasks["update_step"].sum(),
    "Investigation": df_tasks["investigation_step"].sum(),
    "Locating": df_tasks["locating_step"].sum(),
    "Data-Operation": df_tasks["data_operation_step"].sum(),
    "Isolation": df_tasks["isolation_step"].sum(),
    "Privileges": df_tasks["access_action_step"].sum(),
    "System": df_tasks["system_action_step"].sum(),
    "Configuration": df_tasks["set_entity_step"].sum(),
    "Network": df_tasks["traffic_action_step"].sum(),
    "Observation": df_tasks["observe_behavior_step"].sum(),
}

# Sort data by descending order of values
data = dict(sorted(data.items(), key=lambda x: x[1], reverse=True))

# Define chart parameters
nRows = 15
colors = ["#BBBBBB", "#7eb0d5",  "#8bd3c7", "#bd7ebe", "#ffb55a", "#555555", "#beb9db", "#fdcce5",  "#888888","#b2e061"]

# Calculate total sum of values
total = sum(data.values())

# Create a list of legend labels with percentages
legend_labels = []
for k, v in data.items():
    percent = (v / total) * 100
    if percent != 0:
        legend_labels.append(f"{k} ({percent:.1f}%)")
    else:
        legend_labels.append(f"{k} ({percent:.0f}%)")

# Create the Waffle chart with modified legend labels
fig = plt.figure(
    FigureClass=Waffle,
    rows=nRows,
    colors=colors,
    figsize=(16, 17),
    values=data,
    legend={
        "loc": "upper left",
        "bbox_to_anchor": (0, -0.05),
        "ncol": 5,
        "framealpha": 0,
        "labels": legend_labels,
        "prop": {"weight": "bold"},
    },
)

# Show the chart
plt.show()

# Save the chart to a file
plt.rc("text", usetex=False)
fig.savefig("./charts/action_types.pdf", dpi=200, bbox_inches="tight")

Playbook Quality

Confusion Matrix for Siemens ProductCERT

plot_confusion_matrix("Siemens ProductCERT", df_tasks, sentences_siemens)

Confusion Matrix for Cisco Security Advisory

plot_confusion_matrix('Cisco Security Advisory', df_tasks, sentences_siemens)

Confusion Matrix for CISA ICS CERT

plot_confusion_matrix("CISA ICS CERT", df_tasks, sentences_cisa)

Confusion Matrix CERT Summary

# Calculate the values for true positive (tp), false positive (fp), false negative (fn), and true negative (tn)
fp = df_tasks['useless_steps'].sum()
fn = df_tasks['actions_missing'].sum()
tp = df_tasks['detected_actions'].sum() - fp - df_tasks['matched_wrong_pattern'].sum() - df_tasks['nlp_error'].sum()
tn = sentences - fp - fn - tp

# Calculate the accuracy, precision, recall, and f1 score
total = tp + fn + tn + fp
accuracy = (tp <
65D8
span class="pl-c1">+ tn) / total * 100
precision = tp / (tp + fp) * 100
recall = tp / (tp + fn) * 100
f1_score = (2 * precision * recall) / (precision + recall)

# Create a heatmap of the confusion matrix
confusion_matrix = [[tp, fp], [fn, tn]]
ax = sns.heatmap(confusion_matrix, cbar=False, annot=True, cmap='binary', fmt='.4g', alpha=0.7)

# Add text to the heatmap with the accuracy, precision, recall, and f1 score
stats = "\n\nAccuracy = {:0.2f}%        Precision = {:0.2f}%\nRecall = {:0.2f}%             F1 Score = {:0.2f}%".format(
    accuracy, precision, recall, f1_score)
ax.text(0.0, 2.5, stats, fontsize=17)

# Set the x and y labels and tick labels
ax.set_xlabel('Actual Actions\n', fontdict=dict(weight='bold'))
ax.set_ylabel('Predicted Actions\n', fontdict=dict(weight='bold'))
ax.xaxis.set_ticklabels(['Positive', 'Negative'])
ax.yaxis.set_ticklabels(['Positive', 'Negative'])
ax.xaxis.set_label_position('top')
ax.xaxis.tick_top()
ax.yaxis.set_label_position('left')
ax.yaxis.tick_left()

# Add labels to the cells of the heatmap
values = ["(TP)", "(FP)", "(FN)", "(TN)"]
ax.texts[0].set_text(ax.texts[0].get_text() + "\n" + values[0])
ax.texts[1].set_text(ax.texts[1].get_text() + "\n" + values[1])
ax.texts[2].set_text(ax.texts[2].get_text() + "\n" + values[2])
ax.texts[3].set_text(ax.texts[3].get_text() + "\n" + values[3])

# Save the plot as a PDF file
plt.savefig('./charts/confusion_matrix_total.pdf', dpi=200, bbox_inches="tight")

Name		Name	Last commit message	Last commit date
Latest commit History 7 Commits
charts		charts
data		data
resources		resources
.gitignore		.gitignore
README.md		README.md
evaluation.csv		evaluation.csv
evaluation.ipynb		evaluation.ipynb

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Repository files navigation

Ad2Play - Evaluation

Files

Imports

User Definitions

Import CSV

CERT Quality

Advisories and Actions by CERT

Categorization of Actions

Playbook Quality

Confusion Matrix for Siemens ProductCERT

Confusion Matrix for Cisco Security Advisory

Confusion Matrix for CISA ICS CERT

Confusion Matrix CERT Summary

About

Uh oh!

Releases

Packages

Languages

kabulkurniawan/evaluation

Folders and files

Latest commit

History

Repository files navigation

Ad2Play - Evaluation

Files

Imports

User Definitions

Import CSV

CERT Quality

Advisories and Actions by CERT

Categorization of Actions

Playbook Quality

Confusion Matrix for Siemens ProductCERT

Confusion Matrix for Cisco Security Advisory

Confusion Matrix for CISA ICS CERT

Confusion Matrix CERT Summary

About

Resources

Uh oh!

Stars

Watchers

Forks

Releases

Packages 0

Languages

Packages