{ "cells": [ { "cell_type": "code", "execution_count": 28, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import pandas as pd\n", "import json\n", "from sklearn.decomposition import PCA\n", "from sklearn.cluster import KMeans\n", "import pandas as pd\n", "import numpy as np\n", "from sklearn.preprocessing import StandardScaler\n", "from sklearn import preprocessing\n", "import matplotlib.pyplot as plt" ] }, { "cell_type": "code", "execution_count": 29, "outputs": [], "source": [ "data = pd.read_json(r'../..//data/SIR_train_set.json')\n", "CVE_ID = data[\"CVE_ID\"]" ], "metadata": { "collapsed": false } }, { "cell_type": "code", "execution_count": 30, "outputs": [ { "data": { "text/plain": " baseScore impactScore exploitabilityScore severity\n0 7.5 3.6 3.9 HIGH\n1 9.8 5.9 3.9 CRITICAL\n2 7.5 3.6 3.9 HIGH\n3 8.1 5.9 2.2 HIGH\n4 8.8 5.9 2.8 HIGH\n... ... ... ... ...\n5619 7.5 3.6 3.9 HIGH\n5620 6.1 2.7 2.8 MEDIUM\n5621 6.5 3.6 2.8 MEDIUM\n5622 6.5 3.6 2.8 MEDIUM\n5623 5.4 2.7 2.3 MEDIUM\n\n[5624 rows x 4 columns]", "text/html": "
| \n | baseScore | \nimpactScore | \nexploitabilityScore | \nseverity | \n
|---|---|---|---|---|
| 0 | \n7.5 | \n3.6 | \n3.9 | \nHIGH | \n
| 1 | \n9.8 | \n5.9 | \n3.9 | \nCRITICAL | \n
| 2 | \n7.5 | \n3.6 | \n3.9 | \nHIGH | \n
| 3 | \n8.1 | \n5.9 | \n2.2 | \nHIGH | \n
| 4 | \n8.8 | \n5.9 | \n2.8 | \nHIGH | \n
| ... | \n... | \n... | \n... | \n... | \n
| 5619 | \n7.5 | \n3.6 | \n3.9 | \nHIGH | \n
| 5620 | \n6.1 | \n2.7 | \n2.8 | \nMEDIUM | \n
| 5621 | \n6.5 | \n3.6 | \n2.8 | \nMEDIUM | \n
| 5622 | \n6.5 | \n3.6 | \n2.8 | \nMEDIUM | \n
| 5623 | \n5.4 | \n2.7 | \n2.3 | \nMEDIUM | \n
5624 rows × 4 columns
\n| \n | AV | \nAC | \nPR | \nUI | \nS | \nC | \nI | \nA | \n
|---|---|---|---|---|---|---|---|---|
| 0 | \nN | \nL | \nN | \nN | \nU | \nH | \nN | \nN | \n
| 1 | \nN | \nL | \nN | \nN | \nU | \nH | \nH | \nH | \n
| 2 | \nN | \nL | \nN | \nN | \nU | \nH | \nN | \nN | \n
| 3 | \nN | \nH | \nN | \nN | \nU | \nH | \nH | \nH | \n
| 4 | \nN | \nL | \nN | \nR | \nU | \nH | \nH | \nH | \n
| ... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
| 5619 | \nN | \nL | \nN | \nN | \nU | \nN | \nN | \nH | \n
| 5620 | \nN | \nL | \nN | \nR | \nC | \nL | \nL | \nN | \n
| 5621 | \nN | \nL | \nN | \nR | \nU | \nN | \nH | \nN | \n
| 5622 | \nN | \nL | \nN | \nR | \nU | \nN | \nH | \nN | \n
| 5623 | \nN | \nL | \nL | \nR | \nC | \nL | \nL | \nN | \n
5624 rows × 8 columns
\n| \n | AV | \nAC | \nPR | \nUI | \nS | \nC | \nI | \nA | \n
|---|---|---|---|---|---|---|---|---|
| 0 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.447963 | \n0.447963 | \n
| 1 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n
| 2 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.447963 | \n0.447963 | \n
| 3 | \n0.202517 | \n0.447308 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n
| 4 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n
| ... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
| 5619 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.447963 | \n0.447963 | \n0.246931 | \n
| 5620 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.156062 | \n0.305106 | \n0.305106 | \n0.447963 | \n
| 5621 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.447963 | \n0.246931 | \n0.447963 | \n
| 5622 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.447963 | \n0.246931 | \n0.447963 | \n
| 5623 | \n0.202517 | \n0.552692 | \n0.305106 | \n0.452224 | \n0.156062 | \n0.305106 | \n0.305106 | \n0.447963 | \n
5624 rows × 8 columns
\n| \n | AV | \nAC | \nPR | \nUI | \nS | \nC | \nI | \nA | \nbaseScore | \nimpactScore | \nexploitabilityScore | \nseverity | \n
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.447963 | \n0.447963 | \n7.5 | \n3.6 | \n3.9 | \nHIGH | \n
| 1 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n9.8 | \n5.9 | \n3.9 | \nCRITICAL | \n
| 2 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.447963 | \n0.447963 | \n7.5 | \n3.6 | \n3.9 | \nHIGH | \n
| 3 | \n0.202517 | \n0.447308 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n8.1 | \n5.9 | \n2.2 | \nHIGH | \n
| 4 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n8.8 | \n5.9 | \n2.8 | \nHIGH | \n
| ... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
| 5619 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.447963 | \n0.447963 | \n0.246931 | \n7.5 | \n3.6 | \n3.9 | \nHIGH | \n
| 5620 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.156062 | \n0.305106 | \n0.305106 | \n0.447963 | \n6.1 | \n2.7 | \n2.8 | \nMEDIUM | \n
| 5621 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.447963 | \n0.246931 | \n0.447963 | \n6.5 | \n3.6 | \n2.8 | \nMEDIUM | \n
| 5622 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.447963 | \n0.246931 | \n0.447963 | \n6.5 | \n3.6 | \n2.8 | \nMEDIUM | \n
| 5623 | \n0.202517 | \n0.552692 | \n0.305106 | \n0.452224 | \n0.156062 | \n0.305106 | \n0.305106 | \n0.447963 | \n5.4 | \n2.7 | \n2.3 | \nMEDIUM | \n
5624 rows × 12 columns
\n| \n | AV | \nAC | \nPR | \nUI | \nS | \nC | \nI | \nA | \nbaseScore | \nimpactScore | \nexploitabilityScore | \nseverity | \n
|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.447963 | \n0.447963 | \n7.5 | \n3.6 | \n3.9 | \n0.149507 | \n
| 1 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n9.8 | \n5.9 | \n3.9 | \n0.290885 | \n
| 2 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.447963 | \n0.447963 | \n7.5 | \n3.6 | \n3.9 | \n0.149507 | \n
| 3 | \n0.202517 | \n0.447308 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n8.1 | \n5.9 | \n2.2 | \n0.149507 | \n
| 4 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.246931 | \n0.246931 | \n0.246931 | \n8.8 | \n5.9 | \n2.8 | \n0.149507 | \n
| ... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n... | \n
| 5619 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.547776 | \n0.843938 | \n0.447963 | \n0.447963 | \n0.246931 | \n7.5 | \n3.6 | \n3.9 | \n0.149507 | \n
| 5620 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.156062 | \n0.305106 | \n0.305106 | \n0.447963 | \n6.1 | \n2.7 | \n2.8 | \n0.374878 | \n
| 5621 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.447963 | \n0.246931 | \n0.447963 | \n6.5 | \n3.6 | \n2.8 | \n0.374878 | \n
| 5622 | \n0.202517 | \n0.552692 | \n0.447963 | \n0.452224 | \n0.843938 | \n0.447963 | \n0.246931 | \n0.447963 | \n6.5 | \n3.6 | \n2.8 | \n0.374878 | \n
| 5623 | \n0.202517 | \n0.552692 | \n0.305106 | \n0.452224 | \n0.156062 | \n0.305106 | \n0.305106 | \n0.447963 | \n5.4 | \n2.7 | \n2.3 | \n0.374878 | \n
5624 rows × 12 columns
\n| \n | 0 | \n1 | \n2 | \n
|---|---|---|---|
| 0 | \n0.013773 | \n1.328624 | \n0.647031 | \n
| 1 | \n1.539486 | \n0.577848 | \n-0.185040 | \n
| 2 | \n0.013773 | \n1.328624 | \n0.647031 | \n
| 3 | \n0.763329 | \n-1.328923 | \n0.107140 | \n
| 4 | \n1.074067 | \n-0.631252 | \n-0.089019 | \n
| 5 | \n1.073885 | \n-0.633773 | \n-0.097836 | \n
| 6 | \n0.616217 | \n-1.754719 | \n0.053234 | \n
| 7 | \n0.013862 | \n1.327285 | \n0.635674 | \n
| 8 | \n-0.889005 | \n0.561839 | \n-1.746661 | \n
| 9 | \n1.073885 | \n-0.633773 | \n-0.097836 | \n