diff --git a/code/notebooks/03_feature_extraction.ipynb b/code/notebooks/03_feature_extraction.ipynb
index b21cbb2..c32d240 100644
--- a/code/notebooks/03_feature_extraction.ipynb
+++ b/code/notebooks/03_feature_extraction.ipynb
@@ -302,7 +302,7 @@
},
{
"cell_type": "code",
- "execution_count": 4,
+ "execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
@@ -325,12 +325,25 @@
},
{
"cell_type": "code",
- "execution_count": 5,
+ "execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"# Define a function to extract numbers from a filename that later used as labels features\n",
"def extract_numbers(filename):\n",
+ " '''\n",
+ " Extract numbers from a filename\n",
+ "\n",
+ " Parameters\n",
+ " ----------\n",
+ " filename : str\n",
+ " The filename to extract numbers from\n",
+ "\n",
+ " Returns\n",
+ " -------\n",
+ " list\n",
+ " A list of extracted numbers: [damage_number, test_number, sensor_number]\n",
+ " '''\n",
" # Find all occurrences of one or more digits in the filename\n",
" numbers = re.findall(r'\\d+', filename)\n",
" # Convert the list of number strings to integers\n",
@@ -372,7 +385,7 @@
"metadata": {},
"outputs": [],
"source": [
- "data_dir = \"../../data/raw\"\n",
+ "data_dir = \"../../data/QUGS/raw\"\n",
"# Extract features\n",
"df1 = build_features(data_dir, sensor=1)\n",
"df2 = build_features(data_dir, sensor=2)"
@@ -411,145 +424,17 @@
" \n",
" \n",
" | \n",
- " Mean | \n",
- " Max | \n",
- " Peak (Pm) | \n",
- " Peak-to-Peak (Pk) | \n",
- " RMS | \n",
- " Variance | \n",
- " Standard Deviation | \n",
- " Power | \n",
- " Crest Factor | \n",
- " Form Factor | \n",
- " Pulse Indicator | \n",
- " Margin | \n",
- " Kurtosis | \n",
- " Skewness | \n",
- " label | \n",
- " filename | \n",
"
\n",
" \n",
"
\n",
- " \n",
- " | 0 | \n",
- " -0.075377 | \n",
- " 1.466510 | \n",
- " 2.254903 | \n",
- " 3.721414 | \n",
- " 1.037986 | \n",
- " 1.071734 | \n",
- " 1.091245 | \n",
- " 1.077416 | \n",
- " 2.172382 | \n",
- " -13.770555 | \n",
- " -29.914909 | \n",
- " 2.764892 | \n",
- " 2.817839 | \n",
- " -0.649122 | \n",
- " 1 | \n",
- " D1_TEST01_1.csv | \n",
- "
\n",
- " \n",
- " | 1 | \n",
- " -0.227331 | \n",
- " 1.307743 | \n",
- " 1.575323 | \n",
- " 2.883067 | \n",
- " 0.953077 | \n",
- " 0.856677 | \n",
- " 0.975635 | \n",
- " 0.908357 | \n",
- " 1.652881 | \n",
- " -4.192466 | \n",
- " -6.929646 | \n",
- " 1.821195 | \n",
- " 1.915737 | \n",
- " 0.260070 | \n",
- " 1 | \n",
- " D1_TEST02_1.csv | \n",
- "
\n",
- " \n",
- " | 2 | \n",
- " 0.009247 | \n",
- " 1.139160 | \n",
- " 1.476295 | \n",
- " 2.615455 | \n",
- " 0.906951 | \n",
- " 0.822475 | \n",
- " 0.955961 | \n",
- " 0.822560 | \n",
- " 1.627755 | \n",
- " 98.077724 | \n",
- " 159.646548 | \n",
- " 1.868548 | \n",
- " 1.763273 | \n",
- " -0.503998 | \n",
- " 1 | \n",
- " D1_TEST03_1.csv | \n",
- "
\n",
- " \n",
- " | 3 | \n",
- " 0.050242 | \n",
- " 2.637336 | \n",
- " 2.637336 | \n",
- " 4.445498 | \n",
- " 1.135680 | \n",
- " 1.287244 | \n",
- " 1.195939 | \n",
- " 1.289768 | \n",
- " 2.322254 | \n",
- " 22.604275 | \n",
- " 52.492866 | \n",
- " 3.417678 | \n",
- " 3.644127 | \n",
- " 0.696925 | \n",
- " 1 | \n",
- " D1_TEST04_1.csv | \n",
- "
\n",
- " \n",
- " | 4 | \n",
- " -0.063636 | \n",
- " 1.814052 | \n",
- " 1.814052 | \n",
- " 3.213308 | \n",
- " 0.919439 | \n",
- " 0.841319 | \n",
- " 0.966850 | \n",
- " 0.845369 | \n",
- " 1.972998 | \n",
- " -14.448310 | \n",
- " -28.506483 | \n",
- " 2.255246 | \n",
- " 2.633599 | \n",
- " 0.716632 | \n",
- " 1 | \n",
- " D1_TEST05_1.csv | \n",
- "
\n",
" \n",
"\n",
""
],
"text/plain": [
- " Mean Max Peak (Pm) Peak-to-Peak (Pk) RMS Variance \\\n",
- "0 -0.075377 1.466510 2.254903 3.721414 1.037986 1.071734 \n",
- "1 -0.227331 1.307743 1.575323 2.883067 0.953077 0.856677 \n",
- "2 0.009247 1.139160 1.476295 2.615455 0.906951 0.822475 \n",
- "3 0.050242 2.637336 2.637336 4.445498 1.135680 1.287244 \n",
- "4 -0.063636 1.814052 1.814052 3.213308 0.919439 0.841319 \n",
- "\n",
- " Standard Deviation Power Crest Factor Form Factor Pulse Indicator \\\n",
- "0 1.091245 1.077416 2.172382 -13.770555 -29.914909 \n",
- "1 0.975635 0.908357 1.652881 -4.192466 -6.929646 \n",
- "2 0.955961 0.822560 1.627755 98.077724 159.646548 \n",
- "3 1.195939 1.289768 2.322254 22.604275 52.492866 \n",
- "4 0.966850 0.845369 1.972998 -14.448310 -28.506483 \n",
- "\n",
- " Margin Kurtosis Skewness label filename \n",
- "0 2.764892 2.817839 -0.649122 1 D1_TEST01_1.csv \n",
- "1 1.821195 1.915737 0.260070 1 D1_TEST02_1.csv \n",
- "2 1.868548 1.763273 -0.503998 1 D1_TEST03_1.csv \n",
- "3 3.417678 3.644127 0.696925 1 D1_TEST04_1.csv \n",
- "4 2.255246 2.633599 0.716632 1 D1_TEST05_1.csv "
+ "Empty DataFrame\n",
+ "Columns: []\n",
+ "Index: []"
]
},
"execution_count": 7,