From 0306f28a68c5abf47027ad9c4d5e3b70177daa5f Mon Sep 17 00:00:00 2001 From: nuluh Date: Tue, 3 Sep 2024 11:09:47 +0700 Subject: [PATCH] docs(notebooks): add `extract_numbers` docstring --- code/notebooks/03_feature_extraction.ipynb | 153 +++------------------ 1 file changed, 19 insertions(+), 134 deletions(-) diff --git a/code/notebooks/03_feature_extraction.ipynb b/code/notebooks/03_feature_extraction.ipynb index b21cbb2..c32d240 100644 --- a/code/notebooks/03_feature_extraction.ipynb +++ b/code/notebooks/03_feature_extraction.ipynb @@ -302,7 +302,7 @@ }, { "cell_type": "code", - "execution_count": 4, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -325,12 +325,25 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "# Define a function to extract numbers from a filename that later used as labels features\n", "def extract_numbers(filename):\n", + " '''\n", + " Extract numbers from a filename\n", + "\n", + " Parameters\n", + " ----------\n", + " filename : str\n", + " The filename to extract numbers from\n", + "\n", + " Returns\n", + " -------\n", + " list\n", + " A list of extracted numbers: [damage_number, test_number, sensor_number]\n", + " '''\n", " # Find all occurrences of one or more digits in the filename\n", " numbers = re.findall(r'\\d+', filename)\n", " # Convert the list of number strings to integers\n", @@ -372,7 +385,7 @@ "metadata": {}, "outputs": [], "source": [ - "data_dir = \"../../data/raw\"\n", + "data_dir = \"../../data/QUGS/raw\"\n", "# Extract features\n", "df1 = build_features(data_dir, sensor=1)\n", "df2 = build_features(data_dir, sensor=2)" @@ -411,145 +424,17 @@ " \n", " \n", " \n", - " Mean\n", - " Max\n", - " Peak (Pm)\n", - " Peak-to-Peak (Pk)\n", - " RMS\n", - " Variance\n", - " Standard Deviation\n", - " Power\n", - " Crest Factor\n", - " Form Factor\n", - " Pulse Indicator\n", - " Margin\n", - " Kurtosis\n", - " Skewness\n", - " label\n", - " filename\n", " \n", " \n", " \n", - " \n", - " 0\n", - " -0.075377\n", - " 1.466510\n", - " 2.254903\n", - " 3.721414\n", - " 1.037986\n", - " 1.071734\n", - " 1.091245\n", - " 1.077416\n", - " 2.172382\n", - " -13.770555\n", - " -29.914909\n", - " 2.764892\n", - " 2.817839\n", - " -0.649122\n", - " 1\n", - " D1_TEST01_1.csv\n", - " \n", - " \n", - " 1\n", - " -0.227331\n", - " 1.307743\n", - " 1.575323\n", - " 2.883067\n", - " 0.953077\n", - " 0.856677\n", - " 0.975635\n", - " 0.908357\n", - " 1.652881\n", - " -4.192466\n", - " -6.929646\n", - " 1.821195\n", - " 1.915737\n", - " 0.260070\n", - " 1\n", - " D1_TEST02_1.csv\n", - " \n", - " \n", - " 2\n", - " 0.009247\n", - " 1.139160\n", - " 1.476295\n", - " 2.615455\n", - " 0.906951\n", - " 0.822475\n", - " 0.955961\n", - " 0.822560\n", - " 1.627755\n", - " 98.077724\n", - " 159.646548\n", - " 1.868548\n", - " 1.763273\n", - " -0.503998\n", - " 1\n", - " D1_TEST03_1.csv\n", - " \n", - " \n", - " 3\n", - " 0.050242\n", - " 2.637336\n", - " 2.637336\n", - " 4.445498\n", - " 1.135680\n", - " 1.287244\n", - " 1.195939\n", - " 1.289768\n", - " 2.322254\n", - " 22.604275\n", - " 52.492866\n", - " 3.417678\n", - " 3.644127\n", - " 0.696925\n", - " 1\n", - " D1_TEST04_1.csv\n", - " \n", - " \n", - " 4\n", - " -0.063636\n", - " 1.814052\n", - " 1.814052\n", - " 3.213308\n", - " 0.919439\n", - " 0.841319\n", - " 0.966850\n", - " 0.845369\n", - " 1.972998\n", - " -14.448310\n", - " -28.506483\n", - " 2.255246\n", - " 2.633599\n", - " 0.716632\n", - " 1\n", - " D1_TEST05_1.csv\n", - " \n", " \n", "\n", "" ], "text/plain": [ - " Mean Max Peak (Pm) Peak-to-Peak (Pk) RMS Variance \\\n", - "0 -0.075377 1.466510 2.254903 3.721414 1.037986 1.071734 \n", - "1 -0.227331 1.307743 1.575323 2.883067 0.953077 0.856677 \n", - "2 0.009247 1.139160 1.476295 2.615455 0.906951 0.822475 \n", - "3 0.050242 2.637336 2.637336 4.445498 1.135680 1.287244 \n", - "4 -0.063636 1.814052 1.814052 3.213308 0.919439 0.841319 \n", - "\n", - " Standard Deviation Power Crest Factor Form Factor Pulse Indicator \\\n", - "0 1.091245 1.077416 2.172382 -13.770555 -29.914909 \n", - "1 0.975635 0.908357 1.652881 -4.192466 -6.929646 \n", - "2 0.955961 0.822560 1.627755 98.077724 159.646548 \n", - "3 1.195939 1.289768 2.322254 22.604275 52.492866 \n", - "4 0.966850 0.845369 1.972998 -14.448310 -28.506483 \n", - "\n", - " Margin Kurtosis Skewness label filename \n", - "0 2.764892 2.817839 -0.649122 1 D1_TEST01_1.csv \n", - "1 1.821195 1.915737 0.260070 1 D1_TEST02_1.csv \n", - "2 1.868548 1.763273 -0.503998 1 D1_TEST03_1.csv \n", - "3 3.417678 3.644127 0.696925 1 D1_TEST04_1.csv \n", - "4 2.255246 2.633599 0.716632 1 D1_TEST05_1.csv " + "Empty DataFrame\n", + "Columns: []\n", + "Index: []" ] }, "execution_count": 7,