Resolve issue #21: now using proper regex format to resolve syntax warning

Ahtisham-1214 · Ahtisham-1214 · commit fd672fc28de3 · 2025-10-10T09:55:08.000+05:00
diff --git a/1-Data-Cleaning.ipynb b/1-Data-Cleaning.ipynb
@@ -132,11 +132,23 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {
     "collapsed": true
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "NameError",
+     "evalue": "name 'comedians' is not defined",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[1;31mNameError\u001b[0m                                 Traceback (most recent call last)",
+      "Cell \u001b[1;32mIn[1], line 3\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[38;5;66;03m# Load pickled files\u001b[39;00m\n\u001b[0;32m      2\u001b[0m data \u001b[38;5;241m=\u001b[39m {}\n\u001b[1;32m----> 3\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m i, c \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28menumerate\u001b[39m(\u001b[43mcomedians\u001b[49m):\n\u001b[0;32m      4\u001b[0m     \u001b[38;5;28;01mwith\u001b[39;00m \u001b[38;5;28mopen\u001b[39m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mtranscripts/\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;241m+\u001b[39m c \u001b[38;5;241m+\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m.txt\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mrb\u001b[39m\u001b[38;5;124m\"\u001b[39m) \u001b[38;5;28;01mas\u001b[39;00m file:\n\u001b[0;32m      5\u001b[0m         data[c] \u001b[38;5;241m=\u001b[39m pickle\u001b[38;5;241m.\u001b[39mload(file)\n",
+      "\u001b[1;31mNameError\u001b[0m: name 'comedians' is not defined"
+     ]
+    }
+   ],
    "source": [
     "# Load pickled files\n",
     "data = {}\n",
@@ -284,9 +296,9 @@
     "def clean_text_round1(text):\n",
     "    '''Make text lowercase, remove text in square brackets, remove punctuation and remove words containing numbers.'''\n",
     "    text = text.lower()\n",
-    "    text = re.sub('\\[.*?\\]', '', text)\n",
-    "    text = re.sub('[%s]' % re.escape(string.punctuation), '', text)\n",
-    "    text = re.sub('\\w*\\d\\w*', '', text)\n",
+    "    text = re.sub(r'\\[.*?\\]', '', text)\n",
+    "    text = re.sub(r'[%s]' % re.escape(string.punctuation), '', text)\n",
+    "    text = re.sub(r'\\w*\\d\\w*', '', text)\n",
     "    return text\n",
     "\n",
     "round1 = lambda x: clean_text_round1(x)"
@@ -508,7 +520,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.6.2"
+   "version": "3.12.2"
   },
   "toc": {
    "nav_menu": {},