sdk tests with papermill

Yehudit Kerido · Yehudit Kerido · commit ea66c1aab1fa · 2025-03-04T10:32:49.000+02:00
Signed-off-by: Yehudit Kerido &lt;yehudit.kerido@nokia.com&gt;
diff --git a/examples/v1beta1/sdk/.ipynb_checkpoints/tune-train-from-func-checkpoint.ipynb b/examples/v1beta1/sdk/.ipynb_checkpoints/tune-train-from-func-checkpoint.ipynb
@@ -36,9 +36,16 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "1d71674a-baca-4a89-adf0-4f702ac27904",
+   "id": "1fedadf1",
    "metadata": {
+    "collapsed": false,
     "editable": true,
+    "jupyter": {
+     "outputs_hidden": false
+    },
+    "pycharm": {
+     "name": "#%%\n"
+    },
     "slideshow": {
      "slide_type": ""
     },
@@ -48,22 +55,22 @@
    },
    "outputs": [],
    "source": [
-    "katib_python_sdk = \"kubeflow-katib\""
+    "katib_python_sdk = \"kubeflow-katib\"\n",
+    "namespace = \"default\" "
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "5de885ca-e96a-4d59-9e78-75f6fc6f5ce7",
+   "id": "518cfe2d",
    "metadata": {
-    "editable": true,
+    "collapsed": false,
+    "jupyter": {
+     "outputs_hidden": false
+    },
     "pycharm": {
      "name": "#%%\n"
-    },
-    "slideshow": {
-     "slide_type": ""
-    },
-    "tags": []
+    }
    },
    "outputs": [],
    "source": [
@@ -75,32 +82,39 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "15ea90f2-ad99-4bf4-ae07-cc35bcbe6884",
+   "id": "7211d9e4",
    "metadata": {
+    "collapsed": false,
     "editable": true,
+    "jupyter": {
+     "outputs_hidden": false
+    },
     "pycharm": {
      "name": "#%%\n"
     },
     "slideshow": {
      "slide_type": ""
     },
-    "tags": [
-     "parameters"
-    ]
+    "tags": []
    },
    "outputs": [],
    "source": [
-    "# Experiment namespace\n",
-    "namespace = \"default\" "
+    "!pip install {katib_python_sdk}\n",
+    "!pip install tensorflow\n",
+    "!pip install kubeflow-training"
    ]
   },
   {
    "cell_type": "markdown",
    "id": "881aae2f-d08e-4439-bef9-1684ff87556d",
    "metadata": {
+    "editable": true,
     "pycharm": {
      "name": "#%% md\n"
     },
+    "slideshow": {
+     "slide_type": ""
+    },
     "tags": []
    },
    "source": [
diff --git a/examples/v1beta1/sdk/tune-train-from-func.ipynb b/examples/v1beta1/sdk/tune-train-from-func.ipynb
@@ -36,46 +36,41 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "outputs": [],
-   "source": [
-    "katib_python_sdk = \"kubeflow-katib\""
-   ],
+   "id": "1fedadf1",
    "metadata": {
     "collapsed": false,
+    "editable": true,
+    "jupyter": {
+     "outputs_hidden": false
+    },
     "pycharm": {
      "name": "#%%\n"
-    }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
+    },
+    "slideshow": {
+     "slide_type": ""
+    },
+    "tags": [
+     "parameters"
+    ]
+   },
    "outputs": [],
    "source": [
-    "!pip install {katib_python_sdk}\n",
-    "!pip install tensorflow\n",
-    "!pip install kubeflow-training"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "katib_python_sdk = \"kubeflow-katib\"\n",
+    "namespace = \"default\" "
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "5de885ca-e96a-4d59-9e78-75f6fc6f5ce7",
+   "id": "518cfe2d",
    "metadata": {
-    "editable": true,
+    "collapsed": false,
+    "jupyter": {
+     "outputs_hidden": false
+    },
     "pycharm": {
      "name": "#%%\n"
-    },
-    "slideshow": {
-     "slide_type": ""
-    },
-    "tags": []
+    }
    },
    "outputs": [],
    "source": [
@@ -87,158 +82,41 @@
   {
    "cell_type": "code",
    "execution_count": null,
-   "id": "15ea90f2-ad99-4bf4-ae07-cc35bcbe6884",
+   "id": "7211d9e4",
    "metadata": {
+    "collapsed": false,
     "editable": true,
+    "jupyter": {
+     "outputs_hidden": false
+    },
     "pycharm": {
      "name": "#%%\n"
     },
     "slideshow": {
      "slide_type": ""
     },
-    "tags": [
-     "parameters"
-    ]
+    "tags": []
    },
    "outputs": [],
    "source": [
-    "# Experiment namespace\n",
-    "namespace = \"default\" "
+    "!pip install {katib_python_sdk}\n",
+    "!pip install tensorflow\n",
+    "!pip install kubeflow-training"
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "881aae2f-d08e-4439-bef9-1684ff87556d",
-   "metadata": {
-    "pycharm": {
-     "name": "#%% md\n"
-    },
-    "tags": []
-   },
    "source": [
     "## Create Train Script for CNN Model\n",
     "\n",
     "This is simple **Convolutional Neural Network (CNN)** model for recognizing hand-written digits using [MNIST Dataset](http://yann.lecun.com/exdb/mnist/).  "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "id": "98a77484-cee4-4d77-bd76-915c469a242b",
+   ],
    "metadata": {
-    "editable": true,
-    "execution": {
-     "iopub.execute_input": "2022-09-12T18:46:59.051290Z",
-     "iopub.status.busy": "2022-09-12T18:46:59.050544Z",
-     "iopub.status.idle": "2022-09-12T18:46:59.249456Z",
-     "shell.execute_reply": "2022-09-12T18:46:59.248292Z",
-     "shell.execute_reply.started": "2022-09-12T18:46:59.051211Z"
-    },
+    "collapsed": false,
     "pycharm": {
-     "name": "#%%\n"
-    },
-    "slideshow": {
-     "slide_type": ""
-    },
-    "tags": []
-   },
-   "outputs": [],
-   "source": [
-    "def train_mnist_model(parameters):\n",
-    "    import tensorflow as tf\n",
-    "    import numpy as np\n",
-    "    import logging\n",
-    "\n",
-    "    logging.basicConfig(\n",
-    "        format=\"%(asctime)s %(levelname)-8s %(message)s\",\n",
-    "        datefmt=\"%Y-%m-%dT%H:%M:%SZ\",\n",
-    "        level=logging.INFO,\n",
-    "    )\n",
-    "    logging.info(\"--------------------------------------------------------------------------------------\")\n",
-    "    logging.info(f\"Input Parameters: {parameters}\")\n",
-    "    logging.info(\"--------------------------------------------------------------------------------------\\n\\n\")\n",
-    "\n",
-    "\n",
-    "    # Get HyperParameters from the input params dict.\n",
-    "    lr = float(parameters[\"lr\"])\n",
-    "    num_epoch = int(parameters[\"num_epoch\"])\n",
-    "\n",
-    "    # Set dist parameters and strategy.\n",
-    "    is_dist = parameters[\"is_dist\"]\n",
-    "    num_workers = parameters[\"num_workers\"]\n",
-    "    batch_size_per_worker = 64\n",
-    "    batch_size_global = batch_size_per_worker * num_workers\n",
-    "    strategy = tf.distribute.MultiWorkerMirroredStrategy(\n",
-    "        communication_options=tf.distribute.experimental.CommunicationOptions(\n",
-    "            implementation=tf.distribute.experimental.CollectiveCommunication.RING\n",
-    "        )\n",
-    "    )\n",
-    "\n",
-    "    # Callback class for logging training.\n",
-    "    # Katib parses metrics in this format: <metric-name>=<metric-value>.\n",
-    "    class CustomCallback(tf.keras.callbacks.Callback):\n",
-    "        def on_epoch_end(self, epoch, logs=None):\n",
-    "            logging.info(\n",
-    "                \"Epoch {}/{}. accuracy={:.4f} - loss={:.4f}\".format(\n",
-    "                    epoch+1, num_epoch, logs[\"accuracy\"], logs[\"loss\"]\n",
-    "                )\n",
-    "            )\n",
-    "\n",
-    "    # Prepare MNIST Dataset.\n",
-    "    def mnist_dataset(batch_size):\n",
-    "        (x_train, y_train), _ = tf.keras.datasets.mnist.load_data()\n",
-    "        x_train = x_train / np.float32(255)\n",
-    "        y_train = y_train.astype(np.int64)\n",
-    "        train_dataset = (\n",
-    "            tf.data.Dataset.from_tensor_slices((x_train, y_train))\n",
-    "            .shuffle(60000)\n",
-    "            .repeat()\n",
-    "            .batch(batch_size)\n",
-    "        )\n",
-    "        return train_dataset\n",
-    "\n",
-    "    # Build and compile CNN Model.\n",
-    "    def build_and_compile_cnn_model():\n",
-    "        model = tf.keras.Sequential(\n",
-    "            [\n",
-    "                tf.keras.layers.InputLayer(input_shape=(28, 28)),\n",
-    "                tf.keras.layers.Reshape(target_shape=(28, 28, 1)),\n",
-    "                tf.keras.layers.Conv2D(32, 3, activation=\"relu\"),\n",
-    "                tf.keras.layers.Flatten(),\n",
-    "                tf.keras.layers.Dense(128, activation=\"relu\"),\n",
-    "                tf.keras.layers.Dense(10),\n",
-    "            ]\n",
-    "        )\n",
-    "        model.compile(\n",
-    "            loss=tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True),\n",
-    "            optimizer=tf.keras.optimizers.SGD(learning_rate=lr),\n",
-    "            metrics=[\"accuracy\"],\n",
-    "        )\n",
-    "        return model\n",
-    "    \n",
-    "    # Download Dataset.\n",
-    "    dataset = mnist_dataset(batch_size_global)\n",
-    "\n",
-    "    # For dist strategy we should build model under scope().\n",
-    "    if is_dist:\n",
-    "        logging.info(\"Running Distributed Training\")\n",
-    "        logging.info(\"--------------------------------------------------------------------------------------\\n\\n\")\n",
-    "        with strategy.scope():\n",
-    "            model = build_and_compile_cnn_model()\n",
-    "    else:\n",
-    "        logging.info(\"Running Single Worker Training\")\n",
-    "        logging.info(\"--------------------------------------------------------------------------------------\\n\\n\")\n",
-    "        model = build_and_compile_cnn_model()\n",
-    "    \n",
-    "    # Start Training.\n",
-    "    model.fit(\n",
-    "        dataset,\n",
-    "        epochs=num_epoch,\n",
-    "        steps_per_epoch=70,\n",
-    "        callbacks=[CustomCallback()],\n",
-    "        verbose=0,\n",
-    "    )"
-   ]
+     "name": "#%% md\n"
+    }
+   }
   },
   {
    "cell_type": "markdown",
diff --git a/test/e2e/v1beta1/scripts/gh-actions/run-notebook.sh b/test/e2e/v1beta1/scripts/gh-actions/run-notebook.sh
@@ -23,7 +23,7 @@ set -o pipefail
 NOTEBOOK_INPUT=""
 NOTEBOOK_OUTPUT="-" # outputs to console
 NAMESPACE="default"
-KATIB_PYTHON_SDK="../../../sdk/python"
+KATIB_PYTHON_SDK="./sdk/python"
 
 usage() {
   echo "Usage: $0 -i <input_notebook> -o <output_notebook> [-p \"<param> <value>\"...] [-y <params.yaml>]"