example edit + changes .py instances to inputs

daniels290813 · daniels290813 · commit 9e7ce2bf2ec7 · 2021-10-14T06:11:31.000Z
diff --git a/churn_server/churn_server.ipynb b/churn_server/churn_server.ipynb
@@ -15,9 +15,21 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<a id=\"deploy\"></a>\n",
-    "### Deploy our serving class using as a serverless function\n",
-    "in the following section we create a new model serving function which wraps our class , and specify model and other resources."
+    "in the following section we create a new model serving function which wraps our class , and specify model and other resources.\n",
+    "Deploying the serving function will provide us an http endpoint that can handle requests in real time.\n",
+    "This function is part of the [customer-churn-prediction demo](https://github.com/mlrun/demos/tree/master/customer-churn-prediction).<br>\n",
+    "To see how the model is trained or how the data-set is generated, check out `coxph_trainer` and `xgb_trainer` functions from the function marketplace repository."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### **Steps**\n",
+    "1. [Setup function parameters](#Setup-function-parameters)\n",
+    "2. [Importing the function](#Importing-the-function)\n",
+    "3. [Testing the function locally](#Testing-the-function-locally)\n",
+    "4. [Testing the function remotely](#Testing-the-function-remotely)"
    ]
   },
   {
@@ -26,91 +38,124 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import mlrun\n",
-    "import pandas as pd\n",
-    "import os"
+    "import warnings\n",
+    "warnings.filterwarnings(\"ignore\")"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 2,
    "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Following packages are required, make sure to install\n",
+    "# !pip install xgboost==1.3.1"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### **Setup function parameters**"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Setting up models path\n",
+    "xgb_model_path = 'https://s3.wasabisys.com/iguazio/models/function-marketplace-models/churn_server/xgb_model.pkl'"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### **Importing the function**"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "> 2021-10-12 07:29:57,497 [info] loaded project function-marketplace from MLRun DB\n"
+      "> 2021-10-14 06:10:16,104 [info] loaded project function-marketplace from MLRun DB\n"
      ]
     },
     {
      "data": {
       "text/plain": [
-       "('function-marketplace', 'v3io:///projects/{{run.project}}/artifacts')"
+       "<mlrun.serving.states.TaskStep at 0x7f8f2306ca90>"
       ]
      },
-     "execution_count": 2,
+     "execution_count": 4,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
-    "# setting environment \n",
-    "mlrun.set_environment(project='function-marketplace')"
+    "import mlrun\n",
+    "mlrun.set_environment(project='function-marketplace')\n",
+    "\n",
+    "# Importing the function from the hub\n",
+    "fn = mlrun.import_function(\"hub://churn_server:development\")\n",
+    "fn.apply(mlrun.auto_mount())\n",
+    "\n",
+    "# Manually specifying needed packages \n",
+    "fn.spec.build.commands = ['pip install lifelines==0.22.8', 'pip install xgboost==1.3.1']\n",
+    "\n",
+    "# Adding the model \n",
+    "fn.add_model(key='xgb_model', model_path=xgb_model_path ,class_name='ChurnModel')"
    ]
   },
   {
-   "cell_type": "code",
-   "execution_count": 3,
+   "cell_type": "markdown",
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "File ‘/User/functions/churn_server/models/xgb_model.pkl’ already there; not retrieving.\n",
-      "\n"
-     ]
-    }
-   ],
    "source": [
-    "# Stored artifacts path (S3)\n",
-    "data_path = 'https://s3.wasabisys.com/iguazio/data/churn/test_set.csv'\n",
-    "model_url = 'https://s3.wasabisys.com/iguazio/models/churn/xgb_model.pkl'\n",
-    "model_path = os.getcwd() + '/models'\n",
+    "### **Testing the function locally**"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "> Note that this function is a serving function, hence not needs to run, but deployed.<br>\n",
     "\n",
-    "# Downloading the model\n",
-    "! wget -nc -P {model_path} {model_url}"
+    "in order to test locally without deploying to server, mlrun provides mocking api that simulate the action."
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
-     "data": {
-      "text/plain": [
-       "<mlrun.serving.states.TaskStep at 0x7f559bdabb90>"
-      ]
-     },
-     "execution_count": 4,
-     "metadata": {},
-     "output_type": "execute_result"
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "> 2021-10-14 06:10:19,145 [info] model xgb_model was loaded\n",
+      "> 2021-10-14 06:10:19,145 [info] Initializing endpoint records\n",
+      "> 2021-10-14 06:10:19,164 [info] Loaded ['xgb_model']\n"
+     ]
     }
    ],
    "source": [
-    "# importing the function from the function marketplace\n",
-    "fn = mlrun.import_function(\"hub://churn_server\").apply(mlrun.auto_mount())\n",
-    "fn.spec.build.commands = ['pip install lifelines==0.22.8', 'pip install xgboost==1.3.1']\n",
+    "# When mocking, class has to be present\n",
+    "from churn_server import *\n",
     "\n",
-    "# Adding the model \n",
-    "fn.add_model(key='xgb_model', model_path=model_path ,class_name='ChurnModel')"
+    "# Mocking function\n",
+    "server = fn.to_mock_server()"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
@@ -315,106 +360,94 @@
        "[5 rows x 23 columns]"
       ]
      },
-     "execution_count": 5,
+     "execution_count": 6,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
+    "import pandas as pd\n",
+    "\n",
+    "#declaring test_set path\n",
+    "test_set_path = \"https://s3.wasabisys.com/iguazio/data/function-marketplace-data/churn_server/test_set.csv\"\n",
+    "\n",
     "# Getting the data\n",
-    "x_test = pd.read_csv(data_path)\n",
+    "x_test = pd.read_csv(test_set_path)\n",
     "y_test = x_test['labels']\n",
     "x_test.drop(['labels'],axis=1,inplace=True)\n",
     "x_test.head()"
    ]
   },
   {
-   "cell_type": "markdown",
+   "cell_type": "code",
+   "execution_count": 12,
    "metadata": {},
+   "outputs": [],
    "source": [
-    "### **Testing the model locally**"
+    "# KFServing protocol event\n",
+    "event_data = {\"inputs\": x_test.values.tolist()}"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [],
    "source": [
-    "# an old version of lifelines and xgboost is required when running locally, uncomment to install\n",
-    "# !pip install lifelines==0.22.8\n",
-    "# !pip install xgboost==1.3.1"
+    "response = server.test(path='/v2/models/xgb_model/predict',body=event_data)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "> 2021-10-12 07:30:00,756 [info] model xgb_model was loaded\n",
-      "> 2021-10-12 07:30:00,757 [info] Initializing endpoint records\n",
-      "> 2021-10-12 07:30:00,768 [info] Loaded ['xgb_model']\n",
-      "model's accuracy : 0.7913907284768212\n"
+      "When mocking to server, returned dict has the following fields : id, model_name, outputs\n"
      ]
     }
    ],
    "source": [
-    "# importing the class (a must when using mock_to_server)\n",
-    "from churn_server import *\n",
-    "\n",
-    "server = fn.to_mock_server()\n",
-    "response = server.test(\"/v2/models/xgb_model/predict\",body={'inputs' : x_test.values.tolist()})\n",
-    "\n",
-    "# Calculating model's accuracy\n",
-    "accuracy = sum(1 for x,y in zip(response['outputs'],y_test) if x == y) / len(y_test)\n",
-    "print(f\"model's accuracy : {accuracy}\")"
+    "print(f'When mocking to server, returned dict has the following fields : {\", \".join([x for x in response.keys()])}')"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "### **Deploying and testing our model server using HTTP request**"
+    "### **Testing the function remotely**"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "> 2021-10-12 07:33:32,143 [info] Starting remote function deploy\n",
-      "2021-10-12 07:33:32  (info) Deploying function\n",
-      "2021-10-12 07:33:32  (info) Building\n",
-      "2021-10-12 07:33:32  (info) Staging files and preparing base images\n",
-      "2021-10-12 07:33:32  (info) Building processor image\n",
-      "2021-10-12 07:33:33  (info) Build complete\n",
-      "2021-10-12 07:33:41  (info) Function deploy complete\n",
-      "> 2021-10-12 07:33:42,050 [info] successfully deployed function: {'internal_invocation_urls': ['nuclio-default-churn-server.default-tenant.svc.cluster.local:8080'], 'external_invocation_urls': ['default-tenant.app.app-lab-eks-testing.iguazio-cd1.com:31334']}\n"
+      "> 2021-10-14 06:10:20,163 [info] Starting remote function deploy\n",
+      "2021-10-14 06:10:20  (info) Deploying function\n",
+      "2021-10-14 06:10:20  (info) Building\n",
+      "2021-10-14 06:10:20  (info) Staging files and preparing base images\n",
+      "2021-10-14 06:10:20  (info) Building processor image\n",
+      "2021-10-14 06:10:21  (info) Build complete\n",
+      "2021-10-14 06:10:29  (info) Function deploy complete\n",
+      "> 2021-10-14 06:10:30,408 [info] successfully deployed function: {'internal_invocation_urls': ['nuclio-function-marketplace-churn-server.default-tenant.svc.cluster.local:8080'], 'external_invocation_urls': ['default-tenant.app.dev39.lab.iguazeng.com:31984']}\n"
      ]
     }
    ],
    "source": [
     "address = fn.deploy()"
    ]
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We invoke our model serving function using test data, the data vector is specified in the `inputs` attribute."
-   ]
-  },
   {
    "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [
     {
@@ -429,10 +462,7 @@
     "import json\n",
     "import requests\n",
     "\n",
-    "# KFServing protocol event\n",
-    "event_data = {\"inputs\": x_test.values.tolist()}\n",
-    "\n",
-    "# sending data in a json format\n",
+    "# using requests to predict\n",
     "response = requests.put(address + \"/v2/models/xgb_model/predict\", json=json.dumps(event_data))\n",
     "\n",
     "# returned data is a string \n",
@@ -445,7 +475,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "**[back to top](#top)**"
+    "[Back to the top](#Churn-Server)"
    ]
   }
  ],
diff --git a/churn_server/churn_server.py b/churn_server/churn_server.py
@@ -23,7 +23,7 @@ def load(self):
 
     def predict(self, body):
         try:
-            feats = np.asarray(body["instances"], dtype=np.float32).reshape(-1, 23)
+            feats = np.asarray(body["inputs"], dtype=np.float32).reshape(-1, 23)
             result = self.model.predict(feats, validate_features=False)
             return result.tolist()
         except Exception as e: