diff --git a/doc/ipython-notebooks/clustering/KMeans.ipynb b/doc/ipython-notebooks/clustering/KMeans.ipynb index bd480e391f8..cf49d3ccc70 100644 --- a/doc/ipython-notebooks/clustering/KMeans.ipynb +++ b/doc/ipython-notebooks/clustering/KMeans.ipynb @@ -59,13 +59,14 @@ "from numpy import concatenate, array\n", "from numpy.random import randn\n", "\n", - "num=200\n", + "num = 200\n", "d1 = concatenate((randn(1,num),10.*randn(1,num)),0)\n", "d2 = concatenate((randn(1,num),10.*randn(1,num)),0)+array([[10.],[0.]])\n", "d3 = concatenate((randn(1,num),10.*randn(1,num)),0)+array([[0.],[100.]])\n", "d4 = concatenate((randn(1,num),10.*randn(1,num)),0)+array([[10.],[100.]])\n", "\n", - "rectangle = concatenate((d1,d2,d3,d4),1)" + "rectangle = concatenate((d1,d2,d3,d4),1)\n", + "totalPoints = 800 " ], "language": "python", "metadata": {}, @@ -189,18 +190,21 @@ "cell_type": "code", "collapsed": false, "input": [ - "figure,axis = pyplot.subplots(1,1)\n", - "for i in xrange(800):\n", - " if (result[i]==0.0):\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='green', markersize=3)\n", - " else:\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='blue', markersize=3)\n", - " axis.plot(centers[0,0], centers[1,0], 'x', color='green', markersize=10)\n", - " axis.plot(centers[0,1], centers[1,1], 'x', color='blue', markersize=10)\n", - "axis.set_xlim(-5,15)\n", - "axis.set_ylim(-50,150)\n", - "axis.set_title('KMeans Results')\n", - "pyplot.show()" + "def plotResult(title = 'KMeans Plot'):\n", + " figure,axis = pyplot.subplots(1,1)\n", + " for i in xrange(totalPoints):\n", + " if (result[i]==0.0):\n", + " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='green', markersize=3)\n", + " else:\n", + " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='blue', markersize=3)\n", + " axis.plot(centers[0,0], centers[1,0], 'x', color='green', markersize=10)\n", + " axis.plot(centers[0,1], centers[1,1], 'x', color='blue', markersize=10)\n", + " axis.set_xlim(-5,15)\n", + " axis.set_ylim(-50,150)\n", + " axis.set_title(title)\n", + " pyplot.show()\n", + " \n", + "plotResult('KMeans Results')" ], "language": "python", "metadata": {}, @@ -277,18 +281,8 @@ "# Labels for data points\n", "result = kmeans.apply()\n", "\n", - "figure,axis = pyplot.subplots(1,1)\n", - "for i in xrange(800):\n", - " if (result[i]==0.0):\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='green', markersize=3)\n", - " else:\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='blue', markersize=3)\n", - " axis.plot(centers[0,0], centers[1,0], 'x', color='green', markersize=10)\n", - " axis.plot(centers[0,1], centers[1,1], 'x', color='blue', markersize=10)\n", - "axis.set_xlim(-5,15)\n", - "axis.set_ylim(-50,150)\n", - "axis.set_title('Hand initialized KMeans Results 1')\n", - "pyplot.show()" + "# plot the results\n", + "plotResult('Hand initialized KMeans Results 1')" ], "language": "python", "metadata": {}, @@ -334,18 +328,8 @@ "# Labels for data points\n", "result = kmeans.apply()\n", "\n", - "figure,axis = pyplot.subplots(1,1)\n", - "for i in xrange(800):\n", - " if (result[i]==0.0):\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='green', markersize=3)\n", - " else:\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='blue', markersize=3)\n", - " axis.plot(centers[0,0], centers[1,0], 'x', color='green', markersize=10)\n", - " axis.plot(centers[0,1], centers[1,1], 'x', color='blue', markersize=10)\n", - "axis.set_xlim(-5,15)\n", - "axis.set_ylim(-50,150)\n", - "axis.set_title('Hand initialized KMeans Results 2')\n", - "pyplot.show()" + "# plot the results\n", + "plotResult('Hand initialized KMeans Results 2')" ], "language": "python", "metadata": {}, @@ -415,18 +399,8 @@ "# Labels for data points\n", "result = kmeans.apply()\n", "\n", - "figure,axis = pyplot.subplots(1,1)\n", - "for i in xrange(800):\n", - " if (result[i]==0.0):\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='green', markersize=3)\n", - " else:\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='blue', markersize=3)\n", - " axis.plot(centers[0,0], centers[1,0], 'x', color='green', markersize=10)\n", - " axis.plot(centers[0,1], centers[1,1], 'x', color='blue', markersize=10)\n", - "axis.set_xlim(-5,15)\n", - "axis.set_ylim(-50,150)\n", - "axis.set_title('KMeans with KMeans++ Results')\n", - "pyplot.show()" + "# plot the results\n", + "plotResult('KMeans with KMeans++ Results')" ], "language": "python", "metadata": {}, @@ -555,18 +529,8 @@ "# Labels for data points\n", "result = kmeans.apply()\n", "\n", - "figure,axis = pyplot.subplots(1,1)\n", - "for i in xrange(800):\n", - " if (result[i]==0.0):\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='green', markersize=3)\n", - " else:\n", - " axis.plot(rectangle[0,i], rectangle[1,i], 'o', color='blue', markersize=3)\n", - " axis.plot(centers[0,0], centers[1,0], 'x', color='green', markersize=10)\n", - " axis.plot(centers[0,1], centers[1,1], 'x', color='blue', markersize=10)\n", - "axis.set_xlim(-5,15)\n", - "axis.set_ylim(-50,150)\n", - "axis.set_title('Mini-batch KMeans Results')\n", - "pyplot.show()" + "# plot the results\n", + "plotResult('Mini-batch KMeans Results')" ], "language": "python", "metadata": {},