diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index 8fd4a67..4eea785 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -26,13 +26,13 @@ If you're wishing for a feature that doesn't exist yet in MXFusion, there are pr If you're thinking about adding code to MXFusion, here are some guidelines to get you started. -* If the change is a major feature, create a [design proposal](design_proposal/design_proposal_guidelines) in the design_proposals folder and post it as a PR, optionally with a prototype implementation of your proposed changes. This is to get community feedback on the changes and document the design reasoning of MXFusion for future reference. +* If the change is a major feature, create a [design proposal](docs/design_proposals/design_proposal_guidelines.md) in the design_proposals folder and post it as a PR, optionally with a prototype implementation of your proposed changes. This is to get community feedback on the changes and document the design reasoning of MXFusion for future reference. * Keep pull requests small, preferably one feature per pull request. This lowers the bar to entry for a reviewer, and keeps feedback focused for each feature. Some major areas where we appreciate contributions: * [Adding new Distributions/Functions/Modules](examples/notebooks/writing_a_new_distribution.ipynb) -* [Adding new Inference Algorithms](design_documents/inference) +* [Adding new Inference Algorithms](docs/design_documents/inference.md) * Example notebooks showing how to build/train a particular model. If you're still not sure where to begin, have a look at our [issues](issues TODO) page for open work. @@ -73,7 +73,7 @@ Before submitting the pull request, please go through this checklist to make the * Do all public functions have docstrings including examples? If you added a new module, did you add it to the Sphinx docstring in the ```__init__.py``` file of the module's folder? * Is the code style correct (PEP8)? * Is the commit message formatted correctly? -* If this is a large addition, is there a tutorial or more extensive module-level description? Did you discuss the addition in a [design proposal](design_proposals/design_proposal_guidelines)? Is there an issue related to the change? If so, please link the issue or design doc. +* If this is a large addition, is there a tutorial or more extensive module-level description? Did you discuss the addition in a [design proposal](docs/design_proposals/design_proposal_guidelines.md)? Is there an issue related to the change? If so, please link the issue or design doc. ## Setting up a development environment diff --git a/examples/notebooks/gp_regression.ipynb b/examples/notebooks/gp_regression.ipynb index b306327..107148a 100644 --- a/examples/notebooks/gp_regression.ipynb +++ b/examples/notebooks/gp_regression.ipynb @@ -6,7 +6,7 @@ "source": [ "# Gaussian Process Regression\n", "\n", - "**Zhenwen Dai (2018-11-2)**" + "**Zhenwen Dai (2019-05-29)**" ] }, { @@ -68,7 +68,7 @@ "outputs": [ { "data": { - "image/png": "\n", + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYYAAAD8CAYAAABzTgP2AAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDIuMi4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvhp/UCwAAGoRJREFUeJzt3X2QVfWd5/H3R0SIzygdRQFhssRSQVG7caqymm1Fw4xToImLuEnEmhgm7LqTrSlBHaeBhZhSTK0ZN1lKTFQyw0SRjLFTMymj0o6morEbhxHBMeJzpzW2+DBEwIB+9497Gu653U0/nNt9nz6vqlv3nnN+597vbej76fM75/5+igjMzMy6HFTqAszMrLw4GMzMLMXBYGZmKQ4GMzNLcTCYmVmKg8HMzFIcDGZmluJgMDOzFAeDmZmlHFzqAgZj7NixMWnSpFKXYWZWUTZu3PhORNT11a4ig2HSpEm0tbWVugwzs4oi6bX+tHNXkpmZpTgYzMwsxcFgZmYpRTnHIOku4M+AtyNiag/bBfwt8KfATuCqiHgm2TYf+Juk6bciYs1gatizZw/t7e3s3r17MLvbAIwePZrx48czcuTIUpdiZkOgWCef7wG+B/yol+1/AkxJbucAq4BzJB0DLAXqgQA2SmqOiPcGWkB7eztHHHEEkyZNIpdDNhQigu3bt9Pe3s7kyZNLXY6ZDYGidCVFxOPAuwdoMgf4UeQ8BRwtaRzwBeDhiHg3CYOHgVmDqWH37t0ce+yxDoUhJoljjz3WR2ZWXlauhJaW9LqWltx6G7DhOsdwIvBG3nJ7sq639YPiUBge/jlbyRUGQUMDXHIJ/MVf5JZbWmDu3Nx6G7DhCoaePkniAOu7P4G0QFKbpLbOzs6iFmdmFaahIffBnx8OEtx7LyxZktu2bh00Npauxgo2XMHQDkzIWx4PdBxgfTcRsToi6iOivq6uzy/uldyyZcv4zne+c8A2P/3pT9m6deuQ1tHR0cFll13WZ7tvf/vbQ1qHWVE1NuY++OfO3R8EDzwA3/wmrFgBCxc6FDIYrmBoBq5Uzh8DH0TEm8BDwEWSxkgaA1yUrBtaZdIfORzBcMIJJ7B+/fo+2zkYbMgM1e9bY2MuALqCAGDVKmhqyt0Xvqb1W1GCQdKPgSeBkyW1S/qapG9I+kbS5J+Bl4FtwJ3AfweIiHeBFUBrcluerBtahYehReqPvOmmmzj55JOZOXMmL7zwwr71d955Jw0NDZxxxhl86UtfYufOnfzqV7+iubmZRYsWMX36dF566aUe2xVatmwZX/3qVzn//POZMmUKd955J5C7WmjRokVMnTqVadOmcd999wHw6quvMnVq7grie+65hy9+8YvMmjWLKVOmsHjxYgCuv/56du3axfTp0/nyl7/Mhx9+yMUXX8wZZ5zB1KlT9z2X2aAM0e8bLS37g+D223PnGNatg+XL9x9NOBwGJyIq7nb22WdHoa1bt3Zbd0AbNkSMHRvR1JS737BhYPsXaGtri6lTp8aHH34YH3zwQXzmM5+JW2+9NSIi3nnnnX3tbrzxxrj99tsjImL+/Plx//3379vWW7t8S5cujdNPPz127twZnZ2dMX78+Pjtb38b69evj5kzZ8bevXvjrbfeigkTJkRHR0e88sorcdppp0VExN133x2TJ0+O999/P3bt2hUTJ06M119/PSIiDjvssH2vsX79+rj66qv3Lb///vvd6hjwz9tqW5F/3/Y9X9fzLFgQcdRR6efdsCHilluyvU6VAdqiH5+xtfvN58LD0Iz9kU888QSXXnophx56KEceeSSzZ8/et+25557j3HPPZdq0aaxdu5YtW7b0+Bz9bTdnzhw+9alPMXbsWBobG3n66af55S9/yRVXXMGIESM47rjj+PznP09ra2u3fS+44AKOOuooRo8ezamnnsprr3UfU2vatGk88sgjXHfddTzxxBMcddRRg/ypmCWK/PtGa2v65PIdd+TOMeT/n29shOSo2AamdoMh/zC0SP2RvV3GedVVV/G9732PzZs3s3Tp0l6/A9DfdoWvI4ncHwN9GzVq1L7HI0aMYO/evd3afPazn2Xjxo1MmzaNG264geXLl/fruc16Vezft8WLu4eLg6BoajMYuvo4i9gfed555/HAAw+wa9cuduzYwc9+9rN923bs2MG4cePYs2cPa9eu3bf+iCOOYMeOHX22K/Tggw+ye/dutm/fzmOPPUZDQwPnnXce9913Hx9//DGdnZ08/vjjzJgxo9/1jxw5kj179gC5K5kOPfRQvvKVr3DttdfyzDPPDORHYZY2BL9vNrQqcj6GzAoPQ7sufWttHfQh7llnncXll1/O9OnTOemkkzj33HP3bVuxYgXnnHMOJ510EtOmTdsXBvPmzePrX/86t99+O+vXr++1XaEZM2Zw8cUX8/rrr9PU1MQJJ5zApZdeypNPPskZZ5yBJFauXMnxxx/Pq6++2q/6FyxYwOmnn85ZZ53FlVdeyaJFizjooIMYOXIkq1atGtTPxAwYkt83G1rqbxdEOamvr4/CiXqef/55TjnllBJVNHyWLVvG4YcfzrXXXlvSOmrl521WTSRtjIj6vtrVZleSmZn1qja7kirYsmXLSl2CmVW5qjpiqMRusUrkn7NZdauaYBg9ejTbt2/3h9YQi2Q+htGjR5e6FDMbIlXTlTR+/Hja29vxyKtDr2sGNzOrTlUTDCNHjvSMYmZmRVA1XUlmZlYcDgYzM0txMJhZbSqTeVnKkYPBzGrTQOeJqKEgcTCYWU4NffABPU8PeqB5oodqwqEy5GAws5wa+uDbZyDzRAw0SCqYg8HMcmrog2+fgc4TUewJh8qUg8HM9quRDz5gcPNEDMEEX+XIwWBm+9XIBx9w4HkielJDEw4VZT4GSbOAvwVGAD+IiJsLtt8GdP3pcSjw6Yg4Otn2MbA52fZ6RMymDz3Nx2BmGeV/8DU2dl+udStX5s635P8sWlpyQVIhU4r2dz6GzMEgaQTwG+BCoB1oBa6IiK29tP+fwJkR8efJ8u8j4vCBvKaDwWwIVMEHnx1Yf4OhGGMlzQC2RcTLyQvfC8wBegwG4ApgaRFe18yKqacP/8ZGHy3UoGKcYzgReCNvuT1Z142kk4DJwIa81aMltUl6StIlRajHzMwyKMYRg3pY11v/1DxgfUR8nLduYkR0SPojYIOkzRHxUrcXkRYACwAmTpyYtWYzM+tFMY4Y2oEJecvjgY5e2s4Dfpy/IiI6kvuXgceAM3vaMSJWR0R9RNTX1dVlrdnMzHpRjGBoBaZImizpEHIf/s2FjSSdDIwBnsxbN0bSqOTxWOBz9H5uwszMhkHmrqSI2CvpGuAhcper3hURWyQtB9oioiskrgDujfRlUKcAd0j6hFxI3dzb1UxmZjY8ivI9huHmy1XNzAauv5er+pvPZmaW4mAwM8uqyoYsdzCYmWVVZUOWF+N7DGZmtS1/yPKFC3MDEFbwGFM+YjAzK4YqGrLcwWBmVgxVNGS5g8HMLKuBzNVQASeqHQxmZlkNZNKfCjhR7S+4mZkNt64wGOYT1f6Cm5lZuSrzE9UOBrNqUwF92DWvzE9UOxjMqk0F9GHXtIGcqC4RB4NZtcn/stWSJfs/hMqsu6JmDeREdYn45LNZtVqyJNeH3dSU+8vUap5PPpvVsjLvw7by5mAwqzYV0Idt5c3BYFZtKqAP28qbzzGYmdUIn2MwM7NBcTCYmVlKUYJB0ixJL0jaJun6HrZfJalT0qbkdnXetvmSXkxu84tRj5mZDV7mGdwkjQC+D1wItAOtkpojYmtB0/si4pqCfY8BlgL1QAAbk33fy1qXmZkNTjGOGGYA2yLi5Yj4A3AvMKef+34BeDgi3k3C4GFgVhFqMjOzQSpGMJwIvJG33J6sK/QlSc9KWi9pwgD3NTOzYVKMYFAP6wqvgf0ZMCkiTgceAdYMYN9cQ2mBpDZJbZ2dnYMu1qwiecRUG0bFCIZ2YELe8nigI79BRGyPiI+SxTuBs/u7b95zrI6I+oior6urK0LZZhXEI6bWrhL8UVCMYGgFpkiaLOkQYB7QnN9A0ri8xdnA88njh4CLJI2RNAa4KFlnZvk8YmrtKsEfBZmvSoqIvZKuIfeBPgK4KyK2SFoOtEVEM/CXkmYDe4F3gauSfd+VtIJcuAAsj4h3s9ZkVpXyZ/1qanIo1Ir8PwqGaSpQD4lhVilKNE+wlYkiDKPuITHMqolHTK1twzyMuoPBrBJ4xNTaVYI/CtyVZGZWzlauzJ1ozu82bGnJ/VGwePGAnqq/XUkOBjOzGuFzDGZmNigOBjMzS3EwmJlZioPBzMxSHAxm5cSD5VkZcDCYlRMPlmdlIPNYSWZWRCUYF8eskI8YzMpN/mB5Cxc6FGzYORjMys0wj4tjVsjBYFZOPFielQEHg1k58WB5VgY8VpKZWY3wWElmZjYoDgYzM0txMJiZWYqDwczMUooSDJJmSXpB0jZJ1/ew/a8kbZX0rKRHJZ2Ut+1jSZuSW3Mx6jEzs8HLPCSGpBHA94ELgXagVVJzRGzNa/avQH1E7JS0EFgJXJ5s2xUR07PWYWZmxVGMI4YZwLaIeDki/gDcC8zJbxARLRGxM1l8ChhfhNc1M7MhUIxgOBF4I2+5PVnXm68BP89bHi2pTdJTki4pQj1mZpZBMYJBPazr8Vtzkr4C1AO35q2emHzh4r8B35X0mV72XZAESFtnZ2fWms3Ki+dhsDJSjGBoBybkLY8HOgobSZoJ3AjMjoiPutZHREdy/zLwGHBmTy8SEasjoj4i6uvq6opQtlkZ8TwMVkaKEQytwBRJkyUdAswDUlcXSToTuINcKLydt36MpFHJ47HA54D8k9ZmtSF/HoYlS/YPpOcht60EMl+VFBF7JV0DPASMAO6KiC2SlgNtEdFMruvocOB+SQCvR8Rs4BTgDkmfkAupmwuuZjKrHfnzMDQ1ORSsZDyInlm56Oo+8sxtNkQ8iJ5ZJfE8DFZGHAxm5cDzMFgZcTCYDbeeLk1taOgeAo2NsHjx8NVllnAwmA03X5pqZS7zVUlmNkD5l6b6RLOVIR8xmJVC/qWpCxc6FKysOBjMSqGlJXek0NSUu/fVR1ZGHAxmw82XplqZczCYDTdfmmplzt98NjOrEf7ms5mZDYqDwczMUhwMZmaW4mAwM7MUB4OZmaU4GMzMLMXBYGZmKQ4GMzNLcTCYmVmKg8HMzFKKEgySZkl6QdI2Sdf3sH2UpPuS7b+WNClv2w3J+hckfaEY9ZiZ2eBlDgZJI4DvA38CnApcIenUgmZfA96LiP8E3Abckux7KjAPOA2YBfy/5PnMzKxEinHEMAPYFhEvR8QfgHuBOQVt5gBrksfrgQskKVl/b0R8FBGvANuS5zMzsxIpRjCcCLyRt9yerOuxTUTsBT4Aju3nvmZmNoyKEQzqYV3hWN69tenPvrknkBZIapPU1tnZOcASzcysv4oRDO3AhLzl8UBHb20kHQwcBbzbz30BiIjVEVEfEfV1dXVFKNvMzHpSjGBoBaZImizpEHInk5sL2jQD85PHlwEbIjdDUDMwL7lqaTIwBXi6CDWZmdkgHZz1CSJir6RrgIeAEcBdEbFF0nKgLSKagR8CfydpG7kjhXnJvlskrQO2AnuB/xERH2etyczMBs9Te5qZ1QhP7WlmZoPiYDAzsxQHg5mZpTgYzMwsxcFgZmYpDgYzM0txMJiZWYqDwczMUhwMZmaW4mAwM7MUB4OZmaU4GMzMLMXBYGZmKQ4GMzNLcTCYmVmKg8HMzFIcDGZmluJgMDOzFAeDmZmlOBjMzCwlUzBIOkbSw5JeTO7H9NBmuqQnJW2R9Kyky/O23SPpFUmbktv0LPWYmVl2WY8YrgcejYgpwKPJcqGdwJURcRowC/iupKPzti+KiOnJbVPGeszMLKOswTAHWJM8XgNcUtggIn4TES8mjzuAt4G6jK9rZmZDJGswHBcRbwIk958+UGNJM4BDgJfyVt+UdDHdJmlUxnrMzCyjg/tqIOkR4PgeNt04kBeSNA74O2B+RHySrL4BeItcWKwGrgOW97L/AmABwMSJEwfy0mZmNgB9BkNEzOxtm6TfSRoXEW8mH/xv99LuSOCfgL+JiKfynvvN5OFHku4Grj1AHavJhQf19fXRV91mZjY4WbuSmoH5yeP5wIOFDSQdAjwA/Cgi7i/YNi65F7nzE89lrMfMzDLKGgw3AxdKehG4MFlGUr2kHyRt5gLnAVf1cFnqWkmbgc3AWOBbGevp2cqV0NKSXtfSkltvZmYpfXYlHUhEbAcu6GF9G3B18vjvgb/vZf/zs7x+vzU0wNy5sG4dNDbmQqFr2czMUmrjm8+NjbkQmDsXlixJh4TVNh9NmnVTG8EAuRBYuBBWrMjdOxQM9h9NdoVD19FkQ0Np6zIrodoJhpYWWLUKmppy94V/JVpt8tGkWTe1EQz55xSWL9//QeBwMPDRpFmB2giG1tb0X4FdfyW2tpa2LisPPpo0S1FE5X1XrL6+Ptra2kpdhlWD/KPJwivWfORgVUbSxoio76tdbRwxmPXGR5Nm3fiIwcysRviIwczMBsXBYGZmKQ4GMzNLcTCYmVmKg8HMzFIcDGZmluJgMDOzFAeDmZmlOBjMzCzFwWBmZikOBjMzS3EwmJlZSqZgkHSMpIclvZjcj+ml3ceSNiW35rz1kyX9Otn/PkmHZKnHzMyyy3rEcD3waERMAR5NlnuyKyKmJ7fZeetvAW5L9n8P+FrGeszMLKOswTAHWJM8XgNc0t8dJQk4H1g/mP3NzGxoZA2G4yLiTYDk/tO9tBstqU3SU5K6PvyPBd6PiL3JcjtwYsZ6zMwso4P7aiDpEeD4HjbdOIDXmRgRHZL+CNggaTPwHz2063XWIEkLgAUAEydOHMBLF8HKldDQkJ7qsaUlN8vX4sXDW4uZ2RDr84ghImZGxNQebg8Cv5M0DiC5f7uX5+hI7l8GHgPOBN4BjpbUFU7jgY4D1LE6Iuojor6urm4Ab7EIGhpy8wB3TRLfNS9wQ8Pw1mFmNgyydiU1A/OTx/OBBwsbSBojaVTyeCzwOWBr5OYUbQEuO9D+ZaFrHuC5c2HJEk8Wb2ZVLWsw3AxcKOlF4MJkGUn1kn6QtDkFaJP0b+SC4OaI2Jpsuw74K0nbyJ1z+GHGeoZOYyMsXAgrVuTuHQpmVqWU+8O9stTX10dbW9vwvmhX99HChbBqlY8YzKziSNoYEfV9tfM3n/ujKxTWrYPly/d3K3Wdc7DKsHJl93+zlpbcejPbx8HQH62t6SOErnMOra2lrcsGxhcRmPWLu5KstrhL0GqYu5KGg7smKo8vIjDrk4MhC3dNVJ6WltyRQlNT7t7nicy6cTBk4e83VBZfRGDWLw6GrNw1UTl8EYFZv/jkc1Y+mWlmFcInn4eDuybMrAo5GLJw14SZVSF3JZmZ1Qh3JZmZ2aA4GMzMLMXBYGZmKQ4GMzNLcTCYmVmKg8HMzFIcDFaZPLKt2ZBxMFhl8si2ZkPm4FIXYDYo+SPbepwqs6LKdMQg6RhJD0t6Mbkf00ObRkmb8m67JV2SbLtH0it526ZnqcdqjEe2NRsSWbuSrgcejYgpwKPJckpEtETE9IiYDpwP7AR+kddkUdf2iNiUsR6rJZ50x2xIZA2GOcCa5PEa4JI+2l8G/DwidmZ8Xat1HtnWbMhkDYbjIuJNgOT+0320nwf8uGDdTZKelXSbpFEZ67Fa4ZFtzYZMn6OrSnoEOL6HTTcCayLi6Ly270VEt/MMybZxwLPACRGxJ2/dW8AhwGrgpYhY3sv+C4AFABMnTjz7tdde6+OtmZlZvv6OrtrnVUkRMfMAL/I7SeMi4s3kQ/7tAzzVXOCBrlBInvvN5OFHku4Grj1AHavJhQf19fWVN1a4mVmFyNqV1AzMTx7PBx48QNsrKOhGSsIESSJ3fuK5jPWYmVlGWYPhZuBCSS8CFybLSKqX9IOuRpImAROAfynYf62kzcBmYCzwrYz1mJlZRpm+4BYR24ELeljfBlydt/wqcGIP7c7P8vpmZlZ8HhLDzMxSKnLOZ0mdQF+XJY0F3hmGcoZTNb4n8PuqNNX4vqrxPUH393VSRNT1tVNFBkN/SGrrz2VZlaQa3xP4fVWaanxf1fieYPDvy11JZmaW4mAwM7OUag6G1aUuYAhU43sCv69KU43vqxrfEwzyfVXtOQYzMxucaj5iMDOzQajaYJC0Ihm1dZOkX0g6odQ1FYOkWyX9e/LeHpB0dN97lT9J/1XSFkmfSKroq0MkzZL0gqRtkrrNUVKpJN0l6W1JVTN0jaQJklokPZ/8//tmqWsqBkmjJT0t6d+S9/W/B7R/tXYlSToyIv4jefyXwKkR8Y0Sl5WZpIuADRGxV9ItABFxXYnLykzSKcAnwB3Atcm35yuOpBHAb8gNEdMOtAJXRMTWkhZWBJLOA34P/Cgippa6nmJIxmsbFxHPSDoC2AhcUun/Xsn4c4dFxO8ljQR+CXwzIp7qz/5Ve8TQFQqJw4CqSMCI+EVE7E0WnwLGl7KeYomI5yPihVLXUQQzgG0R8XJE/AG4l9yEVhUvIh4H3i11HcUUEW9GxDPJ4x3A8/QwfE+liZzfJ4sjk1u/PwOrNhgAJN0k6Q3gy8CSUtczBP4c+Hmpi7CUE4E38pbbqYIPmlqQDPZ5JvDr0lZSHJJGSNpEbjqEhyOi3++rooNB0iOSnuvhNgcgIm6MiAnAWuCa0lbbf329r6TNjcBecu+tIvTnfVUB9bCuKo5Wq5mkw4GfAP+roLehYkXExxExnVyvwgxJ/e7+yzS6aqkdaBKhAv8A/BOwdAjLKZq+3pek+cCfARdEBZ0kGsC/VyVrJzfEfJfxQEeJarF+SPrgfwKsjYh/LHU9xRYR70t6DJhFP+e8qegjhgORNCVvcTbw76WqpZgkzQKuA2ZHxM5S12PdtAJTJE2WdAi5ec6bS1yT9SI5SftD4PmI+D+lrqdYJNV1XbEo6VPATAbwGVjNVyX9BDiZ3JUurwHfiIjflraq7CRtA0YB25NVT1XJ1VaXAv8XqAPeBzZFxBdKW9XgSPpT4LvACOCuiLipxCUVhaQfA/+F3IidvwOWRsQPS1pURpL+M/AEucnCPklW/3VE/HPpqspO0unAGnL/Bw8C1kXE8n7vX63BYGZmg1O1XUlmZjY4DgYzM0txMJiZWYqDwczMUhwMZmaW4mAwM7MUB4OZmaU4GMzMLOX/A/xoEVK9w+cWAAAAAElFTkSuQmCC\n", "text/plain": [ "
" ] @@ -159,16 +159,16 @@ "name": "stdout", "output_type": "stream", "text": [ - "Iteration 11 loss: -13.523289192527265\n", - "Iteration 21 loss: -16.077990179961076\n", - "Iteration 31 loss: -16.784414553096843\n", - "Iteration 41 loss: -16.820970924702017\n", - "Iteration 51 loss: -16.859865329532193\n", - "Iteration 61 loss: -16.895666914166453\n", - "Iteration 71 loss: -16.899409131167452\n", - "Iteration 81 loss: -16.901728290347176\n", - "Iteration 91 loss: -16.903122097339737\n", - "Iteration 100 loss: -16.903135093930537" + "Iteration 10 loss: -13.09287954321266\t\t\t\t\n", + "Iteration 20 loss: -15.971970034359586\t\t\t\t\n", + "Iteration 30 loss: -16.725359053995163\t\t\t\t\n", + "Iteration 40 loss: -16.835084442759314\t\t\t\t\n", + "Iteration 50 loss: -16.850332113428053\t\t\t\t\n", + "Iteration 60 loss: -16.893812683762203\t\t\t\t\n", + "Iteration 70 loss: -16.900137667771077\t\t\t\t\n", + "Iteration 80 loss: -16.901158761459012\t\t\t\t\n", + "Iteration 90 loss: -16.903085976668137\t\t\t\t\n", + "Iteration 100 loss: -16.903135093930537\t\t\t\t\n" ] } ], @@ -303,7 +303,7 @@ "outputs": [ { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -386,7 +386,7 @@ "outputs": [ { "data": { - "image/png": "\n", + "image/png": "\n", "text/plain": [ "
" ] @@ -408,7 +408,149 @@ "source": [ "## Gaussian process with a mean function\n", "\n", - "TBA" + "In the previous example, we created an GP regression model without a mean function (the mean of GP is zero). It is very easy to extend a GP model with a mean field. First, we create a mean function in MXNet (a neural network). For simplicity, we create a 1D linear function as the mean function." + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "metadata": {}, + "outputs": [], + "source": [ + "mean_func = mx.gluon.nn.Dense(1, in_units=1, flatten=False)\n", + "mean_func.initialize(mx.init.Xavier(magnitude=3))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We create the GP regression model in a similar way as above. The difference is \n", + "1. We create a wrapper of the mean function in model definition ```m.mean_func```.\n", + "2. We evaluate the mean function with the input of our GP model, which results into the mean of the GP.\n", + "3. We pass the resulting mean into the mean argument of the GP module." + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [], + "source": [ + "m = Model()\n", + "m.N = Variable()\n", + "m.X = Variable(shape=(m.N, 1))\n", + "m.mean_func = MXFusionGluonFunction(mean_func, num_outputs=1, broadcastable=True)\n", + "m.mean = m.mean_func(m.X)\n", + "m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=0.01)\n", + "m.kernel = RBF(input_dim=1, variance=1, lengthscale=1)\n", + "m.Y = GPRegression.define_variable(X=m.X, kernel=m.kernel, noise_var=m.noise_var, mean=m.mean, shape=(m.N, 1))" + ] + }, + { + "cell_type": "code", + "execution_count": 24, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Iteration 10 loss: -6.288699675985622\t\t\t\t\n", + "Iteration 20 loss: -13.938366520031717\t\t\t\t\n", + "Iteration 30 loss: -16.238146742572965\t\t\t\t\n", + "Iteration 40 loss: -16.214515784955303\t\t\t\t\n", + "Iteration 50 loss: -16.302410205174386\t\t\t\t\n", + "Iteration 60 loss: -16.423765889507315\t\t\t\t\n", + "Iteration 70 loss: -16.512277794947106\t\t\t\t\n", + "Iteration 80 loss: -16.5757306621185\t\t\t\t\t\t\n", + "Iteration 90 loss: -16.6410597628529\t\t\t\t\t\t\n", + "Iteration 100 loss: -16.702913078848557\t\t\t\t\n" + ] + } + ], + "source": [ + "import mxnet as mx\n", + "from mxfusion.inference import GradBasedInference, MAP\n", + "\n", + "infr = GradBasedInference(inference_algorithm=MAP(model=m, observed=[m.X, m.Y]))\n", + "infr.run(X=mx.nd.array(X, dtype='float64'), Y=mx.nd.array(Y, dtype='float64'), \n", + " max_iter=100, learning_rate=0.05, verbose=True)" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion.inference import TransferInference, ModulePredictionAlgorithm\n", + "infr_pred = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y]), \n", + " infr_params=infr.params)" + ] + }, + { + "cell_type": "code", + "execution_count": 26, + "metadata": {}, + "outputs": [], + "source": [ + "xt = np.linspace(-5,5,100)[:, None]\n", + "res = infr_pred.run(X=mx.nd.array(xt, dtype='float64'))[0]\n", + "f_mean, f_var = res[0].asnumpy()[0], res[1].asnumpy()[0]" + ] + }, + { + "cell_type": "code", + "execution_count": 27, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "plot(xt, f_mean[:,0], 'b-', label='mean')\n", + "plot(xt, f_mean[:,0]-2*np.sqrt(f_var), 'b--', label='2 x std')\n", + "plot(xt, f_mean[:,0]+2*np.sqrt(f_var), 'b--')\n", + "plot(X, Y, 'rx', label='data points')\n", + "ylabel('F')\n", + "xlabel('X')\n", + "_=legend()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The effect of the mean function is not noticable, because there is no linear trend in our data. We can plot the values of the estimated parameters of the linear mean function." + ] + }, + { + "cell_type": "code", + "execution_count": 36, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The weight is 0.021969 and the bias is 0.079038.\n" + ] + } + ], + "source": [ + "print(\"The weight is %f and the bias is %f.\" %(infr.params[m.mean_func.parameters['dense1_weight']].asnumpy(), \n", + " infr.params[m.mean_func.parameters['dense1_bias']].asscalar()))" ] }, { @@ -417,7 +559,26 @@ "source": [ "## Variational sparse Gaussian process regression\n", "\n", - "TBA" + "In MXFusion, we also have variational sparse GP implemented as a module. A sparse GP model can be created in a similar way as the plain GP model. " + ] + }, + { + "cell_type": "code", + "execution_count": 39, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion import Model, Variable\n", + "from mxfusion.components.variables import PositiveTransformation\n", + "from mxfusion.components.distributions.gp.kernels import RBF\n", + "from mxfusion.modules.gp_modules import SparseGPRegression\n", + "\n", + "m = Model()\n", + "m.N = Variable()\n", + "m.X = Variable(shape=(m.N, 1))\n", + "m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=0.01)\n", + "m.kernel = RBF(input_dim=1, variance=1, lengthscale=1)\n", + "m.Y = SparseGPRegression.define_variable(X=m.X, kernel=m.kernel, noise_var=m.noise_var, shape=(m.N, 1), num_inducing=50)" ] } ], @@ -437,7 +598,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.6" + "version": "3.6.0" } }, "nbformat": 4, diff --git a/examples/notebooks/pilco.ipynb b/examples/notebooks/pilco.ipynb new file mode 100644 index 0000000..db09fa9 --- /dev/null +++ b/examples/notebooks/pilco.ipynb @@ -0,0 +1,51119 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# PILCO: A Model-based Policy Search" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Obtaining file:///Users/erimeiss/workspace/mxfusion\n", + "Requirement already satisfied: networkx>=2.1 in /Users/erimeiss/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages (from MXFusion==0.3.0) (2.1)\n", + "Requirement already satisfied: numpy>=1.7 in /Users/erimeiss/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages (from MXFusion==0.3.0) (1.16.3)\n", + "Requirement already satisfied: decorator>=4.1.0 in /Users/erimeiss/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages (from networkx>=2.1->MXFusion==0.3.0) (4.3.0)\n", + "Installing collected packages: MXFusion\n", + " Found existing installation: MXFusion 0.3.0\n", + " Uninstalling MXFusion-0.3.0:\n", + " Successfully uninstalled MXFusion-0.3.0\n", + " Running setup.py develop for MXFusion\n", + "Successfully installed MXFusion\n" + ] + } + ], + "source": [ + "!pip install -e ../.." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Common reinforcement learning methods suffer from data inefficiency, which can be a issue in real world applications where gathering sufficiently large amounts of data pose economic issues and may be impossible. Deisenroth & Rasmussen (2011) propose a model-based policy search method known as PILCO in part to address this issue. PILCO uses a Gaussian process (GP) for learning the dynamics of the environment and optimizes a parametric policy function using the learned dynamics model.\n", + "\n", + "In this notebook, we demonstrate a straight-forward implementation of PILCO. This implementation follows the idea of PILCO and have a few enhancement compared to the published implementation. The enhancement are listed as follows: \n", + "\n", + "- **Use Monte Carlo integration instead of moment estimation.** We approximate the expected reward using Monte Carlo integration instead of the proposed moment estimation approach. This removes the bias in the expected reward computation and enables a wide range of choices of kernels and policy functions. In the original work, only RBF and linear kernel and only linear and RBF network policy can be used.\n", + "- **Use automatic differentiation.** Thanks to automatic differentiation, no gradient derivation is needed.\n", + "- **An unified interface of Gaussian process.** MXFusion provides an unified inferface of GP modules. We allows us to easily switch among plan GP, variational sparse GP and stocastic variational GP implementations." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Preparation" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "This notebook depends on MXNet, MXFusion and Open AI Gym. These packages can be installed into your Python environment by running the following commands.\n", + "```bash\n", + "pip install mxnet mxfusion gym\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Set the global configuration." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "os.environ['MXNET_ENGINE_TYPE'] = 'NaiveEngine'\n", + "from mxfusion.common import config\n", + "config.DEFAULT_DTYPE = 'float64'\n", + "%matplotlib inline" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Example: Pendulum\n", + "\n", + "\n", + "We use the inverted pendulum swingup problem as an example. We use the [Pendulum-v0](https://gym.openai.com/envs/Pendulum-v0/) enironment in Open AI Gym. The task is to swing the pendulum up and balance it at the inverted position. This is a classical control problem and is known to be unsolvable with a linear controller.\n", + "\n", + "To solve this problem with PILCO, it needs three components:\n", + "\n", + "- Execute a policy in an real environment (an Open AI Gym simulator in this example) and collect data.\n", + "- Fit a GP model as the model for the dynamics of the environment.\n", + "- Optimize the policy given the dynamics model learned from all the data that have been collected so far.\n", + "\n", + "The overall PILCO algorithm is to iterate the above three steps until a policy that can solve the problem is found." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Execute the Environment \n", + "\n", + "The Pendulum-v0 environment can be loaded easily." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [], + "source": [ + "import gym\n", + "env = gym.make('Pendulum-v0')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The state of the pendulum environment is a 3D vector. The first two dimensions are the 2D location of the end point of the pendulum. The third dimension encodes the angular speed of the pendulum. The action space is a 1D vector in [-2, 2]." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We write a helper function for executing the environment with a given policy." + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from matplotlib import animation\n", + "\n", + "def run_one_episode(env, policy, initial_state=None, max_steps=200, verbose=False, render=False):\n", + " \"\"\"\n", + " Drives an episode of the OpenAI gym environment using the policy to decide next actions.\n", + " \"\"\"\n", + " observation = env.reset()\n", + " if initial_state is not None:\n", + " env.env.state = initial_state\n", + " observation = env.env._get_obs()\n", + " env._max_episode_steps = max_steps\n", + " step_idx = 0\n", + " done = False\n", + " total_reward = 0\n", + " frames = []\n", + " all_actions = []\n", + " all_observations = [observation]\n", + " while not done:\n", + " if render:\n", + " frames.append(env.render(mode = 'rgb_array'))\n", + " if verbose:\n", + " print(observation)\n", + " action = policy(observation)\n", + " observation, reward, done, info = env.step(action)\n", + " all_observations.append(observation)\n", + " all_actions.append(action)\n", + " total_reward += reward\n", + " step_idx += 1\n", + " if done or step_idx>=max_steps-1:\n", + " print(\"Episode finished after {} timesteps because {}\".format(step_idx+1, \"'done' reached\" if done else \"Max timesteps reached\"))\n", + " break\n", + " if render:\n", + " fig = plt.figure()\n", + " ax = fig.gca()\n", + " fig.tight_layout()\n", + " patch = ax.imshow(frames[0])\n", + " ax.axis('off')\n", + " def animate(i):\n", + " patch.set_data(frames[i])\n", + " anim = animation.FuncAnimation(plt.gcf(), animate, frames = len(frames), interval=20)\n", + " return total_reward, np.array(all_observations, dtype=np.float64,), np.array(all_actions, dtype=np.float64), anim\n", + " else:\n", + " return total_reward, np.array(all_observations, dtype=np.float64,), np.array(all_actions, dtype=np.float64)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Let's first apply a random policy and see how the environment reacts. The random policy uniformly samples in the space of action." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "def random_policy(state):\n", + " return env.action_space.sample()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The animation is generated with the following commands:\n", + "```python\n", + "anim = run_one_episode(env, random_policy, max_steps=500, render=True, verbose=False)[-1]\n", + "\n", + "with open('animation_random_policy.html', 'w') as f:\n", + " f.write(anim.to_jshtml())\n", + "```" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + " Once \n", + " Loop \n", + " Reflect \n", + "
\n", + "
\n", + "\n", + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from IPython.display import HTML\n", + "\n", + "HTML(filename=\"pilco/animation_random_policy.html\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Fit the Dynamics Model\n", + "\n", + "The dynamics model of pendulum can be written as\n", + "$$p(y_{t+1}|y_t, a_t)$$\n", + "where $y_t$ is the state vector at the time $t$ and $a_t$ is the action taken at the time $t$. PILCO uses a Gaussian process to model the above dynamics.\n", + "\n", + "Given a sequence of state and action, we break them into the pairs of input and output for the above GP model. The below helper function is written to do so." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "def prepare_data(state_list, action_list, win_in):\n", + " \"\"\"\n", + " Prepares a list of states and a list of actions as inputs to the Gaussian Process for training.\n", + " \"\"\"\n", + " \n", + " X_list = []\n", + " Y_list = []\n", + " \n", + " for state_array, action_array in zip(state_list, action_list):\n", + " # the state and action array shape should be aligned.\n", + " assert state_array.shape[0]-1 == action_array.shape[0]\n", + " \n", + " for i in range(state_array.shape[0]-win_in):\n", + " Y_list.append(state_array[i+win_in:i+win_in+1])\n", + " X_list.append(np.hstack([state_array[i:i+win_in].flatten(), action_array[i:i+win_in].flatten()]))\n", + " X = np.vstack(X_list)\n", + " Y = np.vstack(Y_list)\n", + " return X, Y" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "In this example, we do a maximum likelihood estimate for the model hyper-parameters. In MXFusion, Gaussian process regression model is available as a module, which includes a dediated inference algorithm." + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "import mxnet as mx\n", + "from mxfusion import Model, Variable\n", + "from mxfusion.components.variables import PositiveTransformation\n", + "from mxfusion.components.distributions.gp.kernels import RBF\n", + "from mxfusion.modules.gp_modules import GPRegression\n", + "from mxfusion.inference import GradBasedInference, MAP\n", + "\n", + "def fit_model(state_list, action_list, win_in, verbose=True):\n", + " \"\"\"\n", + " Fits a Gaussian Process model to the state / action pairs passed in. \n", + " This creates a model of the environment which is used during\n", + " policy optimization instead of querying the environment directly.\n", + " \n", + " See mxfusion.gp_modules for additional types of GP models to fit,\n", + " including Sparse GP and Stochastic Varitional Inference Sparse GP.\n", + " \"\"\"\n", + " X, Y = prepare_data(state_list, action_list, win_in)\n", + "\n", + " m = Model()\n", + " m.N = Variable()\n", + " m.X = Variable(shape=(m.N, X.shape[-1]))\n", + " m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(),\n", + " initial_value=0.01)\n", + " m.kernel = RBF(input_dim=X.shape[-1], variance=1, lengthscale=1, ARD=True)\n", + " m.Y = GPRegression.define_variable(\n", + " X=m.X, kernel=m.kernel, noise_var=m.noise_var,\n", + " shape=(m.N, Y.shape[-1]))\n", + " m.Y.factor.gp_log_pdf.jitter = 1e-6\n", + "\n", + " infr = GradBasedInference(\n", + " inference_algorithm=MAP(model=m, observed=[m.X, m.Y]))\n", + " infr.run(X=mx.nd.array(X, dtype='float64'),\n", + " Y=mx.nd.array(Y, dtype='float64'),\n", + " max_iter=1000, learning_rate=0.1, verbose=verbose)\n", + " return m, infr, X, Y" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Policy Optimization\n", + "\n", + "PILCO computes the expected reward of a policy given the dynamics model. First, we need to define the parametric form of the policy. In this example, we use a neural network with one hidden layer. As the action space is [-2, 2], we apply a tanh transformation and multiply the come with two. This enforces the returned actions stay within the range." + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [], + "source": [ + "from mxnet.gluon import HybridBlock\n", + "from mxnet.gluon.nn import Dense\n", + "\n", + "class NNController(HybridBlock):\n", + " def __init__(self, prefix=None, params=None):\n", + " super(NNController, self).__init__(prefix=prefix, params=params)\n", + " self.dense1 = Dense(100, in_units=len(env.observation_space.high), dtype='float64', activation='relu')\n", + " self.dense2 = Dense(1, in_units=100, dtype='float64', activation='tanh')\n", + " def hybrid_forward(self, F, x):\n", + " out = self.dense2(self.dense1(x))*2\n", + " return out \n", + " \n", + "policy = NNController()\n", + "policy.collect_params().initialize(mx.initializer.Xavier(magnitude=1))" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To compute the expected reward, we also need to define a reward function. This reward function is defined by us according to the task. The main component is the height of the pendulum. We also penalize the force and the angular momentum. " + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "class CostFunction(mx.gluon.HybridBlock):\n", + " \"\"\"\n", + " The goal is to get the pendulum upright and stable as quickly as possible.\n", + " Taken from the code for Pendulum.\n", + " \"\"\"\n", + " def hybrid_forward(self, F, state, action):\n", + " \"\"\"\n", + " :param state: [np.cos(theta), np.sin(theta), ~ momentum(theta)]\n", + " a -> 0 when pendulum is upright, largest when pendulum is hanging down completely.\n", + " b -> penalty for taking action\n", + " c -> penalty for pendulum momentum\n", + " \"\"\"\n", + " a_scale = 2.\n", + " b_scale = .001\n", + " c_scale = .1\n", + " a = F.sum(a_scale * (state[:,:,0:1] -1) ** 2, axis=-1)\n", + " b = F.sum(b_scale * action ** 2, axis=-1)\n", + " c = F.sum(c_scale * state[:,:,2:3] ** 2, axis=-1)\n", + " return (a + c + b)\n", + " \n", + "cost = CostFunction()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The expected reward function can be written as\n", + "$$R = \\mathbb{E}_{p(y_T, \\ldots, y_0)}\\left(\\sum_{t=0}^T r(y_t)\\right)$$\n", + "where $r(\\cdot)$ is the reward function. $p(y_T, \\ldots, y_0)$ is the joint distribution when applying the policy to the dynamics model:\n", + "$$p(y_T, \\ldots, y_0) = p(y_0) \\prod_{t=1}^T p(y_t|y_{t-1}, a_{t-1}),$$\n", + "where $a_{t-1} = \\pi(y_{t-1})$ is the action taken at the time $t-1$, which is the outcome of the policy $\\pi(\\cdot)$.\n", + "\n", + "The expected reward function is implemented as follows." + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion.inference.inference_alg import SamplingAlgorithm\n", + "\n", + "class PILCOAlgorithm(SamplingAlgorithm):\n", + "\n", + " def compute(self, F, variables):\n", + " \n", + " s_0 = self.initial_state_generator(self.num_samples)\n", + " a_0 = self.policy(s_0)\n", + " a_t_plus_1 = a_0\n", + " x_t = F.expand_dims(F.concat(s_0, a_0, dim=1), axis=1)\n", + " cost = 0\n", + " for t in range(self.n_time_steps):\n", + " variables[self.model.X] = x_t\n", + " res = self.model.Y.factor.predict(F, variables, targets=[self.model.Y], num_samples=self.num_samples)[0]\n", + " s_t_plus_1 = res[0]\n", + "\n", + " cost = cost + self.cost_function(s_t_plus_1, a_t_plus_1)\n", + "\n", + " a_t_plus_1 = mx.nd.expand_dims(self.policy(s_t_plus_1), axis=2)\n", + " x_t = mx.nd.concat(s_t_plus_1, a_t_plus_1, dim=2)\n", + " total_cost = F.sum(cost)\n", + " return total_cost, total_cost" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We optimize the policy with respect to the expected reward by using a gradient optimizer." + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion.inference import GradTransferInference\n", + "from mxfusion.inference.pilco_alg import PILCOAlgorithm\n", + "\n", + "def optimize_policy(policy, cost_func, model, infr, model_data_X, model_data_Y,\n", + " initial_state_generator, num_grad_steps,\n", + " learning_rate=1e-2, num_time_steps=100, \n", + " num_samples=10, verbose=True):\n", + " \"\"\"\n", + " Takes as primary inputs a policy, cost function, and trained model.\n", + " Optimizes the policy for num_grad_steps number of iterations.\n", + " \"\"\"\n", + " mb_alg = PILCOAlgorithm(\n", + " model=model, observed=[model.X, model.Y], cost_function=cost_func,\n", + " policy=policy, n_time_steps=num_time_steps,\n", + " initial_state_generator=initial_state_generator,\n", + " num_samples=num_samples)\n", + "\n", + " infr_pred = GradTransferInference(\n", + " mb_alg, infr_params=infr.params, train_params=policy.collect_params())\n", + " infr_pred.run(\n", + " max_iter=num_grad_steps,\n", + " X=mx.nd.array(model_data_X, dtype='float64'),\n", + " Y=mx.nd.array(model_data_Y, dtype='float64'),\n", + " verbose=verbose, learning_rate=learning_rate)\n", + " return policy" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## The Loop\n", + "\n", + "We need to define a function that provides random initial states." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "def initial_state_generator(num_initial_states):\n", + " \"\"\"\n", + " Starts from valid states by drawing theta and momentum\n", + " then computing np.cos(theta) and np.sin(theta) for state[0:2].s\n", + " \"\"\"\n", + " return mx.nd.array(\n", + " [env.observation_space.sample() for i in range(num_initial_states)],\n", + " dtype='float64')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The loop of PILCO iterates the above three steps." + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Episode finished after 100 timesteps because Max timesteps reached\n", + "\r", + "Iteration 1 loss: 183.19438945442164\t\t\t\t\r", + "Iteration 2 loss: 151.71942134183473\t\t\t\t\r", + "Iteration 3 loss: 120.76437985446427\t\t\t\t\r", + "Iteration 4 loss: 90.37715754239662\t\t\t\t\r", + "Iteration 5 loss: 60.62170569881482\t\t\t\t\r", + "Iteration 6 loss: 31.623024274306943\t\t\t\t\r", + "Iteration 7 loss: 3.431141954762154\t\t\t\t\r", + "Iteration 8 loss: -23.92777780034288\t\t\t\t\r", + "Iteration 9 loss: -50.42669502898963\t\t\t\t\r", + "Iteration 10 loss: -76.06646934620255\t\t\t\t\r", + "Iteration 11 loss: -100.8759268163551\t\t\t\t\r", + "Iteration 12 loss: -124.88561342741707\t\t\t\t\r", + "Iteration 13 loss: -148.12378769295128\t\t\t\t\r", + "Iteration 14 loss: -170.62435583550786\t\t\t\t\r", + "Iteration 15 loss: -192.42864381636554\t\t\t\t\r", + "Iteration 16 loss: -213.5807400140273\t\t\t\t\r", + "Iteration 17 loss: -234.12273086863553\t\t\t\t\r", + "Iteration 18 loss: -254.09447432916545\t\t\t\t\r", + "Iteration 19 loss: -273.5358786562007\t\t\t\t\r", + "Iteration 20 loss: -292.48731266753873\t\t\t\t\r", + "Iteration 21 loss: -310.98755147007927\t\t\t\t\r", + "Iteration 22 loss: -329.0718006155711\t\t\t\t" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/erimeiss/workspace/mxfusion/mxfusion/inference/inference_parameters.py:71: UserWarning: InferenceParameters has already been initialized. The existing one will be overwritten.\n", + " warnings.warn(\"InferenceParameters has already been initialized. The existing one will be overwritten.\")\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Iteration 100 loss: -1145.489716701466\t\t\t\t\n", + "Iteration 200 loss: -1285.3929126768035\t\t\t\t\n", + "Iteration 300 loss: -1331.7954137173099\t\t\t\t\n", + "Iteration 400 loss: -1357.6716807213334\t\t\t\t\n", + "Iteration 500 loss: -1374.5650793437253\t\t\t\t\n", + "Iteration 600 loss: -1386.6350141511623\t\t\t\t\n", + "Iteration 700 loss: -1395.7585508375987\t\t\t\t\n", + "Iteration 800 loss: -1402.93562993511\t\t\t\t\t\t\n", + "Iteration 900 loss: -1408.7594436983916\t\t\t\t\n", + "Iteration 1000 loss: -1413.6055169247031\t\t\t\t\n", + "Iteration 59 loss: 5544930.409976534\t\t\t\t\t" + ] + }, + { + "ename": "KeyboardInterrupt", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 28\u001b[0m \u001b[0minitial_state_generator\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_grad_steps\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnum_grad_steps\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 29\u001b[0m \u001b[0mnum_samples\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mlearning_rate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mlearning_rate\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 30\u001b[0;31m num_time_steps=num_time_steps)\n\u001b[0m", + "\u001b[0;32m\u001b[0m in \u001b[0;36moptimize_policy\u001b[0;34m(policy, cost_func, model, infr, model_data_X, model_data_Y, initial_state_generator, num_grad_steps, learning_rate, num_time_steps, num_samples, verbose)\u001b[0m\n\u001b[1;32m 22\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel_data_X\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'float64'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 23\u001b[0m \u001b[0mY\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel_data_Y\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'float64'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 24\u001b[0;31m verbose=verbose, learning_rate=learning_rate)\n\u001b[0m\u001b[1;32m 25\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mpolicy\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/grad_based_inference.py\u001b[0m in \u001b[0;36mrun\u001b[0;34m(self, optimizer, learning_rate, max_iter, verbose, **kwargs)\u001b[0m\n\u001b[1;32m 102\u001b[0m \u001b[0minfr_executor\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0minfr\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparam_dict\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparams\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparam_dict\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 103\u001b[0m \u001b[0mctx\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmxnet_context\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0moptimizer\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0moptimizer\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 104\u001b[0;31m learning_rate=learning_rate, max_iter=max_iter, verbose=verbose)\n\u001b[0m\u001b[1;32m 105\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 106\u001b[0m \u001b[0;32mclass\u001b[0m \u001b[0mGradTransferInference\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mGradBasedInference\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/batch_loop.py\u001b[0m in \u001b[0;36mrun\u001b[0;34m(self, infr_executor, data, param_dict, ctx, optimizer, learning_rate, max_iter, n_prints, verbose)\u001b[0m\n\u001b[1;32m 51\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmax_iter\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 52\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mautograd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecord\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 53\u001b[0;31m \u001b[0mloss\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mloss_for_gradient\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0minfr_executor\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mzeros\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mctx\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mctx\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 54\u001b[0m \u001b[0mloss_for_gradient\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbackward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 55\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/gluon/block.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args)\u001b[0m\n\u001b[1;32m 538\u001b[0m \u001b[0mhook\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 539\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 540\u001b[0;31m \u001b[0mout\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mforward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 541\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 542\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mhook\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_forward_hooks\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/gluon/block.py\u001b[0m in \u001b[0;36mforward\u001b[0;34m(self, x, *args)\u001b[0m\n\u001b[1;32m 915\u001b[0m \u001b[0mparams\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m{\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mctx\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mj\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_reg_params\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 916\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 917\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mhybrid_forward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mndarray\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mx\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mparams\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 918\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 919\u001b[0m \u001b[0;32massert\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mx\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mSymbol\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;31m \u001b[0m\u001b[0;31m\\\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/inference_alg.py\u001b[0m in \u001b[0;36mhybrid_forward\u001b[0;34m(self, F, x, *args, **kw)\u001b[0m\n\u001b[1;32m 81\u001b[0m \u001b[0madd_sample_dimension_to_arrays\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkw\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mout\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 82\u001b[0m \u001b[0madd_sample_dimension_to_arrays\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_constants\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mout\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 83\u001b[0;31m \u001b[0mobj\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_infr_method\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcompute\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 84\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mautograd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpause\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 85\u001b[0m \u001b[0;31m# An inference algorithm may directly set the value of a parameter instead of computing its gradient.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/pilco_alg.py\u001b[0m in \u001b[0;36mcompute\u001b[0;34m(self, F, variables)\u001b[0m\n\u001b[1;32m 82\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mt\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mn_time_steps\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 83\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mX\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mx_t\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 84\u001b[0;31m \u001b[0mres\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mY\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfactor\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpredict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtargets\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mY\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_samples\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 85\u001b[0m \u001b[0ms_t_plus_1\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mres\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 86\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/modules/module.py\u001b[0m in \u001b[0;36mpredict\u001b[0;34m(self, F, variables, num_samples, targets)\u001b[0m\n\u001b[1;32m 362\u001b[0m \u001b[0malg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnum_samples\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnum_samples\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 363\u001b[0m \u001b[0malg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtarget_variables\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtargets\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 364\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0malg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcompute\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 365\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 366\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m_get_algorithm_for_target_conditional_pair\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0malgorithms\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtargets\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexact_match\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mFalse\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/modules/gp_modules/gp_regression.py\u001b[0m in \u001b[0;36mcompute\u001b[0;34m(self, F, variables)\u001b[0m\n\u001b[1;32m 167\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 168\u001b[0m X, noise_var, X_cond, L, LinvY, kern_params = arrays_as_samples(\n\u001b[0;32m--> 169\u001b[0;31m F, [X, noise_var, X_cond, L, LinvY, kern_params])\n\u001b[0m\u001b[1;32m 170\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 171\u001b[0m \u001b[0mKxt\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mkern\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mK\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX_cond\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkern_params\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/components/variables/runtime_variable.py\u001b[0m in \u001b[0;36marrays_as_samples\u001b[0;34m(F, arrays)\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmax\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 115\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 116\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0ma\u001b[0m \u001b[0;32min\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 117\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 118\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/components/variables/runtime_variable.py\u001b[0m in \u001b[0;36m\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmax\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 115\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 116\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0ma\u001b[0m \u001b[0;32min\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 117\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 118\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/components/variables/runtime_variable.py\u001b[0m in \u001b[0;36mas_samples\u001b[0;34m(F, array, num_samples)\u001b[0m\n\u001b[1;32m 97\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0marray\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 98\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 99\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mF\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbroadcast_axis\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0msize\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 100\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 101\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/ndarray/register.py\u001b[0m in \u001b[0;36mbroadcast_axis\u001b[0;34m(data, axis, size, out, name, **kwargs)\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/_ctypes/ndarray.py\u001b[0m in \u001b[0;36m_imperative_invoke\u001b[0;34m(handle, ndargs, keys, vals, out)\u001b[0m\n\u001b[1;32m 90\u001b[0m \u001b[0mc_str_array\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkeys\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[0mc_str_array\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mstr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ms\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0ms\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mvals\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 92\u001b[0;31m ctypes.byref(out_stypes)))\n\u001b[0m\u001b[1;32m 93\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 94\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0moriginal_output\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mKeyboardInterrupt\u001b[0m: " + ] + } + ], + "source": [ + "num_episode = 20 # how many model fit + policy optimization episodes to run\n", + "num_samples = 100 # how many sample trajectories the policy optimization loop uses\n", + "num_grad_steps = 1000 # how many gradient steps the optimizer takes per episode\n", + "num_time_steps = 100 # how far to roll out each sample trajectory\n", + "learning_rate = 1e-3 # learning rate for the policy optimization\n", + "\n", + "all_states = []\n", + "all_actions = []\n", + "\n", + "for i_ep in range(num_episode):\n", + " # Run an episode and collect data.\n", + " if i_ep == 0:\n", + " policy_func = lambda x: env.action_space.sample()\n", + " else:\n", + " policy_func = lambda x: policy(mx.nd.expand_dims(mx.nd.array(x, dtype='float64'), axis=0)).asnumpy()[0]\n", + " total_reward, states, actions = run_one_episode(\n", + " env, policy_func, max_steps=num_time_steps)\n", + " all_states.append(states)\n", + " all_actions.append(actions)\n", + "\n", + " # Fit a model.\n", + " model, infr, model_data_X, model_data_Y = fit_model(\n", + " all_states, all_actions, win_in=1, verbose=True)\n", + "\n", + " # Optimize the policy.\n", + " policy = optimize_policy(\n", + " policy, cost, model, infr, model_data_X, model_data_Y,\n", + " initial_state_generator, num_grad_steps=num_grad_steps,\n", + " num_samples=num_samples, learning_rate=learning_rate,\n", + " num_time_steps=num_time_steps)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Policy after the first episode (random exploration):" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + " Once \n", + " Loop \n", + " Reflect \n", + "
\n", + "
\n", + "\n", + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 15, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "HTML(filename=\"pilco/animation_policy_iter_0.html\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Policy after the 5th episode:" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + " Once \n", + " Loop \n", + " Reflect \n", + "
\n", + "
\n", + "\n", + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "HTML(filename=\"pilco/animation_policy_iter_4.html\")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Reference\n", + "\n", + "M. P. Deisenroth, C. E. Rasmussen. 2011. \"PILCO: A Model-Based and Data-Efficient Approach to Policy Search\". _in\n", + "Proceedings of the 28th International Conference on Machine Learning._ [http://mlg.eng.cam.ac.uk/pub/pdf/DeiRas11.pdf](http://mlg.eng.cam.ac.uk/pub/pdf/DeiRas11.pdf)\n" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.0" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/notebooks/pilco/animation_policy_iter_0.html b/examples/notebooks/pilco/animation_policy_iter_0.html new file mode 100644 index 0000000..95b984d --- /dev/null +++ b/examples/notebooks/pilco/animation_policy_iter_0.html @@ -0,0 +1,18186 @@ + + + + +
+ +
+ +
+ + + + + + + + + +
+ Once + Loop + Reflect +
+
+ + + diff --git a/examples/notebooks/pilco/animation_policy_iter_4.html b/examples/notebooks/pilco/animation_policy_iter_4.html new file mode 100644 index 0000000..bffd3bf --- /dev/null +++ b/examples/notebooks/pilco/animation_policy_iter_4.html @@ -0,0 +1,14098 @@ + + + + +
+ +
+ +
+ + + + + + + + + +
+ Once + Loop + Reflect +
+
+ + + diff --git a/examples/notebooks/pilco/animation_random_policy.html b/examples/notebooks/pilco/animation_random_policy.html new file mode 100644 index 0000000..850177e --- /dev/null +++ b/examples/notebooks/pilco/animation_random_policy.html @@ -0,0 +1,18111 @@ + + + + +
+ +
+ +
+ + + + + + + + + +
+ Once + Loop + Reflect +
+
+ + + diff --git a/examples/notebooks/pilco_neurips2018_mloss_slides.ipynb b/examples/notebooks/pilco_neurips2018_mloss_slides.ipynb new file mode 100644 index 0000000..8dc7fdc --- /dev/null +++ b/examples/notebooks/pilco_neurips2018_mloss_slides.ipynb @@ -0,0 +1,51558 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Obtaining file:///Users/erimeiss/workspace/mxfusion\n", + "Requirement already satisfied: networkx>=2.1 in /Users/erimeiss/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages (from MXFusion==0.3.0) (2.1)\n", + "Requirement already satisfied: numpy>=1.7 in /Users/erimeiss/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages (from MXFusion==0.3.0) (1.16.3)\n", + "Requirement already satisfied: decorator>=4.1.0 in /Users/erimeiss/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages (from networkx>=2.1->MXFusion==0.3.0) (4.3.0)\n", + "Installing collected packages: MXFusion\n", + " Found existing installation: MXFusion 0.3.0\n", + " Uninstalling MXFusion-0.3.0:\n", + " Successfully uninstalled MXFusion-0.3.0\n", + " Running setup.py develop for MXFusion\n", + "Successfully installed MXFusion\n" + ] + } + ], + "source": [ + "!pip install -e ../../" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# MXFusion\n", + "## A Deep Modular Probabilistic Programming Library\n", + "\n", + "**Eric Meissner**\n", + "Zhenwen Dai\n", + "\n", + "@Amazon - Cambridge, UK" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# Why another one?\n", + "\n", + "Existing libraries had either:\n", + "- Probabilistic modelling with rich, flexible models and universal inference or\n", + "- Specialized, efficient inference over a subset of models\n", + "\n", + "**We needed both**" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# Key Requirements\n", + "- Integration with deep learning\n", + "- Flexiblility\n", + "- Scalability\n", + "- Specialized inference and models support\n" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "- Bayesian Deep Learning methods\n", + "- Rapid prototyping and software re-use\n", + "- GPUs, specialized inference methods" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "Modularity\n", + " - Specialized Inference\n", + " - Composability (tinkerability)\n", + " - Better leveraging of expert expertise\n", + "\n", + "Specialized inference methods + models, without requiring users to reimplement nor understand them every time.\n", + "Leverage expert knowledge. Efficient inference, flexible framework. \n", + "Existing frameworks either did one or the other: flexible, or efficient." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# What does it look like?\n", + "\n", + "**Modelling**\n", + "\n", + "**Inference**" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "## Modelling \n", + "\n", + "### Directed Factor Graphs\n", + "* Variable\n", + "* Function\n", + "* Distribution\n", + "\n", + "### Example\n", + "\n", + "```python\n", + "m = Model()\n", + "m.mu = Variable()\n", + "m.s = Variable(transformation=PositiveTransformation())\n", + "m.Y = Normal.define_variable(mean=m.mu, variance=m.s)\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "* 3 primary components in modeling\n", + " * Variable\n", + " * Distribution\n", + " * Function \n", + "* 2 primary methods for models \n", + " * log_pdf\n", + " * draw_samples" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "## Inference\n", + "\n", + "### Two Classes\n", + "\n", + "* Variational Inference\n", + "* MCMC Sampling (*soon*)\n", + "\n", + "Built on MXNet Gluon (imperative code, not static graph)\n", + "\n", + "### Example\n", + "\n", + "```\n", + "infr = GradBasedInference(inference_algorithm=MAP(model=m, observed=[m.Y]))\n", + "infr.run(Y=data)\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "Primarily variational inference right now\n", + "\n", + "MCMC method coming soon\n", + "\n", + "```python\n", + "infr = GradBasedInference(inference_algorithm=MAP(model=m, observed=[m.Y]))\n", + "infr.run(Y=data)\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "## Modules\n", + " - Model + Inference together form building blocks.\n", + " - Just doing modular modeling with universal inference doesn't really scale, need specialized inference methods for specialized modelling objects like non-parametrics." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "# PILCO: A Model-based Policy Search\n", + "Common reinforcement learning methods suffer from data inefficiency, which can be a issue in real world applications where gathering sufficiently large amounts of data pose economic issues and may be impossible. propose a model-based policy search method known as PILCO in part to address this issue. PILCO uses a Gaussian process (GP) for learning the dynamics of the environment and optimizes a parametric policy function using the learned dynamics model.\n", + "\n", + "In this notebook, we demonstrate a straight-forward implementation of PILCO. This implementation follows the main idea of PILCO and has a few enhancements in addition to the published implementation. The enhancements are as follows: \n", + "- **Use Monte Carlo integration instead of moment estimation.** We approximate the expected reward using Monte Carlo integration instead of the proposed moment estimation approach. This removes the bias in the expected reward computation and enables a wide range of choices of kernels and policy functions. In the original work, only RBF and linear kernel and only linear and RBF network policy can be used.\n", + "- **Use automatic differentiation.** Thanks to automatic differentiation, no gradient derivation is needed.\n", + "- **An unified interface of Gaussian process.** MXFusion provides an unified inferface of GP modules. We allows us to easily switch among plan GP, variational sparse GP and stocastic variational GP implementations." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# PILCO: A Model-based Policy Search\n", + "PILCO [1] is a model-based data-efficient algorithm that solves the RL problem by the following two step iterative process:\n", + "1. Fit a Gaussian Process that models the state dynamics, using calls to a simulator \n", + "2. Optimize a parametric policy using our GP instead of calling the simulator.\n", + "\n", + "## Enhancements MXFusion Brings\n", + "* Use Monte Carlo integration instead of moment estimation\n", + "* Use automatic differentiation\n", + "* A flexible interface for Gaussian processes, trivial to switch to sparse or stochastic variational \n", + "\n", + "[1] Deisenroth & Rasmussen (2011)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "## Preparation" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "This notebook depends on MXNet, MXFusion and Open AI Gym. These packages can be installed into your Python environment by running the following commands.\n", + "```bash\n", + "pip install mxnet mxfusion gym\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "Set the global configuration." + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "import os\n", + "os.environ['MXNET_ENGINE_TYPE'] = 'NaiveEngine'\n", + "from mxfusion.common import config\n", + "config.DEFAULT_DTYPE = 'float64'\n", + "%matplotlib inline" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "## Example: Pendulum\n", + "\n", + "\n", + "We use the inverted pendulum swingup problem as an example. We use the [Pendulum-v0](https://gym.openai.com/envs/Pendulum-v0/) enironment in Open AI Gym. The task is to swing the pendulum up and balance it at the inverted position. This is a classical control problem and is known to be unsolvable with a linear controller.\n", + "\n", + "To solve this problem with PILCO, it needs three components:\n", + "\n", + "- Execute a policy in an real environment (an Open AI Gym simulator in this example) and collect data.\n", + "- Fit a GP model as the model for the dynamics of the environment.\n", + "- Optimize the policy given the dynamics model learned from all the data that have been collected so far.\n", + "\n", + "The overall PILCO algorithm is to iterate the above three steps until a policy that can solve the problem is found." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "## Execute the Environment \n", + "\n", + "The Pendulum-v0 environment can be loaded easily." + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "import gym\n", + "env = gym.make('Pendulum-v0')" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "The state of the pendulum environment is a 3D vector. The first two dimensions are the 2D location of the end point of the pendulum. The third dimension encodes the angular speed of the pendulum. The action space is a 1D vector in [-2, 2]." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "We write a helper function for executing the environment with a given policy." + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "import numpy as np\n", + "import matplotlib.pyplot as plt\n", + "from matplotlib import animation\n", + "\n", + "def run_one_episode(env, policy, initial_state=None, max_steps=200, verbose=False, render=False):\n", + " \"\"\"\n", + " Drives an episode of the OpenAI gym environment using the policy to decide next actions.\n", + " \"\"\"\n", + " observation = env.reset()\n", + " if initial_state is not None:\n", + " env.env.state = initial_state\n", + " observation = env.env._get_obs()\n", + " env._max_episode_steps = max_steps\n", + " step_idx = 0\n", + " done = False\n", + " total_reward = 0\n", + " frames = []\n", + " all_actions = []\n", + " all_observations = [observation]\n", + " while not done:\n", + " if render:\n", + " frames.append(env.render(mode = 'rgb_array'))\n", + " if verbose:\n", + " print(observation)\n", + " action = policy(observation)\n", + " observation, reward, done, info = env.step(action)\n", + " all_observations.append(observation)\n", + " all_actions.append(action)\n", + " total_reward += reward\n", + " step_idx += 1\n", + " if done or step_idx>=max_steps-1:\n", + " print(\"Episode finished after {} timesteps because {}\".format(step_idx+1, \"'done' reached\" if done else \"Max timesteps reached\"))\n", + " break\n", + " if render:\n", + " fig = plt.figure()\n", + " ax = fig.gca()\n", + " fig.tight_layout()\n", + " patch = ax.imshow(frames[0])\n", + " ax.axis('off')\n", + " def animate(i):\n", + " patch.set_data(frames[i])\n", + " anim = animation.FuncAnimation(plt.gcf(), animate, frames = len(frames), interval=20)\n", + " return total_reward, np.array(all_observations, dtype=np.float64,), np.array(all_actions, dtype=np.float64), anim\n", + " else:\n", + " return total_reward, np.array(all_observations, dtype=np.float64,), np.array(all_actions, dtype=np.float64)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "Let's first apply a random policy and see how the environment reacts. The random policy uniformly samples in the space of action." + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "def random_policy(state):\n", + " return env.action_space.sample()" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "The animation is generated with the following commands:\n", + "```python\n", + "anim = run_one_episode(env, random_policy, max_steps=500, render=True, verbose=False)[-1]\n", + "\n", + "with open('animation_random_policy.html', 'w') as f:\n", + " f.write(anim.to_jshtml())\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# Pendulum" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + " Once \n", + " Loop \n", + " Reflect \n", + "
\n", + "
\n", + "\n", + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "from IPython.display import HTML\n", + "\n", + "HTML(filename=\"pilco/animation_random_policy.html\")" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "## Fit the Dynamics Model\n", + "\n", + "The dynamics model of pendulum can be written as\n", + "$$p(y_{t+1}|y_t, a_t)$$\n", + "where $y_t$ is the state vector at the time $t$ and $a_t$ is the action taken at the time $t$. \n", + "\n", + "PILCO uses a Gaussian process to model the above dynamics." + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "def prepare_data(state_list, action_list, win_in):\n", + " \"\"\"\n", + " Prepares a list of states and a list of actions as inputs to the Gaussian Process for training.\n", + " \"\"\"\n", + " \n", + " X_list = []\n", + " Y_list = []\n", + " \n", + " for state_array, action_array in zip(state_list, action_list):\n", + " # the state and action array shape should be aligned.\n", + " assert state_array.shape[0]-1 == action_array.shape[0]\n", + " \n", + " for i in range(state_array.shape[0]-win_in):\n", + " Y_list.append(state_array[i+win_in:i+win_in+1])\n", + " X_list.append(np.hstack([state_array[i:i+win_in].flatten(), action_array[i:i+win_in].flatten()]))\n", + " X = np.vstack(X_list)\n", + " Y = np.vstack(Y_list)\n", + " return X, Y" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "In this example, we do a maximum likelihood estimate for the model hyper-parameters. In MXFusion, Gaussian process regression model is available as a module, which includes a dediated inference algorithm." + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "import mxnet as mx\n", + "from mxfusion import Model, Variable\n", + "from mxfusion.components.variables import PositiveTransformation\n", + "from mxfusion.components.distributions.gp.kernels import RBF\n", + "from mxfusion.modules.gp_modules import GPRegression\n", + "from mxfusion.inference import GradBasedInference, MAP" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# Define and fit the model" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "outputs": [], + "source": [ + "def fit_model(state_list, action_list, win_in, verbose=True):\n", + " \"\"\"\n", + " Fits a Gaussian Process model to the state / action pairs passed in. \n", + " This creates a model of the environment which is used during\n", + " policy optimization instead of querying the environment directly.\n", + " \n", + " See mxfusion.gp_modules for additional types of GP models to fit,\n", + " including Sparse GP and Stochastic Varitional Inference Sparse GP.\n", + " \"\"\"\n", + " X, Y = prepare_data(state_list, action_list, win_in)\n", + "\n", + " m = Model()\n", + " m.N = Variable()\n", + " m.X = Variable(shape=(m.N, X.shape[-1]))\n", + " m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(),\n", + " initial_value=0.01)\n", + " m.kernel = RBF(input_dim=X.shape[-1], variance=1, lengthscale=1, ARD=True)\n", + " m.Y = GPRegression.define_variable(\n", + " X=m.X, kernel=m.kernel, noise_var=m.noise_var,\n", + " shape=(m.N, Y.shape[-1]))\n", + " m.Y.factor.gp_log_pdf.jitter = 1e-6\n", + "\n", + " infr = GradBasedInference(\n", + " inference_algorithm=MAP(model=m, observed=[m.X, m.Y]))\n", + " infr.run(X=mx.nd.array(X, dtype='float64'),\n", + " Y=mx.nd.array(Y, dtype='float64'),\n", + " max_iter=1000, learning_rate=0.1, verbose=verbose)\n", + " return m, infr, X, Y" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "notes" + } + }, + "source": [ + "### Policy Optimization\n", + "\n", + "PILCO computes the expected reward of a policy given the dynamics model. First, we need to define the parametric form of the policy. In this example, we use a neural network with one hidden layer. As the action space is [-2, 2], we apply a tanh transformation and multiply the come with two. This enforces the returned actions stay within the range." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# Policy\n", + "\n", + "We define a neural network with one hidden layer and and output constrained between [-2,2] for the policy." + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "outputs": [], + "source": [ + "from mxnet.gluon import HybridBlock\n", + "from mxnet.gluon.nn import Dense\n", + "\n", + "class NNController(HybridBlock):\n", + " def __init__(self, prefix=None, params=None):\n", + " super(NNController, self).__init__(prefix=prefix, params=params)\n", + " self.dense1 = Dense(100, in_units=len(env.observation_space.high), dtype='float64', activation='relu')\n", + " self.dense2 = Dense(1, in_units=100, dtype='float64', activation='tanh')\n", + " def hybrid_forward(self, F, x):\n", + " out = self.dense2(self.dense1(x))*2\n", + " return out \n", + " \n", + "policy = NNController()\n", + "policy.collect_params().initialize(mx.initializer.Xavier(magnitude=1))" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "To compute the expected reward, we also need to define a reward function. This reward function is defined by us according to the task. The main component is the height of the pendulum. We also penalize the force and the angular momentum. " + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "class CostFunction(mx.gluon.HybridBlock):\n", + " \"\"\"\n", + " The goal is to get the pendulum upright and stable as quickly as possible.\n", + " Taken from the code for Pendulum.\n", + " \"\"\"\n", + " def hybrid_forward(self, F, state, action):\n", + " \"\"\"\n", + " :param state: [np.cos(theta), np.sin(theta), ~ momentum(theta)]\n", + " a -> 0 when pendulum is upright, largest when pendulum is hanging down completely.\n", + " b -> penalty for taking action\n", + " c -> penalty for pendulum momentum\n", + " \"\"\"\n", + " a_scale = 2.\n", + " b_scale = .001\n", + " c_scale = .1\n", + " a = F.sum(a_scale * (state[:,:,0:1] -1) ** 2, axis=-1)\n", + " b = F.sum(b_scale * action ** 2, axis=-1)\n", + " c = F.sum(c_scale * state[:,:,2:3] ** 2, axis=-1)\n", + " return (a + c + b)\n", + " \n", + "cost = CostFunction()" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "The expected reward function can be written as\n", + "$$R = \\mathbb{E}_{p(y_T, \\ldots, y_0)}\\left(\\sum_{t=0}^T r(y_t)\\right)$$\n", + "where $r(\\cdot)$ is the reward function. $p(y_T, \\ldots, y_0)$ is the joint distribution when applying the policy to the dynamics model:\n", + "$$p(y_T, \\ldots, y_0) = p(y_0) \\prod_{t=1}^T p(y_t|y_{t-1}, a_{t-1}),$$\n", + "where $a_{t-1} = \\pi(y_{t-1})$ is the action taken at the time $t-1$, which is the outcome of the policy $\\pi(\\cdot)$.\n", + "\n", + "The expected reward function is implemented as follows." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "# Obtaining the policy gradients" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "from mxfusion.inference.inference_alg import SamplingAlgorithm\n", + "\n", + "class PILCOAlgorithm(SamplingAlgorithm):\n", + "\n", + " def compute(self, F, variables):\n", + " s_0 = self.initial_state_generator(self.num_samples)\n", + " a_0 = self.policy(s_0)\n", + " a_t_plus_1 = a_0\n", + " x_t = F.expand_dims(F.concat(s_0, a_0, dim=1), axis=1)\n", + " cost = 0\n", + " for t in range(self.n_time_steps):\n", + " variables[self.model.X] = x_t\n", + " res = self.model.Y.factor.predict(F, variables, targets=[self.model.Y], num_samples=self.num_samples)[0]\n", + " s_t_plus_1 = res[0]\n", + "\n", + " cost = cost + self.cost_function(s_t_plus_1, a_t_plus_1)\n", + "\n", + " a_t_plus_1 = mx.nd.expand_dims(self.policy(s_t_plus_1), axis=2)\n", + " x_t = mx.nd.concat(s_t_plus_1, a_t_plus_1, dim=2)\n", + " total_cost = F.sum(cost)\n", + " return total_cost, total_cost" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "We optimize the policy with respect to the expected reward by using a gradient optimizer." + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "from mxfusion.inference import GradTransferInference\n", + "from mxfusion.inference.pilco_alg import PILCOAlgorithm\n", + "\n", + "def optimize_policy(policy, cost_func, model, infr, model_data_X, model_data_Y,\n", + " initial_state_generator, num_grad_steps,\n", + " learning_rate=1e-2, num_time_steps=100, \n", + " num_samples=10, verbose=True):\n", + " \"\"\"\n", + " Takes as primary inputs a policy, cost function, and trained model.\n", + " Optimizes the policy for num_grad_steps number of iterations.\n", + " \"\"\"\n", + " mb_alg = PILCOAlgorithm(\n", + " model=model, observed=[model.X, model.Y], cost_function=cost_func,\n", + " policy=policy, n_time_steps=num_time_steps,\n", + " initial_state_generator=initial_state_generator,\n", + " num_samples=num_samples)\n", + "\n", + " infr_pred = GradTransferInference(\n", + " mb_alg, infr_params=infr.params, train_params=policy.collect_params())\n", + " infr_pred.run(\n", + " max_iter=num_grad_steps,\n", + " X=mx.nd.array(model_data_X, dtype='float64'),\n", + " Y=mx.nd.array(model_data_Y, dtype='float64'),\n", + " verbose=verbose, learning_rate=learning_rate)\n", + " return policy" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "source": [ + "## The Loop\n", + "\n", + "We need to define a function that provides random initial states." + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "def initial_state_generator(num_initial_states):\n", + " \"\"\"\n", + " Starts from valid states by drawing theta and momentum\n", + " then computing np.cos(theta) and np.sin(theta) for state[0:2].s\n", + " \"\"\"\n", + " return mx.nd.array(\n", + " [env.observation_space.sample() for i in range(num_initial_states)],\n", + " dtype='float64')" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# The Loop" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": { + "slideshow": { + "slide_type": "skip" + } + }, + "outputs": [], + "source": [ + "num_episode = 20 # how many model fit + policy optimization episodes to run\n", + "num_samples = 100 # how many sample trajectories the policy optimization loop uses\n", + "num_grad_steps = 1000 # how many gradient steps the optimizer takes per episode\n", + "num_time_steps = 100 # how far to roll out each sample trajectory\n", + "learning_rate = 1e-3 # learning rate for the policy optimization\n", + "\n", + "all_states = []\n", + "all_actions = []" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Episode finished after 100 timesteps because Max timesteps reached\n", + "\r", + "Iteration 1 loss: -147.44275894783664\t\t\t\t\r", + "Iteration 2 loss: -175.90537081675882\t\t\t\t\r", + "Iteration 3 loss: -203.08783994173928\t\t\t\t\r", + "Iteration 4 loss: -228.99512346183315\t\t\t\t\r", + "Iteration 5 loss: -253.65195491239757\t\t\t\t\r", + "Iteration 6 loss: -277.0934209762746\t\t\t\t\r", + "Iteration 7 loss: -299.3600581570322\t\t\t\t\r", + "Iteration 8 loss: -320.49807202924745\t\t\t\t\r", + "Iteration 9 loss: -340.56099060736454\t\t\t\t\r", + "Iteration 10 loss: -359.61034033457696\t\t\t\t\r", + "Iteration 11 loss: -377.71565978816744\t\t\t\t\r", + "Iteration 12 loss: -394.9550799167229\t\t\t\t\r", + "Iteration 13 loss: -411.41695470306104\t\t\t\t\r", + "Iteration 14 loss: -427.20182567104433\t\t\t\t\r", + "Iteration 15 loss: -442.42316993901187\t\t\t\t\r", + "Iteration 16 loss: -457.20516453335017\t\t\t\t\r", + "Iteration 17 loss: -471.67636880459304\t\t\t\t\r", + "Iteration 18 loss: -485.9597423546608\t\t\t\t\r", + "Iteration 19 loss: -500.16127762489947\t\t\t\t\r", + "Iteration 20 loss: -514.360528573828\t\t\t\t\r", + "Iteration 21 loss: -528.6057260995374\t\t\t\t\r", + "Iteration 22 loss: -542.9143027944718\t\t\t\t\r", + "Iteration 23 loss: -557.2778368461522\t\t\t\t\r", + "Iteration 24 loss: -571.6694615828881\t\t\t\t" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/erimeiss/workspace/mxfusion/mxfusion/inference/inference_parameters.py:71: UserWarning: InferenceParameters has already been initialized. The existing one will be overwritten.\n", + " warnings.warn(\"InferenceParameters has already been initialized. The existing one will be overwritten.\")\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Iteration 100 loss: -1365.1946754085056\t\t\t\t\n", + "Iteration 200 loss: -1469.3300788900378\t\t\t\t\n", + "Iteration 300 loss: -1491.5593095277768\t\t\t\t\n", + "Iteration 400 loss: -1503.8953879089897\t\t\t\t\n", + "Iteration 500 loss: -1512.5250343137307\t\t\t\t\n", + "Iteration 600 loss: -1519.2204316627003\t\t\t\t\n", + "Iteration 700 loss: -1524.6930473364855\t\t\t\t\n", + "Iteration 800 loss: -1529.294080558935\t\t\t\t\t\n", + "Iteration 900 loss: -1533.229205462882\t\t\t\t\t\n", + "Iteration 1000 loss: -1536.6377727466997\t\t\t\t\n", + "Iteration 2 loss: 7108711.122901848\t\t\t\t" + ] + }, + { + "ename": "KeyboardInterrupt", + "evalue": "", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 19\u001b[0m \u001b[0minitial_state_generator\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_grad_steps\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnum_grad_steps\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 20\u001b[0m \u001b[0mnum_samples\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mlearning_rate\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mlearning_rate\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 21\u001b[0;31m num_time_steps=num_time_steps)\n\u001b[0m", + "\u001b[0;32m\u001b[0m in \u001b[0;36moptimize_policy\u001b[0;34m(policy, cost_func, model, infr, model_data_X, model_data_Y, initial_state_generator, num_grad_steps, learning_rate, num_time_steps, num_samples, verbose)\u001b[0m\n\u001b[1;32m 22\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel_data_X\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'float64'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 23\u001b[0m \u001b[0mY\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmodel_data_Y\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m'float64'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 24\u001b[0;31m verbose=verbose, learning_rate=learning_rate)\n\u001b[0m\u001b[1;32m 25\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mpolicy\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/grad_based_inference.py\u001b[0m in \u001b[0;36mrun\u001b[0;34m(self, optimizer, learning_rate, max_iter, verbose, **kwargs)\u001b[0m\n\u001b[1;32m 102\u001b[0m \u001b[0minfr_executor\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0minfr\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdata\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mparam_dict\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparams\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mparam_dict\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 103\u001b[0m \u001b[0mctx\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmxnet_context\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0moptimizer\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0moptimizer\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 104\u001b[0;31m learning_rate=learning_rate, max_iter=max_iter, verbose=verbose)\n\u001b[0m\u001b[1;32m 105\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 106\u001b[0m \u001b[0;32mclass\u001b[0m \u001b[0mGradTransferInference\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mGradBasedInference\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/batch_loop.py\u001b[0m in \u001b[0;36mrun\u001b[0;34m(self, infr_executor, data, param_dict, ctx, optimizer, learning_rate, max_iter, n_prints, verbose)\u001b[0m\n\u001b[1;32m 51\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmax_iter\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 52\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mautograd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrecord\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 53\u001b[0;31m \u001b[0mloss\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mloss_for_gradient\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0minfr_executor\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mzeros\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mctx\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mctx\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 54\u001b[0m \u001b[0mloss_for_gradient\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbackward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 55\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/gluon/block.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args)\u001b[0m\n\u001b[1;32m 538\u001b[0m \u001b[0mhook\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 539\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 540\u001b[0;31m \u001b[0mout\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mforward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 541\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 542\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mhook\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_forward_hooks\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/gluon/block.py\u001b[0m in \u001b[0;36mforward\u001b[0;34m(self, x, *args)\u001b[0m\n\u001b[1;32m 915\u001b[0m \u001b[0mparams\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m{\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdata\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mctx\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mj\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_reg_params\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 916\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 917\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mhybrid_forward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mndarray\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mx\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mparams\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 918\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 919\u001b[0m \u001b[0;32massert\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mx\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mSymbol\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;31m \u001b[0m\u001b[0;31m\\\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/inference_alg.py\u001b[0m in \u001b[0;36mhybrid_forward\u001b[0;34m(self, F, x, *args, **kw)\u001b[0m\n\u001b[1;32m 81\u001b[0m \u001b[0madd_sample_dimension_to_arrays\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkw\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mout\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 82\u001b[0m \u001b[0madd_sample_dimension_to_arrays\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_constants\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mout\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 83\u001b[0;31m \u001b[0mobj\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_infr_method\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcompute\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 84\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mautograd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpause\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 85\u001b[0m \u001b[0;31m# An inference algorithm may directly set the value of a parameter instead of computing its gradient.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/inference/pilco_alg.py\u001b[0m in \u001b[0;36mcompute\u001b[0;34m(self, F, variables)\u001b[0m\n\u001b[1;32m 82\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mt\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mn_time_steps\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 83\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mX\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mx_t\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 84\u001b[0;31m \u001b[0mres\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mY\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfactor\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpredict\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtargets\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmodel\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mY\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_samples\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 85\u001b[0m \u001b[0ms_t_plus_1\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mres\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 86\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/modules/module.py\u001b[0m in \u001b[0;36mpredict\u001b[0;34m(self, F, variables, num_samples, targets)\u001b[0m\n\u001b[1;32m 362\u001b[0m \u001b[0malg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnum_samples\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnum_samples\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 363\u001b[0m \u001b[0malg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtarget_variables\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtargets\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 364\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0malg\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcompute\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 365\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 366\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0m_get_algorithm_for_target_conditional_pair\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0malgorithms\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtargets\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mvariables\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mexact_match\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mFalse\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/modules/gp_modules/gp_regression.py\u001b[0m in \u001b[0;36mcompute\u001b[0;34m(self, F, variables)\u001b[0m\n\u001b[1;32m 167\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 168\u001b[0m X, noise_var, X_cond, L, LinvY, kern_params = arrays_as_samples(\n\u001b[0;32m--> 169\u001b[0;31m F, [X, noise_var, X_cond, L, LinvY, kern_params])\n\u001b[0m\u001b[1;32m 170\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 171\u001b[0m \u001b[0mKxt\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mkern\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mK\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX_cond\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mX\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkern_params\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/components/variables/runtime_variable.py\u001b[0m in \u001b[0;36marrays_as_samples\u001b[0;34m(F, arrays)\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmax\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 115\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 116\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0ma\u001b[0m \u001b[0;32min\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 117\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 118\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/components/variables/runtime_variable.py\u001b[0m in \u001b[0;36m\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mmax\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 115\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mmax_num_samples\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 116\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0mk\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mk\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mitems\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m}\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdict\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0mas_samples\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mmax_num_samples\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0ma\u001b[0m \u001b[0;32min\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 117\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 118\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0marrays\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/workspace/mxfusion/mxfusion/components/variables/runtime_variable.py\u001b[0m in \u001b[0;36mas_samples\u001b[0;34m(F, array, num_samples)\u001b[0m\n\u001b[1;32m 97\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0marray\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 98\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 99\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mF\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbroadcast_axis\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0marray\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0msize\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mnum_samples\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 100\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 101\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/ndarray/register.py\u001b[0m in \u001b[0;36mbroadcast_axis\u001b[0;34m(data, axis, size, out, name, **kwargs)\u001b[0m\n", + "\u001b[0;32m~/.pyenv/versions/anaconda3-5.3.1/lib/python3.7/site-packages/mxnet/_ctypes/ndarray.py\u001b[0m in \u001b[0;36m_imperative_invoke\u001b[0;34m(handle, ndargs, keys, vals, out)\u001b[0m\n\u001b[1;32m 90\u001b[0m \u001b[0mc_str_array\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkeys\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 91\u001b[0m \u001b[0mc_str_array\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mstr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ms\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0ms\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mvals\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 92\u001b[0;31m ctypes.byref(out_stypes)))\n\u001b[0m\u001b[1;32m 93\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 94\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0moriginal_output\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mKeyboardInterrupt\u001b[0m: " + ] + } + ], + "source": [ + "for i_ep in range(num_episode):\n", + " # Run an episode and collect data.\n", + " if i_ep == 0:\n", + " policy_func = lambda x: env.action_space.sample()\n", + " else:\n", + " policy_func = lambda x: policy(mx.nd.expand_dims(mx.nd.array(x, dtype='float64'), axis=0)).asnumpy()[0]\n", + " total_reward, states, actions = run_one_episode(\n", + " env, policy_func, max_steps=num_time_steps)\n", + " all_states.append(states)\n", + " all_actions.append(actions)\n", + "\n", + " # Fit a model.\n", + " model, infr, model_data_X, model_data_Y = fit_model(\n", + " all_states, all_actions, win_in=1, verbose=True)\n", + "\n", + " # Optimize the policy.\n", + " policy = optimize_policy(\n", + " policy, cost, model, infr, model_data_X, model_data_Y,\n", + " initial_state_generator, num_grad_steps=num_grad_steps,\n", + " num_samples=num_samples, learning_rate=learning_rate,\n", + " num_time_steps=num_time_steps)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "Policy after the first episode (random exploration):" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + " Once \n", + " Loop \n", + " Reflect \n", + "
\n", + "
\n", + "\n", + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 17, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "HTML(filename=\"pilco/animation_policy_iter_0.html\")" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "Policy after the 5th episode:" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + "\n", + "\n", + "\n", + "
\n", + " \n", + "
\n", + " \n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
\n", + " Once \n", + " Loop \n", + " Reflect \n", + "
\n", + "
\n", + "\n", + "\n", + "\n" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "HTML(filename=\"pilco/animation_policy_iter_4.html\")" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "slide" + } + }, + "source": [ + "# Conclusion\n", + "\n", + "* Modular probabilistic programming library\n", + "* Flexibly pair specialized models/inference algorithms with a wide range of probabilistic models\n", + "\n", + "## Join us!\n", + "\n", + "[github.com/amzn/mxfusion](github.com/amzn/mxfusion)" + ] + }, + { + "cell_type": "markdown", + "metadata": { + "slideshow": { + "slide_type": "fragment" + } + }, + "source": [ + "## Reference\n", + "\n", + "M. P. Deisenroth, C. E. Rasmussen. 2011. \"PILCO: A Model-Based and Data-Efficient Approach to Policy Search\". _in\n", + "Proceedings of the 28th International Conference on Machine Learning._ [http://mlg.eng.cam.ac.uk/pub/pdf/DeiRas11.pdf](http://mlg.eng.cam.ac.uk/pub/pdf/DeiRas11.pdf)\n" + ] + } + ], + "metadata": { + "celltoolbar": "Slideshow", + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.0" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/notebooks/svgp_regression.ipynb b/examples/notebooks/svgp_regression.ipynb new file mode 100644 index 0000000..46f51c1 --- /dev/null +++ b/examples/notebooks/svgp_regression.ipynb @@ -0,0 +1,383 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Stochastic Variational Gaussian Process Regression\n", + "\n", + "**Zhenwen Dai (2019-05-29)**" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Introduction\n", + "\n", + "Gaussian process (GP) is computationally expensive. A popular approach to scale up GP regression on large data is to use stochastic variational inference with mini-batch training (Hensman et al., 2013). SVGP regression with Gaussian noise has been implemented as a module in MXFusion." + ] + }, + { + "cell_type": "code", + "execution_count": 32, + "metadata": {}, + "outputs": [], + "source": [ + "import warnings\n", + "warnings.filterwarnings('ignore')\n", + "import os\n", + "os.environ['MXNET_ENGINE_TYPE'] = 'NaiveEngine'" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Toy data\n", + "\n", + "We generate some synthetic data for our regression example. The data set is generate from a sine function with some additive Gaussian noise. " + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np\n", + "%matplotlib inline\n", + "from pylab import *\n", + "\n", + "np.random.seed(0)\n", + "X = np.random.uniform(-3.,3.,(1000,1))\n", + "Y = np.sin(X) + np.random.randn(1000,1)*0.05" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The generated data are visualized as follows:" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "plot(X, Y, 'rx', label='data points')\n", + "_=legend()" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion.common import config\n", + "config.DEFAULT_DTYPE = 'float64'" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The SVGP regression model is created as follow. Two SVGP specific parameters are ```num_inducing``` which specifies the number of inducing points used in the variational sparse GP approximation and ```svgp_log_pdf.jitter``` which the jitter term in the log pdf calculation for numerical robustness. " + ] + }, + { + "cell_type": "code", + "execution_count": 33, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion import Model, Variable\n", + "from mxfusion.components.variables import PositiveTransformation\n", + "from mxfusion.components.distributions.gp.kernels import RBF\n", + "from mxfusion.modules.gp_modules import SVGPRegression\n", + "\n", + "m = Model()\n", + "m.N = Variable()\n", + "m.X = Variable(shape=(m.N, 1))\n", + "m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=0.01)\n", + "m.kernel = RBF(input_dim=1, variance=1, lengthscale=1)\n", + "m.Y = SVGPRegression.define_variable(X=m.X, kernel=m.kernel, noise_var=m.noise_var, shape=(m.N, 1), num_inducing=20)\n", + "m.Y.factor.svgp_log_pdf.jitter = 1e-6" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Inference is done by creating the inference instance from the ```GradBasedInference``` class, in which we use a ```MAP``` inference algorithm as there are no latent variables outside the SVGPRegression module. Additional, we specify ```grad_loop``` to be ```MiniBatchInferenceLoop``` in which we set the size of mini-batch and the scaling factor for minibatch training.\n", + "\n", + "Then, training is triggered by calling the ```run``` method." + ] + }, + { + "cell_type": "code", + "execution_count": 38, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "epoch 1 Iteration 100 loss: 933115.0603707978\t\t\tepoch-loss: 10413624.614005275 \n", + "epoch 2 Iteration 100 loss: 524948.7079326594\t\t\tepoch-loss: 686034.5295730559 \n", + "epoch 3 Iteration 100 loss: 345602.4022749258\t\t\tepoch-loss: 427065.8343717841 \n", + "epoch 4 Iteration 100 loss: 277011.3760208657\t\t\tepoch-loss: 297071.493696023 \n", + "epoch 5 Iteration 100 loss: 183347.13021907964\t\t\tepoch-loss: 219808.0871498559 \n", + "epoch 6 Iteration 100 loss: 143763.11007552472\t\t\tepoch-loss: 169486.20729875282 \n", + "epoch 7 Iteration 100 loss: 132031.47695326462\t\t\tepoch-loss: 134765.1471133905 \n", + "epoch 8 Iteration 100 loss: 95632.60561449913\t\t\tepoch-loss: 109798.66321648406 \n", + "epoch 9 Iteration 100 loss: 73957.6220462552\t\t\tepoch-loss: 91257.8705670977 \n", + "epoch 10 Iteration 100 loss: 64840.07207031624\t\t\tepoch-loss: 77084.06942481917 \n", + "epoch 11 Iteration 100 loss: 60780.27278575914\t\t\tepoch-loss: 65962.38163622493 \n", + "epoch 12 Iteration 100 loss: 48546.66342698521\t\t\tepoch-loss: 57037.39009905885 \n", + "epoch 13 Iteration 100 loss: 42676.907263579335\t\t\tepoch-loss: 49725.50869601666 \n", + "epoch 14 Iteration 100 loss: 43266.74759690139\t\t\tepoch-loss: 43635.70855486856 \n", + "epoch 15 Iteration 100 loss: 33139.32033870425\t\t\tepoch-loss: 38501.415430223606 \n", + "epoch 16 Iteration 100 loss: 35129.68003531527\t\t\tepoch-loss: 34139.30892930683 \n", + "epoch 17 Iteration 100 loss: 33309.08869286892\t\t\tepoch-loss: 30414.713307491817 \n", + "epoch 18 Iteration 100 loss: 31058.180286752693\t\t\tepoch-loss: 27222.957705478882 \n", + "epoch 19 Iteration 100 loss: 22781.668494776342\t\t\tepoch-loss: 24466.753696665117 \n", + "epoch 20 Iteration 100 loss: 16921.53875526696\t\t\tepoch-loss: 22063.866203795988 \n", + "epoch 21 Iteration 100 loss: 16866.27172281184\t\t\tepoch-loss: 19959.435781693166 \n", + "epoch 22 Iteration 100 loss: 18001.39866328793\t\t\tepoch-loss: 18093.70564938978 \n", + "epoch 23 Iteration 100 loss: 19268.435700542395\t\t\tepoch-loss: 16435.61461383947 \n", + "epoch 24 Iteration 100 loss: 13586.70681551015\t\t\tepoch-loss: 14947.197437326102 \n", + "epoch 25 Iteration 100 loss: 11842.634017398044\t\t\tepoch-loss: 13605.954880888436 \n", + "epoch 26 Iteration 100 loss: 12304.581180033452\t\t\tepoch-loss: 12393.880316263208 \n", + "epoch 27 Iteration 100 loss: 12712.095456995734\t\t\tepoch-loss: 11293.27810727986 \n", + "epoch 28 Iteration 100 loss: 12662.540317512301\t\t\tepoch-loss: 10292.698091923068 \n", + "epoch 29 Iteration 100 loss: 9789.253683769626\t\t\tepoch-loss: 9379.934609293405 \n", + "epoch 30 Iteration 100 loss: 10336.484081253366\t\t\tepoch-loss: 8542.778732654882 \n", + "epoch 31 Iteration 100 loss: 8427.615871046397\t\t\tepoch-loss: 7780.101399774407 \n", + "epoch 32 Iteration 100 loss: 6243.338653452632\t\t\tepoch-loss: 7083.3906599663305 \n", + "epoch 33 Iteration 100 loss: 5633.910939630758\t\t\tepoch-loss: 6442.360608787293 \n", + "epoch 34 Iteration 100 loss: 6128.494674105952\t\t\tepoch-loss: 5856.924952855579 \n", + "epoch 35 Iteration 100 loss: 5561.132651568278\t\t\tepoch-loss: 5319.662670742758 \n", + "epoch 36 Iteration 100 loss: 5007.633559342303\t\t\tepoch-loss: 4827.494923733251 \n", + "epoch 37 Iteration 100 loss: 4570.798941667555\t\t\tepoch-loss: 4375.152951451802 \n", + "epoch 38 Iteration 100 loss: 3427.8776815125993\t\t\tepoch-loss: 3958.746627662967 \n", + "epoch 39 Iteration 100 loss: 3145.271868648371\t\t\tepoch-loss: 3574.2727718396727 \n", + "epoch 40 Iteration 100 loss: 3252.388844355417\t\t\tepoch-loss: 3216.389789008766 \n", + "epoch 41 Iteration 100 loss: 2682.992323506939\t\t\tepoch-loss: 2880.8040627817663 \n", + "epoch 42 Iteration 100 loss: 2776.54316335849\t\t\tepoch-loss: 2563.2893900928902 \n", + "epoch 43 Iteration 100 loss: 2052.181117489573\t\t\tepoch-loss: 2259.124250598867 \n", + "epoch 44 Iteration 100 loss: 1789.3450917418618\t\t\tepoch-loss: 1963.4009524512699 \n", + "epoch 45 Iteration 100 loss: 1637.0460616480382\t\t\tepoch-loss: 1683.301052960261 \n", + "epoch 46 Iteration 100 loss: 1250.3190196168575\t\t\tepoch-loss: 1421.08925599032 \n", + "epoch 47 Iteration 100 loss: 1056.4280170128945\t\t\tepoch-loss: 1181.4882875552755 \n", + "epoch 48 Iteration 100 loss: 934.1323712121834\t\t\tepoch-loss: 972.8920812023131 \n", + "epoch 49 Iteration 100 loss: 743.6854774208032\t\t\tepoch-loss: 794.3919410633861 \n", + "epoch 50 Iteration 100 loss: 592.0162492873271\t\t\tepoch-loss: 643.6129305537779 \n", + "epoch 1 Iteration 100 loss: -617.7115390031664\t\t\tepoch-loss: 122.02590714978953 \n", + "epoch 2 Iteration 100 loss: -1042.9322804366407\t\t\tepoch-loss: -861.8691127743712 \n", + "epoch 3 Iteration 100 loss: -1246.1061590298375\t\t\tepoch-loss: -1142.8551043268158 \n", + "epoch 4 Iteration 100 loss: -1422.4364206976472\t\t\tepoch-loss: -1248.3343954963652 \n", + "epoch 5 Iteration 100 loss: -1364.319275718058\t\t\tepoch-loss: -1319.0632400945233 \n", + "epoch 6 Iteration 100 loss: -1138.6014678286117\t\t\tepoch-loss: -1375.485088640635 \n", + "epoch 7 Iteration 100 loss: -1468.2449906521865\t\t\tepoch-loss: -1415.3387799226973 \n", + "epoch 8 Iteration 100 loss: -1331.0742440765116\t\t\tepoch-loss: -1398.7259993571608 \n", + "epoch 9 Iteration 100 loss: -1023.1218294411456\t\t\tepoch-loss: -1406.2506096944428 \n", + "epoch 10 Iteration 100 loss: -1491.0721525479291\t\t\tepoch-loss: -1425.3786072098467 \n", + "epoch 11 Iteration 100 loss: -1487.9902441406107\t\t\tepoch-loss: -1385.4821177117121 \n", + "epoch 12 Iteration 100 loss: -963.575720938497\t\t\tepoch-loss: -1148.7904243974 \n", + "epoch 13 Iteration 100 loss: -1496.8723348964538\t\t\tepoch-loss: -1248.4710558849933 \n", + "epoch 14 Iteration 100 loss: -1189.2469453417261\t\t\tepoch-loss: -1302.58240646708 \n", + "epoch 15 Iteration 100 loss: -1354.0129933002445\t\t\tepoch-loss: -1422.9290660653176 \n", + "epoch 16 Iteration 100 loss: -1375.0688655561046\t\t\tepoch-loss: -1296.0532055882159 \n", + "epoch 17 Iteration 100 loss: -1601.7368685439442\t\t\tepoch-loss: -1432.8777691683824 \n", + "epoch 18 Iteration 100 loss: -1140.428056593764\t\t\tepoch-loss: -1443.8657069101057 \n", + "epoch 19 Iteration 100 loss: -1396.6869254783921\t\t\tepoch-loss: -1421.0467725977735 \n", + "epoch 20 Iteration 100 loss: -1313.511818206805\t\t\tepoch-loss: -1411.19388568273 \n", + "epoch 21 Iteration 100 loss: -1508.1672406497062\t\t\tepoch-loss: -1427.8889874691674 \n", + "epoch 22 Iteration 100 loss: -1249.1642813846483\t\t\tepoch-loss: -1379.492333117903 \n", + "epoch 23 Iteration 100 loss: -1214.1394062603918\t\t\tepoch-loss: -1356.5797617962307 \n", + "epoch 24 Iteration 100 loss: -1554.6263005956837\t\t\tepoch-loss: -1358.5256191991677 \n", + "epoch 25 Iteration 100 loss: -1419.5889498936215\t\t\tepoch-loss: -1405.5467914984783 \n", + "epoch 26 Iteration 100 loss: -1262.3682620336267\t\t\tepoch-loss: -1409.6484860247688 \n", + "epoch 27 Iteration 100 loss: -1327.4752015434606\t\t\tepoch-loss: -1368.1521038967614 \n", + "epoch 28 Iteration 100 loss: -1256.4414309051297\t\t\tepoch-loss: -1351.3528504368003 \n", + "epoch 29 Iteration 100 loss: -1178.4788588168844\t\t\tepoch-loss: -1413.816013007459 \n", + "epoch 30 Iteration 100 loss: -1605.1239164704423\t\t\tepoch-loss: -1426.6550440932342 \n", + "epoch 31 Iteration 100 loss: -1617.1795697144926\t\t\tepoch-loss: -1356.5267725452202 \n", + "epoch 32 Iteration 100 loss: -1590.7237287842681\t\t\tepoch-loss: -1425.2884165221458 \n", + "epoch 33 Iteration 100 loss: -1594.3448025229204\t\t\tepoch-loss: -1420.5483351285052 \n", + "epoch 34 Iteration 100 loss: -1576.9397677615486\t\t\tepoch-loss: -1430.2946033617723 \n", + "epoch 35 Iteration 100 loss: -1303.3497394593587\t\t\tepoch-loss: -1380.3330104443605 \n", + "epoch 36 Iteration 100 loss: -1478.0145396344049\t\t\tepoch-loss: -1399.0665992260174 \n", + "epoch 37 Iteration 100 loss: -1555.4119456067176\t\t\tepoch-loss: -1360.9939473244767 \n", + "epoch 38 Iteration 100 loss: -1553.031887368961\t\t\tepoch-loss: -1419.1421503464217 \n", + "epoch 39 Iteration 100 loss: -1427.3431059260865\t\t\tepoch-loss: -1415.0248356293594 \n", + "epoch 40 Iteration 100 loss: -1137.8470272897798\t\t\tepoch-loss: -1398.6618957762776 \n", + "epoch 41 Iteration 100 loss: -1551.999240061582\t\t\tepoch-loss: -1402.3061839927834 \n", + "epoch 42 Iteration 100 loss: -1458.4434735943848\t\t\tepoch-loss: -1425.2654433536431 \n", + "epoch 43 Iteration 100 loss: -1585.6542548185487\t\t\tepoch-loss: -1384.815978968837 \n", + "epoch 44 Iteration 100 loss: -1410.7384899311965\t\t\tepoch-loss: -1400.3690408109871 \n", + "epoch 45 Iteration 100 loss: -1343.7557878846794\t\t\tepoch-loss: -1402.4205821010662 \n", + "epoch 46 Iteration 100 loss: -1309.0681838828461\t\t\tepoch-loss: -1412.2783526889364 \n", + "epoch 47 Iteration 100 loss: -1125.0585501913108\t\t\tepoch-loss: -1391.0496208478644 \n", + "epoch 48 Iteration 100 loss: -1470.087468755146\t\t\tepoch-loss: -1390.1175558545679 \n", + "epoch 49 Iteration 100 loss: -1572.597159674086\t\t\tepoch-loss: -1389.4460105298315 \n", + "epoch 50 Iteration 100 loss: -1113.9894360784558\t\t\tepoch-loss: -1403.3841449208112 \n" + ] + } + ], + "source": [ + "import mxnet as mx\n", + "from mxfusion.inference import GradBasedInference, MAP, MinibatchInferenceLoop\n", + "\n", + "infr = GradBasedInference(inference_algorithm=MAP(model=m, observed=[m.X, m.Y]), \n", + " grad_loop=MinibatchInferenceLoop(batch_size=10, rv_scaling={m.Y: 1000/10}))\n", + "infr.initialize(X=(1000,1), Y=(1000,1))\n", + "infr.params[m.Y.factor.inducing_inputs] = mx.nd.array(np.random.randn(20, 1), dtype='float64')\n", + "infr.run(X=mx.nd.array(X, dtype='float64'), Y=mx.nd.array(Y, dtype='float64'), \n", + " max_iter=50, learning_rate=0.1, verbose=True)\n", + "infr.run(X=mx.nd.array(X, dtype='float64'), Y=mx.nd.array(Y, dtype='float64'), \n", + " max_iter=50, learning_rate=0.01, verbose=True)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The learned kernel parameters are as follows:" + ] + }, + { + "cell_type": "code", + "execution_count": 44, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "The estimated variance of the RBF kernel is 0.220715.\n", + "The estimated length scale of the RBF kernel is 0.498507.\n", + "The estimated variance of the Gaussian likelihood is 0.003107.\n" + ] + } + ], + "source": [ + "print('The estimated variance of the RBF kernel is %f.' % infr.params[m.kernel.variance].asscalar())\n", + "print('The estimated length scale of the RBF kernel is %f.' % infr.params[m.kernel.lengthscale].asscalar())\n", + "print('The estimated variance of the Gaussian likelihood is %f.' % infr.params[m.noise_var].asscalar())" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Prediction\n", + "\n", + "The prediction of a SVGP model can be done by creating a ```TransferInference``` instance." + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "metadata": {}, + "outputs": [], + "source": [ + "from mxfusion.inference import TransferInference, ModulePredictionAlgorithm\n", + "infr_pred = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y]), \n", + " infr_params=infr.params)\n", + "m.Y.factor.svgp_predict.jitter = 1e-6" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To visualize the fitted model, we make predictions on 100 points evenly spanned from -5 to 5. We estimate the mean and variance of the noise-free output $F$." + ] + }, + { + "cell_type": "code", + "execution_count": 46, + "metadata": {}, + "outputs": [], + "source": [ + "xt = np.linspace(-5,5,100)[:, None]\n", + "res = infr_pred.run(X=mx.nd.array(xt, dtype='float64'))[0]\n", + "f_mean, f_var = res[0].asnumpy()[0], res[1].asnumpy()[0]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The resulting figure is shown as follows:" + ] + }, + { + "cell_type": "code", + "execution_count": 47, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], + "source": [ + "plot(xt, f_mean[:,0], 'b-', label='mean')\n", + "plot(xt, f_mean[:,0]-2*np.sqrt(f_var[:, 0]), 'b--', label='2 x std')\n", + "plot(xt, f_mean[:,0]+2*np.sqrt(f_var[:, 0]), 'b--')\n", + "plot(X, Y, 'rx', label='data points')\n", + "ylabel('F')\n", + "xlabel('X')\n", + "_=legend()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.0" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/examples/notebooks/variational_auto_encoder.ipynb b/examples/notebooks/variational_auto_encoder.ipynb index 1736b67..3e0efdc 100644 --- a/examples/notebooks/variational_auto_encoder.ipynb +++ b/examples/notebooks/variational_auto_encoder.ipynb @@ -6,28 +6,25 @@ "source": [ "# Variational Auto-Encoder (VAE)\n", "\n", - "### Zhenwen Dai (2018-8-21)" + "### Zhenwen Dai (2019-05-29)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "```\n", - "# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved.\n", - "#\n", - "# Licensed under the Apache License, Version 2.0 (the \"License\").\n", - "# You may not use this file except in compliance with the License.\n", - "# A copy of the License is located at\n", - "#\n", - "# http://www.apache.org/licenses/LICENSE-2.0\n", - "#\n", - "# or in the \"license\" file accompanying this file. This file is distributed\n", - "# on an \"AS IS\" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either\n", - "# express or implied. See the License for the specific language governing\n", - "# permissions and limitations under the License.\n", - "# ==============================================================================\n", - "```" + "Variational auto-encoder (VAE) is a latent variable model that uses a latent variable to generate data represented in vector form. Consider a latent variable $x$ and an observed variable $y$. The plain VAE is defined as\n", + "\\begin{align}\n", + "p(x) =& \\mathcal{N}(0, I) \\\\\n", + "p(y|x) =& \\mathcal{N}(f(x), \\sigma^2I)\n", + "\\end{align}\n", + "where $f$ is the deep neural network (DNN), often referred to as the decoder network.\n", + "\n", + "The variational posterior of VAE is defined as \n", + "\\begin{align}\n", + "q(x) = \\mathcal{N}\\left(g_{\\mu}(y), \\sigma^2_x I)\\right)\n", + "\\end{align}\n", + "where $g_{\\mu}$ is the encoder networks that generate the mean of the variational posterior of $x$. For simplicity, we assume that all the data points share the same variance in the variational posteior. This can be extended by generating the variance also from the encoder network." ] }, { @@ -80,7 +77,9 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Model Defintion" + "## Model Defintion\n", + "\n", + "We first define that the encoder and decoder DNN with MXNet Gluon blocks. Both DNNs have two hidden layers with tanh non-linearity." ] }, { @@ -101,11 +100,10 @@ "H = 50\n", "encoder = nn.HybridSequential(prefix='encoder_')\n", "with encoder.name_scope():\n", - " encoder.add(nn.Dense(H, activation=\"tanh\"))\n", - " encoder.add(nn.Dense(H, activation=\"tanh\"))\n", - " encoder.add(nn.Dense(Q, flatten=True))\n", - "encoder.initialize(mx.init.Xavier(magnitude=3))\n", - "_=encoder(mx.nd.array(np.random.rand(5,D)))" + " encoder.add(nn.Dense(H, in_units=D, activation=\"tanh\", flatten=False))\n", + " encoder.add(nn.Dense(H, in_units=H, activation=\"tanh\", flatten=False))\n", + " encoder.add(nn.Dense(Q, in_units=H, flatten=False))\n", + "encoder.initialize(mx.init.Xavier(magnitude=3))" ] }, { @@ -117,20 +115,17 @@ "H = 50\n", "decoder = nn.HybridSequential(prefix='decoder_')\n", "with decoder.name_scope():\n", - " decoder.add(nn.Dense(H, activation=\"tanh\"))\n", - " decoder.add(nn.Dense(H, activation=\"tanh\"))\n", - " decoder.add(nn.Dense(D, flatten=True))\n", - "decoder.initialize(mx.init.Xavier(magnitude=3))\n", - "_=decoder(mx.nd.array(np.random.rand(5,Q)))" + " decoder.add(nn.Dense(H, in_units=Q, activation=\"tanh\", flatten=False))\n", + " decoder.add(nn.Dense(H, in_units=H, activation=\"tanh\", flatten=False))\n", + " decoder.add(nn.Dense(D, in_units=H, flatten=False))\n", + "decoder.initialize(mx.init.Xavier(magnitude=3))" ] }, { - "cell_type": "code", - "execution_count": 7, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "from mxfusion.components.variables.var_trans import PositiveTransformation" + "Then, we define the model of VAE in MXFusion. Note that for simplicity in implementation, we use scalar normal distributions defined for individual entries of a Matrix instead of multivariate normal distributions with diagonal covariance matrices." ] }, { @@ -142,23 +137,42 @@ "name": "stdout", "output_type": "stream", "text": [ - "x ~ Normal(mean=Variable(e909c), variance=Variable(e90bf))\n", - "f = GluonFunctionEvaluation(decoder_input_0=x, decoder_dense0_weight=Variable(0f71b), decoder_dense0_bias=Variable(aee54), decoder_dense1_weight=Variable(8db61), decoder_dense1_bias=Variable(7c56e), decoder_dense2_weight=Variable(85b99), decoder_dense2_bias=Variable(21241))\n", - "y ~ Normal(mean=f, variance=noise_var)\n" + "Model (37a04)\n", + "Variable (b92c2) = BroadcastToOperator(data=Variable noise_var (a50d4))\n", + "Variable (39c2c) = BroadcastToOperator(data=Variable (e1aad))\n", + "Variable (b7150) = BroadcastToOperator(data=Variable (a57d4))\n", + "Variable x (53056) ~ Normal(mean=Variable (b7150), variance=Variable (39c2c))\n", + "Variable f (ad606) = GluonFunctionEvaluation(decoder_input_0=Variable x (53056), decoder_dense0_weight=Variable (b9b70), decoder_dense0_bias=Variable (d95aa), decoder_dense1_weight=Variable (73dc2), decoder_dense1_bias=Variable (b85dd), decoder_dense2_weight=Variable (7a61c), decoder_dense2_bias=Variable (eba91))\n", + "Variable y (23bca) ~ Normal(mean=Variable f (ad606), variance=Variable (b92c2))\n" ] } ], "source": [ - "m = mf.models.Model()\n", - "m.N = mf.components.Variable()\n", - "m.decoder = mf.components.functions.MXFusionGluonFunction(decoder, num_outputs=1,broadcastable=False)\n", - "m.x = mf.components.distributions.Normal.define_variable(mean=mx.nd.array([0]), variance=mx.nd.array([1]), shape=(m.N, Q))\n", + "from mxfusion.components.variables.var_trans import PositiveTransformation\n", + "from mxfusion import Variable, Model, Posterior\n", + "from mxfusion.components.functions import MXFusionGluonFunction\n", + "from mxfusion.components.distributions import Normal\n", + "from mxfusion.components.functions.operators import broadcast_to\n", + "\n", + "m = Model()\n", + "m.N = Variable()\n", + "m.decoder = MXFusionGluonFunction(decoder, num_outputs=1,broadcastable=True)\n", + "m.x = Normal.define_variable(mean=broadcast_to(mx.nd.array([0]), (m.N, Q)),\n", + " variance=broadcast_to(mx.nd.array([1]), (m.N, Q)), shape=(m.N, Q))\n", "m.f = m.decoder(m.x)\n", - "m.noise_var = mf.components.Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=mx.nd.array([0.01]))\n", - "m.y = mf.components.distributions.Normal.define_variable(mean=m.f, variance=m.noise_var, shape=(m.N, D))\n", + "m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=mx.nd.array([0.01]))\n", + "m.y = Normal.define_variable(mean=m.f, variance=broadcast_to(m.noise_var, (m.N, D)), \n", + " shape=(m.N, D))\n", "print(m)" ] }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "We also define the variational posterior following the equation above." + ] + }, { "cell_type": "code", "execution_count": 9, @@ -168,17 +182,19 @@ "name": "stdout", "output_type": "stream", "text": [ - "x_mean = GluonFunctionEvaluation(encoder_input_0=y, encoder_dense0_weight=Variable(9768f), encoder_dense0_bias=Variable(9f1a0), encoder_dense1_weight=Variable(18970), encoder_dense1_bias=Variable(bcff4), encoder_dense2_weight=Variable(3d2a8), encoder_dense2_bias=Variable(95031))\n", - "x ~ Normal(mean=x_mean, variance=x_var)\n" + "Posterior (4ec05)\n", + "Variable x_mean (86d22) = GluonFunctionEvaluation(encoder_input_0=Variable y (23bca), encoder_dense0_weight=Variable (51b3d), encoder_dense0_bias=Variable (c0092), encoder_dense1_weight=Variable (ad9ef), encoder_dense1_bias=Variable (83db0), encoder_dense2_weight=Variable (78b82), encoder_dense2_bias=Variable (b856d))\n", + "Variable (6dc84) = BroadcastToOperator(data=Variable x_var (19d07))\n", + "Variable x (53056) ~ Normal(mean=Variable x_mean (86d22), variance=Variable (6dc84))\n" ] } ], "source": [ - "q = mf.models.Posterior(m)\n", - "q.x_var = mf.components.Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=mx.nd.array([1e-6]))\n", - "q.encoder = mf.components.functions.MXFusionGluonFunction(encoder, num_outputs=1, broadcastable=False)\n", + "q = Posterior(m)\n", + "q.x_var = Variable(shape=(1,), transformation=PositiveTransformation(), initial_value=mx.nd.array([1e-6]))\n", + "q.encoder = MXFusionGluonFunction(encoder, num_outputs=1, broadcastable=True)\n", "q.x_mean = q.encoder(q.y)\n", - "q.x.set_prior(mf.components.distributions.Normal(mean=q.x_mean, variance=q.x_var))\n", + "q.x.set_prior(Normal(mean=q.x_mean, variance=broadcast_to(q.x_var, q.x.shape)))\n", "print(q)" ] }, @@ -186,50 +202,52 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Variational Inference" + "## Variational Inference\n", + "\n", + "Variational inference is done via creating an inference object and passing in the stochastic variational inference algorithm." ] }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 11, "metadata": {}, "outputs": [], "source": [ - "from mxfusion.inference import BatchInferenceLoop, StochasticVariationalInference, GradBasedInference" + "from mxfusion.inference import BatchInferenceLoop, StochasticVariationalInference, GradBasedInference\n", + "\n", + "observed = [m.y]\n", + "alg = StochasticVariationalInference(num_samples=3, model=m, posterior=q, observed=observed)\n", + "infr = GradBasedInference(inference_algorithm=alg, grad_loop=BatchInferenceLoop())" ] }, { - "cell_type": "code", - "execution_count": 11, + "cell_type": "markdown", "metadata": {}, - "outputs": [], "source": [ - "observed = [m.y]\n", - "alg = StochasticVariationalInference(num_samples=3, model=m, posterior=q, observed=observed)\n", - "infr = GradBasedInference(inference_algorithm=alg, grad_loop=BatchInferenceLoop())" + "SVI is a gradient-based algorithm. We can run the algorithm by providing the data and specifying the parameters for the gradient optimizer (the default gradient optimizer is Adam)." ] }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 13, "metadata": { - "scrolled": true + "scrolled": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "Iteration 201 loss: 1715.0395507812525\n", - "Iteration 401 loss: 599.87670898437525\n", - "Iteration 601 loss: 149.24291992187538\n", - "Iteration 801 loss: -44.793395996093755\n", - "Iteration 1001 loss: -202.39929199218755\n", - "Iteration 1201 loss: -314.48220825195315\n", - "Iteration 1401 loss: -301.41076660156255\n", - "Iteration 1601 loss: -585.94531250937585\n", - "Iteration 1801 loss: -702.51806640625525\n", - "Iteration 2000 loss: -775.11627197265625" + "Iteration 200 loss: 1720.556396484375\t\t\t\t\t\n", + "Iteration 400 loss: 601.11962890625\t\t\t\t\t\t\t\n", + "Iteration 600 loss: 168.620849609375\t\t\t\t\t\t\n", + "Iteration 800 loss: -48.67474365234375\t\t\t\t\t\n", + "Iteration 1000 loss: -207.34835815429688\t\t\t\t\n", + "Iteration 1200 loss: -354.17742919921875\t\t\t\t\n", + "Iteration 1400 loss: -356.26409912109375\t\t\t\t\n", + "Iteration 1600 loss: -561.263427734375\t\t\t\t\t\t\n", + "Iteration 1800 loss: -697.8665161132812\t\t\t\t\t\n", + "Iteration 2000 loss: -753.83203125\t\t\t\t8\t\t\t\t\t\n" ] } ], @@ -241,31 +259,37 @@ "cell_type": "markdown", "metadata": {}, "source": [ - "## Plot the training data in the latent space" + "## Plot the training data in the latent space\n", + "\n", + "Finally, we may be interested in visualizing the latent space of our dataset. We can do that by calling encoder network." ] }, { "cell_type": "code", - "execution_count": 13, + "execution_count": 17, "metadata": {}, "outputs": [], "source": [ + "from mxfusion.inference import TransferInference\n", + "\n", "q_x_mean = q.encoder.gluon_block(mx.nd.array(Y)).asnumpy()" ] }, { "cell_type": "code", - "execution_count": 14, + "execution_count": 18, "metadata": {}, "outputs": [ { "data": { - "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXYAAAD8CAYAAABjAo9vAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDIuMi4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvhp/UCwAAFlBJREFUeJzt3X+I3Hedx/HXeye7nKLUYpMoTbZrq4g/7hjbMVeRcFJ7sXc0EevJ6R1Szjb55wQFj3peQe4EuVNROM6Cl01FD0pFsGpalbZixQjGdLbMmcacR1oakqtkq5dWpYezu/O+PzYTNpvZnV+f7/fzmc/3+YCy3WYy89lJ85rPvL/vz3vM3QUAyMdU7AUAAMIi2AEgMwQ7AGSGYAeAzBDsAJAZgh0AMkOwA0BmCHYAyAzBDgCZ2RLjQa+66iqfm5uL8dAAMLEWFhZ+5e5b+90uSrDPzc2p2WzGeGgAmFhmdnqQ21GKAYDMEOwAkBmCHQAyQ7ADQGbGDnYz+wMzO2Zm/2lmJ8zsn0IsDAAwmhBdMb+XdJO7/87MpiX92My+5+5HA9w3AGBIY+/YfdXvLnw7feEfPpYJmFCtxZYOHT+k1mIr9lIwoiB97GZWk7Qg6bWS7nH3n/a4zQFJByRpdnY2xMMCCKy12NL+R/arvdLWTG1G83vmVd9Wj70sDCnIxVN3X3H3uqQdknaZ2Zt73OaguzfcvbF1a9+DUwAiaJ5rqr3SVkcdLXWW1DzHQcJJFLQrxt2fl/RDSbeEvF8A5Whsb2imNqOa1TQ9Na3G9kbsJWEEY5dizGyrpCV3f97MXiLpZkmfGXtlAEpX31bX/J55Nc811djeoAwzoULU2F8t6asX6uxTkr7u7g8FuF8AEdS31Qn0CTd2sLv7zyS9JcBaAAABcPIUADJDsANAZgh2AMgMwQ4AmSHYASAzBDsAZIZgB4DMEOwAkBmCHavOHJOOfH71K4CJFmRsLybcmWPSV/dJK22pNiPdfljauSv2qgCMiB07pGeOrIa6r6x+feZI7BUBGAPBDmlu9+pO3WqrX+d2x14RgDFQisFq2eX2w6s79bndlGGACUewY9XOXQQ6kAlKMQCQGYIdADJDsANAZgh2AMgMwQ4AmSHYASAzBDsAZIZgB4DMEOwAkBmCHQAyQ7ADQGYIdgDIDMEOAJkh2AEgMwQ7AGRm7GA3s51m9piZnTSzE2b2kRALAwCMJsQHbSxL+pi7P2FmL5e0YGaPuvvPA9w3ENzC6fM6+vSvdeO1r9QN11wZezlAcGMHu7v/UtIvL/z7b83spKSrJRHsSM7C6fP660NH1V7uaGbLlO6780bCHdkJWmM3szlJb5H005D3C4Ry9Olfq73cUcelpeWOjj7969hLqoTWYkuHjh9Sa7EVeymVEOwzT83sZZK+Iemj7v6bHr9+QNIBSZqdnQ31sMBQbrz2lZrZMqWl5Y6mt0zpxmtfGXtJ2WsttrT/kf1qr7Q1U5vR/J551bfVYy8ra0GC3cymtRrq97n7A71u4+4HJR2UpEaj4SEeFxjWDddcqfvuvJEae4ma55pqr7TVUUdLnSU1zzUJ9oKNHexmZpLulXTS3b8w/pKAYt1wzZUEeoka2xuaqc1oqbOk6alpNbY3Yi8peyF27G+X9EFJx82sW0D7B3f/boD7BjDh6tvqmt8zr+a5phrbG+zWSxCiK+bHkizAWgBkqr6tTqCXiJOnAKKgU6Y4wbpigBRw+Ggy0ClTLIId2eDw0eSgU6ZYlGKQDQ4fTY5up0zNanTKFIAdO7LB4aPJQadMscy9/LNCjUbDm81m6Y+L/FFjR87MbMHd+769YceOrHD4CKDGDgDZIdgBIDMEOwBkhmAHgMwQ7MjawunzuuexU1o4fT72UoDS0BWDbHESFVXFjh3Z4iQqqopgR7a6J1FrJk6iolIoxSBbfAweqopgR9Y4iYoqohQDFISOHMTCjh0oAB05iIkdO1AAOnIQE8EOFICOHMREKQYoAB05iIlgRxhnjknPHJHmdks7d8VeTRLoyEEsBDvGd+aY9NV90kpbqs1Itx8m3IGIqLFjfM8cWQ11X1n9+syR2CsCStdabOnQ8UNqLbZiL4UdOwKY2726U+/u2Od2x14RUKrWYkv7H9mv9kpbM7UZze+Zj/oB3QQ7xrdz12r5JaMaOx+KjWE0zzXVXmmro46WOktqnmsS7MjAzl1ZBLrE4SIMr7G9oZnajJY6S5qemlZjeyPqegh2YJ1eh4vWBzs7eqxV31bX/J55Nc811djeiLpblwIFu5l9WdKtkhbd/c0h7hOJqGAbY/dw0dJy5+LhorVBLokdPS5T31aPHuhdoXbsX5H0RUn/Eej+kIKKtjGuP1wkXRrkt12/o++OHogpSLC7+4/MbC7EfSEhvdoYKxDs0qWHi+557NQlQW7SZTt6ICXU2LEx2hglXV6aue36Hbrt+h3U2JEsc/cwd7S6Y39ooxq7mR2QdECSZmdnbzh9+nSQx0XBKlhj73VhNJWLpamsA3GY2YK79225KW3H7u4HJR2UpEajEebVBMXrhnn3NGnm4b5Rq2MKc19ow8SgGCmAzXUvoP7g06tfzxyLvaJCpTxHPeW1IS1Bgt3M7pf0E0mvN7OzZnZHiPtFAio2ByblOeopr60KBp0Fk8LMmFBdMR8IcT9IUMUuoIaYo15UHZwZ7/EMOgsmlZkxdMVgcxnOgellfRiPGppF18G799UtwxDu5dhsFkxrsXXxxGkqM2MIdvSX0RyYXhZOn9cH5o9ebGe8f//oYTzIOIJx18oF1PJtNAtm/Q79rrfelcTMGIIdlffAE2fVXu5IktrLHT3wxNmRw7LXOIKQin7hQG8bzYJZv0N/of1CEjNjCHZU3vre23F6cYuugxf9woGN9ZoF02snn8LMmGAHlIbRaDS82WyW/rjoo4KHkaQLpZiDP9HSimu6Zrr/wNuS3gVzSCkta2vsRQf6oAeUCPaUlRm0FR341UVYYhIkd/IUQyozaM8ck374z9Ly7yV1KjfwS1K0k6W8oKAIBHuqypqsePEF5EKoa6oS/epl2Sy46XBBUQj2VJV1MOjiC0hHsinp2ndI7/hEpXbrRekX3HS4oCgEe6rKOhi0/gWEUA+mX3DT4VI9ZV1oJdhTVsbBoFFeQCraPTOsfsHNiIBqKXPcAMGO4V5AKtg9M+oFzkGCO4VxwChHmeMGCHYMp2IflzfuBU6CG10bjSUoAsFOWWE4FZv2yAVOhLLRWIIiVDvYK1hWGFtFpj12FXWBk/71aipr3EC1g71iZYW+Bn33kvm0x7WKuMBJ/zqKVu1gr1hZYVO8e9lQvzr5sLtvyjsoWrWDvYiywqTW7Hn3MpD1IT7K7pv+dRSt2sEuhS0rTPKul3cvffUK8VF23/Svo2gE+zD67cYnedc7QRdFY1147BXio+6+aYNEkQj2QQ2yG5/0Xe8g714il5piXnjsFeLsvpEign1Qg+zGU9n1FhW+CZSaYl543CjE2X0jNQT7oAbdjcduBRw2fId5EUig1NTdNbeXOzIzXfnSmVIfnxDHJJiKvYCJ0d2N33R32hdFe4XvRrovAj/49OrXM8c2v+/ui5vVopWabrjmSn3y1jdpykwrHdenHjqhhdPnS18HkDJ27MOIvRsfxDB1/mF34ImUms6/2FbHXa60+sA5TYpUEOy5GSZ8R7nYm8CLW4p94JwmRUoI9hSNe/Fz0PBNZAc+rBQ7UThNipQQ7Kkpu/Nk2B14IidrU7uImeK7CFQXwZ6aBDpPNpRAu2OqUnwXgeoi2FPTq+6dyC456RedBKT2LgLVFSTYzewWSf8qqSbpkLv/S4j7raT1dW8pnV3ypJ+sjYRuGZRt7GA3s5qkeyT9qaSzkh43s8Pu/vNx77uy1ta9j3w+nV3yhF5sjYluGcQQYse+S9Ipd39akszsa5LeLYlgDyG1XXKR7Y6plJwColsGMYQI9qslnVnz/VlJf7z+RmZ2QNIBSZqdnQ3wsBVRlV1yphdmr3zpjKbMJDndMihNiJEC1uO/+WX/wf2guzfcvbF169YAD1shO3dJuz+WRdBtaJhRCBNi4fR5feqhE1rpuKbM9Mlb33TJbn3h9Hnd89gpRiIguBA79rOSdq75foekZwPc72gyfDtfCamVnALolmFckrvr/Ivti79G7R1FChHsj0t6nZm9RtL/SHq/pL8KcL/Dy/TtfOlivDhmWHK6OIly6fJJlNTeUaSxSzHuvizpw5IelnRS0tfd/cS49zuSDN/Ol27YiY8hZVZyujiJcsrU8UsnUXZDv2ai9o7ggvSxu/t3JX03xH2NJcO386ULcQgp43LYsD3p3UmU63fmnFRFkfI6eZrh2/nSjfvimHE5bJS6+GYzZCb9pGprsaXmuaYa2xuqb6vHXg7WyCvYpSTGyk60cV8cEx07EOL05yh18Vx35q3Flu54+A4tdZY0PTWte991L+GekPyCHeMb58UxwXJYqA6UUSc4TvrOvJfDTx1Wu7Pa5dPutHX4qcMEe0IIdoSVYDksVAdKrrvvUdi64yvrv0dckx/sGV+om1i9dvwR/5xCzkrPcfc9ir3X7dW3Tn3rYilm73V7Yy8Ja5j7ZYdEC9doNLzZbI5/RxlfqCtMjIBN4M+JCYvh9bp4ygXVYpnZgrs3+t1usnfsiV6oS1asgE3gz4mddnj1bfVLwru12NL+R/arvdLWTG1G83vmCfdIQsyKiad7oc5qyVyoG8uZY6tjeos6FBTrAFduf04V01ps6dDxQ2ottja9XfNcU+2VtjrqaKmzpOa5AO/KMZLJ3rEneKFuZGXspmN1rGTy51TFcs4wu/DG9oZmajMX6+6N7X0rBijIZAe7lE/fehnlipgBm8Cf0zjBXNWhXb124RsFe31bXfN75qmxJ2Dygz0XZe2mEwjYGMYN5qoO7eruwtsrbZlMV8xcsent19fdEcdk19hz0t1N33R3dbt7CrzG0CuYh1HVoV31bXXd9da7NGVT6nhHn338s31r7YiPHXtKKrqbllT4NYZxe9mrfDjphfYL6nhnoHJMP7RDlmOygp3DSMWJ/dwWfI0hRDBXtWVynIuia4NcEu2QJZmcYE/gkEu2UnhuS7jGUNVgHteoF0XXd9Tsu27fwBdiMZ7JCfYEDrlkK4XnNrGWyCq2Nm5mmIui3V36s7979pIgdzntkCWZnGBPcGpgNlJ5bhO5xlDV1sYQ1u7St0xt0ZapLVrxFU1PTWvfdfu077p91NhLMDnBntiOLis8t5eoamtjCGv73ld8Re993Xv16pe9+pIgJ9CLNznBLiWzo8sSz+1FIadBVs36C617r9tLkEcw2dMdgYJUscYeqhWxez9XzFyhF9ovUHYJqBrTHYGCVK2DJuRkxu7vo7UxHk6eYmNFT5tEMkJPZmTSY1zs2NFbCr3tKM2wh5D6lW2Y9BgXwY7eUuhtR2mGOYQ0SNmGSY9xEewbyPri2SDjA1LpbUdpBj2ENOgoXyY9xkOw95D1AZVBSyz0tmMDlFnSR7D3kPUBlWFKLPS2owfKLOmjK6aHrGdv8/mjKMign42K4rFj7yHr2duUWDCmXhdPJfrWUzJWsJvZ+yT9o6Q3SNrl7tk0q2Z9QIUSC8awUY86I3nTMe6O/UlJt0n69wBrATABNrp4utEFVT41qXxBZsWY2Q8l/d2gO3ZmxQCTrdc8GEmXBXjIUQVgVgyAAm00D+bOP7zzktsN2vOOsPp2xZjZ983syR7/vHuYBzKzA2bWNLPmc889N/qKASRhkHkw3bJNzWr0vJeo747d3W8O8UDuflDSQWm1FBPiPgHEM8hBpW7P+4NPPSgXf+3LQikGwEiGOah0+KnDaq+09eBTD1JnL8G47Y7vkfRvkrZK+o6Ztdz9XUFWBiB5g8yDoc5evrGC3d2/KembgdYCIEPMlikfpZiAYk+EjP34QC/MlikfwR5I7ImQsR8f2AwjfMtFsAcSayJkd5f+7PP/l+9ESiSLU6VpIthHtL7s0Z0IubTcKW0i5Npd+pYp05balFZWynt8VBunStNFsI9go7JH2RMh175LWOm4/nLXTl39ipdQY0cp6HZJF8E+go3KLmVPhFz/LuG91+8g0FEaul3SRbCPIEbZpZes58YjeXS7pCvIdMdh5TDdkdZCAGVjumPBsv4gDgATjc88BYDMEOwAkBmCHQAyQ7ADQGYIdgDIDMEOAJkh2AEgMwQ7AGSGYAeAzBDsAJAZgh0AMkOwAwVqLbZ06PghtRZbsZeCCmEIGFAQPmEIsbBjBwrS6xOGgDIQ7EBBup8wVLManzCEUlGKAQqy/hOGJOnQ8UN82hAKR7ADBapvq6u+rU69HaUi2IESbFRv5/NCUQSCHShBt96+1FnS9NS0rpi5gh08CkOwAyVYX2/vtYMn2BHKWMFuZp+TtFdSW9JTkv7G3Z8PsTAgN916e9faHTwdMwjJ3H3032y2R9IP3H3ZzD4jSe7+8X6/r9FoeLNJTy+qrbXYosaOoZjZgrv33QWMtWN390fWfHtU0l+Mc39AlazfwQOhhDyg9CFJ3wt4fwCAEfTdsZvZ9yW9qscv3e3u375wm7slLUu6b5P7OSDpgCTNzs6OtFiUa9hSAaUFIA19g93db97s183sdkm3Snqnb1Kwd/eDkg5KqzX2IdeJkg17oKbf7Qn9wfFcYVzjdsXcIunjkv7E3V8MsySkYNh2vM1uz6nLwfFcIYRxa+xflPRySY+aWcvMvhRgTUjAsAOsNrs9Uw4Hx3OFEMbtinltqIUgLesP1PTbNW52+/WnLunZ3hjPFUIYq499VPSxxxGzdkvdeHA8V9jIoH3sBHtFULsFJt+gwc4HbVQEtVugOgj2iuDTfIDqYLpjRQx7MRTA5CLYK4TZJEA1UIoBgMwQ7ACQGYIdADJDsANAZgh2AMgMwQ4AmYkyUsDMnpN0uuSHvUrSr0p+zJRU/eeXeA6q/vNLk/8cXOPuW/vdKEqwx2BmzUFmLOSq6j+/xHNQ9Z9fqs5zQCkGADJDsANAZqoU7AdjLyCyqv/8Es9B1X9+qSLPQWVq7ABQFVXasQNAJVQq2M3sc2b2X2b2MzP7ppm9IvaaymRm7zOzE2bWMbPsOwO6zOwWM/uFmZ0ys7+PvZ6ymdmXzWzRzJ6MvZZYzGynmT1mZicv/B34SOw1FalSwS7pUUlvdvc/kvTfkj4ReT1le1LSbZJ+FHshZTGzmqR7JP2ZpDdK+oCZvTHuqkr3FUm3xF5EZMuSPubub5B0o6S/zfn/g0oFu7s/4u7LF749KmlHzPWUzd1PuvsvYq+jZLsknXL3p929Lelrkt4deU2lcvcfSfrf2OuIyd1/6e5PXPj330o6KenquKsqTqWCfZ0PSfpe7EWgcFdLOrPm+7PK+C80+jOzOUlvkfTTuCspTnafoGRm35f0qh6/dLe7f/vCbe7W6luz+8pcWxkG+fkrxnr8N1rBKsrMXibpG5I+6u6/ib2eomQX7O5+82a/bma3S7pV0js9w17Pfj9/BZ2VtHPN9zskPRtpLYjIzKa1Gur3ufsDsddTpEqVYszsFkkfl7TP3V+MvR6U4nFJrzOz15jZjKT3SzoceU0omZmZpHslnXT3L8ReT9EqFeySvijp5ZIeNbOWmX0p9oLKZGbvMbOzkt4m6Ttm9nDsNRXtwsXyD0t6WKsXzL7u7ifirqpcZna/pJ9Ier2ZnTWzO2KvKYK3S/qgpJsu/N1vmdmfx15UUTh5CgCZqdqOHQCyR7ADQGYIdgDIDMEOAJkh2AEgMwQ7AGSGYAeAzBDsAJCZ/wfwkPjuAc1V6gAAAABJRU5ErkJggg==\n", + "image/png": "iVBORw0KGgoAAAANSUhEUgAAAXYAAAD8CAYAAABjAo9vAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDIuMi4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvhp/UCwAAFiZJREFUeJzt3X2MXFd5x/Hfs5OdFglkosRrotiOSaAVNKqGZDBGKCoKaQgocUQqJEiFogK2KpUKJKrQNFJf/mobBGolIrXeNYJKKQg1EEwhyosUhJHqOLPRFDuYFyeKazfRrkONASFldnee/jE7Zjye3Zk7c+89d879fiRrM97J3DO7ye+eee5zzjV3FwAgHjOhBwAASBfBDgCRIdgBIDIEOwBEhmAHgMgQ7AAQGYIdACJDsANAZAh2AIjMZSEOeuWVV/quXbtCHBoAptbi4uIr7r512POCBPuuXbvUaDRCHBoAppaZnRrleZRiACAyBDsARIZgB4DIEOwAEBmCHQAiQ7ADQGQmDnYz+20zO2pm/21mz5nZ36UxMAD5ay43tXBsQc3lZuihYAJp9LG/Kulmd/+Vmc1K+r6ZPeruR1J4bQA5aS43te/xfWqttVStVDV/67xqc7XQw8IYJp6xe8ev1h/Orv/hRqrAlGksNdRaa6mttlbaK2ossYhwWqVSYzezipk1JS1LesLdnx7wnP1m1jCzxtmzZ9M4LIAU1bfVVa1UVbGKZmdmVd9WDz0kjMnc05tcm9nrJX1D0p+7+/GNnlev150tBYDiaS431VhqqL6tThmmgMxs0d2HnnFT3SvG3X9uZt+VdJukDYMdQDHV5moEegTS6IrZuj5Tl5m9RtItkn406esCAMaTxoz9KklfNrOKOieKr7n7f6bwugCAMUwc7O7+A0lvS2EsAIAUsPIUACJDsANAZAh2AIgMwQ4AkSHYASAyBDsARIZgB4DIEOwAEBmCHYOdPiod/lznK4CpkuomYIjE6aPSl/dKay2pUpXuOSTt2B16VABGxIwdl3rxcCfUfa3z9cXDoUcEIAGCHZfadVNnpm6VztddN4UeEYAEKMXgUjt2d8ovLx7uhDplGGCqEOwYbMduAh2YUpRiACAyBDsARIZgB4DIEOwAEBmCHQAiQ7ADQGQIdgCIDMEOAJEh2AEgMgQ7AESGYAeAyBDsABAZgh0AIkOwA0BkCHYAiMzEwW5mO8zsKTM7YWbPmdkn0xgYAGA8adxoY1XSp939WTN7naRFM3vC3X+YwmsDmVo8dU5HXviZ9lx7hW685vLQwwFSMXGwu/vLkl5e/+dfmtkJSVdLIthRaIunzumPF46otdpW9bIZPfTxPYQ7opBqjd3Mdkl6m6SnB3xvv5k1zKxx9uzZNA8LjOXICz9Ta7Wttksrq20deeFnoYcEpCK1YDez10p6WNKn3P0X/d939wPuXnf3+tatW9M6LDC2PddeoeplM6qYNHvZjPZce0XoIUWludzUwrEFNZeboYdSOqnczNrMZtUJ9Yfc/etpvCaQtRuvuVwPfXwPNfYMNJeb2vf4PrXWWqpWqpq/dV61uVroYZXGxMFuZibpoKQT7v75yYcE5OfGay4n0DPQWGqotdZSW22ttFfUWGoQ7DlKoxTzLkkfkXSzmTXX/7w/hdcFMKXq2+qqVqqqWEWzM7Oqb6uHHlKppNEV831JlsJYAESiNlfT/K3zaiw1VN9WZ7aes1Rq7ADQrzZXI9ADYUsBRGvx1Dk9+NRJLZ46F3oo6EG3TPaYsSNKLD4qJrpl8sGMHVFi8VExDeqWQfoIdkSJxUfFRLdMPszdcz9ovV73RoMzNbLFBl/F1Fxu0i0zJjNbdPehZ0OCHQCmxKjBTikGACJDsANAZAh2AIgMwQ4AkSHYURqsREVZsPIUpcBKVJQJM3aUAitRUSYEO0qBlagoE0oxKAVug4cyIdhRGtwGD2VBKQYAIkOwAzmh3RJ5oRQD5IB2S+SJGTuQA9otkSeCHdk4fVQ6/LnOV9BuiVxRikH6Th+VvrxXWmtJlap0zyFpx+7QowqKdkvkiWBH+l483Al1X+t8ffFw6YNdot0S+aEUg/TtuqkzU7dK5+uum0KPCMhcc7mphWMLai43Qw+FGTsysGN3p/zy4uFOqDNbR+Say03te3yfWmstVStVzd86H/R+rgQ7srFj99QHOjfDxqgaSw211lpqq62V9ooaSw2CHSga+s6RRH1bXdVKVSvtFc3OzKq+bej9pjNFsGN0p4+WprwyqO98ULAzq4ck1eZqmr91Xo2lhurb6kFn61JKwW5mX5R0u6Rld78+jddEwZSshbHbd76y2r6o77w3yCUxq8cFtbla8EDvSmvG/iVJX5D0bym9HoqmZC2Mg/rO+8szd92wfaRZPZC3VILd3b9nZrvSeC0UVLeFsTtjL0ELY3/feX95xqSBs3ogtNxq7Ga2X9J+Sdq5c2deh0VaaGG8pDxz1w3bddcN26mxo3ByC3Z3PyDpgCTV63XP67jAuPovjG60LQCBjqKhKwajKdnF043aHdkWANOALQUwmkEXTyNW5G12uWFH8YXeXiCtdsevSHq3pCvN7Iykv3H3g2m8NgqiZBdPN2p3DI2FU2E1l5tDe9WLsL1AWl0xH07jdVBgJbt4WtRtdkddOIX0bRbYvYFfhO0FqLFjdBHs/7KZf3/6f/To8Zf1vuuv0t3v2DlRPT2rFalF/SRRBhsFdn/g3/v2e4NvL0CwA+qE+l9945gk6fBPX5Ek3f2O8dpysyyXFPWTRBlstB9Mf+Cfb50Pvr0AwY6LlWg/mF6PHn/5ksfjBjvlkjhttB/MoMAPvb0AwY7fKFlLY6/3XX/VhZl69/G4siyXcPE0rEGBXbQNwCSCvfjymkGfPip99++l1VcltUuxH0yv7uy8t8Y+rizLJXwaKKbQM/R+BHuR5TWDvnCc9VDXTClaGvvd/Y6dEwV6r6wWMnHxFKMg2Issrx0VLxynLdmMdO27pXffV5rZ+jTh4ilGQbAXWV6LgvqPQ6inIquWR7Y1wDAEe5HltSgo6XFK2jmTxKgXObkDU7mMsnI1DQR70eW1KGjU45S4cyaJUS5y0uFSLnluNcAmYEimZJuBjat7kbNi2vAiZ5E3GkP6Bq1czQoz9l6UGIYr2WZg0njlklEuctLhUi4brVzNgrnnf8+Ler3ujUZ2Z6uxUGIYXYlOgFmXS6ixl8ukNXYzW3T3oWcEZuxdJbtZ80CjBnbkm4H1ynpBEB0u5ZLXQiaCvauEJYaL8IllIMolmEYEe1fJ9hu/BJ9YBspqQRAlGGSJYO+VZolh2urQZf/Esom0yyW0OSJrBHtSowT2NJY1puwTS6gZ76DjJh0LG3khawR7EqMG9rSWNZIsUgp4Agg14x10XEmJx0LdHlkj2JMYNbBjLmsU4NNIqBnvRguKko6FjbyQNYI9iVEDO3RZI8sZdQE+jey59gpdVunMeCuV/Ga8G820x5l90+aILBHsSSQJ7FC93kln1ElPAkX5NNJdWJfjAruNZtrMvlE0BHtSRV+ck2RGPU5ZJfSnEXVKIqttl0taa3uuFx8HzbSZfaNoCPbYJJlRj1tWCXxy4+IjsDmCPTZJZtRFKaskVMSLjyw4QpGwCVhR5XkT6yTHmbaFVzlgwRHywiZg0yzPlsIkZZUCtDoWEQuOUDTcaKOIBtW+Tx+VDn+u87VI48JIN9UA8sSMvYj6a9+vuaIYM+UprclnrYg1f5RbKsFuZrdJ+mdJFUkL7v4PabxuafVfAC3AoqCB46IMcwEtjyiSiYPdzCqSHpT0h5LOSHrGzA65+w8nfe1S6699F2WmnGWrY6QXZumYQd7SmLHvlnTS3V+QJDP7qqQ7JRHsaSnDTDnSC7N0zCCENC6eXi3pdM/jM+t/dxEz229mDTNrnD17NoXDlsyO3dJNn44i7AaK9MLsRhuHAVlKI9htwN9d0hzv7gfcve7u9a1bt6Zw2A0UoXsEyXUvzFolfLkpRXTMIIQ0SjFnJO3oebxd0kspvG5ykX6cz12IWneE5aZubf2vb/89nft1ixo7cpNGsD8j6c1m9kZJ/yvpQ5LuTuF1kytK98g0C3lyLPoGawkMq61zQRVZmjjY3X3VzD4h6TF12h2/6O7PTTyycdBnPbk0To6Rdrck0Vtbf3WlrYefPXPRrfS4oIospdLH7u7fkfSdNF5rIhF+nM/dpCdHymGS1m8GMmNqrXW2F/6PxTP6oxu268ZrLmcLAmQuvi0FYu8eyVr35Hjz/eOFcqTdLVJnpv3gUye1eOrc0OfeeM3l+mB9x4XOgrW133TExHJBtbnc1MKxBTWXm6GHgj5sKYBLTVLrLmA5LI169jjlk7tu2K6Hnz1zyb7xMWxB0Fxu6mOPfUwr7RXNzszq4HsPqjZXCz0srCPYka6ClcPSqmePUz7ZLMCnfQuCQ88fUqvdkiS12i0dev4QwV4g0x/sXKgrno1m/AF+V2nVs8e9a9O0B/hGrG/5Sv9jhDXdwc6FumRCngQD/a7Suo1eDOWTNN1x3R165OQjF0oxd1x3R+ghocd0Bzt966MLfRIM9LtKM5BjnX2PozZX08H3HlRjqaH6trpqczU1l5sXPUY40x3sBbxQV1ihT4IBf1cEcjZqc7ULAd5cbmrf4/vUWmupWqlq/tZ5wj2g6Q72gl2om0jWZZLQJ8GYflclNGw23lhqqLXWUlttrbRX1FhqEOwBTXewS3EsQ8+jTFKEYI3hd1VCo8zG69vqqlaqF2ru9W1D77eMDE1/sMcgrzJJkYM1408sk/ayl3lvl1Fm47W5muZvnafGXhAEexGELpOElvEnlkl72cu+t0t3Nt5aa8lk2lLdMvB5vTV3hDVdWwrEutf6pMv4p13G2xBMerOLst8sozZX071vv1czNqO2t/XAMw+wjUDBTc+MPXS7XtZCl0lC9rhn/Ill0l72tHrhp9n51nm1vT3xxVFaIvMxPcEeul0vZqFPmhlf2J20l53FSeNfHO0Nckm0ROZkeoK97HXoLBXhpJnxJ5ZJe9nL3guf9OJoc7mpbz3/LT1y8hGttldVrVS197q9tETmZHqCvQjterHipIkRjHpxtNse+eraq/L12x+vtFfkcloiczI9wS6Fr0PHipPmRcrc2piGbntkN9RNptmZWe29bq/2XreXGnsOpivYkR1OmpJobUxDbz2+YhXd+aY7tfe6vReCnEDPHsEO9OC2dZPrrcdvqW7R+db50EMqHYId6FH21sa02hG7/y5dMGEQ7NhYCW9iUubWxrR3aGRjsHAIdgwWurc9oLK2NqYdxGwMFg7BXkajzMSL0NuOXCUN4mFlGzYGC4dgL5tRZ+L0tpdOkiAetWzDxmBhEOxlM+pMnN72Uho1iKmfFxvBPkDUC1SSzMTpbccGqJ8Xm7l77get1+veaDRyP+4oSrFApYTdLkjfoBo7uzdmy8wW3X3oWZQZe59SLFBhJo4UdIO7sfSbSRp968VAsPcp+wIVYFT9F1DZvbE4Jgp2M/ugpL+V9BZJu929mPWVBMq8QAVIov8CKrs3FsekM/bjku6S9K8pjKUwyrpABUiif7MvSbr37ffqfOv8JTV2au/5mijY3f2EJJlZOqMBMDW6fe/dG2o8/JOHB9bW096qAMPldjNrM9tvZg0za5w9ezavwwLIUG2upqtee5VW26sX1dZ7Dep5R7aGBruZPWlmxwf8uTPJgdz9gLvX3b2+devW8UcMoFC6JZmKVQbW1nu/X7GKXvrVS2ouNwONthxS6WM3s+9K+otRL54WuY8dQHLDauiD7oFKSSY5+tgB5GbYVgS1uZoaS41LSjYEezYmqrGb2QfM7Iykd0r6tpk9ls6wAMRmWMkG6WFLgYhEvccNokDb42QoxeQsdKiWYo8bTD228c0HwZ6C0KG6eOqc/unJn8S/xw2AkeTWxx6zQRuH5aV7Uvn+T19R26UZE3vcIHfN5aYWji3QxlgQzNgTGlRyCblxWPek4uqcpd/1piv1qVt+h9k6csPK0uIh2BPYqOQScuOw/pMKoY68cTel4iHYE9hsr/ZQG4exGyVC425KxUOwJ1DUvdrZjRIhJbkJNvJBH3tCodsaAZQXfewZYXYMoOhodwSAyBDsABAZgh0AIkOwA0BkCHYAiAzBDgCRIdgBIDIEOwBEhmAHgMgQ7AAQGYIdyBA3oEAI7BUDZIQbUCAUZuxARgbdgALIA8EOZKR7A4qKVTQ7M6st1S2UZZALSjFARnpvQLGlukUPPPMAZRnkgmAHMlSbq6k2V9PCsYWBZRnuOoQsEOxADvrvC7qluoULq8gMwQ7koP++oIMurBLsSAvBDuSkW5bp6p3B17cNvY0lMLKJgt3MPivpDkktSc9L+hN3/3kaAwNi1j+DZ7aONE06Y39C0n3uvmpm/yjpPkmfmXxYQPz6Z/BAWibqY3f3x919df3hEUnbJx8SAGASaS5Q+qikR1N8PQDAGIaWYszsSUlvGPCt+939m+vPuV/SqqSHNnmd/ZL2S9LOnTvHGizy01xuJqr/Jn0+gOwMDXZ3v2Wz75vZPZJul/Qed/dNXueApAOSVK/XN3wewku6eRWbXaWLkyQmNWlXzG3qXCz9A3f/dTpDQmhJe6yHPZ+gGh0nSaRh0q6YL0j6LUlPmJkkHXH3P514VAiqf5XksB7rzZ5PUCXDwiWkYaJgd/c3pTUQFEfSHuvNnk9QJZP0pAoMwsrTkkhaDknaY73R8wmqZFi4hDTYJtc7M1Ov173R4KYDeQldDqHGDqTDzBbdfejsiBl7CYQuh7DCEsgXd1Aqgf47+VAOAeLGjL0EqNsC5UKwlwTlEKA8KMUAQGQIdgCIDMEOAJEh2AEgMgQ7AESGYAeAyATZUsDMzko6lfuBpSslvRLguEVR9vcv8TMo+/uXpvtncI27bx32pCDBHoqZNUbZZyFWZX//Ej+Dsr9/qRw/A0oxABAZgh0AIlO2YD8QegCBlf39S/wMyv7+pRL8DEpVYweAMijbjB0Aole6YDezz5rZj8zsB2b2DTN7fegx5cnMPmhmz5lZ28yi7gzoZWa3mdmPzeykmf1l6PHkzcy+aGbLZnY89FhCMLMdZvaUmZ1Y/+//k6HHlKXSBbukJyRd7+6/L+knku4LPJ68HZd0l6TvhR5IXsysIulBSe+T9FZJHzazt4YdVe6+JOm20IMIaFXSp939LZL2SPqzmP8bKF2wu/vj7r66/vCIpO0hx5M3dz/h7j8OPY6c7ZZ00t1fcPeWpK9KujPwmHLl7t+T9H+hxxGKu7/s7s+u//MvJZ2QdHXYUWWndMHe56OSHg09CGTuakmnex6fUcT/U2NzZrZL0tskPR12JNmJ8g5KZvakpDcM+Nb97v7N9efcr87Hs4fyHFseRnn/JWMD/o52sBIys9dKeljSp9z9F6HHk5Uog93db9ns+2Z2j6TbJb3HI+z3HPb+S+iMpB09j7dLeinQWBCImc2qE+oPufvXQ48nS6UrxZjZbZI+I2mvu/869HiQi2ckvdnM3mhmVUkfknQo8JiQIzMzSQclnXD3z4ceT9ZKF+ySviDpdZKeMLOmmf1L6AHlycw+YGZnJL1T0rfN7LHQY8ra+sXyT0h6TJ2LZl9z9+fCjipfZvYVSf8l6XfN7IyZfSz0mHL2LkkfkXTz+v/3TTN7f+hBZYWVpwAQmTLO2AEgagQ7AESGYAeAyBDsABAZgh0AIkOwA0BkCHYAiAzBDgCR+X8tA7ZLJcL0MgAAAABJRU5ErkJggg==\n", "text/plain": [ "
" ] }, - "metadata": {}, + "metadata": { + "needs_background": "light" + }, "output_type": "display_data" } ], diff --git a/mxfusion/__version__.py b/mxfusion/__version__.py index 8473f95..0a2127a 100644 --- a/mxfusion/__version__.py +++ b/mxfusion/__version__.py @@ -13,4 +13,4 @@ # ============================================================================== -__version__ = '0.3.0' +__version__ = '0.3.1' diff --git a/mxfusion/common/exceptions.py b/mxfusion/common/exceptions.py index 2ea8690..4a082cf 100644 --- a/mxfusion/common/exceptions.py +++ b/mxfusion/common/exceptions.py @@ -16,8 +16,10 @@ class ModelSpecificationError(Exception): pass + class InferenceError(Exception): pass + class SerializationError(Exception): pass diff --git a/mxfusion/components/distributions/bernoulli.py b/mxfusion/components/distributions/bernoulli.py index fa9aa77..d61c0f0 100644 --- a/mxfusion/components/distributions/bernoulli.py +++ b/mxfusion/components/distributions/bernoulli.py @@ -45,7 +45,8 @@ def replicate_self(self, attribute_map=None): """ This functions as a copy constructor for the object. In order to do a copy constructor we first call ``__new__`` on the class which creates a blank object. - We then initialize that object using the methods standard init procedures, and do any extra copying of attributes. + We then initialize that object using the methods standard init procedures, and do any extra copying of + attributes. Replicates this Factor, using new inputs, outputs, and a new uuid. Used during model replication to functionally replicate a factor into a new graph. @@ -85,7 +86,7 @@ def draw_samples_impl(self, prob_true, rv_shape, num_samples=1, F=None): :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Bernoulli distribution :rtypes: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/beta.py b/mxfusion/components/distributions/beta.py index 760f544..0ba9121 100644 --- a/mxfusion/components/distributions/beta.py +++ b/mxfusion/components/distributions/beta.py @@ -81,7 +81,7 @@ def draw_samples_impl(self, alpha, beta, rv_shape, num_samples=1, F=None): :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the beta distribution. :rtypes: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/categorical.py b/mxfusion/components/distributions/categorical.py index b937ce8..9f56a86 100644 --- a/mxfusion/components/distributions/categorical.py +++ b/mxfusion/components/distributions/categorical.py @@ -51,7 +51,8 @@ def __init__(self, log_prob, num_classes, one_hot_encoding=False, rand_gen=rand_gen, dtype=dtype, ctx=ctx) if axis != -1: - raise NotImplementedError("The Categorical distribution currently only supports the last dimension to be the class label dimension, i.e., axis == -1.") + raise NotImplementedError("The Categorical distribution currently only supports the last dimension to be " + "the class label dimension, i.e., axis == -1.") self.axis = axis self.normalization = normalization self.one_hot_encoding = one_hot_encoding @@ -61,7 +62,8 @@ def replicate_self(self, attribute_map=None): """ This functions as a copy constructor for the object. In order to do a copy constructor we first call ``__new__`` on the class which creates a blank object. - We then initialize that object using the methods standard init procedures, and do any extra copying of attributes. + We then initialize that object using the methods standard init procedures, and do any extra copying of + attributes. Replicates this Factor, using new inputs, outputs, and a new uuid. Used during model replication to functionally replicate a factor into a new graph. @@ -112,7 +114,7 @@ def draw_samples_impl(self, log_prob, rv_shape, num_samples=1, F=None): :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Categorical distribution :rtypes: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/distribution.py b/mxfusion/components/distributions/distribution.py index 6c3a44b..8914d60 100644 --- a/mxfusion/components/distributions/distribution.py +++ b/mxfusion/components/distributions/distribution.py @@ -93,14 +93,16 @@ def log_cdf(self, F=None, **kwargs): def draw_samples(self, F, variables, num_samples=1, targets=None, always_return_tuple=False): """ - Draw a number of samples from the distribution. All the dependent variables are automatically collected from a dictionary of variables according to the UUIDs of the dependent variables. + Draw a number of samples from the distribution. All the dependent variables are automatically collected from a + dictionary of variables according to the UUIDs of the dependent variables. :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :param variables: the set of variables where the dependent variables are collected from. :type variables: {str(UUID): MXNet NDArray or Symbol} :param num_samples: the number of drawn samples (default: one). - :int num_samples: int - :param always_return_tuple: return the samples in a tuple of shape one. This allows easy programming when there are potentially multiple output variables. + :type num_samples: int + :param always_return_tuple: return the samples in a tuple of shape one. This allows easy programming when there + are potentially multiple output variables. :type always_return_tuple: boolean :returns: a set samples of the distribution. :rtypes: MXNet NDArray or MXNet Symbol or [MXNet NDArray or MXNet Symbol] @@ -122,7 +124,7 @@ def draw_samples_impl(self, rv_shape, num_samples=1, F=None, **kwargs): :param rv_shape: the shape of each sample. :type rv_shape: tuple, [tuple] :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the distribution. :rtypes: MXNet NDArray or MXNet Symbol or [MXNet NDArray or MXNet Symbol] diff --git a/mxfusion/components/distributions/gamma.py b/mxfusion/components/distributions/gamma.py index 414fe9b..66e1ea8 100644 --- a/mxfusion/components/distributions/gamma.py +++ b/mxfusion/components/distributions/gamma.py @@ -63,8 +63,8 @@ def draw_samples_impl(self, alpha, beta, rv_shape, num_samples=1, F=None): Draw samples from the Gamma distribution. :param rv_shape: the shape of each sample. :type rv_shape: tuple - :param nSamples: the number of drawn samples (default: one). - :int nSamples: int + :param num_samples: the number of drawn samples (default: one). + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Gamma distribution. :rtypes: MXNet NDArray or MXNet Symbol @@ -79,6 +79,10 @@ def define_variable(alpha=0., beta=1., shape=None, rand_gen=None, """ Creates and returns a random variable drawn from a Gamma distribution parameterized with a and b parameters. + :param alpha: beta parameter of the Gamma random variable (also known as rate) + :type alpha: float + :param beta: alpha parameter of the Gamma random variable (also known as shape) + :type beta: float :param shape: the shape of the random variable(s). :type shape: tuple or [tuple] :param rand_gen: the random generator (default: MXNetRandomGenerator). @@ -137,6 +141,10 @@ def log_pdf_impl(self, mean, variance, random_variable, F=None): """ Computes the logarithm of the probability density function (PDF) of the Gamma distribution. + :param mean: mean of the Gamma random variable (alpha / beta) + :type mean: float + :param variance: variance of the Gamma random variable (alpha / beta**2) + :type variance: float :param random_variable: the random variable of the Gamma distribution. :type random_variable: MXNet NDArray or MXNet Symbol :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). @@ -150,14 +158,13 @@ def log_pdf_impl(self, mean, variance, random_variable, F=None): p1 = (alpha - 1.) * F.log(random_variable) return (p1 - beta * random_variable) - (g_alpha - alpha * F.log(beta)) - def draw_samples_impl(self, mean, variance, rv_shape, num_samples=1, - F=None): + def draw_samples_impl(self, mean, variance, rv_shape, num_samples=1, F=None): """ Draw samples from the Gamma distribution. :param rv_shape: the shape of each sample. :type rv_shape: tuple - :param nSamples: the number of drawn samples (default: one). - :int nSamples: int + :param num_samples: the number of drawn samples (default: one). + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Gamma distribution. :rtypes: MXNet NDArray or MXNet Symbol @@ -168,8 +175,7 @@ def draw_samples_impl(self, mean, variance, rv_shape, num_samples=1, ctx=self.ctx) @staticmethod - def define_variable(mean=0., variance=1., shape=None, rand_gen=None, - dtype=None, ctx=None): + def define_variable(mean=0., variance=1., shape=None, rand_gen=None, dtype=None, ctx=None): """ Creates and returns a random variable drawn from a Gamma distribution parameterized with mean and variance. diff --git a/mxfusion/components/distributions/gp/cond_gp.py b/mxfusion/components/distributions/gp/cond_gp.py index da7674d..6176a87 100644 --- a/mxfusion/components/distributions/gp/cond_gp.py +++ b/mxfusion/components/distributions/gp/cond_gp.py @@ -15,11 +15,9 @@ import numpy as np from ....common.config import get_default_MXNet_mode -from ....common.exceptions import InferenceError +from ....common.exceptions import ModelSpecificationError from ...variables.variable import Variable -from ....util.customop import broadcast_to_w_samples from ..distribution import Distribution -from ...variables.runtime_variable import get_num_samples class ConditionalGaussianProcess(Distribution): @@ -46,8 +44,10 @@ class ConditionalGaussianProcess(Distribution): :type Y_cond: Variable :param kernel: the kernel of Gaussian process. :type kernel: Kernel - :param mean_func: the mean function of Gaussian process. - :type mean_func: N/A + :param mean: the mean of Gaussian process. + :type mean: Variable + :param mean_cond: the mean of the conditional output variable under the same mean function. + :type mean_cond: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -55,23 +55,40 @@ class ConditionalGaussianProcess(Distribution): :param ctx: the mxnet context (default: None/current context). :type ctx: None or mxnet.cpu or mxnet.gpu """ - def __init__(self, X, X_cond, Y_cond, kernel, mean_func=None, + def __init__(self, X, X_cond, Y_cond, kernel, mean=None, mean_cond=None, rand_gen=None, dtype=None, ctx=None): + if (mean is None) and (mean_cond is not None): + raise ModelSpecificationError("The argument mean and mean_cond need to be both specified.") inputs = [('X', X), ('X_cond', X_cond), ('Y_cond', Y_cond)] + \ [(k, v) for k, v in kernel.parameters.items()] input_names = [k for k, _ in inputs] + if mean is not None: + inputs.append(('mean', mean)) + input_names.append('mean') + self._has_mean = True + else: + self._has_mean = False + if mean_cond is not None: + inputs.append(('mean_cond', mean_cond)) + input_names.append('mean_cond') + self._has_mean_cond = True + else: + self._has_mean_cond = False output_names = ['random_variable'] super(ConditionalGaussianProcess, self).__init__( inputs=inputs, outputs=None, input_names=input_names, output_names=output_names, rand_gen=rand_gen, dtype=dtype, ctx=ctx) - self.mean_func = mean_func self.kernel = kernel + @property + def has_mean(self): + return self._has_mean + @staticmethod - def define_variable(X, X_cond, Y_cond, kernel, shape=None, mean_func=None, - rand_gen=None, minibatch_ratio=1., dtype=None, - ctx=None): + def define_variable(X, X_cond, Y_cond, kernel, shape=None, mean=None, + mean_cond=None, rand_gen=None, minibatch_ratio=1., + dtype=None, ctx=None): """ Creates and returns a set of random variable drawn from a Gaussian process. @@ -85,8 +102,10 @@ def define_variable(X, X_cond, Y_cond, kernel, shape=None, mean_func=None, :type kernel: Kernel :param shape: the shape of the random variable(s) (the default shape is the same shape as *X* but the last dimension is changed to one.) :type shape: tuple or [tuple] - :param mean_func: the mean function of Gaussian process. - :type mean_func: N/A + :param mean: the mean of Gaussian process. + :type mean: Variable + :param mean_cond: the mean of the conditional output variable under the same mean function. + :type mean_cond: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -95,15 +114,15 @@ def define_variable(X, X_cond, Y_cond, kernel, shape=None, mean_func=None, :type ctx: None or mxnet.cpu or mxnet.gpu """ gp = ConditionalGaussianProcess( - X=X, X_cond=X_cond, Y_cond=Y_cond, kernel=kernel, - mean_func=mean_func, rand_gen=rand_gen, dtype=dtype, ctx=ctx) + X=X, X_cond=X_cond, Y_cond=Y_cond, kernel=kernel, mean=mean, + mean_cond=mean_cond, rand_gen=rand_gen, dtype=dtype, ctx=ctx) gp.outputs = [('random_variable', Variable(value=gp, shape=X.shape[:-1] + (1,) if shape is None else shape))] return gp.random_variable def log_pdf_impl(self, X, X_cond, Y_cond, random_variable, F=None, - **kernel_params): + **kernel_params): """ Computes the logarithm of the probability density function (PDF) of the conditional Gaussian process. @@ -127,6 +146,12 @@ def log_pdf_impl(self, X, X_cond, Y_cond, random_variable, F=None, :returns: log pdf of the distribution. :rtypes: MXNet NDArray or MXNet Symbol """ + if self._has_mean: + mean = kernel_params['mean'] + del kernel_params['mean'] + if self._has_mean_cond: + mean_cond = kernel_params['mean_cond'] + del kernel_params['mean_cond'] D = random_variable.shape[-1] F = get_default_MXNet_mode() if F is None else F K = self.kernel.K(F, X, **kernel_params) @@ -136,9 +161,10 @@ def log_pdf_impl(self, X, X_cond, Y_cond, random_variable, F=None, LccInvKc = F.linalg.trsm(Lcc, Kc) cov = K - F.linalg.syrk(LccInvKc, transpose=True) L = F.linalg.potrf(cov) - if self.mean_func is not None: - random_variable = random_variable - self.mean_func(F, X) - Y_cond = Y_cond - self.mean_func(F, X_cond) + if self._has_mean: + random_variable = random_variable - mean + if self._has_mean_cond: + Y_cond = Y_cond - mean_cond LccInvY = F.linalg.trsm(Lcc, Y_cond) rv_mean = F.linalg.gemm2(LccInvKc, LccInvY, True, False) LinvY = F.sum(F.linalg.trsm(L, random_variable - rv_mean), axis=-1) @@ -161,13 +187,19 @@ def draw_samples_impl(self, X, X_cond, Y_cond, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :param **kernel_params: the set of kernel parameters, provided as keyword arguments. :type **kernel_params: {str: MXNet NDArray or MXNet Symbol} :returns: a set samples of the distribution. :rtypes: MXNet NDArray or MXNet Symbol """ + if self._has_mean: + mean = kernel_params['mean'] + del kernel_params['mean'] + if self._has_mean_cond: + mean_cond = kernel_params['mean_cond'] + del kernel_params['mean_cond'] F = get_default_MXNet_mode() if F is None else F K = self.kernel.K(F, X, **kernel_params) Kc = self.kernel.K(F, X_cond, X, **kernel_params) @@ -176,19 +208,18 @@ def draw_samples_impl(self, X, X_cond, Y_cond, rv_shape, num_samples=1, LccInvKc = F.linalg.trsm(Lcc, Kc) cov = K - F.linalg.syrk(LccInvKc, transpose=True) L = F.linalg.potrf(cov) - if self.mean_func is not None: - Y_cond = Y_cond - self.mean_func(F, X_cond) + if self._has_mean_cond: + Y_cond = Y_cond - mean_cond LccInvY = F.linalg.trsm(Lcc, Y_cond) rv_mean = F.linalg.gemm2(LccInvKc, LccInvY, True, False) out_shape = (num_samples,) + rv_shape - L = broadcast_to_w_samples(F, L, out_shape[:-1] + out_shape[-2:-1]) die = self._rand_gen.sample_normal( shape=out_shape, dtype=self.dtype, ctx=self.ctx) rv = F.linalg.trmm(L, die) + rv_mean - if self.mean_func is not None: - rv = rv + self.mean_func(F, X) + if self._has_mean: + rv = rv + mean return rv def replicate_self(self, attribute_map=None): @@ -197,7 +228,7 @@ def replicate_self(self, attribute_map=None): """ replicant = super(ConditionalGaussianProcess, self).replicate_self(attribute_map) - replicant.mean_func = self.mean_func.replicate_self(attribute_map) \ - if self.mean_func is not None else None + replicant._has_mean = self._has_mean + replicant._has_mean_cond = self._has_mean_cond replicant.kernel = self.kernel.replicate_self(attribute_map) return replicant diff --git a/mxfusion/components/distributions/gp/gp.py b/mxfusion/components/distributions/gp/gp.py index 7c9ebdd..95c55b3 100644 --- a/mxfusion/components/distributions/gp/gp.py +++ b/mxfusion/components/distributions/gp/gp.py @@ -15,27 +15,25 @@ import numpy as np from ....common.config import get_default_MXNet_mode -from ....common.exceptions import InferenceError from ...variables import Variable -from ....util.customop import broadcast_to_w_samples from ..distribution import Distribution -from ...variables.runtime_variable import get_num_samples class GaussianProcess(Distribution): """ The Gaussian process distribution. - A Gaussian process consists of a kernel function and a mean function (optional). A collection of GP random variables follows a multi-variate - normal distribution, where the mean is computed from the mean function (zero, if not given) and the covariance matrix is computed from the kernel - function, both of which are computed given a collection of inputs. + A Gaussian process consists of a kernel function and a mean function (optional). A collection of GP random + variables follows a multi-variate normal distribution, where the mean is computed from the mean function + (zero, if not given) and the covariance matrix is computed from the kernel function, both of which are computed + given a collection of inputs. :param X: the input variables on which the random variables are conditioned. :type X: Variable :param kernel: the kernel of Gaussian process. :type kernel: Kernel - :param mean_func: the mean function of Gaussian process. - :type mean_func: N/A + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -43,21 +41,31 @@ class GaussianProcess(Distribution): :param ctx: the mxnet context (default: None/current context). :type ctx: None or mxnet.cpu or mxnet.gpu """ - def __init__(self, X, kernel, mean_func=None, rand_gen=None, dtype=None, + def __init__(self, X, kernel, mean=None, rand_gen=None, dtype=None, ctx=None): inputs = [('X', X)] + [(k, v) for k, v in kernel.parameters.items()] input_names = [k for k, _ in inputs] + if mean is not None: + inputs.append(('mean', mean)) + input_names.append('mean') + self._has_mean = True + else: + self._has_mean = False output_names = ['random_variable'] super(GaussianProcess, self).__init__( inputs=inputs, outputs=None, input_names=input_names, output_names=output_names, rand_gen=rand_gen, dtype=dtype, ctx=ctx) - self.mean_func = mean_func self.kernel = kernel + @property + def has_mean(self): + return self._has_mean + @staticmethod - def define_variable(X, kernel, shape=None, mean_func=None, rand_gen=None, dtype=None, ctx=None): + def define_variable(X, kernel, shape=None, mean=None, rand_gen=None, + dtype=None, ctx=None): """ Creates and returns a set of random variables drawn from a Gaussian process. @@ -65,10 +73,11 @@ def define_variable(X, kernel, shape=None, mean_func=None, rand_gen=None, dtype= :type X: Variable :param kernel: the kernel of Gaussian process. :type kernel: Kernel - :param shape: the shape of the random variable(s) (the default shape is the same shape as *X* but the last dimension is changed to one). + :param shape: the shape of the random variable(s) (the default shape is the same shape as *X* but the last + dimension is changed to one). :type shape: tuple or [tuple] - :param mean_func: the mean function of Gaussian process. - :type mean_func: N/A + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -76,8 +85,8 @@ def define_variable(X, kernel, shape=None, mean_func=None, rand_gen=None, dtype= :param ctx: the mxnet context (default: None/current context). :type ctx: None or mxnet.cpu or mxnet.gpu """ - gp = GaussianProcess(X=X, kernel=kernel, mean_func=mean_func, - rand_gen=rand_gen, dtype=dtype, ctx=ctx) + gp = GaussianProcess(X=X, kernel=kernel, mean=mean, rand_gen=rand_gen, + dtype=dtype, ctx=ctx) gp.outputs = [('random_variable', Variable(value=gp, shape=X.shape[:-1] + (1,) if shape is None else shape))] @@ -92,26 +101,27 @@ def log_pdf_impl(self, X, random_variable, F=None, **kernel_params): :param random_variable: the random_variable of which log-PDF is computed. :type random_variable: MXNet NDArray or MXNet Symbol :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray) - :param **kernel_params: the set of kernel parameters, provided as keyword arguments. - :type **kernel_params: {str: MXNet NDArray or MXNet Symbol} + :param kernel_params: the set of kernel parameters, provided as keyword arguments. + :type kernel_params: {str: MXNet NDArray or MXNet Symbol} :returns: log pdf of the distribution. :rtypes: MXNet NDArray or MXNet Symbol """ + if self._has_mean: + mean = kernel_params['mean'] + del kernel_params['mean'] D = random_variable.shape[-1] F = get_default_MXNet_mode() if F is None else F K = self.kernel.K(F, X, **kernel_params) L = F.linalg.potrf(K) - if self.mean_func is not None: - mean = self.mean_func(F, X) + if self._has_mean: random_variable = random_variable - mean LinvY = F.linalg.trsm(L, random_variable) logdet_l = F.linalg.sumlogdiag(F.abs(L)) return (- logdet_l * D - F.sum(F.sum(F.square(LinvY) + np.log(2. * np.pi), axis=-1), axis=-1) / 2) * self.log_pdf_scaling - def draw_samples_impl(self, X, rv_shape, num_samples=1, F=None, - **kernel_params): + def draw_samples_impl(self, X, rv_shape, num_samples=1, F=None, **kernel_params): """ Draw a number of samples from the Gaussian process. @@ -120,25 +130,25 @@ def draw_samples_impl(self, X, rv_shape, num_samples=1, F=None, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). - :param **kernel_params: the set of kernel parameters, provided as keyword arguments. - :type **kernel_params: {str: MXNet NDArray or MXNet Symbol} + :param kernel_params: the set of kernel parameters, provided as keyword arguments. + :type kernel_params: {str: MXNet NDArray or MXNet Symbol} :returns: a set samples of the distribution. :rtypes: MXNet NDArray or MXNet Symbol """ + if self._has_mean: + mean = kernel_params['mean'] + del kernel_params['mean'] F = get_default_MXNet_mode() if F is None else F K = self.kernel.K(F, X, **kernel_params) L = F.linalg.potrf(K) out_shape = (num_samples,) + rv_shape - L = broadcast_to_w_samples(F, L, out_shape[:-1] + out_shape[-2:-1]) - die = self._rand_gen.sample_normal( shape=out_shape, dtype=self.dtype, ctx=self.ctx) rv = F.linalg.trmm(L, die) - if self.mean_func is not None: - mean = self.mean_func(F, X) + if self._has_mean: rv = rv + mean return rv @@ -147,7 +157,6 @@ def replicate_self(self, attribute_map=None): The copy constructor for a Gaussian process distribution. """ replicant = super(GaussianProcess, self).replicate_self(attribute_map) - replicant.mean_func = self.mean_func.replicate_self(attribute_map) \ - if self.mean_func is not None else None + replicant._has_mean = self._has_mean replicant.kernel = self.kernel.replicate_self(attribute_map) return replicant diff --git a/mxfusion/components/distributions/gp/kernels/add_kernel.py b/mxfusion/components/distributions/gp/kernels/add_kernel.py index 30b5114..d6decdd 100644 --- a/mxfusion/components/distributions/gp/kernels/add_kernel.py +++ b/mxfusion/components/distributions/gp/kernels/add_kernel.py @@ -53,7 +53,8 @@ def _compute_K(self, F, X, X2=None, **kernel_params): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param **kernel_params: the set of kernel parameters, provided as keyword arguments. @@ -70,8 +71,8 @@ def _compute_Kdiag(self, F, X, **kernel_params): """ The internal interface for the actual computation for the diagonal of the covariance matrix. - This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of the kernel has been - removed. The dimensions of *X* has been sliced according to *active_dims*. + This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of + the kernel has been removed. The dimensions of *X* has been sliced according to *active_dims*. :param F: MXNet computation type . :param X: the first set of inputs to the kernel. diff --git a/mxfusion/components/distributions/gp/kernels/kernel.py b/mxfusion/components/distributions/gp/kernels/kernel.py index 25d837c..e5c082e 100644 --- a/mxfusion/components/distributions/gp/kernels/kernel.py +++ b/mxfusion/components/distributions/gp/kernels/kernel.py @@ -24,13 +24,15 @@ class Kernel(MXFusionFunction): """ - The base class for a Gaussian process kernel: a positive definite function which forms of a covariance function (kernel). + The base class for a Gaussian process kernel: a positive definite function which forms of a covariance function + (kernel). :param input_dim: the number of dimensions of the kernel. (The total number of active dimensions). :type input_dim: int :param name: the name of the kernel. The name is also used as the prefix for the kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -60,12 +62,12 @@ def __setattr__(self, name, value): @property def local_parameters(self): """ - The kernel parameters in the current kernel, which does not include kernel parameters that belongs to the sub-kernels of a compositional - kernel. The keys of the returned dictionary are the name of the kernel parameters (without the prefix) and the values are the corresponding - variables. + The kernel parameters in the current kernel, which does not include kernel parameters that belongs to the + sub-kernels of a compositional kernel. The keys of the returned dictionary are the name of the kernel + parameters (without the prefix) and the values are the corresponding variables. - :return: a dictionary of local kernel parameters, in which the keys are the name of individual parameters, including the kernel in front, and - the values are the corresponding Variables. + :return: a dictionary of local kernel parameters, in which the keys are the name of individual parameters, + including the kernel in front, and the values are the corresponding Variables. :rtype: {str: Variable} """ return {getattr(self, n) for n in self._parameter_names} @@ -73,11 +75,12 @@ def local_parameters(self): @property def parameters(self): """ - All the kernel parameters including the kernel parameters that belongs to the sub-kernels. The keys of the returned dictionary are the name of - the kernel parameters with a prefix (the name of the kernel plus '_') and the values are the corresponding variables. + All the kernel parameters including the kernel parameters that belongs to the sub-kernels. The keys of the + returned dictionary are the name of the kernel parameters with a prefix (the name of the kernel plus '_') and + the values are the corresponding variables. - :return: a dictionary of all the kernel parameters, in which the keys are the name of individual parameters, including the kernel in front, - and the values are the corresponding Variables. + :return: a dictionary of all the kernel parameters, in which the keys are the name of individual parameters, + including the kernel in front, and the values are the corresponding Variables. :rtype: {str: Variable} """ raise NotImplementedError @@ -100,11 +103,11 @@ def K(self, F, X, X2=None, **kernel_params): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol - :param **kernel_params: the set of kernel parameters, provided as keyword arguments. - :type **kernel_params: {str: MXNet NDArray or MXNet Symbol} + :param kernel_params: the set of kernel parameters, provided as keyword arguments. + :type kernel_params: {str: MXNet NDArray or MXNet Symbol} :return: The covariance matrix :rtype: MXNet NDArray or MXNet Symbol """ @@ -129,8 +132,8 @@ def Kdiag(self, F, X, **kernel_params): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param **kernel_params: the set of kernel parameters, provided as keyword arguments. - :type **kernel_params: {str: MXNet NDArray or MXNet Symbol} + :param kernel_params: the set of kernel parameters, provided as keyword arguments. + :type kernel_params: {str: MXNet NDArray or MXNet Symbol} :return: The diagonal of the covariance matrix. :rtype: MXNet NDArray or MXNet Symbol """ @@ -149,6 +152,8 @@ def add(self, other, name='add'): :param other: the other kernel to be added. :type other: Kernel + :param name: The name of the kernel + :type name: str :return: the kernel which is the sum of the current kernel with the specified kernel. :rtype: Kernel """ @@ -170,6 +175,8 @@ def multiply(self, other, name='mul'): :param other: the other kernel to be added. :type other: Kernel + :param name: The name of the kernel + :type name: str :return: the kernel which is the sum of the current kernel with the specified kernel. :rtype: Kernel """ @@ -177,8 +184,7 @@ def multiply(self, other, name='mul'): raise ModelSpecificationError( "Only a Gaussian Process Kernel can be multiplied with a Gaussian Process Kernel.") from .multiply_kernel import MultiplyKernel - return MultiplyKernel([self, other], name=name, ctx=self.ctx, - dtype=self.dtype) + return MultiplyKernel([self, other], name=name, ctx=self.ctx, dtype=self.dtype) def __mul__(self, other): """ @@ -190,8 +196,8 @@ def _compute_K(self, F, X, X2=None, **kernel_params): """ The internal interface for the actual covariance matrix computation. - This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of the kernel has been - removed. The dimensions of *X* and *X2* have been sliced according to *active_dims*. + This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of + the kernel has been removed. The dimensions of *X* and *X2* have been sliced according to *active_dims*. :param F: MXNet computation type . :param X: the first set of inputs to the kernel. @@ -210,8 +216,8 @@ def _compute_Kdiag(self, F, X, **kernel_params): """ The internal interface for the actual computation for the diagonal of the covariance matrix. - This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of the kernel has been - removed. The dimensions of *X* has been sliced according to *active_dims*. + This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of + the kernel has been removed. The dimensions of *X* has been sliced according to *active_dims*. :param F: MXNet computation type . :param X: the first set of inputs to the kernel. @@ -225,13 +231,15 @@ def _compute_Kdiag(self, F, X, **kernel_params): def fetch_parameters(self, params): """ - The helper function to fetch the kernel parameters from a set of variables according to the UUIDs of the kernel parameters. It returns a - dictionary of kernel parameters, where the keys are the name of the kernel parameters and the values are the MXNet array at runtime. The - returned dict can be directly passed into *K* and *Kdiag* as *kernel_params*. + The helper function to fetch the kernel parameters from a set of variables according to the UUIDs of the kernel + parameters. It returns a dictionary of kernel parameters, where the keys are the name of the kernel parameters + and the values are the MXNet array at runtime. The returned dict can be directly passed into *K* and *Kdiag* as + *kernel_params*. :param params: the set of parameters where the kernel parameters are fetched from. :type params: {str (UUID): MXNet NDArray or MXNet Symbol} - :return: a dict of the kernel parameters, where the keys are the name of the kernel parameters and the values are the MXNet array at runtime. + :return: a dict of the kernel parameters, where the keys are the name of the kernel parameters and the values + are the MXNet array at runtime. :rtype: {str (kernel name): MXNet NDArray or MXNet Symbol} """ return {n: params[v.uuid] for n, v in self.parameters.items()} @@ -241,10 +249,10 @@ def eval(self, F, X, X2=None, **kernel_params): The method handling the execution of the function. :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray) - :param **input_kws: the dict of inputs to the functions. The key in the + :param input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs specified in the inputs of FunctionEvaluation. - :type **input_kws: {variable name: MXNet NDArray or MXNet Symbol} + :type input_kws: {variable name: MXNet NDArray or MXNet Symbol} :returns: the return value of the function :rtypes: MXNet NDArray or MXNet Symbol """ @@ -273,7 +281,8 @@ class NativeKernel(Kernel): :type input_dim: int :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -289,11 +298,12 @@ def __init__(self, input_dim, name, active_dims=None, dtype=None, @property def parameters(self): """ - All the kernel parameters including the kernel parameters that belongs to the sub-kernels. The keys of the returned dictionary are the name of - the kernel parameters with a prefix (the name of the kernel plus '_') and the values are the corresponding variables. + All the kernel parameters including the kernel parameters that belongs to the sub-kernels. The keys of the + returned dictionary are the name of the kernel parameters with a prefix (the name of the kernel plus '_') + and the values are the corresponding variables. - :return: a dictionary of all the kernel parameters, in which the keys are the name of individual parameters, including the kernel in front, - and the values are the corresponding Variables. + :return: a dictionary of all the kernel parameters, in which the keys are the name of individual parameters, + including the kernel in front, and the values are the corresponding Variables. :rtype: {str: Variable} """ return {self.name + '_' + n: getattr(self, n) for n in @@ -306,7 +316,8 @@ def parameter_names(self): class CombinationKernel(Kernel): """ - The base class for combination kernels: the covariance matrix is computed by combining the covariance matrix from multiple sub-kernels. + The base class for combination kernels: the covariance matrix is computed by combining the covariance matrix from + multiple sub-kernels. :param sub_kernels: a list of kernels that are combined to compute a covariance matrix. :type sub_kernels: [Kernel] @@ -331,11 +342,12 @@ def __init__(self, sub_kernels, name, dtype=None, ctx=None): @property def parameters(self): """ - All the kernel parameters including the kernel parameters that belongs to the sub-kernels. The keys of the returned dictionary are the name of - the kernel parameters with a prefix (the name of the kernel plus '_') and the values are the corresponding variables. + All the kernel parameters including the kernel parameters that belongs to the sub-kernels. The keys of the + returned dictionary are the name of the kernel parameters with a prefix (the name of the kernel plus '_') and + the values are the corresponding variables. - :return: a dictionary of all the kernel parameters, in which the keys are the name of individual parameters, including the kernel in front, - and the values are the corresponding Variables. + :return: a dictionary of all the kernel parameters, in which the keys are the name of individual parameters, + including the kernel in front, and the values are the corresponding Variables. :rtype: {str: Variable} """ p = {} @@ -354,10 +366,8 @@ def replicate_self(self, attribute_map=None): """ The copy constructor for a kernel. """ - replicant = super(CombinationKernel, self).replicate_self( - attribute_map) - replicant.sub_kernels = [k.replicate_self(attribute_map) for k in - self.sub_kernels] + replicant = super(CombinationKernel, self).replicate_self(attribute_map) + replicant.sub_kernels = [k.replicate_self(attribute_map) for k in self.sub_kernels] for k in replicant.sub_kernels: setattr(replicant, k.name, k) return replicant diff --git a/mxfusion/components/distributions/gp/kernels/linear.py b/mxfusion/components/distributions/gp/kernels/linear.py index c6ec55e..53d371a 100644 --- a/mxfusion/components/distributions/gp/kernels/linear.py +++ b/mxfusion/components/distributions/gp/kernels/linear.py @@ -27,14 +27,15 @@ class Linear(NativeKernel): :param input_dim: the number of dimensions of the kernel. (The total number of active dimensions) . :type input_dim: int - :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided by a lengthscale for individual - dimensions. + :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided + by a lengthscale for individual dimensions. :type ARD: boolean :param variances: the initial value for the variances parameter, which scales the input dimensions. :type variances: float or MXNet NDArray :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -62,13 +63,11 @@ def _compute_K(self, F, X, variances, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variances: the variances parameter, which scales the input dimensions. :type variances: MXNet NDArray or MXNet Symbol - :param lengthscale: the lengthscale parameter. - :type lengthscale: MXNet NDArray or MXNet Symbol :return: The covariance matrix. :rtype: MXNet NDArray or MXNet Symbol """ @@ -101,8 +100,7 @@ def _compute_Kdiag(self, F, X, variances): :rtype: MXNet NDArray or MXNet Symbol """ X2 = F.square(X) - return F.sum(X2 * F.expand_dims(variances, axis=-2), - axis=-1) + return F.sum(X2 * F.expand_dims(variances, axis=-2), axis=-1) def replicate_self(self, attribute_map=None): """ diff --git a/mxfusion/components/distributions/gp/kernels/matern.py b/mxfusion/components/distributions/gp/kernels/matern.py index 845cbe8..0d277b7 100644 --- a/mxfusion/components/distributions/gp/kernels/matern.py +++ b/mxfusion/components/distributions/gp/kernels/matern.py @@ -27,8 +27,8 @@ class Matern(StationaryKernel): :param input_dim: the number of dimensions of the kernel. (The total number of active dimensions) :type input_dim: int - :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided by a lengthscale for individual - dimensions. + :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided + by a lengthscale for individual dimensions. :type ARD: boolean :param variance: the initial value for the variance parameter (scalar), which scales the whole covariance matrix. :type variance: float or MXNet NDArray @@ -36,7 +36,8 @@ class Matern(StationaryKernel): :type lengthscale: float or MXNet NDArray :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -70,8 +71,8 @@ def _compute_K(self, F, X, lengthscale, variance, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variance: the variance parameter (scalar), which scales the whole covariance matrix. :type variance: MXNet NDArray or MXNet Symbol @@ -102,8 +103,8 @@ def _compute_K(self, F, X, lengthscale, variance, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variance: the variance parameter (scalar), which scales the whole covariance matrix. :type variance: MXNet NDArray or MXNet Symbol @@ -134,8 +135,8 @@ def _compute_K(self, F, X, lengthscale, variance, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variance: the variance parameter (scalar), which scales the whole covariance matrix. :type variance: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/gp/kernels/multiply_kernel.py b/mxfusion/components/distributions/gp/kernels/multiply_kernel.py index 30fcd15..3769850 100644 --- a/mxfusion/components/distributions/gp/kernels/multiply_kernel.py +++ b/mxfusion/components/distributions/gp/kernels/multiply_kernel.py @@ -53,8 +53,8 @@ def _compute_K(self, F, X, X2=None, **kernel_params): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param **kernel_params: the set of kernel parameters, provided as keyword arguments. :type **kernel_params: {str: MXNet NDArray or MXNet Symbol} @@ -70,8 +70,8 @@ def _compute_Kdiag(self, F, X, **kernel_params): """ The internal interface for the actual computation for the diagonal of the covariance matrix. - This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name of the kernel has been - removed. The dimensions of *X* has been sliced according to *active_dims*. + This function takes as an assumption: The prefix in the keys of *kernel_params* that corresponds to the name + of the kernel has been removed. The dimensions of *X* has been sliced according to *active_dims*. :param F: MXNet computation type . :param X: the first set of inputs to the kernel. diff --git a/mxfusion/components/distributions/gp/kernels/rbf.py b/mxfusion/components/distributions/gp/kernels/rbf.py index 46aefe1..2719d70 100644 --- a/mxfusion/components/distributions/gp/kernels/rbf.py +++ b/mxfusion/components/distributions/gp/kernels/rbf.py @@ -25,8 +25,8 @@ class RBF(StationaryKernel): :param input_dim: the number of dimensions of the kernel. (The total number of active dimensions) :type input_dim: int - :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided by a lengthscale for individual - dimensions. + :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided + by a lengthscale for individual dimensions. :type ARD: boolean :param variance: the initial value for the variance parameter (scalar), which scales the whole covariance matrix. :type variance: float or MXNet NDArray @@ -34,7 +34,8 @@ class RBF(StationaryKernel): :type lengthscale: float or MXNet NDArray :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -57,8 +58,8 @@ def _compute_K(self, F, X, lengthscale, variance, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variance: the variance parameter (scalar), which scales the whole covariance matrix. :type variance: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/gp/kernels/static.py b/mxfusion/components/distributions/gp/kernels/static.py index 3782b39..790e0d6 100644 --- a/mxfusion/components/distributions/gp/kernels/static.py +++ b/mxfusion/components/distributions/gp/kernels/static.py @@ -32,7 +32,8 @@ class Bias(NativeKernel): :type variance: float or MXNet NDArray :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -59,8 +60,8 @@ def _compute_K(self, F, X, variance, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, + this computes a square covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variance: the variance parameter. :type variance: MXNet NDArray or MXNet Symbol @@ -100,7 +101,8 @@ class White(NativeKernel): :type variance: float or MXNet NDArray :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -127,8 +129,8 @@ def _compute_K(self, F, X, variance, X2=None): :param F: MXNet computation type :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :param variance: the variance parameter. :type variance: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/gp/kernels/stationary.py b/mxfusion/components/distributions/gp/kernels/stationary.py index c95b312..75e21ad 100644 --- a/mxfusion/components/distributions/gp/kernels/stationary.py +++ b/mxfusion/components/distributions/gp/kernels/stationary.py @@ -31,13 +31,14 @@ class StationaryKernel(NativeKernel): In this implementation, r is scaled by the lengthscales parameter(s): .. math:: r2(x, x') = \\sum_{q=1}^Q \\frac{(x_q - x'_q)^2}{\\ell_q^2}. - By default, there's only one lengthscale: separate lengthscales for each dimension can be enables by setting ARD=True. + By default, there's only one lengthscale: separate lengthscales for each dimension can be enables by setting + ARD=True. :param input_dim: the number of dimensions of the kernel. (The total number of active dimensions). :type input_dim: int - :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided by a lengthscale for individual - dimensions. + :param ARD: a binary switch for Automatic Relevance Determination (ARD). If true, the squared distance is divided + by a lengthscale for individual dimensions. :type ARD: boolean :param variance: the initial value for the variance parameter (scalar), which scales the whole covariance matrix. :type variance: float or MXNet NDArray @@ -45,7 +46,8 @@ class StationaryKernel(NativeKernel): :type lengthscale: float or MXNet NDArray :param name: the name of the kernel. The name is used to access kernel parameters. :type name: str - :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. (default: None, taking all the dimensions). + :param active_dims: The dimensions of the inputs that are taken for the covariance matrix computation. + (default: None, taking all the dimensions). :type active_dims: [int] or None :param dtype: the data type for float point numbers. :type dtype: numpy.float32 or numpy.float64 @@ -81,8 +83,8 @@ def _compute_R2(self, F, X, lengthscale, variance, X2=None): :param F: MXNet computation type . :param X: the first set of inputs to the kernel. :type X: MXNet NDArray or MXNet Symbol - :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square covariance matrix of X. In other words, - X2 is internally treated as X. + :param X2: (optional) the second set of arguments to the kernel. If X2 is None, this computes a square + covariance matrix of X. In other words, X2 is internally treated as X. :type X2: MXNet NDArray or MXNet Symbol :return: The squared distance. :rtype: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/laplace.py b/mxfusion/components/distributions/laplace.py index 3063a2f..7fbc03f 100644 --- a/mxfusion/components/distributions/laplace.py +++ b/mxfusion/components/distributions/laplace.py @@ -54,8 +54,7 @@ def log_pdf_impl(self, location, scale, random_variable, F=None): F.abs(F.broadcast_minus(random_variable, location)), scale)) * self.log_pdf_scaling return logL - def draw_samples_impl(self, location, scale, rv_shape, num_samples=1, - F=None): + def draw_samples_impl(self, location, scale, rv_shape, num_samples=1, F=None): """ Draw samples from the Laplace distribution. @@ -66,7 +65,7 @@ def draw_samples_impl(self, location, scale, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Laplace distribution. :rtypes: MXNet NDArray or MXNet Symbol @@ -78,8 +77,7 @@ def draw_samples_impl(self, location, scale, rv_shape, num_samples=1, scale), location) @staticmethod - def define_variable(location=0., scale=1., shape=None, rand_gen=None, - dtype=None, ctx=None): + def define_variable(location=0., scale=1., shape=None, rand_gen=None, dtype=None, ctx=None): """ Creates and returns a random variable drawn from a Laplace distribution. diff --git a/mxfusion/components/distributions/normal.py b/mxfusion/components/distributions/normal.py index 3fb7393..1d62fb4 100644 --- a/mxfusion/components/distributions/normal.py +++ b/mxfusion/components/distributions/normal.py @@ -25,8 +25,9 @@ class Normal(UnivariateDistribution): """ - The one-dimensional normal distribution. The normal distribution can be defined over a scalar random variable or an array of random variables. In case - of an array of random variables, the mean and variance are broadcasted to the shape of the output random variable (array). + The one-dimensional normal distribution. The normal distribution can be defined over a scalar random variable or an + array of random variables. In case of an array of random variables, the mean and variance are broadcasted to the + shape of the output random variable (array). :param mean: Mean of the normal distribution. :type mean: Variable @@ -68,8 +69,7 @@ def log_pdf_impl(self, mean, variance, random_variable, F=None): F.broadcast_minus(random_variable, mean)), -2 * variance)) * self.log_pdf_scaling return logL - def draw_samples_impl(self, mean, variance, rv_shape, num_samples=1, - F=None): + def draw_samples_impl(self, mean, variance, rv_shape, num_samples=1, F=None): """ Draw samples from the normal distribution. @@ -80,7 +80,7 @@ def draw_samples_impl(self, mean, variance, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the normal distribution. :rtypes: MXNet NDArray or MXNet Symbol @@ -177,8 +177,7 @@ def log_pdf_impl(self, mean, covariance, random_variable, F=None): sqnorm_z = - F.sum(F.square(zvec), axis=-1) return (0.5 * (sqnorm_z - (N * np.log(2 * np.pi))) + logdetl)* self.log_pdf_scaling - def draw_samples_impl(self, mean, covariance, rv_shape, num_samples=1, - F=None): + def draw_samples_impl(self, mean, covariance, rv_shape, num_samples=1, F=None): """ Draw a number of samples from the normal distribution. @@ -189,7 +188,7 @@ def draw_samples_impl(self, mean, covariance, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the normal distribution :rtypes: MXNet NDArray or MXNet Symbol @@ -203,8 +202,7 @@ def draw_samples_impl(self, mean, covariance, rv_shape, num_samples=1, return F.broadcast_add(lmat_eps.sum(-1), mean) @staticmethod - def define_variable(shape, mean=0., covariance=None, rand_gen=None, - minibatch_ratio=1., dtype=None, ctx=None): + def define_variable(shape, mean=0., covariance=None, rand_gen=None, minibatch_ratio=1., dtype=None, ctx=None): """ Creates and returns a random variable drawn from a normal distribution. @@ -285,8 +283,7 @@ def log_pdf_impl(self, mean, precision, random_variable, F=None): F.broadcast_minus(random_variable, mean)), -precision / 2)) * self.log_pdf_scaling return logL - def draw_samples_impl(self, mean, precision, rv_shape, num_samples=1, - F=None): + def draw_samples_impl(self, mean, precision, rv_shape, num_samples=1, F=None): """ Draw samples from the normal distribution. @@ -297,7 +294,7 @@ def draw_samples_impl(self, mean, precision, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the normal distribution. :rtypes: MXNet NDArray or MXNet Symbol @@ -396,8 +393,7 @@ def log_pdf_impl(self, mean, precision, random_variable, F=None): return -0.5 * (sqnorm_z + c + logdetl) * self.log_pdf_scaling - def draw_samples_impl(self, mean, precision, rv_shape, num_samples=1, - F=None): + def draw_samples_impl(self, mean, precision, rv_shape, num_samples=1, F=None): """ Draw a number of samples from the normal distribution. @@ -408,7 +404,7 @@ def draw_samples_impl(self, mean, precision, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the normal distribution :rtypes: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/pointmass.py b/mxfusion/components/distributions/pointmass.py index 3f38c2c..68124cf 100644 --- a/mxfusion/components/distributions/pointmass.py +++ b/mxfusion/components/distributions/pointmass.py @@ -21,7 +21,7 @@ class PointMass(UnivariateDistribution): """ The Point Mass distribution. - :param value: the location of the point mass. + :param location: the location of the point mass. """ def __init__(self, location, rand_gen=None, dtype=None, ctx=None): inputs = [('location', location)] @@ -51,13 +51,18 @@ def draw_samples_impl(self, location, rv_shape, num_samples=1, F=None): location, shape=(num_samples,)+location.shape[1:]) @staticmethod - def define_variable(location, shape=None, rand_gen=None, dtype=None, - ctx=None): + def define_variable(location, shape=None, rand_gen=None, dtype=None, ctx=None): """ Creates and returns a random variable drawn from a Normal distribution. :param location: the location of the point mass. :param shape: Shape of random variables drawn from the distribution. If non-scalar, each variable is drawn iid. + :param rand_gen: the random generator (default: MXNetRandomGenerator). + :type rand_gen: RandomGenerator + :param dtype: the data type for float point numbers. + :type dtype: numpy.float32 or numpy.float64 + :param ctx: the mxnet context (default: None/current context). + :type ctx: None or mxnet.cpu or mxnet.gpu :returns: RandomVariable drawn from the distribution specified. """ diff --git a/mxfusion/components/distributions/random_gen.py b/mxfusion/components/distributions/random_gen.py index a155da4..58c7a09 100644 --- a/mxfusion/components/distributions/random_gen.py +++ b/mxfusion/components/distributions/random_gen.py @@ -39,7 +39,6 @@ def sample_multinomial(data, get_prob=True, dtype='int32', F=None): def sample_bernoulli(prob_true=0.5, dtype='bool', F=None): pass - @staticmethod def sample_uniform(low=0., high=1., shape=None, dtype=None, out=None, ctx=None, F=None): pass @@ -48,6 +47,7 @@ def sample_uniform(low=0., high=1., shape=None, dtype=None, out=None, ctx=None, def sample_laplace(location=0., scale=1., shape=None, dtype=None, out=None, ctx=None, F=None): pass + class MXNetRandomGenerator(RandomGenerator): """ The MXNet pseudo-random number generator. @@ -98,8 +98,7 @@ def sample_normal(loc=0, scale=1, shape=None, dtype=None, out=None, ctx=None, F= shape=shape, dtype=dtype, out=out, ctx=ctx, F=F) @staticmethod - def sample_multinomial(data, shape=None, get_prob=False, dtype='int32', - F=None): + def sample_multinomial(data, shape=None, get_prob=False, dtype='int32', F=None): """ Sample Multinomial distributed variables @@ -107,6 +106,7 @@ def sample_multinomial(data, shape=None, get_prob=False, dtype='int32', `k` is the number of possible outcomes of each multinomial distribution. For example, data with shape `(m, n, k)` specifies `m*n` multinomial distributions each with `k` possible outcomes. + :param shape: Shape of the random variable :param get_prob: If true, a second array containing log likelihood of the drawn samples will also be returned. This is usually used for reinforcement learning, where you can provide diff --git a/mxfusion/components/distributions/uniform.py b/mxfusion/components/distributions/uniform.py index 8c0921c..a17f2eb 100644 --- a/mxfusion/components/distributions/uniform.py +++ b/mxfusion/components/distributions/uniform.py @@ -73,7 +73,7 @@ def draw_samples_impl(self, low, high, rv_shape, num_samples=1, F=None): :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Uniform distribution. :rtypes: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/distributions/wishart.py b/mxfusion/components/distributions/wishart.py index 4b06901..1f1ef57 100644 --- a/mxfusion/components/distributions/wishart.py +++ b/mxfusion/components/distributions/wishart.py @@ -113,7 +113,7 @@ def draw_samples_impl(self, degrees_of_freedom, scale, rv_shape, num_samples=1, :param rv_shape: the shape of each sample. :type rv_shape: tuple :param num_samples: the number of drawn samples (default: one). - :int num_samples: int + :type num_samples: int :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :returns: a set samples of the Wishart distribution :rtypes: MXNet NDArray or MXNet Symbol diff --git a/mxfusion/components/factor.py b/mxfusion/components/factor.py index 514dfb6..3c96621 100644 --- a/mxfusion/components/factor.py +++ b/mxfusion/components/factor.py @@ -45,17 +45,19 @@ def _define_variable_from_constant(v): elif isinstance(v, NDArray): return Variable(value=v) else: - raise ModelSpecificationError('The inputs/outputs of a factor can only be a int, float, MXNet NDArray or Variable, but get '+str(v)+'.') + raise ModelSpecificationError('The inputs/outputs of a factor can only be a int, float, ' + 'MXNet NDArray or Variable, but get '+str(v)+'.') class Factor(ModelComponent): """ - A factor represents a relation among multiple variables in a model such as a distribution, a function or a module. It consists of a list of output - variables and optionally a list of input variables. + A factor represents a relation among multiple variables in a model such as a distribution, a function or a module. + It consists of a list of output variables and optionally a list of input variables. - The ``inputs`` and ``outputs`` argument of ``__init__`` holds the input and output of the factor, which are represented in Python dict. The key of a variable in - the dict is the name of the variable referred in the context of the factor, e.g., the mean and variance of a normal distribution. The value of a - variable is the reference to the variable in memory. Both input and output variables are accessible as class attributes. + The ``inputs`` and ``outputs`` argument of ``__init__`` holds the input and output of the factor, which are + represented in Python dict. The key of a variable in the dict is the name of the variable referred in the context + of the factor, e.g., the mean and variance of a normal distribution. The value of a variable is the reference to + the variable in memory. Both input and output variables are accessible as class attributes. The ``inputs`` and ``outputs`` argument of ``__init__`` can be: @@ -74,9 +76,11 @@ class Factor(ModelComponent): def __getattr__(self, value): if value.startswith("__"): """ - When python copies objects, it begins by checking for ``__setstate__()`` which doesn't exist, so it calls ``__getattr__()``. Our implementation then - calls the ``self.inputs`` getter before the object is fully prepared because ``__init__()`` never gets called during the copy. This causes an infinite - recursion to ``__getattr__()``. By skipping magic methods with "__" prefix, we allow the object to initialize correctly during copying. + When python copies objects, it begins by checking for ``__setstate__()`` which doesn't exist, so it calls + ``__getattr__()``. Our implementation then calls the ``self.inputs`` getter before the object is fully + prepared because ``__init__()`` never gets called during the copy. This causes an infinite recursion to + ``__getattr__()``. By skipping magic methods with "__" prefix, we allow the object to initialize correctly + during copying. # TODO this is very inefficient, can be improved. """ @@ -118,7 +122,8 @@ def replicate_self(self, attribute_map=None): """ This functions is a copy constructor for the object. In order to perform copy construction we first call ``__new__()`` on the class which creates a blank object. - We then initialize that object using the method's standard init procedures, and do any extra copying of attributes. + We then initialize that object using the method's standard init procedures, and do any extra copying of + attributes. Replicates this Factor, using new inputs, outputs, and a new uuid. Used during model replication to functionally replicate a factor into a new graph. diff --git a/mxfusion/components/functions/function_evaluation.py b/mxfusion/components/functions/function_evaluation.py index ec982fa..164fa10 100644 --- a/mxfusion/components/functions/function_evaluation.py +++ b/mxfusion/components/functions/function_evaluation.py @@ -46,34 +46,38 @@ def replicate_self(self, attribute_map=None): def eval(self, F, variables, always_return_tuple=False): """ - Evaluate the function with the pre-specified input arguments in the model defintion. All the input arguments are automatically collected from a dictionary of variables according to the UUIDs of the input arguments. + Evaluate the function with the pre-specified input arguments in the model defintion. All the input arguments + are automatically collected from a dictionary of variables according to the UUIDs of the input arguments. :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray). :param variables: the set of variables where the dependent variables are collected from. :type variables: {str(UUID): MXNet NDArray or Symbol} - :param always_return_tuple: whether to always return the function outcome in a tuple, even if there is only one output variable. This makes programming easy, as the downstream code can consistently expect a tuple. + :param always_return_tuple: whether to always return the function outcome in a tuple, even if there is only + one output variable. This makes programming easy, as the downstream code can consistently expect a tuple. :type always_return_tuple: boolean :returns: the outcome of the function evaluation :rtypes: MXNet NDArray or MXNet Symbol or [MXNet NDArray or MXNet Symbol] """ - kwargs = {name: variables[var.uuid] for name, var in self.inputs - if not var.isInherited or var.type == VariableType.RANDVAR} + if self.broadcastable: # If some of the inputs are samples and the function is # broadcastable, evaluate the function with the inputs that are # broadcasted to the right shape. + kwargs = {name: variables[var.uuid] for name, var in self.inputs if not var.isInherited} kwargs = broadcast_samples_dict(F, kwargs) + kwargs.update({name: variables[var.uuid][0] for name, var in self.inputs if var.isInherited}) results = self.eval_impl(F=F, **kwargs) results = results if isinstance(results, (list, tuple)) \ else [results] else: + kwargs = {name: variables[var.uuid] for name, var in self.inputs} # If some of the inputs are samples and the function is *not* # broadcastable, evaluate the function with each set of samples # and concatenate the output variables. - nSamples = max([get_num_samples(F, v) for v in kwargs.values()]) + num_samples = max([get_num_samples(F, v) for v in kwargs.values()]) results = None - for sample_idx in range(nSamples): + for sample_idx in range(num_samples): r = self.eval_impl(F=F, **{ n: v[sample_idx] if array_has_samples(F, v) else v[0] for n, v in kwargs.items()}) @@ -86,7 +90,7 @@ def eval(self, F, variables, always_return_tuple=False): else: for r_list, r_i in zip(results, r): r_list.append(r_i) - if nSamples == 1: + if num_samples == 1: results = [r[0] for r in results] else: results = [F.concat(*r, dim=0) for r in results] @@ -115,10 +119,10 @@ class FunctionEvaluationWithParameters(FunctionEvaluation): The evaluation of a function with internal function parameters. :param func: the function that this evaluation is generated from - :param inputs: MXFusion.components.functions.MXFusionFunction - :type inputs: {str : Variable} - :param outputs: the output variables of the function. - :type outputs: {str : Variable} + :param input_variables: MXFusion.components.functions.MXFusionFunction + :type input_variables: {str : Variable} + :param output_variables: the output variables of the function. + :type output_variables: {str : Variable} :param broadcastable: Whether the function supports broadcasting with the additional dimension for samples. :type: boolean """ @@ -156,9 +160,9 @@ def eval_impl(self, F, **input_kws): Invokes the MXNet Gluon block with the arguments passed in. :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray) - :param **input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs specified in the inputs - of FunctionEvaluation. - :type **input_kws: {variable name: MXNet NDArray or MXNet Symbol} + :param input_kws: the dict of inputs to the functions. The key in the dict should match with the name of + inputs specified in the inputs of FunctionEvaluation. + :type input_kws: {variable name: MXNet NDArray or MXNet Symbol} :returns: the return value of the function :rtypes: MXNet NDArray or MXNet Symbol """ diff --git a/mxfusion/components/functions/gluon_func_eval.py b/mxfusion/components/functions/gluon_func_eval.py index 45a9d99..78886e2 100644 --- a/mxfusion/components/functions/gluon_func_eval.py +++ b/mxfusion/components/functions/gluon_func_eval.py @@ -36,22 +36,3 @@ def __init__(self, func, input_variables, output_variables, func=func, input_variables=input_variables, output_variables=output_variables, broadcastable=broadcastable ) - - @property - def _input_to_gluon_names(self): - return [k for k, v in self.inputs if (not v.isInherited) or - v.type != VariableType.PARAMETER] - - def eval_impl(self, F, **input_kws): - """ - Invokes the MXNet Gluon block with the arguments passed in. - - :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray) - :param **input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs specified in the inputs - of FunctionEvaluation. - :type **input_kws: {variable name: MXNet NDArray or MXNet Symbol} - :returns: the return value of the function - :rtypes: MXNet NDArray or MXNet Symbol - """ - inputs_func = {k: input_kws[k] for k in self._input_to_gluon_names} - return self._func.eval(F, **inputs_func) diff --git a/mxfusion/components/functions/mxfusion_function.py b/mxfusion/components/functions/mxfusion_function.py index 2a86fba..7616cf8 100644 --- a/mxfusion/components/functions/mxfusion_function.py +++ b/mxfusion/components/functions/mxfusion_function.py @@ -43,10 +43,10 @@ def eval(self, F, **input_kws): The method handling the execution of the function. :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray) - :param **input_kws: the dict of inputs to the functions. The key in the + :param input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs specified in the inputs of FunctionEvaluation. - :type **input_kws: {variable name: MXNet NDArray or MXNet Symbol} + :type input_kws: {variable name: MXNet NDArray or MXNet Symbol} :returns: the return value of the function :rtypes: MXNet NDArray or MXNet Symbol """ diff --git a/mxfusion/components/functions/mxfusion_gluon_function.py b/mxfusion/components/functions/mxfusion_gluon_function.py index 47f8a6d..d242711 100644 --- a/mxfusion/components/functions/mxfusion_gluon_function.py +++ b/mxfusion/components/functions/mxfusion_gluon_function.py @@ -24,8 +24,9 @@ class MXFusionGluonFunction(MXFusionFunction): """ - The wrapper of a MXNet Gluon block in MXFusion. It automatically fetches all the Gluon parameters in its ParameterDict. When this function - wrapper is called in Model definition, it returns a factor corresponding to the function evaluation. + The wrapper of a MXNet Gluon block in MXFusion. It automatically fetches all the Gluon parameters in its + ParameterDict. When this function wrapper is called in Model definition, it returns a factor corresponding to + the function evaluation. :param block: The MXNet Gluon block to be wrapped. :type block: mxnet.gluon.Block or mxnet.gluon.HybridBlock @@ -98,9 +99,10 @@ def eval(self, F, **input_kws): Invokes the MXNet Gluon block with the arguments passed in. :param F: the MXNet computation mode (mxnet.symbol or mxnet.ndarray) - :param **input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs specified in the inputs + :param input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs + specified in the inputs of FunctionEvaluation. - :type **input_kws: {variable name: MXNet NDArray or MXNet Symbol} + :type input_kws: {variable name: MXNet NDArray or MXNet Symbol} :returns: the return value of the function :rtypes: MXNet NDArray or MXNet Symbol """ @@ -127,7 +129,8 @@ def __call__(self, *args, **kwargs): broadcastable = self.broadcastable for bv in kwargs.values(): if bv.type != VariableType.PARAMETER and self.broadcastable: - # Broadcasting function evaluation can not be applied to the Gluon block with gluon block parameters as random variables. + # Broadcasting function evaluation can not be applied to the Gluon block with gluon block + # parameters as random variables. broadcastable = False break @@ -155,39 +158,23 @@ def _create_variables_from_gluon_block(self, block): params = block.collect_params() vs = {} for param in params.values(): - v = Variable(isInherited=True, shape=param.shape) + v = Variable(isInherited=True, shape=param.shape, initial_value=param.data()) v.inherited_name = param.name vs[v.inherited_name] = v return vs - def collect_gluon_parameters(self): - """ - Return the parameters of the MXNet Gluon block that have *not* been set a prior distribution. - - :returns: the parameters of the MXNet Gluon block without a prior distribution. - :rtype: MXNet.gluon.ParameterDict - """ - params = ParameterDict() - gluon_params = self._gluon_block.collect_params() - params.update({var_name: gluon_params[var_name] for var_name, var in self._gluon_parameters.items() if var.type == VariableType.PARAMETER}) - return params - - def collect_params(self): - """ - Return a variable set / dict. Used for the function.collect_params.set_prior() functionality. - """ - # TODO: implement VariableSet - raise NotImplementedError - def _override_block_parameters(self, input_kws): """ - When a probabilistic distribution is defined for the parameters of a Gluon block (in ParameterDict), a special treatment is necessary - because otherwise these parameters will be directly exposed to a gradient optimizer as free parameters. + When a probabilistic distribution is defined for the parameters of a Gluon block (in ParameterDict), a special + treatment is necessary because otherwise these parameters will be directly exposed to a gradient optimizer as + free parameters. - For each parameters of the Gluon bock with probabilistic distribution, this method dynamically sets its values as the outcome of - upstream computation and ensure the correct gradient can be estimated via automatic differentiation. + For each parameters of the Gluon bock with probabilistic distribution, this method dynamically sets its values + as the outcome of upstream computation and ensure the correct gradient can be estimated via automatic + differentiation. - :param **input_kws: the dict of inputs to the functions. The key in the dict should match with the name of inputs specified in the + :param **input_kws: the dict of inputs to the functions. The key in the dict should match with the name of + inputs specified in the inputs of FunctionEvaluation. :type **input_kws: {variable name: MXNet NDArray or MXNet Symbol} """ diff --git a/mxfusion/components/functions/operators/operator_impl.py b/mxfusion/components/functions/operators/operator_impl.py index 9fba608..2d7781b 100644 --- a/mxfusion/components/functions/operators/operator_impl.py +++ b/mxfusion/components/functions/operators/operator_impl.py @@ -22,57 +22,77 @@ """ Basic Arithmetic """ + + @MXNetOperatorDecorator(name='add', args=['x', 'y'], inputs=['x', 'y']) def add(F, x, y): return F.add(x, y) + @MXNetOperatorDecorator(name='subtract', args=['x', 'y'], inputs=['x', 'y']) def subtract(F, x, y): return F.subtract(x, y) + @MXNetOperatorDecorator(name='multiply', args=['x', 'y'], inputs=['x', 'y']) def multiply(F, x, y): return F.multiply(x, y) + @MXNetOperatorDecorator(name='divide', args=['x', 'y'], inputs=['x', 'y']) def divide(F, x, y): return F.divide(x, y) + @MXNetOperatorDecorator(name='power', args=['x', 'y'], inputs=['x', 'y']) def power(F, x, y): return F.power(x, y) + """ Elementwise Operations """ + + @MXNetOperatorDecorator(name='square', args=['data'], inputs=['data']) def square(F, data): return F.square(data) + @MXNetOperatorDecorator(name='exp', args=['data'], inputs=['data']) def exp(F, data): return F.exp(data) + @MXNetOperatorDecorator(name='log', args=['data'], inputs=['data']) def log(F, data): return F.log(data) + """ Aggregation """ + + @MXNetOperatorDecorator(name='sum', args=['data', 'axis'], inputs=['data']) def sum(F, data, axis=None): return F.sum(data, axis) + @MXNetOperatorDecorator(name='mean', args=['data', 'axis'], inputs=['data']) def mean(F, data, axis=None): return F.mean(data, axis) + @MXNetOperatorDecorator(name='prod', args=['data', 'axis'], inputs=['data']) def prod(F, data, axis=None): return F.prod(data, axis) + """ Matrix Operations """ + + @MXNetOperatorDecorator(name='dot', args=['x', 'y'], inputs=['x', 'y']) def dot(F, x, y): return F.linalg.gemm2(x, y) + # TODO Bring in the axis arguments once it's in the release version of MXNet @MXNetOperatorDecorator(name='diag', args=['data', 'k', 'axis1', 'axis2'], inputs=['data']) def diag(F, data, k=0, axis1=None, axis2=None): @@ -80,11 +100,15 @@ def diag(F, data, k=0, axis1=None, axis2=None): raise Exception("axis1 and axis2 are not implemented yet.") return F.diag(data, k) + """ Matrix Manipulations """ + + @MXNetOperatorDecorator(name='reshape', args=['data', 'shape', 'reverse'], inputs=['data']) def reshape(F, data, shape, reverse=False): return F.reshape(data=data, shape=shape, reverse=reverse) + @MXNetOperatorDecorator(name='transpose', args=['data', 'axes'], inputs=['data']) def transpose(F, data, axes=None): axes = axes if axes is not None else [] @@ -96,7 +120,8 @@ def transpose(F, data, axes=None): def broadcast_to(data, shape): """ - This operator broadcast a variable to a target shape. The broadcasting rule is the same as [the numpy broadcasting rule](https://docs.scipy.org/doc/numpy-1.13.0/user/basics.broadcasting.html). See the following example: + This operator broadcast a variable to a target shape. The broadcasting rule is the same as [the numpy broadcasting + rule](https://docs.scipy.org/doc/numpy-1.13.0/user/basics.broadcasting.html). See the following example: ```python m.x = Gaussian.define_variable(mean=broadcast_to(array([0]), (2,)), diff --git a/mxfusion/components/functions/operators/operators.py b/mxfusion/components/functions/operators/operators.py index cf7e605..1c6a44a 100644 --- a/mxfusion/components/functions/operators/operators.py +++ b/mxfusion/components/functions/operators/operators.py @@ -21,7 +21,8 @@ class Operator(FunctionEvaluation): """ Abstract Operator object for using MXNet operators in MXFusion space. - Child classes implement the eval method with their operator and access necessary state through the properties dictionary. + Child classes implement the eval method with their operator and access necessary state through the + properties dictionary. """ def __init__(self, inputs, outputs, operator_name, properties=None, broadcastable=False): @@ -57,7 +58,8 @@ def __init__(self, name, args, inputs, num_outputs=1, broadcastable=False): :type name: string :param args: The names of the arguments for the mxnet operator in order. :type args: list of strings - :param inputs: The inputs to the MXNet operator that could have gradient's chained through them. I.E. the mx.nd.array or mx.sym.array parameters. This will be a subset of args (possibly the same set). + :param inputs: The inputs to the MXNet operator that could have gradient's chained through them. + I.E. the mx.nd.array or mx.sym.array parameters. This will be a subset of args (possibly the same set). :type inputs: list of strings :param num_outputs: How many output variables the operator produces. Defaults to 1. :type num_outputs: int @@ -87,7 +89,8 @@ def eval_impl(self, F, **input_kws): return func(F, **input_kws) if not len(all_args) >= len(self.input_names): - raise ModelSpecificationError("Must pass in arguments matching the input names {} but received {}.".format(self.input_names, all_args)) + raise ModelSpecificationError("Must pass in arguments matching the input names {} but received {}." + .format(self.input_names, all_args)) op = CustomOperator( inputs=[(n, all_args[n]) for n in self.input_names], diff --git a/mxfusion/components/model_component.py b/mxfusion/components/model_component.py index 0d6c569..82db1fa 100644 --- a/mxfusion/components/model_component.py +++ b/mxfusion/components/model_component.py @@ -31,7 +31,8 @@ class ModelComponent(object): **Mode 2 - Graph mode** If a node is attached to a FactorGraph, it does not store direct references to its successors and predecessors. - When accessed, the predecessors/successors properties directly query the graph they are attached to to find out what the respective neighbor nodes are. + When accessed, the predecessors/successors properties directly query the graph they are attached to to find out + what the respective neighbor nodes are. """ def __init__(self): @@ -73,9 +74,11 @@ def graph(self): @graph.setter def graph(self, graph): """ - Attaches the node to a graph, switching from Bidirectional mode to Graph mode if it is not already in Graph mode. + Attaches the node to a graph, switching from Bidirectional mode to Graph mode if it is not already + in Graph mode. - A node cannot be re-attached to a different graph once it is attached. Use the ``replicate()`` functionality if you need to do this. + A node cannot be re-attached to a different graph once it is attached. Use the ``replicate()`` functionality + if you need to do this. :param graph: The ``components_graph`` of the ``FactorGraph`` this node is attaching to. :type graph: networkx.DiGraph @@ -105,7 +108,8 @@ def _update_attributes(self): def _align_graph_modes(self, edge_nodes): """ - This function will update the current node and all nodes passed in to be in Graph mode if any of edge_nodes are in Graph mode. + This function will update the current node and all nodes passed in to be in Graph mode if any of edge_nodes are + in Graph mode. :param edge_nodes: All the nodes to align to the same graph mode. I.E. predecessors or successors. :type edge_nodes: List of tuples of name to node e.g. [('random_variable': Variable y)] @@ -146,7 +150,8 @@ def add_predecessor(successor, predecessor, successor_name): if successor.graph is None: successor._predecessors.append((successor_name, predecessor)) if successor.graph is not None: - raise ModelSpecificationError("Internal Error. Cannot add predecessor when a component is attached to a graph.") + raise ModelSpecificationError( + "Internal Error. Cannot add predecessor when a component is attached to a graph.") self._align_graph_modes(successors) if self.graph is not None: @@ -186,7 +191,8 @@ def add_successor(predecessor, successor, predecessor_name): if predecessor.graph is None: predecessor._successors.append((predecessor_name, successor)) if predecessor.graph is not None: - raise ModelSpecificationError("Internal Error. Cannot add a successor when a component is attached to a graph.") + raise ModelSpecificationError( + "Internal Error. Cannot add a successor when a component is attached to a graph.") self._align_graph_modes(predecessors) if self.graph is not None: @@ -229,20 +235,23 @@ def _replicate_neighbors(self, var_map, neighbors, recurse_type, replication_fun :param var_map: A mapping from the original model's components to the replicated components. :type var_map: {original_node: new_node} - :param neighbors: Dictionary containing the list of a node's neighbors in one direction (predecessors or successors). + :param neighbors: Dictionary containing the list of a node's neighbors in one direction + (predecessors or successors). :type neighbors: List of tuples of name to node e.g. [('random_variable': Variable y)] - :param recurse_type: Parameter that decides how to replicate the neighbor nodes. Must be one of: 'recursive', 'one_level', or None. + :param recurse_type: Parameter that decides how to replicate the neighbor nodes. Must be one of: 'recursive', + 'one_level', or None. :type recurse_type: String or None - :param replication_function: A function that takes in a ModelComponent and returns an answer for how to replicate that node's predecessors and successors. + :param replication_function: A function that takes in a ModelComponent and returns an answer for how to + replicate that node's predecessors and successors. :type replication_function: function """ if recurse_type == 'recursive': replicated_neighbors = [(name, i.replicate(var_map=var_map, replication_function=replication_function)) - for name, i in neighbors] + for name, i in neighbors] elif recurse_type == 'one_level': replicated_neighbors = [(name, i._replicate_self_with_attributes(var_map=var_map)) - for name, i in neighbors] + for name, i in neighbors] elif recurse_type is None: replicated_neighbors = [] else: @@ -253,10 +262,11 @@ def replicate(self, var_map=None, replication_function=None): """ Replicates this component and its neighbors based on the replication_function logic passed in. - :param var_map: A mapping from the original model's components to the replicated components. This is used to track which components - have already been replicated in a dynamic programming style. + :param var_map: A mapping from the original model's components to the replicated components. This is used to + track which components have already been replicated in a dynamic programming style. :type var_map: {original_node: new_node} - :param replication_function: A function that takes in a ModelComponent and returns an answer for how to replicate that node's predecessors and successors. If None, only replicates this node. + :param replication_function: A function that takes in a ModelComponent and returns an answer for how to + replicate that node's predecessors and successors. If None, only replicates this node. :type replication_function: function """ var_map = var_map if var_map is not None else {} diff --git a/mxfusion/inference/__init__.py b/mxfusion/inference/__init__.py index e89b8f3..32a391f 100644 --- a/mxfusion/inference/__init__.py +++ b/mxfusion/inference/__init__.py @@ -41,9 +41,10 @@ from .minibatch_loop import MinibatchInferenceLoop from .meanfield import create_Gaussian_meanfield from .forward_sampling import ForwardSampling, VariationalPosteriorForwardSampling, ForwardSamplingAlgorithm -from .grad_based_inference import GradBasedInference +from .grad_based_inference import GradBasedInference, GradTransferInference from .variational import StochasticVariationalInference from .inference_parameters import InferenceParameters from .score_function import ScoreFunctionInference, ScoreFunctionRBInference from .expectation import ExpectationAlgorithm, ExpectationScoreFunctionAlgorithm from .prediction import ModulePredictionAlgorithm +from .pilco_alg import PILCOAlgorithm diff --git a/mxfusion/inference/batch_loop.py b/mxfusion/inference/batch_loop.py index 1061365..35f0078 100644 --- a/mxfusion/inference/batch_loop.py +++ b/mxfusion/inference/batch_loop.py @@ -12,22 +12,6 @@ # permissions and limitations under the License. # ============================================================================== - -# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved. -# -# Licensed under the Apache License, Version 2.0 (the "License"). -# You may not use this file except in compliance with the License. -# A copy of the License is located at -# -# http://www.apache.org/licenses/LICENSE-2.0 -# -# or in the "license" file accompanying this file. This file is distributed -# on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either -# express or implied. See the License for the specific language governing -# permissions and limitations under the License. -# ============================================================================== - - import mxnet as mx from .grad_loop import GradLoop @@ -52,6 +36,8 @@ def run(self, infr_executor, data, param_dict, ctx, optimizer='adam', :type optimizer: str :param learning_rate: the learning rate of the gradient optimizer (default: 0.001) :type learning_rate: float + :param n_prints: number of messages to print + :type n_prints: int :param max_iter: the maximum number of iterations of gradient optimization :type max_iter: int :param verbose: whether to print per-iteration messages. @@ -66,10 +52,10 @@ def run(self, infr_executor, data, param_dict, ctx, optimizer='adam', with mx.autograd.record(): loss, loss_for_gradient = infr_executor(mx.nd.zeros(1, ctx=ctx), *data) loss_for_gradient.backward() + if verbose: - print('\rIteration {} loss: {}'.format(i + 1, loss.asscalar()), - end='') - if i % iter_step == 0 and i > 0: + print('\rIteration {} loss: {}\t\t\t\t'.format(i + 1, loss.asscalar()), end='') + if ((i+1) % iter_step == 0 and i > 0) or i == max_iter-1: print() trainer.step(batch_size=1, ignore_stale_grad=True) loss = infr_executor(mx.nd.zeros(1, ctx=ctx), *data) diff --git a/mxfusion/inference/expectation.py b/mxfusion/inference/expectation.py index ae71a31..6236c0e 100644 --- a/mxfusion/inference/expectation.py +++ b/mxfusion/inference/expectation.py @@ -101,7 +101,10 @@ def compute(self, F, variables): gradient_lambda = F.mean(q_z_lambda * F.stop_gradient(p_x_z), axis=0) - gradient_theta = F.mean(p_x_z, axis=0) # TODO known issue. This will double count the gradient of any distribution using the reparameterization trick (i.e. Normal). Issue #91 + # TODO known issue. + # This will double count the gradient of any distribution using the + # reparameterization trick (i.e. Normal). Issue #91 + gradient_theta = F.mean(p_x_z, axis=0) gradient_log_L = gradient_lambda + gradient_theta diff --git a/mxfusion/inference/grad_based_inference.py b/mxfusion/inference/grad_based_inference.py index f52495e..5935538 100644 --- a/mxfusion/inference/grad_based_inference.py +++ b/mxfusion/inference/grad_based_inference.py @@ -15,20 +15,18 @@ from .inference import Inference from .batch_loop import BatchInferenceLoop +from ..util.inference import discover_shape_constants, init_outcomes +from .minibatch_loop import MinibatchInferenceLoop class GradBasedInference(Inference): """ The abstract class for gradient-based inference methods. - An inference method consists of a few components: the applied inference algorithm, the model definition (optionally a definition of posterior - approximation), the inference parameters. + An inference method consists of a few components: the applied inference algorithm, the model definition + (optionally a definition of posterior approximation), the inference parameters. :param inference_algorithm: The applied inference algorithm :type inference_algorithm: InferenceAlgorithm - :param graphs: a list of graph definitions required by the inference method. It includes the model definition and necessary posterior approximation. - :type graphs: [FactorGraph] - :param observed: A list of observed variables - :type observed: [Variable] :param grad_loop: The reference to the main loop of gradient optimization :type grad_loop: GradLoop :param constants: Specify a list of model variables as constants @@ -79,14 +77,64 @@ def run(self, optimizer='adam', learning_rate=1e-3, max_iter=2000, :type max_iter: int :param verbose: whether to print per-iteration messages. :type verbose: boolean - :param **kwargs: The keyword arguments specify the data for inferences. The key of each argument is the name of the corresponding - variable in model definition and the value of the argument is the data in numpy array format. + :param kwargs: The keyword arguments specify the data for inferences. The key of each argument is the name of + the corresponding variable in model definition and the value of the argument is the data in numpy array format. """ data = [kwargs[v] for v in self.observed_variable_names] self.initialize(**kwargs) infr = self.create_executor() - return self._grad_loop.run( - infr_executor=infr, data=data, param_dict=self.params.param_dict, - ctx=self.mxnet_context, optimizer=optimizer, - learning_rate=learning_rate, max_iter=max_iter, verbose=verbose) + + if isinstance(self._grad_loop, MinibatchInferenceLoop): + def update_shape_constants(data_batch): + data_shapes = {i: d.shape for i, d in zip(self.observed_variable_UUIDs, + data_batch)} + shape_constants = discover_shape_constants(data_shapes, self._graphs) + self.params.update_constants(shape_constants) + + return self._grad_loop.run( + infr_executor=infr, data=data, param_dict=self.params.param_dict, + ctx=self.mxnet_context, optimizer=optimizer, + learning_rate=learning_rate, max_iter=max_iter, verbose=verbose, + update_shape_constants=update_shape_constants) + else: + return self._grad_loop.run( + infr_executor=infr, data=data, param_dict=self.params.param_dict, + ctx=self.mxnet_context, optimizer=optimizer, + learning_rate=learning_rate, max_iter=max_iter, verbose=verbose) + +class GradTransferInference(GradBasedInference): + """ + The abstract Inference method for transferring the outcome of one inference + method to another. + + :param inference_algorithm: The applied inference algorithm + :type inference_algorithm: InferenceAlgorithm + :param train_params: + :param constants: Specify a list of model variables as constants + :type constants: {Variable: mxnet.ndarray} + :param hybridize: Whether to hybridize the MXNet Gluon block of the inference method. + :type hybridize: boolean + :param dtype: data type for internal numerical representation + :type dtype: {numpy.float64, numpy.float32, 'float64', 'float32'} + :param context: The MXNet context + :type context: {mxnet.cpu or mxnet.gpu} + """ + + def __init__(self, inference_algorithm, infr_params, train_params, + grad_loop=None, var_tie=None, + constants=None, hybridize=False, + dtype=None, context=None): + self._var_tie = var_tie if var_tie is not None else {} + self._inherited_params = infr_params + self.train_params = train_params + super(GradTransferInference, self).__init__( + inference_algorithm=inference_algorithm, + grad_loop=grad_loop, constants=constants, + hybridize=hybridize, dtype=dtype, context=context) + + def _initialize_params(self): + self.params.initialize_with_carryover_params( + self._graphs, self.observed_variable_UUIDs, self._var_tie, + init_outcomes(self._inherited_params)) + self.params.fix_all() diff --git a/mxfusion/inference/inference.py b/mxfusion/inference/inference.py index fe6e686..fe2dc6f 100644 --- a/mxfusion/inference/inference.py +++ b/mxfusion/inference/inference.py @@ -21,7 +21,7 @@ import zipfile from .inference_parameters import InferenceParameters from ..common.config import get_default_device, get_default_dtype -from ..common.exceptions import InferenceError +from ..common.exceptions import InferenceError, SerializationError from ..util.inference import discover_shape_constants, init_outcomes from ..models import FactorGraph, Model, Posterior from ..util.serialization import ModelComponentEncoder, make_numpy, load_json_from_zip, load_parameters, \ @@ -61,7 +61,8 @@ def __init__(self, inference_algorithm, constants=None, def print_params(self): """ - Returns a string with the inference parameters nicely formatted for display, showing which model they came from and their name + uuid. + Returns a string with the inference parameters nicely formatted for display, showing which model they came from + and their name + uuid. Format: > infr.print_params() @@ -158,8 +159,9 @@ def run(self, **kwargs): """ Run the inference method. - :param **kwargs: The keyword arguments specify the data for inference self. The key of each argument is the name of the corresponding - variable in model definition and the value of the argument is the data in numpy array format. + :param kwargs: The keyword arguments specify the data for inference self. The key of each argument is the name + of the corresponding variable in model definition and the value of the argument is the data in numpy + array format. :returns: the samples of target variables (if not specified, the samples of all the latent variables) :rtype: {UUID: samples} """ @@ -232,8 +234,8 @@ def load_configuration(self, configuration, uuid_map): using the uuid_map parameter to store the correct current observed variables. - :param config_file: The loaded configuration dictionary - :type config_file: str + :param configuration: The loaded configuration dictionary + :type configuration: dict :param uuid_map: A map of previous/loaded model component uuids to their current variable in the loaded graph. :type uuid_map: { current_model_uuid : loaded_previous_uuid} @@ -243,10 +245,10 @@ def load_configuration(self, configuration, uuid_map): def get_serializable(self): """ - Returns the mimimum set of properties that the object needs to save in order to be + Returns the minimum set of properties that the object needs to save in order to be serialized down and loaded back in properly. :returns: A dictionary of configuration properties needed to serialize and reload this inference method. - :rtypes: Dictionary that is JSON serializable. + :rtype: Dictionary that is JSON serializable. """ return {'observed': self.observed_variable_UUIDs} @@ -271,8 +273,7 @@ def save(self, zip_filename=DEFAULT_ZIP): mxnet_parameters, mxnet_constants, variable_constants = self.params.get_serializable() configuration = self.get_serializable() graphs = [g.as_json()for g in self._graphs] - version_dict = {"serialization_version": - SERIALIZATION_VERSION} + version_dict = {"serialization_version": SERIALIZATION_VERSION} files_to_save = [] objects = [graphs, mxnet_parameters, mxnet_constants, @@ -338,6 +339,7 @@ def generate_executor(self, **kw): data_shapes = [kw[v] for v in self.observed_variable_names] if not self._initialized: + # TODO This function isn't defined anywhere? self._initialize_run(self._var_tie, self._inherited_params, data_shapes) self._initialized = True diff --git a/mxfusion/inference/inference_alg.py b/mxfusion/inference/inference_alg.py index 8ed624d..573fbe9 100644 --- a/mxfusion/inference/inference_alg.py +++ b/mxfusion/inference/inference_alg.py @@ -30,10 +30,11 @@ class ObjectiveBlock(HybridBlock): :type infr_method: a pointer to a function :param constants: the variables with constant values :type constants: {Variable UUID: int or float or mxnet.ndarray} - :param data_def: a list of variable UUID, which corresponds to the order of variables expected as the positional arguments in "hybrid_forward". + :param data_def: a list of variable UUID, which corresponds to the order of variables expected as the positional + arguments in "hybrid_forward". :type data_def: [UUID] :param var_trans: the transformations applied variables - :type var_trains: {UUID: VariableTransformation} + :type var_trans: {UUID: VariableTransformation} :param var_ties: A dictionary of variables that are tied and use the MXNet Parameter of the dict value uuid. :type var_ties: { UUID of source variable: UUID of target variable} :param excluded: a set of variables excluded from being set as Block parameters. @@ -58,7 +59,7 @@ def __init__(self, infr_method, constants, data_def, var_trans, var_ties, def hybrid_forward(self, F, x, *args, **kw): """ - This function does all the preprocesses and postprocesses for the execution of a InferenceAlgorithm. + This function does all the pre-processes and post-processes for the execution of a InferenceAlgorithm. :param F: the MXNet computation mode :type F: mxnet.symbol or mxnet.ndarray @@ -94,14 +95,6 @@ class InferenceAlgorithm(ABC): The abstract class for an inference algorithm. A concrete inference algorithm will inherit this class and overload the "compute" function with the actual computation logic. - - :param model: the definition of the probabilistic model - :type model: Model - :param observed: A list of observed variables - :type observed: [Variable] - :param extra_graphs: a list of extra FactorGraph used in the inference - algorithm. - :type extra_graphs: [FactorGraph] """ def replicate_self(self, model, extra_graphs=None): @@ -115,8 +108,17 @@ def replicate_self(self, model, extra_graphs=None): replicant._observed_names = [v.name for v in observed] return replicant - def __init__(self, model, observed, extra_graphs=None): + """ + Initialize the algorithm + + :param model: the definition of the probabilistic model + :type model: Model + :param observed: A list of observed variables + :type observed: [Variable] + :param extra_graphs: a list of extra FactorGraph used in the inference algorithm. + :type extra_graphs: [FactorGraph] + """ self._model_graph = model self._extra_graphs = extra_graphs if extra_graphs is not None else [] self._graphs = [model] if extra_graphs is None else \ @@ -162,11 +164,15 @@ def graphs(self): def prepare_executor(self, rv_scaling=None): """ - Prepare the creation of an executor. This includes collecting the list of variable transformations and the list of the variables that are inherited from external Gluon blocks, and setting log_pdf_scaling for random variables. + Prepare the creation of an executor. This includes collecting the list of variable transformations and the list + of the variables that are inherited from external Gluon blocks, and setting log_pdf_scaling for random + variables. - :param rv_scaling: The scaling of log_pdf of the random variables that are set by users for data sub-sampling or mini-batch learning. + :param rv_scaling: The scaling of log_pdf of the random variables that are set by users for data sub-sampling + or mini-batch learning. :type rv_scaling: {UUID: float} - :returns: the list of the variable transformations and the list of the variables that are excluded from being set as Gluon block parameters (see the excluded argument of __init__ of ObjectiveBlock). + :returns: the list of the variable transformations and the list of the variables that are excluded from being + set as Gluon block parameters (see the excluded argument of __init__ of ObjectiveBlock). :rtypes: {str(UUID): Transformation}, set(str(UUID)) """ excluded = set() @@ -176,8 +182,6 @@ def prepare_executor(self, rv_scaling=None): for v in g.variables.values(): if v.type == VariableType.PARAMETER and v.transformation is not None: var_trans[v.uuid] = v.transformation - if v.type == VariableType.PARAMETER and v.isInherited: - excluded.add(v.uuid) if v.type == VariableType.RANDVAR: if v.uuid in rv_scaling: v.factor.log_pdf_scaling = rv_scaling[v.uuid] @@ -197,7 +201,8 @@ def create_executor(self, data_def, params, var_ties, rv_scaling=None): :type params: InferenceParameters :param var_ties: A dictionary of variables that are tied and use the MXNet Parameter of the dict value uuid. :type var_ties: { UUID of source variable: UUID of target variable} - :param rv_scaling: The scaling of log_pdf of the random variables that are set by users for data sub-sampling or mini-batch learning. + :param rv_scaling: The scaling of log_pdf of the random variables that are set by users for data sub-sampling + or mini-batch learning. :type rv_scaling: {UUID: float} :returns: the Gluon block computing the outcome of inference :rtype: mxnet.gluon.HybridBlock @@ -230,7 +235,8 @@ def compute(self, F, variables): def set_parameter(self, variables, target_variable, target_value): """ - Set the value of a variable as the artifacts of this inference algorithm. This triggers to set the value to the corresponding variable into InferenceParameters at the end of inference. + Set the value of a variable as the artifacts of this inference algorithm. This triggers to set the value to the + corresponding variable into InferenceParameters at the end of inference. :param variables: the set of MXNet arrays that holds the values of all the variables at runtime. @@ -257,8 +263,7 @@ class SamplingAlgorithm(InferenceAlgorithm): :type num_samples: int :param target_variables: (optional) the target variables to sample :type target_variables: [UUID] - :param extra_graphs: a list of extra FactorGraph used in the inference - algorithm. + :param extra_graphs: a list of extra FactorGraph used in the inference algorithm. :type extra_graphs: [FactorGraph] """ @@ -273,7 +278,8 @@ def compute(self, F, variables): """ The abstract method for the computation of the inference algorithm. - If inference algorithm is used for gradient based optimizations, it should return two values. The first for the loss function, the second the gradient of the loss function. + If inference algorithm is used for gradient based optimizations, it should return two values. + The first for the loss function, the second the gradient of the loss function. :param F: the execution context (mxnet.ndarray or mxnet.symbol) :type F: Python module @@ -281,6 +287,7 @@ def compute(self, F, variables): variables at runtime. :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} :returns: the outcome of the inference algorithm - :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol. If gradient based, will return two values. The first the loss function, the second the gradient of the loss function. + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol. If gradient based, will return two values. + The first the loss function, the second the gradient of the loss function. """ raise NotImplementedError diff --git a/mxfusion/inference/inference_parameters.py b/mxfusion/inference/inference_parameters.py index 398c309..768ae74 100644 --- a/mxfusion/inference/inference_parameters.py +++ b/mxfusion/inference/inference_parameters.py @@ -14,16 +14,13 @@ import warnings -import numpy as np import mxnet as mx from mxnet import initializer -from mxnet import ndarray from mxnet.gluon import ParameterDict from ..components.variables import VariableType, Variable from ..components import ModelComponent from ..util.inference import realize_shape from ..common.config import get_default_device, get_default_dtype -from ..components.functions.gluon_func_eval import GluonFunctionEvaluation class InferenceParameters(object): @@ -75,18 +72,11 @@ def initialize_params(self, graphs, observed_uuid): self._params = ParameterDict() for g in graphs: - # load in parameterdict from external gluon blocks. - for f in g.functions.values(): - if isinstance(f, GluonFunctionEvaluation): - self._params.update( - f.function.collect_gluon_parameters()) - for var in g.get_constants(): self._constants[var.uuid] = var.constant excluded = set(self._constants.keys()).union(observed_uuid) - for var in g.get_parameters(excluded=excluded, - include_inherited=False): + for var in g.get_parameters(excluded=excluded): var_shape = realize_shape(var.shape, self._constants) init = initializer.Constant(var.initial_value_before_transformation) \ if var.initial_value is not None else None @@ -146,6 +136,10 @@ def initialize_with_carryover_params(self, graphs, observed_uuid, var_ties, # if to_var_uuid in carryover.param_dict} self._params.update(carryover_pairs) + def fix_all(self): + for p in self.param_dict.values(): + p.grad_req = 'null' + @property def param_dict(self): return self._params @@ -161,8 +155,7 @@ def var_ties(self): def __getitem__(self, key, ctx=None): if not isinstance(key, Variable): raise KeyError("The access key of inference parameter needs to be Variable, but got "+str(type(key))+".") - pkey = key.inherited_name if key.isInherited else key.uuid - val = self._params.get(pkey).data(ctx) + val = self._params.get(key.uuid).data(ctx) if key.transformation is not None: val = key.transformation.transform(val) return val diff --git a/mxfusion/inference/meanfield.py b/mxfusion/inference/meanfield.py index 537bec1..68e2350 100644 --- a/mxfusion/inference/meanfield.py +++ b/mxfusion/inference/meanfield.py @@ -25,8 +25,8 @@ def create_Gaussian_meanfield(model, observed, dtype=None): """ Create the Meanfield posterior for Variational Inference. - :param model_graph: the definition of the probabilistic model - :type model_graph: Model + :param model: the definition of the probabilistic model + :type model: Model :param observed: A list of observed variables :type observed: [Variable] :returns: the resulting posterior representation diff --git a/mxfusion/inference/minibatch_loop.py b/mxfusion/inference/minibatch_loop.py index e196824..517cd0c 100644 --- a/mxfusion/inference/minibatch_loop.py +++ b/mxfusion/inference/minibatch_loop.py @@ -14,8 +14,8 @@ import mxnet as mx -from .grad_loop import GradLoop from mxnet.gluon.data import ArrayDataset +from .grad_loop import GradLoop class MinibatchInferenceLoop(GradLoop): @@ -40,7 +40,7 @@ def __init__(self, batch_size=100, rv_scaling=None): if rv_scaling is not None else rv_scaling def run(self, infr_executor, data, param_dict, ctx, optimizer='adam', - learning_rate=1e-3, max_iter=1000, verbose=False): + learning_rate=1e-3, max_iter=1000, verbose=False, update_shape_constants=None): """ :param infr_executor: The MXNet function that computes the training objective. :type infr_executor: MXNet Gluon Block @@ -58,6 +58,8 @@ def run(self, infr_executor, data, param_dict, ctx, optimizer='adam', :type max_iter: int :param verbose: whether to print per-iteration messages. :type verbose: boolean + :param update_shape_constants: The callback function to update the shape constants according to the size of minibatch + :type update_shape_constants: Python function """ if isinstance(data, mx.gluon.data.DataLoader): @@ -74,6 +76,10 @@ def run(self, infr_executor, data, param_dict, ctx, optimizer='adam', L_e = 0 n_batches = 0 for i, data_batch in enumerate(data_loader): + if not isinstance(data_batch, list or tuple): + data_batch = [data_batch] + if update_shape_constants is not None: + update_shape_constants(data_batch) with mx.autograd.record(): loss, loss_for_gradient = infr_executor(mx.nd.zeros(1, ctx=ctx), *data_batch) loss_for_gradient.backward() diff --git a/mxfusion/inference/pilco_alg.py b/mxfusion/inference/pilco_alg.py new file mode 100644 index 0000000..04d83ed --- /dev/null +++ b/mxfusion/inference/pilco_alg.py @@ -0,0 +1,92 @@ +# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"). +# You may not use this file except in compliance with the License. +# A copy of the License is located at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# or in the "license" file accompanying this file. This file is distributed +# on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either +# express or implied. See the License for the specific language governing +# permissions and limitations under the License. +# ============================================================================== + +import mxnet as mx + +from .inference_alg import SamplingAlgorithm +from ..common.config import get_default_dtype, get_default_device + + +class PILCOAlgorithm(SamplingAlgorithm): + """ + Sampling-based inference algorithm that returns the expectation of each variable in the model. + + :param model: the definition of the probabilistic model + :type model: Model + :param observed: A list of observed variables + :type observed: [Variable] + :param num_samples: the number of samples used in estimating the variational lower bound + :type num_samples: int + :param target_variables: (optional) the target variables to sample + :type target_variables: [UUID] + :param extra_graphs: a list of extra FactorGraph used in the inference + algorithm. + :type extra_graphs: [FactorGraph] + """ + def __init__(self, model, observed, cost_function, policy, n_time_steps, initial_state_generator, extra_graphs=None, num_samples=3, ctx=None, dtype=None): + """ + :param model: The model to use to generate the next state from a state/action pair. + :param observed: Observed variables for the model. + :param cost_function: The cost function to evaluate state/action pairs on. + :param policy: The policy function to determine what action to take next from a particular state. + :param n_time_steps: How many time steps to roll forward using the model+policy to generate a trajectory. + :param initial_state_generator: Function that generates initial states for the model to begin at. + :param num_samples: How many sample trajectories to compute at once + """ + super(PILCOAlgorithm, self).__init__(model, observed, extra_graphs=extra_graphs) + self.cost_function = cost_function + self.policy = policy + self.initial_state_generator = initial_state_generator + self.n_time_steps = n_time_steps + self.num_samples = num_samples + self.dtype = dtype if dtype is not None else get_default_dtype() + self.mxnet_context = ctx if ctx is not None else get_default_device() + + + def compute(self, F, variables): + """ + Compute the PILCO algorithm's policy computation loop. + + 1. Generates a number of initial state + action pairs + 2. For each state+action pair: + 1. Predict the new state (s_t_plus_1) given the current state and action pair + 2. Compute the cost of being in that state + 3. Use the policy to compute the next action (a_t_plus_1) to take from s_t_plus_1 + 4. Repeat n_time_steps into the future, using the previous round's state/action pairs to roll forward. + 3. Return the total cost of all sample trajectories over time. + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.NDArray or mxnet.Symbol + """ + s_0 = self.initial_state_generator(self.num_samples) + a_0 = self.policy(s_0) + a_t_plus_1 = a_0 + x_t = F.expand_dims(F.concat(s_0, a_0, dim=1), axis=1) + cost = 0 + for t in range(self.n_time_steps): + variables[self.model.X] = x_t + res = self.model.Y.factor.predict(F, variables, targets=[self.model.Y], num_samples=self.num_samples)[0] + s_t_plus_1 = res[0] + + cost = cost + self.cost_function(s_t_plus_1, a_t_plus_1) + + a_t_plus_1 = mx.nd.expand_dims(self.policy(s_t_plus_1), axis=2) + x_t = mx.nd.concat(s_t_plus_1, a_t_plus_1, dim=2) + total_cost = F.sum(cost) + return total_cost, total_cost diff --git a/mxfusion/inference/prediction.py b/mxfusion/inference/prediction.py index 40634a3..7c86d79 100644 --- a/mxfusion/inference/prediction.py +++ b/mxfusion/inference/prediction.py @@ -21,7 +21,8 @@ class ModulePredictionAlgorithm(SamplingAlgorithm): """ - A prediction algorithm for modules. The algorithm evaluates all the functions, draws samples from distributions and runs the predict method on all the modules. + A prediction algorithm for modules. The algorithm evaluates all the functions, draws samples from distributions and + runs the predict method on all the modules. :param model: the definition of the probabilistic model :type model: Model @@ -61,7 +62,8 @@ def compute(self, F, variables): if all(known): continue elif any(known): - raise InferenceError("Part of the outputs of the distribution " + f.__class__.__name__ + " has been observed!") + raise InferenceError("Part of the outputs of the distribution " + f.__class__.__name__ + + " has been observed!") outcome_uuid = [v.uuid for _, v in f.outputs] outcome = f.draw_samples( F=F, num_samples=self.num_samples, variables=variables, diff --git a/mxfusion/inference/score_function.py b/mxfusion/inference/score_function.py index b82a983..c96c891 100644 --- a/mxfusion/inference/score_function.py +++ b/mxfusion/inference/score_function.py @@ -85,7 +85,8 @@ class ScoreFunctionRBInference(ScoreFunctionInference): """ Implemented following the [Black Box Variational Inference](https://arxiv.org/abs/1401.0118) paper. - The addition of Rao-Blackwellization and Control Variates (RBCV) requires that the posterior passed in be of meanfield form (i.e. all posterior variables independent.) + The addition of Rao-Blackwellization and Control Variates (RBCV) requires that the posterior passed in be of + meanfield form (i.e. all posterior variables independent.) Terminology: Lambda - Posterior parameters @@ -173,7 +174,6 @@ def compute(self, F, variables): gradient_lambda = F.sum(grad) - # Robbins-Monro sequence?? gradient_log_L = gradient_lambda + gradient_theta @@ -181,10 +181,12 @@ def compute(self, F, variables): def _extract_descendant_blanket_params(self, graph, node): """ - Returns a set of the markov blankets of all of the descendants of the node in the graph, mapped to their parameter form. + Returns a set of the markov blankets of all of the descendants of the node in the graph, + mapped to their parameter form. """ if node.graph != graph.components_graph: - raise InferenceError("Graph of node and graph to find it's descendants in differ. These should match so something went wrong.") + raise InferenceError("Graph of node and graph to find it's descendants in differ. " + "These should match so something went wrong.") descendants = graph.get_descendants(node) varset = [graph.get_markov_blanket(d) for d in descendants] diff --git a/mxfusion/inference/variational.py b/mxfusion/inference/variational.py index a438763..eaaa0ab 100644 --- a/mxfusion/inference/variational.py +++ b/mxfusion/inference/variational.py @@ -18,10 +18,8 @@ class VariationalInference(InferenceAlgorithm): """ - The class of the Stochastic Variational Inference (SVI) algorithm. + The base class for Variational Inference (VI) algorithms. - :param num_samples: the number of samples used in estimating the variational lower bound - :type num_samples: int :param model: the definition of the probabilistic model :type model: Model :param posterior: the definition of the variational posterior of the probabilistic model diff --git a/mxfusion/models/factor_graph.py b/mxfusion/models/factor_graph.py index c6fc0c3..b1a5311 100644 --- a/mxfusion/models/factor_graph.py +++ b/mxfusion/models/factor_graph.py @@ -162,8 +162,7 @@ def ordered_factors(self): :rtype: A topologically sorted list of Factors in the graph. """ - return [node for node in nx.topological_sort(self.components_graph) - if isinstance(node, Factor)] + return [node for node in nx.topological_sort(self.components_graph) if isinstance(node, Factor)] @property def roots(self): @@ -192,9 +191,9 @@ def var_ties(self): def log_pdf(self, F, variables, targets=None): """ - Compute the logarithm of the probability/probability density of a set of random variables in the factor graph. The set of random - variables are specified in the "target" argument and any necessary conditional variables are specified in the "conditionals" argument. - Any relevant constants are specified in the "constants" argument. + Compute the logarithm of the probability/probability density of a set of random variables in the factor graph. + The set of random variables are specified in the "target" argument and any necessary conditional variables are + specified in the "conditionals" argument. Any relevant constants are specified in the "constants" argument. :param F: the MXNet computation mode (``mxnet.symbol`` or ``mxnet.ndarray``). :param variables: The set of variables @@ -215,7 +214,9 @@ def log_pdf(self, F, variables, targets=None): outcome_uuid = [v.uuid for _, v in f.outputs] for v, uuid in zip(outcome, outcome_uuid): if uuid in variables: - warnings.warn('Function evaluation in FactorGraph.compute_log_prob_RT: the outcome variable '+str(uuid)+' of the function evaluation '+str(f)+' has already existed in the variable set.') + warnings.warn('Function evaluation in FactorGraph.compute_log_prob_RT: the outcome variable ' + + str(uuid) + ' of the function evaluation ' + str(f) + + ' has already existed in the variable set.') variables[uuid] = v elif isinstance(f, Distribution): if targets is None or f.random_variable.uuid in targets: @@ -232,13 +233,16 @@ def log_pdf(self, F, variables, targets=None): logL = logL + F.sum(expectation(F, f.log_pdf( F=F, variables=variables, targets=module_targets))) else: - raise ModelSpecificationError("There is an object in the factor graph that isn't a factor." + "That shouldn't happen.") + raise ModelSpecificationError("There is an object in the factor graph that isn't a factor." + + "That shouldn't happen.") return logL def draw_samples(self, F, variables, num_samples=1, targets=None): """ - Draw samples from the target variables of the Factor Graph. If the ``targets`` argument is None, draw samples from all the variables - that are *not* in the conditional variables. If the ``targets`` argument is given, this method returns a list of samples of variables in the order of the target argument, otherwise it returns a dict of samples where the keys are the UUIDs of variables and the values are the samples. + Draw samples from the target variables of the Factor Graph. If the ``targets`` argument is None, draw samples + from all the variables that are *not* in the conditional variables. If the ``targets`` argument is given, + this method returns a list of samples of variables in the order of the target argument, otherwise it returns a + dict of samples where the keys are the UUIDs of variables and the values are the samples. :param F: the MXNet computation mode (``mxnet.symbol`` or ``mxnet.ndarray``). :param variables: The set of variables @@ -258,7 +262,9 @@ def draw_samples(self, F, variables, num_samples=1, targets=None): outcome_uuid = [v.uuid for _, v in f.outputs] for v, uuid in zip(outcome, outcome_uuid): if uuid in variables: - warnings.warn('Function evaluation in FactorGraph.draw_samples_RT: the outcome of the function evaluation '+str(f)+' has already existed in the variable set.') + warnings.warn('Function evaluation in FactorGraph.draw_samples_RT: ' + 'the outcome of the function evaluation ' + str(f) + + ' has already existed in the variable set.') variables[uuid] = v samples[uuid] = v elif isinstance(f, Distribution): @@ -266,7 +272,8 @@ def draw_samples(self, F, variables, num_samples=1, targets=None): if all(known): continue elif any(known): - raise InferenceError("Part of the outputs of the distribution " + f.__class__.__name__ + " has been observed!") + raise InferenceError("Part of the outputs of the distribution " + + f.__class__.__name__ + " has been observed!") outcome_uuid = [v.uuid for _, v in f.outputs] outcome = f.draw_samples( F=F, num_samples=num_samples, variables=variables, always_return_tuple=True) @@ -282,7 +289,8 @@ def draw_samples(self, F, variables, num_samples=1, targets=None): variables[uuid] = v samples[uuid] = v else: - raise ModelSpecificationError("There is an object in the factor graph that isn't a factor." + "That shouldn't happen.") + raise ModelSpecificationError("There is an object in the factor graph that isn't a factor." + + "That shouldn't happen.") if targets: return tuple(samples[uuid] for uuid in targets) else: @@ -302,7 +310,7 @@ def remove_component(self, component): try: self.components_graph.remove_node(component) # implicitly removes edges except NetworkXError as e: - raise ModelSpecificationError("Attempted to remove a node "+str(component)+" that isn't in the graph.") + raise ModelSpecificationError("Attempted to remove a node " + str(component) + " that isn't in the graph.") if component.name is not None: @@ -322,14 +330,18 @@ def _replicate_class(self, **kwargs): def get_markov_blanket(self, node): """ - Gets the Markov Blanket for a node, which is the node's predecessors, the nodes successors, and those successors' other predecessors. + Gets the Markov Blanket for a node, which is the node's predecessors, the nodes successors, and those + successors' other predecessors. """ def get_variable_predecessors(node): return [v2 for k1,v1 in node.predecessors for k2,v2 in v1.predecessors if isinstance(v2, Variable)] + def get_variable_successors(node): return [v2 for k1,v1 in node.successors for k2,v2 in v1.successors if isinstance(v2, Variable)] + def flatten(node_list): return set([p for varset in node_list for p in varset]) + successors = set(get_variable_successors(node)) n = set([node]) pred = set(get_variable_predecessors(node)) @@ -381,8 +393,8 @@ def replace_subgraph(self, target_variable, new_subgraph): def extract_distribution_of(self, variable): """ - Extracts the distribution of the variable passed in, returning a replicated copy of the passed in variable with only its parent - subgraph attached (also replicated). + Extracts the distribution of the variable passed in, returning a replicated copy of the passed in variable with + only its parent subgraph attached (also replicated). :param variable: The variable to extract the distribution from. :type variable: Variable @@ -400,14 +412,23 @@ def extract_distribution_function(component): return predecessor_direction, successor_direction return variable.replicate(replication_function=extract_distribution_function) - def clone(self, leaves=None): + """ + Clones a model, maintaining the same functionality and topology. Replicates all of its ModelComponents, + while maintaining the same UUIDs. + + Starts upward from the leaves and copies everything in the graph recursively. + + :param leaves: If None, use the leaves in this model, otherwise use the provided leaves. + :return: the cloned model + """ new_model = self._replicate_class(name=self.name, verbose=self._verbose) return self._clone(new_model, leaves) def _clone(self, new_model, leaves=None): """ - Clones a model, maintaining the same functionality and topology. Replicates all of its ModelComponents, while maintaining the same UUIDs. + Clones a model, maintaining the same functionality and topology. Replicates all of its ModelComponents, + while maintaining the same UUIDs. Starts upward from the leaves and copies everything in the graph recursively. @@ -415,13 +436,12 @@ def _clone(self, new_model, leaves=None): :returns: the cloned model """ - var_map = {} # from old model to new model + var_map = {} # from old model to new model leaves = self.leaves if leaves is None else leaves for v in leaves: if v.name is not None: - new_leaf = v.replicate(var_map=var_map, - replication_function=lambda x: ('recursive', 'recursive')) + new_leaf = v.replicate(var_map=var_map, replication_function=lambda x: ('recursive', 'recursive')) setattr(new_model, v.name, new_leaf) else: v.graph = new_model.graph @@ -430,7 +450,7 @@ def _clone(self, new_model, leaves=None): setattr(new_model, v.name, new_model[v.uuid]) return new_model - def get_parameters(self, excluded=None, include_inherited=False): + def get_parameters(self, excluded=None, include_inherited=True): """ Get all the parameters not in the excluded list. @@ -444,7 +464,8 @@ def get_parameters(self, excluded=None, include_inherited=False): if include_inherited: return [v for v in self.variables.values() if (v.type == VariableType.PARAMETER and v.uuid not in excluded)] else: - return [v for v in self.variables.values() if (v.type == VariableType.PARAMETER and v.uuid not in excluded and not v.isInherited)] + return [v for v in self.variables.values() if (v.type == VariableType.PARAMETER and v.uuid not in excluded + and not v.isInherited)] def get_constants(self): """ @@ -455,44 +476,45 @@ def get_constants(self): """ return [v for v in self.variables.values() if v.type == VariableType.CONSTANT] - @staticmethod - def reconcile_graphs(current_graphs, primary_previous_graph, secondary_previous_graphs=None, primary_current_graph=None): + def reconcile_graphs(current_graphs, primary_previous_graph, secondary_previous_graphs=None, + primary_current_graph=None): """ Reconciles two sets of graphs, matching the model components in the previous graph to the current graph. - This is primarily used when loading back a graph from a file and matching it to an existing in-memory graph in order to load the previous - graph's parameters correctly. - - :param current_graphs: A list of the graphs we are reconciling a loaded factor graph against. This must be a fully built set of graphs - generated through the model definition process. - :param primary_previous_graph: A graph which may have been loaded in from a file and be partially specified, or could be a full graph - built through model definition. - :param secondary_previous_graphs: A list of secondary graphs (e.g. posteriors) that share components with the primary_previous_graph. - :param primary_current_graph: Optional parameter to specify the primary_current_graph, otherwise it is taken to be the model in the - current_graphs (which should be unique). + This is primarily used when loading back a graph from a file and matching it to an existing in-memory graph in + order to load the previous graph's parameters correctly. + + :param current_graphs: A list of the graphs we are reconciling a loaded factor graph against. This must be a + fully built set of graphs generated through the model definition process. + :param primary_previous_graph: A graph which may have been loaded in from a file and be partially specified, or + could be a full graph built through model definition. + :param secondary_previous_graphs: A list of secondary graphs (e.g. posteriors) that share components with the + primary_previous_graph. + :param primary_current_graph: Optional parameter to specify the primary_current_graph, otherwise it is taken to + be the model in the current_graphs (which should be unique). :rtype: {previous ModelComponent : current ModelComponent} """ def update_with_named_components(previous_components, current_components, component_map, nodes_to_traverse_from): - name_pre = {c.name: c for c in previous_components if c.name} - name_cur = {c.name: c for c in current_components if c.name} + name_pre = {c.name: c for c in previous_components if c.name} + name_cur = {c.name: c for c in current_components if c.name} for name, previous_c in name_pre.items(): current_c = name_cur[name] component_map[previous_c.uuid] = current_c.uuid nodes_to_traverse_from[previous_c.uuid] = current_c.uuid - - from .model import Model component_map = {} nodes_to_traverse_from = {} current_graph = primary_current_graph if primary_current_graph is not None else current_graphs[0] secondary_current_graphs = current_graphs[1:] secondary_previous_graphs = secondary_previous_graphs if secondary_previous_graphs is not None else [] if len(secondary_current_graphs) != len(secondary_previous_graphs): - raise ModelSpecificationError("Different number of secondary graphs passed in {} {}".format(secondary_current_graphs, secondary_previous_graphs)) + raise ModelSpecificationError("Different number of secondary graphs passed in {} {}".format( + secondary_current_graphs, secondary_previous_graphs)) - update_with_named_components(primary_previous_graph.components.values(), current_graph.components.values(), component_map, nodes_to_traverse_from) + update_with_named_components(primary_previous_graph.components.values(), current_graph.components.values(), + component_map, nodes_to_traverse_from) # Reconcile the primary graph FactorGraph._reconcile_graph(nodes_to_traverse_from, component_map, @@ -503,7 +525,8 @@ def update_with_named_components(previous_components, current_components, compon secondary_previous_graphs): nodes_to_traverse_from = {pc: cc for pc, cc in component_map.items() if pc in pg.components.keys()} - update_with_named_components(pg.components.values(), cg.components.values(), component_map, nodes_to_traverse_from) + update_with_named_components(pg.components.values(), cg.components.values(), component_map, + nodes_to_traverse_from) FactorGraph._reconcile_graph( nodes_to_traverse_from, component_map, cg, pg) @@ -513,14 +536,16 @@ def update_with_named_components(previous_components, current_components, compon @staticmethod def _reconcile_graph(nodes_to_traverse_from, component_map, current_graph, previous_graph): """ - Traverses the components (breadth first) in nodes_to_traverse_from of the current_graph/previous_graph, matching components where possible and generating - new calls to _reconcile_graph where the graph is still incompletely traversed. This method makes no attempt to resolve ambiguities - in naming between the graphs and request the user to more completely specify names in their graph if such an ambiguity exists. Such + Traverses the components (breadth first) in nodes_to_traverse_from of the current_graph/previous_graph, + matching components where possible and generating new calls to _reconcile_graph where the graph is still + incompletely traversed. This method makes no attempt to resolve ambiguities in naming between the graphs and + request the user to more completely specify names in their graph if such an ambiguity exists. Such naming can be more completely specified by attaching names to each leaf node in the original graph. :param nodes_to_traverse_from: A list of items to traverse the graph upwards from. :type nodes_to_traverse_from: [previous ModelComponents] - :param component_map: The current mapping from the previous graph's MCs to the current_graph's MCs. This is used and modified during reconciliation. + :param component_map: The current mapping from the previous graph's MCs to the current_graph's MCs. + This is used and modified during reconciliation. :type component_map: {previous_graph ModelComponent : current_graph ModelComponent} :param current_graph: The current graph to match components against. :type current_graph: FactorGraph @@ -540,8 +565,10 @@ def reconcile_direction(direction, previous_c, current_c, new_level, component_m for edge_name, node in previous_neighbors: if node.uuid not in component_map: if edge_name in duplicate_names: - # TODO if all the other parts of the ambiguity are resolved, we have the answer still. Otherwise throw an exception - raise Exception("Multiple edges connecting unnamed nodes have the same name, this isn't supported currently.") # TODO Support the ambiguities :) + # TODO if all the other parts of the ambiguity are resolved, we have the answer still. + # Otherwise throw an exception + raise Exception("Multiple edges connecting unnamed nodes have the same name, " + "this isn't supported currently.") # TODO Support the ambiguities :) current_node = [item for name, item in current_neighbors if edge_name == name][0] component_map[node.uuid] = current_node.uuid new_level[node.uuid] = current_node.uuid @@ -550,10 +577,13 @@ def reconcile_direction(direction, previous_c, current_c, new_level, component_m component_map.update(module_component_map) new_level = {} for previous_c, current_c in nodes_to_traverse_from.items(): - reconcile_direction('predecessor', previous_graph[previous_c], current_graph[current_c], new_level, component_map) + reconcile_direction('predecessor', previous_graph[previous_c], current_graph[current_c], new_level, + component_map) """ - TODO Reconciling in both directions currently breaks the reconciliation process and can cause multiple previous_uuid's to map to the same current_uuid. It's unclear why that happens. - This shouldn't be necessary until we implement multi-output Factors though (and even then, only if not all the outputs are in a named chain). + TODO Reconciling in both directions currently breaks the reconciliation process and can cause multiple + previous_uuid's to map to the same current_uuid. It's unclear why that happens. This shouldn't be necessary + until we implement multi-output Factors though (and even then, only if not all the outputs are in a + named chain). """ # reconcile_direction('successor', previous_graph[c], current_graph[current_c], new_level, component_map) if len(new_level) > 0: @@ -575,14 +605,15 @@ def load_from_json(self, json_graph): @staticmethod def load_graphs(graphs_list, existing_graphs=None): """ - Method to load back in a graph. The graphs should have been saved down using the save method, and be a JSON representation of the graph - generated by the [networkx](https://networkx.github.io) library. + Method to load back in a graph. The graphs should have been saved down using the save method, and be a JSON + representation of the graph generated by the [networkx](https://networkx.github.io) library. :param graphs_list: A list of raw json dicts loaded in from memory representing the FactorGraphs to create. :type graphs_list: list of dicts loaded in using the ModelComponentDecoder class. """ import json - existing_graphs = existing_graphs if existing_graphs is not None else [FactorGraph(graph['name']) for graph in graphs_list] + existing_graphs = existing_graphs if existing_graphs is not None else [FactorGraph(graph['name']) + for graph in graphs_list] return [existing_graph.load_from_json(graph) for existing_graph, graph in zip(existing_graphs, graphs_list)] def as_json(self): @@ -598,8 +629,8 @@ def as_json(self): @staticmethod def save(graph_file, json_graphs): """ - Method to save this graph down into a file. The graph file will be saved down as a JSON representation of the graph generated by the - [networkx](https://networkx.github.io) library. + Method to save this graph down into a file. The graph file will be saved down as a JSON representation of the + graph generated by the [networkx](https://networkx.github.io) library. :param graph_file: The file containing the primary model to load back for this inference algorithm. :type graph_file: str of filename diff --git a/mxfusion/modules/gp_modules/__init__.py b/mxfusion/modules/gp_modules/__init__.py index 14ee835..b4a9bb5 100644 --- a/mxfusion/modules/gp_modules/__init__.py +++ b/mxfusion/modules/gp_modules/__init__.py @@ -28,6 +28,6 @@ __all__ = ['gp_regression', 'sparsegp_regression', 'svgp_regression'] -from .gp_regression import GPRegression -from .sparsegp_regression import SparseGPRegression +from .gp_regression import GPRegression, GPRegressionSamplingPrediction +from .sparsegp_regression import SparseGPRegression, SparseGPRegressionSamplingPrediction from .svgp_regression import SVGPRegression diff --git a/mxfusion/modules/gp_modules/gp_regression.py b/mxfusion/modules/gp_modules/gp_regression.py index a3de449..7ba80c6 100644 --- a/mxfusion/modules/gp_modules/gp_regression.py +++ b/mxfusion/modules/gp_modules/gp_regression.py @@ -40,6 +40,7 @@ def __init__(self, model, posterior, observed, jitter=0.): self.jitter = jitter def compute(self, F, variables): + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] Y = variables[self.model.Y] noise_var = variables[self.model.noise_var] @@ -59,8 +60,8 @@ def compute(self, F, variables): self.jitter L = F.linalg.potrf(K) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] Y = Y - mean LinvY = F.linalg.trsm(L, Y) logdet_l = F.linalg.sumlogdiag(F.abs(L)) @@ -89,6 +90,18 @@ def __init__(self, model, observed, num_samples=1, target_variables=None, rand_gen def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] noise_var = variables[self.model.noise_var] N = X.shape[-2] @@ -110,8 +123,8 @@ def compute(self, F, variables): dtype=self.model.F.factor.dtype) y_samples = F.linalg.trmm(L, die) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] y_samples = y_samples + mean samples = {self.model.Y.uuid: y_samples} @@ -131,6 +144,18 @@ def __init__(self, model, posterior, observed, noise_free=True, self.diagonal_variance = diagonal_variance def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] N = X.shape[-2] noise_var = variables[self.model.noise_var] @@ -147,8 +172,8 @@ def compute(self, F, variables): LinvKxt = F.linalg.trsm(L, Kxt) mu = F.linalg.gemm2(LinvKxt, LinvY, True, False) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] mu = mu + mean if self.diagonal_variance: @@ -172,6 +197,9 @@ def compute(self, F, variables): class GPRegressionSamplingPrediction(SamplingAlgorithm): + """ + The method for drawing samples from the posterior distribution of a Gaussian process regression model. + """ def __init__(self, model, posterior, observed, rand_gen=None, noise_free=True, diagonal_variance=True, jitter=0.): super(GPRegressionSamplingPrediction, self).__init__( @@ -183,6 +211,18 @@ def __init__(self, model, posterior, observed, rand_gen=None, self.jitter = jitter def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] N = X.shape[-2] noise_var = variables[self.model.noise_var] @@ -199,8 +239,8 @@ def compute(self, F, variables): LinvKxt = F.linalg.trsm(L, Kxt) mu = F.linalg.gemm2(LinvKxt, LinvY, True, False) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] mu = mu + mean if self.diagonal_variance: @@ -247,8 +287,8 @@ class GPRegression(Module): :type kernel: Kernel :param noise_var: the variance of the Gaussian likelihood :type noise_var: Variable - :param mean_func: the mean function of Gaussian process. - :type mean_func: MXFusionFunction + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -257,7 +297,7 @@ class GPRegression(Module): :type ctx: None or mxnet.cpu or mxnet.gpu """ - def __init__(self, X, kernel, noise_var, mean_func=None, rand_gen=None, + def __init__(self, X, kernel, noise_var, mean=None, rand_gen=None, dtype=None, ctx=None): if not isinstance(X, Variable): X = Variable(value=X) @@ -265,21 +305,26 @@ def __init__(self, X, kernel, noise_var, mean_func=None, rand_gen=None, noise_var = Variable(value=noise_var) inputs = [('X', X), ('noise_var', noise_var)] input_names = [k for k, _ in inputs] + if mean is not None: + inputs.append(('mean', mean)) + input_names.append('mean') + self._has_mean = True + else: + self._has_mean = False output_names = ['random_variable'] super(GPRegression, self).__init__( inputs=inputs, outputs=None, input_names=input_names, output_names=output_names, rand_gen=rand_gen, dtype=dtype, ctx=ctx) - self.mean_func = mean_func self.kernel = kernel - def _generate_outputs(self, output_shapes=None): + def _generate_outputs(self, output_shapes): """ Generate the output of the module with given output_shapes. - :param output_shape: the shapes of all the output variables - :type output_shape: {str: tuple} + :param output_shapes: the shapes of all the output variables + :type output_shapes: {str: tuple} """ - if output_shapes is None: + if output_shapes['random_variable'] is None: Y_shape = self.X.shape[:-1] + (1,) else: Y_shape = output_shapes['random_variable'] @@ -293,15 +338,19 @@ def _build_module_graphs(self): graph = Model(name='gp_regression') graph.X = self.X.replicate_self() graph.noise_var = self.noise_var.replicate_self() + if self._has_mean: + mean = self.mean.replicate_self() + graph.mean = mean + else: + mean = None graph.F = GaussianProcess.define_variable( X=graph.X, kernel=self.kernel, shape=Y.shape, - mean_func=self.mean_func, rand_gen=self._rand_gen, + mean=mean, rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx) graph.Y = Y.replicate_self() graph.Y.set_prior(Normal( mean=graph.F, variance=broadcast_to(graph.noise_var, graph.Y.shape), rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx)) - graph.mean_func = self.mean_func graph.kernel = graph.F.factor.kernel # The posterior graph is used to store parameters for prediction post = Posterior(graph) @@ -321,8 +370,7 @@ def _attach_default_inference_algorithms(self): [v for k, v in self.outputs] self.attach_log_pdf_algorithms( targets=self.output_names, conditionals=self.input_names, - algorithm=GPRegressionLogPdf(self._module_graph, self._extra_graphs[0], - observed), + algorithm=GPRegressionLogPdf(self._module_graph, self._extra_graphs[0], observed), alg_name='gp_log_pdf') observed = [v for k, v in self.inputs] @@ -339,7 +387,7 @@ def _attach_default_inference_algorithms(self): alg_name='gp_predict') @staticmethod - def define_variable(X, kernel, noise_var, shape=None, mean_func=None, + def define_variable(X, kernel, noise_var, shape=None, mean=None, rand_gen=None, dtype=None, ctx=None): """ Creates and returns a variable drawn from a Gaussian process regression. @@ -354,8 +402,8 @@ def define_variable(X, kernel, noise_var, shape=None, mean_func=None, :param shape: the shape of the random variable(s) (the default shape is the same shape as *X* but the last dimension is changed to one.) :type shape: tuple or [tuple] - :param mean_func: the mean function of Gaussian process - :type mean_func: MXFusionFunction + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator) :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers @@ -364,7 +412,7 @@ def define_variable(X, kernel, noise_var, shape=None, mean_func=None, :type ctx: None or mxnet.cpu or mxnet.gpu """ gp = GPRegression( - X=X, kernel=kernel, noise_var=noise_var, mean_func=mean_func, + X=X, kernel=kernel, noise_var=noise_var, mean=mean, rand_gen=rand_gen, dtype=dtype, ctx=ctx) gp._generate_outputs({'random_variable': shape}) return gp.random_variable @@ -376,5 +424,5 @@ def replicate_self(self, attribute_map=None): rep = super(GPRegression, self).replicate_self(attribute_map) rep.kernel = self.kernel.replicate_self(attribute_map) - rep.mean_func = None if self.mean_func is None else self.mean_func.replicate_self(attribute_map) + rep._has_mean = self._has_mean return rep diff --git a/mxfusion/modules/gp_modules/sparsegp_regression.py b/mxfusion/modules/gp_modules/sparsegp_regression.py index 3379243..57b7e48 100644 --- a/mxfusion/modules/gp_modules/sparsegp_regression.py +++ b/mxfusion/modules/gp_modules/sparsegp_regression.py @@ -40,6 +40,18 @@ def __init__(self, model, posterior, observed, jitter=0.): self.jitter = jitter def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] Y = variables[self.model.Y] Z = variables[self.model.inducing_inputs] @@ -69,8 +81,8 @@ def compute(self, F, variables): F.broadcast_div(F.linalg.syrk(LinvKuf), noise_var_m) LA = F.linalg.potrf(A) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] Y = Y - mean LAInvLinvKufY = F.linalg.trsm(LA, F.linalg.gemm2(LinvKuf, Y)) @@ -105,6 +117,18 @@ def __init__(self, model, posterior, observed, target_variables=None, self.diagonal_variance = diagonal_variance def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] N = X.shape[-2] Z = variables[self.model.inducing_inputs] @@ -121,8 +145,8 @@ def compute(self, F, variables): Kxt = kern.K(F, Z, X, **kern_params) mu = F.linalg.gemm2(Kxt, wv, True, False) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] mu = mu + mean LinvKxt = F.linalg.trsm(L, Kxt) @@ -162,6 +186,18 @@ def __init__(self, model, posterior, observed, rand_gen=None, self.jitter = jitter def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] N = X.shape[-2] Z = variables[self.model.inducing_inputs] @@ -178,8 +214,8 @@ def compute(self, F, variables): Kxt = kern.K(F, Z, X, **kern_params) mu = F.linalg.gemm2(Kxt, wv, True, False) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] mu = mu + mean LinvKxt = F.linalg.trsm(L, Kxt) @@ -231,12 +267,13 @@ class SparseGPRegression(Module): :type kernel: Kernel :param noise_var: the variance of the Gaussian likelihood :type noise_var: Variable - :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated if not specified. + :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated + if not specified. :type inducing_inputs: Variable - :param inducing_num: the number of inducing points of sparse GP (default: 10) - :type inducing_num: int - :param mean_func: the mean function of Gaussian process. - :type mean_func: MXFusionFunction + :param num_inducing: the number of inducing points of sparse GP (default: 10) + :type num_inducing: int + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -246,7 +283,7 @@ class SparseGPRegression(Module): """ def __init__(self, X, kernel, noise_var, inducing_inputs=None, - num_inducing=10, mean_func=None, + num_inducing=10, mean=None, rand_gen=None, dtype=None, ctx=None): if not isinstance(X, Variable): X = Variable(value=X) @@ -257,21 +294,26 @@ def __init__(self, X, kernel, noise_var, inducing_inputs=None, inputs = [('X', X), ('inducing_inputs', inducing_inputs), ('noise_var', noise_var)] input_names = [k for k, _ in inputs] + if mean is not None: + inputs.append(('mean', mean)) + input_names.append('mean') + self._has_mean = True + else: + self._has_mean = False output_names = ['random_variable'] super(SparseGPRegression, self).__init__( inputs=inputs, outputs=None, input_names=input_names, output_names=output_names, rand_gen=rand_gen, dtype=dtype, ctx=ctx) - self.mean_func = mean_func self.kernel = kernel def _generate_outputs(self, output_shapes=None): """ Generate the output of the module with given output_shapes. - :param output_shape: the shapes of all the output variables - :type output_shape: {str: tuple} + :param output_shapes: the shapes of all the output variables + :type output_shapes: {str: tuple} """ - if output_shapes is None: + if output_shapes['random_variable'] is None: Y_shape = self.X.shape[:-1] + (1,) else: Y_shape = output_shapes['random_variable'] @@ -290,25 +332,24 @@ def _build_module_graphs(self): graph.U = GaussianProcess.define_variable( X=graph.inducing_inputs, kernel=self.kernel, shape=(graph.inducing_inputs.shape[0], Y.shape[-1]), - mean_func=self.mean_func, rand_gen=self._rand_gen, dtype=self.dtype, - ctx=self.ctx) + rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx) + if self._has_mean: + mean = self.mean.replicate_self() + graph.mean = mean + else: + mean = None graph.F = ConditionalGaussianProcess.define_variable( X=graph.X, X_cond=graph.inducing_inputs, Y_cond=graph.U, - kernel=self.kernel, shape=Y.shape, mean_func=self.mean_func, + kernel=self.kernel, shape=Y.shape, mean=mean, rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx) graph.Y = Y.replicate_self() graph.Y.set_prior(Normal( mean=graph.F, variance=broadcast_to(graph.noise_var, graph.Y.shape), rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx)) - graph.mean_func = self.mean_func graph.kernel = graph.U.factor.kernel post = Posterior(graph) - # TODO: allow cloning kernel to be in both model and posterior. - # post.F.assign_factor(ConditionalGaussianProcess( - # X=post.X, X_cond=post.inducing_inputs, Y_cond=post.U, - # kernel=self.kernel, mean_func=self.mean_func, - # rand_gen=self.rand_gen, dtype=self.dtype, ctx=self.ctx)) - # post.U.assign_factor(MultivariateNormal()) + # The posterior graph here is used as the place holder + # intermediate inference results, which will be used for prediction. post.L = Variable(shape=(M, M)) post.LA = Variable(shape=(M, M)) post.wv = Variable(shape=(M, Y.shape[-1])) @@ -325,7 +366,8 @@ def _attach_default_inference_algorithms(self): [v for k, v in self.outputs] self.attach_log_pdf_algorithms( targets=self.output_names, conditionals=self.input_names, - algorithm=SparseGPRegressionLogPdf(self._module_graph, self._extra_graphs[0], observed), alg_name='sgp_log_pdf') + algorithm=SparseGPRegressionLogPdf(self._module_graph, self._extra_graphs[0], observed), + alg_name='sgp_log_pdf') observed = [v for k, v in self.inputs] self.attach_draw_samples_algorithms( @@ -342,7 +384,7 @@ def _attach_default_inference_algorithms(self): @staticmethod def define_variable(X, kernel, noise_var, shape=None, inducing_inputs=None, - num_inducing=10, mean_func=None, rand_gen=None, + num_inducing=10, mean=None, rand_gen=None, dtype=None, ctx=None): """ Creates and returns a variable drawn from a sparse Gaussian process regression. @@ -356,12 +398,13 @@ def define_variable(X, kernel, noise_var, shape=None, inducing_inputs=None, :param shape: the shape of the random variable(s) (the default shape is the same shape as *X* but the last dimension is changed to one.) :type shape: tuple or [tuple] - :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated if not specified. + :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated + if not specified. :type inducing_inputs: Variable - :param inducing_num: the number of inducing points of sparse GP (default: 10) - :type inducing_num: int - :param mean_func: the mean function of Gaussian process. - :type mean_func: MXFusionFunction + :param num_inducing: the number of inducing points of sparse GP (default: 10) + :type num_inducing: int + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -372,7 +415,7 @@ def define_variable(X, kernel, noise_var, shape=None, inducing_inputs=None, gp = SparseGPRegression( X=X, kernel=kernel, noise_var=noise_var, inducing_inputs=inducing_inputs, num_inducing=num_inducing, - mean_func=mean_func, rand_gen=rand_gen, dtype=dtype, ctx=ctx) + mean=mean, rand_gen=rand_gen, dtype=dtype, ctx=ctx) gp._generate_outputs({'random_variable': shape}) return gp.random_variable @@ -383,5 +426,5 @@ def replicate_self(self, attribute_map=None): rep = super(SparseGPRegression, self).replicate_self(attribute_map) rep.kernel = self.kernel.replicate_self(attribute_map) - rep.mean_func = None if self.mean_func is None else self.mean_func.replicate_self(attribute_map) + rep._has_mean = self._has_mean return rep diff --git a/mxfusion/modules/gp_modules/svgp_regression.py b/mxfusion/modules/gp_modules/svgp_regression.py index 5161d74..bfbda08 100644 --- a/mxfusion/modules/gp_modules/svgp_regression.py +++ b/mxfusion/modules/gp_modules/svgp_regression.py @@ -31,7 +31,8 @@ class SVGPRegressionLogPdf(VariationalInference): """ - The inference algorithm for computing the variational lower bound of the stochastic variational Gaussian process with Gaussian likelihood. + The inference algorithm for computing the variational lower bound of the stochastic variational Gaussian process + with Gaussian likelihood. """ def __init__(self, model, posterior, observed, jitter=0.): super(SVGPRegressionLogPdf, self).__init__( @@ -40,6 +41,7 @@ def __init__(self, model, posterior, observed, jitter=0.): self.jitter = jitter def compute(self, F, variables): + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] Y = variables[self.model.Y] Z = variables[self.model.inducing_inputs] @@ -56,7 +58,13 @@ def compute(self, F, variables): X, Y, Z, noise_var, mu, S_W, S_diag, kern_params = arrays_as_samples( F, [X, Y, Z, noise_var, mu, S_W, S_diag, kern_params]) - noise_var_m = F.expand_dims(noise_var, axis=-2) + if noise_var.ndim == 2: # it is heteroscedastic noise, when ndim == 3 + noise_var = F.expand_dims(noise_var, axis=-2) + + if noise_var.shape[-1] == 1: + beta_sum = D*F.sum(1/noise_var, axis=-1) + else: + beta_sum = F.sum(1/noise_var, axis=-1) Kuu = kern.K(F, Z, **kern_params) if self.jitter > 0.: @@ -67,33 +75,35 @@ def compute(self, F, variables): S = F.linalg.syrk(S_W) + make_diagonal(F, S_diag) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] Y = Y - mean - psi1Y = F.linalg.gemm2(Kuf, Y, False, False) + psi1Y = F.linalg.gemm2(Kuf, Y/noise_var, False, False) L = F.linalg.potrf(Kuu) Ls = F.linalg.potrf(S) LinvLs = F.linalg.trsm(L, Ls) Linvmu = F.linalg.trsm(L, mu) LinvKuf = F.linalg.trsm(L, Kuf) - LinvKufY = F.linalg.trsm(L, psi1Y)/noise_var_m - LmInvPsi2LmInvT = F.linalg.syrk(LinvKuf)/noise_var_m - LinvSLinvT = F.linalg.syrk(LinvLs) - LmInvSmuLmInvT = LinvSLinvT*D + F.linalg.syrk(Linvmu) + KfuKuuInvmu = F.linalg.gemm2(LinvKuf, Linvmu, True, False) + KfuKuuInvLs = F.linalg.gemm2(LinvKuf, LinvLs, True, False) + + LinvKufY = F.linalg.trsm(L, psi1Y) KL_u = (M/2. + F.linalg.sumlogdiag(Ls))*D - F.linalg.sumlogdiag(L)*D\ - F.sum(F.sum(F.square(LinvLs), axis=-1), axis=-1)/2.*D \ - F.sum(F.sum(F.square(Linvmu), axis=-1), axis=-1)/2. logL = -F.sum(F.sum(F.square(Y)/noise_var + np.log(2. * np.pi) + - F.log(noise_var_m), axis=-1), axis=-1)/2. - logL = logL - D/2.*F.sum(Kff_diag/noise_var, axis=-1) - logL = logL - F.sum(F.sum(LmInvSmuLmInvT*LmInvPsi2LmInvT, axis=-1), + F.log(noise_var), axis=-1), axis=-1)/2. + logL = logL - F.sum(Kff_diag*beta_sum, axis=-1)/2. + logL = logL - F.sum(F.sum(F.square(KfuKuuInvmu)/noise_var, axis=-1), + axis=-1)/2. + logL = logL - F.sum(F.sum(F.square(KfuKuuInvLs)*F.expand_dims(beta_sum, axis=-1), axis=-1), + axis=-1)/2. + logL = logL + F.sum(F.sum(F.square(LinvKuf)*F.expand_dims(beta_sum, axis=-2), axis=-1), axis=-1)/2. - logL = logL + F.sum(F.sum(F.square(LinvKuf)/noise_var_m, axis=-1), - axis=-1)*D/2. logL = logL + F.sum(F.sum(Linvmu*LinvKufY, axis=-1), axis=-1) logL = self.log_pdf_scaling*logL + KL_u return logL @@ -109,6 +119,18 @@ def __init__(self, model, posterior, observed, noise_free=True, self.diagonal_variance = diagonal_variance def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] N = X.shape[-2] Z = variables[self.model.inducing_inputs] @@ -135,8 +157,8 @@ def compute(self, F, variables): Kxt = kern.K(F, Z, X, **kern_params) mu = F.linalg.gemm2(Kxt, wv, True, False) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] mu = mu + mean LinvKxt = F.linalg.trsm(L, Kxt) @@ -145,15 +167,19 @@ def compute(self, F, variables): tmp = F.linalg.gemm2(LinvSLinvT, LinvKxt) var = Ktt - F.sum(F.square(LinvKxt), axis=-2) + \ F.sum(tmp*LinvKxt, axis=-2) + var = F.expand_dims(var, axis=-1) if not self.noise_free: - var += noise_var + var = var + noise_var else: Ktt = kern.K(F, X, **kern_params) tmp = F.linalg.gemm2(LinvSLinvT, LinvKxt) var = Ktt - F.linalg.syrk(LinvKxt, True) + \ F.linalg.gemm2(LinvKxt, tmp, True, False) + var = F.expand_dims(var, axis=-1) if not self.noise_free: - var += F.eye(N, dtype=X.dtype) * noise_var + var = var + \ + F.reshape(F.eye(N, dtype=X.dtype), shape=(1, N, N, 1)) * \ + F.expand_dims(noise_var, axis=-2) outcomes = {self.model.Y.uuid: (mu, var)} @@ -175,6 +201,18 @@ def __init__(self, model, posterior, observed, rand_gen=None, self.jitter = jitter def compute(self, F, variables): + """ + The method for the computation of the sampling algorithm + + :param F: the execution context (mxnet.ndarray or mxnet.symbol) + :type F: Python module + :param variables: the set of MXNet arrays that holds the values of + variables at runtime. + :type variables: {str(UUID): MXNet NDArray or MXNet Symbol} + :returns: the outcome of the inference algorithm + :rtype: mxnet.ndarray.ndarray.NDArray or mxnet.symbol.symbol.Symbol + """ + has_mean = self.model.F.factor.has_mean X = variables[self.model.X] N = X.shape[-2] Z = variables[self.model.inducing_inputs] @@ -186,6 +224,9 @@ def compute(self, F, variables): kern = self.model.kernel kern_params = kern.fetch_parameters(variables) + X, Z, noise_var, mu, S_W, S_diag, kern_params = arrays_as_samples( + F, [X, Z, noise_var, mu, S_W, S_diag, kern_params]) + S = F.linalg.syrk(S_W) + make_diagonal(F, S_diag) Kuu = kern.K(F, Z, **kern_params) @@ -201,8 +242,8 @@ def compute(self, F, variables): Kxt = kern.K(F, Z, X, **kern_params) mu = F.linalg.gemm2(Kxt, wv, True, False) - if self.model.mean_func is not None: - mean = self.model.mean_func(F, X) + if has_mean: + mean = variables[self.model.mean] mu = mu + mean LinvKxt = F.linalg.trsm(L, Kxt) @@ -213,7 +254,8 @@ def compute(self, F, variables): F.sum(tmp*LinvKxt, axis=-2) if not self.noise_free: var += noise_var - die = self._rand_gen.sample_normal(shape=(self.num_samples,) + mu.shape[1:], dtype=self.model.F.factor.dtype) + die = self._rand_gen.sample_normal(shape=(self.num_samples,) + mu.shape[1:], + dtype=self.model.F.factor.dtype) samples = mu + die * F.sqrt(F.expand_dims(var, axis=-1)) else: Ktt = kern.K(F, X, **kern_params) @@ -250,12 +292,13 @@ class SVGPRegression(Module): :type kernel: Kernel :param noise_var: the variance of the Gaussian likelihood :type noise_var: Variable - :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated if not specified. + :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated + if not specified. :type inducing_inputs: Variable - :param inducing_num: the number of inducing points of sparse GP (default: 10) - :type inducing_num: int - :param mean_func: the mean function of Gaussian process. - :type mean_func: MXFusionFunction + :param num_inducing: the number of inducing points of sparse GP (default: 10) + :type num_inducing: int + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -265,32 +308,39 @@ class SVGPRegression(Module): """ def __init__(self, X, kernel, noise_var, inducing_inputs=None, - num_inducing=10, mean_func=None, + num_inducing=10, mean=None, rand_gen=None, dtype=None, ctx=None): if not isinstance(X, Variable): X = Variable(value=X) if not isinstance(noise_var, Variable): noise_var = Variable(value=noise_var) if inducing_inputs is None: - inducing_inputs = Variable(shape=(num_inducing, kernel.input_dim)) + inducing_inputs = Variable( + shape=(num_inducing, kernel.input_dim), + initial_value=np.random.randn(num_inducing, kernel.input_dim)) inputs = [('X', X), ('inducing_inputs', inducing_inputs), ('noise_var', noise_var)] input_names = [k for k, _ in inputs] + if mean is not None: + inputs.append(('mean', mean)) + input_names.append('mean') + self._has_mean = True + else: + self._has_mean = False output_names = ['random_variable'] super(SVGPRegression, self).__init__( inputs=inputs, outputs=None, input_names=input_names, output_names=output_names, dtype=dtype, ctx=ctx) - self.mean_func = mean_func self.kernel = kernel def _generate_outputs(self, output_shapes=None): """ Generate the output of the module with given output_shapes. - :param output_shape: the shapes of all the output variables - :type output_shape: {str: tuple} + :param output_shapes: the shapes of all the output variables + :type output_shapes: {str: tuple} """ - if output_shapes is None: + if output_shapes['random_variable'] is None: Y_shape = self.X.shape[:-1] + (1,) else: Y_shape = output_shapes['random_variable'] @@ -309,17 +359,20 @@ def _build_module_graphs(self): graph.U = GaussianProcess.define_variable( X=graph.inducing_inputs, kernel=self.kernel, shape=(graph.inducing_inputs.shape[0], Y.shape[-1]), - mean_func=self.mean_func, rand_gen=self._rand_gen, dtype=self.dtype, - ctx=self.ctx) + rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx) + if self._has_mean: + mean = self.mean.replicate_self() + graph.mean = mean + else: + mean = None graph.F = ConditionalGaussianProcess.define_variable( X=graph.X, X_cond=graph.inducing_inputs, Y_cond=graph.U, - kernel=self.kernel, shape=Y.shape, mean_func=self.mean_func, + kernel=self.kernel, shape=Y.shape, mean=mean, rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx) graph.Y = Y.replicate_self() graph.Y.set_prior(Normal( mean=graph.F, variance=broadcast_to(graph.noise_var, graph.Y.shape), rand_gen=self._rand_gen, dtype=self.dtype, ctx=self.ctx)) - graph.mean_func = self.mean_func graph.kernel = graph.U.factor.kernel post = Posterior(graph) post.qU_cov_diag = Variable(shape=(M,), transformation=PositiveTransformation()) @@ -357,10 +410,11 @@ def _attach_default_inference_algorithms(self): @staticmethod def define_variable(X, kernel, noise_var, shape=None, inducing_inputs=None, - num_inducing=10, mean_func=None, rand_gen=None, + num_inducing=10, mean=None, rand_gen=None, dtype=None, ctx=None): """ - Creates and returns a variable drawn from a Stochastic variational sparse Gaussian process regression with Gaussian likelihood. + Creates and returns a variable drawn from a Stochastic variational sparse Gaussian process regression with + Gaussian likelihood. :param X: the input variables on which the random variables are conditioned. :type X: Variable @@ -371,12 +425,13 @@ def define_variable(X, kernel, noise_var, shape=None, inducing_inputs=None, :param shape: the shape of the random variable(s) (the default shape is the same shape as *X* but the last dimension is changed to one.) :type shape: tuple or [tuple] - :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated if not specified. + :param inducing_inputs: the inducing inputs of the sparse GP (optional). This variable will be auto-generated + if not specified. :type inducing_inputs: Variable - :param inducing_num: the number of inducing points of sparse GP (default: 10) - :type inducing_num: int - :param mean_func: the mean function of Gaussian process. - :type mean_func: MXFusionFunction + :param num_inducing: the number of inducing points of sparse GP (default: 10) + :type num_inducing: int + :param mean: the mean of Gaussian process. + :type mean: Variable :param rand_gen: the random generator (default: MXNetRandomGenerator). :type rand_gen: RandomGenerator :param dtype: the data type for float point numbers. @@ -387,7 +442,7 @@ def define_variable(X, kernel, noise_var, shape=None, inducing_inputs=None, gp = SVGPRegression( X=X, kernel=kernel, noise_var=noise_var, inducing_inputs=inducing_inputs, num_inducing=num_inducing, - mean_func=mean_func, rand_gen=rand_gen, dtype=dtype, ctx=ctx) + mean=mean, rand_gen=rand_gen, dtype=dtype, ctx=ctx) gp._generate_outputs({'random_variable': shape}) return gp.random_variable @@ -398,5 +453,5 @@ def replicate_self(self, attribute_map=None): rep = super(SVGPRegression, self).replicate_self(attribute_map) rep.kernel = self.kernel.replicate_self(attribute_map) - rep.mean_func = None if self.mean_func is None else self.mean_func.replicate_self(attribute_map) + rep._has_mean = self._has_mean return rep diff --git a/mxfusion/modules/module.py b/mxfusion/modules/module.py index 588b762..bbedbd4 100644 --- a/mxfusion/modules/module.py +++ b/mxfusion/modules/module.py @@ -55,8 +55,7 @@ def __init__(self, inputs, outputs, input_names, super(Module, self).__init__( inputs=inputs, outputs=outputs, input_names=input_names, output_names=output_names) - self._rand_gen = MXNetRandomGenerator if rand_gen is None else \ - rand_gen + self._rand_gen = MXNetRandomGenerator if rand_gen is None else rand_gen self.dtype = get_default_dtype() if dtype is None else dtype self.ctx = ctx self._module_graph = None @@ -77,18 +76,20 @@ def __getitem__(self, key): if key in g: return g[key] return self._module_graph[key] + def _generate_outputs(self, output_shapes): """ Generate the output of the module with given output_shapes. - :param output_shape: the shapes of all the output variables - :type output_shape: {str: tuple} + :param output_shapes: the shapes of all the output variables + :type output_shapes: {str: tuple} """ raise NotImplementedError def _build_module_graphs(self): """ - The internal method for constructing the internal factor graphs of the module. This method needs to be overridden by specific probabilistic modules. + The internal method for constructing the internal factor graphs of the module. + This method needs to be overridden by specific probabilistic modules. :returns: model, extra factor graphs :rtypes: Model, [FactorGraph] @@ -97,19 +98,20 @@ def _build_module_graphs(self): def _attach_default_inference_algorithms(self): """ - The internal method for attaching default inference algorithms of the module. This method needs to be overridden by specific probabilistic modules. + The internal method for attaching default inference algorithms of the module. + This method needs to be overridden by specific probabilistic modules. """ raise NotImplementedError def set_outputs(self, variables): """ - This method overrides the set_outputs method of Factor. It triggers the initialization produces of a probabilistic module including building the factor graphs and attaching default inference algorithms. + This method overrides the set_outputs method of Factor. It triggers the initialization produces of a + probabilistic module including building the factor graphs and attaching default inference algorithms. :param variables: The list of variables to be set as the outputs of the module - :type variable: Variable or (Variable,) + :type variables: Variable or (Variable,) """ - variables = [variables] if not isinstance(variables, (list, tuple)) \ - else variables + variables = [variables] if not isinstance(variables, (list, tuple)) else variables outputs = {name: variable for name, variable in zip(self.output_names, variables)} self.successors = [(k, v) for k, v in outputs.items()] @@ -188,8 +190,7 @@ def get_names_from_uuid(self, uuids): return tuple(sorted([uuid_to_names[uuid] for uuid in uuids if uuid in uuid_to_names])) - def attach_log_pdf_algorithms(self, targets, conditionals, algorithm, - alg_name=None): + def attach_log_pdf_algorithms(self, targets, conditionals, algorithm, alg_name=None): """ Attach an inference algorithm for computing the log_pdf of the module. @@ -200,11 +201,12 @@ def attach_log_pdf_algorithms(self, targets, conditionals, algorithm, :param algorithm: the inference algorithm to compute log probability of the module. :type algorithm: InferenceAlgorithm + :param alg_name: The name of the algorithm + :type alg_name: str """ self._attach_algorithm(self._log_pdf_algorithms, targets, conditionals, algorithm, alg_name) - def attach_draw_samples_algorithms(self, targets, conditionals, algorithm, - alg_name=None): + def attach_draw_samples_algorithms(self, targets, conditionals, algorithm, alg_name=None): """ Attach an inference algorithm for drawing samples from the module. @@ -214,12 +216,12 @@ def attach_draw_samples_algorithms(self, targets, conditionals, algorithm, :type conditionals: tuple of str :param algorithm: the inference algorithm to draw samples of the chosen target variables from the module. :type algorithm: InferenceAlgorithm + :param alg_name: The name of the algorithm + :type alg_name: str """ self._attach_algorithm(self._draw_samples_algorithms, targets, conditionals, algorithm, alg_name) - - def attach_prediction_algorithms(self, targets, conditionals, algorithm, - alg_name=None): + def attach_prediction_algorithms(self, targets, conditionals, algorithm, alg_name=None): """ Attach an inference algorithm for prediction from the module. @@ -229,6 +231,8 @@ def attach_prediction_algorithms(self, targets, conditionals, algorithm, :type conditionals: tuple of str :param algorithm: the inference algorithm to predict the chosen target variables from the module. :type algorithm: InferenceAlgorithm + :param alg_name: The name of the algorithm + :type alg_name: str """ self._attach_algorithm(self._prediction_algorithms, targets, conditionals, algorithm, alg_name) @@ -257,7 +261,8 @@ def _preprocess_attach_parameters(self, targets, conditionals): def _set_algorithm_name(self, alg_name, algorithm): """ - Sets the attribute of self with the algorithm name, overriding an old algorithm that had the same name. If something other than an InferenceAlgorithm has that name, prints a warning and returns None for alg_name. + Sets the attribute of self with the algorithm name, overriding an old algorithm that had the same name. + If something other than an InferenceAlgorithm has that name, prints a warning and returns None for alg_name. """ from ..inference.inference_alg import InferenceAlgorithm @@ -267,14 +272,17 @@ def _set_algorithm_name(self, alg_name, algorithm): elif isinstance(getattr(self, alg_name), InferenceAlgorithm): setattr(self, alg_name, algorithm) else: - warnings.warn('Something ({}) in this module ({}) is already using the attribute \"{}\". Skipping setting that name to the algorithm.'.format(str(getattr(self, alg_name)),str(self), str(alg_name))) + warnings.warn('Something ({}) in this module ({}) is already using the attribute \"{}\". ' + 'Skipping setting that name to the algorithm.'.format(str(getattr(self, alg_name)), + str(self), str(alg_name))) alg_name = None return alg_name def _attach_duplicate_conditional_algorithm(self, algorithms, targets, conditionals, algorithm, alg_name): """ Mutates the algorithms object, adding the new algorithm to it. - Also removes the name of an old inference algorithm if it had the same (targets, conditional) pair as the new algorithm. + Also removes the name of an old inference algorithm if it had the same (targets, conditional) + pair as the new algorithm. """ methods = algorithms[conditionals] no_match = True @@ -295,9 +303,9 @@ def _attach_duplicate_conditional_algorithm(self, algorithms, targets, condition def log_pdf(self, F, variables, targets=None): """ - Compute the logarithm of the probability/probability density of a set of random variables in the Module. The set of random - variables are specified in the "target" argument and any necessary conditional variables are specified in the "conditionals" argument. - Any relevant constants are specified in the "constants" argument. + Compute the logarithm of the probability/probability density of a set of random variables in the Module. + The set of random variables are specified in the "target" argument and any necessary conditional variables + are specified in the "conditionals" argument. Any relevant constants are specified in the "constants" argument. :param F: the MXNet computation mode (``mxnet.symbol`` or ``mxnet.ndarray``). :param variables: The set of variables @@ -307,15 +315,18 @@ def log_pdf(self, F, variables, targets=None): :returns: the sum of the log probability of all the target variables. :rtype: mxnet NDArray or mxnet Symbol """ - alg = self._get_algorithm_for_target_conditional_pair(self._log_pdf_algorithms, targets, variables, exact_match=True) + alg = self._get_algorithm_for_target_conditional_pair(self._log_pdf_algorithms, targets, variables, + exact_match=True) alg.log_pdf_scaling = self.log_pdf_scaling result = alg.compute(F, variables) return result def draw_samples(self, F, variables, num_samples=1, targets=None): """ - Draw samples from the target variables of the Module. If the ``targets`` argument is None, draw samples from all the variables - that are *not* in the conditional variables. If the ``targets`` argument is given, this method returns a list of samples of variables in the order of the target argument, otherwise it returns a dict of samples where the keys are the UUIDs of variables and the values are the samples. + Draw samples from the target variables of the Module. If the ``targets`` argument is None, draw samples from + all the variables that are *not* in the conditional variables. If the ``targets`` argument is given, this + method returns a list of samples of variables in the order of the target argument, otherwise it returns a dict + of samples where the keys are the UUIDs of variables and the values are the samples. :param F: the MXNet computation mode (``mxnet.symbol`` or ``mxnet.ndarray``). :param variables: The set of variables @@ -339,14 +350,15 @@ def predict(self, F, variables, num_samples=1, targets=None): :param F: the MXNet computation mode (``mxnet.symbol`` or ``mxnet.ndarray``). :param variables: The set of variables :type variables: {UUID : MXNet NDArray or MXNet Symbol} - :param num_samples: The number of samples to draw for the target variables if sampling is used for prediction. (optional) + :param num_samples: The number of samples to draw for the target variables if sampling is used for prediction. + (optional) :type num_samples: int :param targets: a list of Variables to predict. :type targets: [UUID] :returns: the sum of the log probability of all the target variables. :rtype: mxnet NDArray or mxnet Symbol """ - alg = self._get_algorithm_for_target_conditional_pair(self._prediction_algorithms, targets, variables) + alg = self._get_algorithm_for_target_conditional_pair(self._prediction_algorithms, targets, variables, exact_match=True) alg.num_samples = num_samples alg.target_variables = targets return alg.compute(F, variables) @@ -354,14 +366,16 @@ def predict(self, F, variables, num_samples=1, targets=None): def _get_algorithm_for_target_conditional_pair(self, algorithms, targets, variables, exact_match=False): """ Searches through the algorithms to find the right algorithm for the target/conditional pair. - :param exact_match: This indicates whether the targets passed in must be precisely those in the algorithm, or whether a subset of targets will suffice. + :param exact_match: This indicates whether the targets passed in must be precisely those in the algorithm, + or whether a subset of targets will suffice. """ if targets is None: target_names = tuple(sorted(self.output_names.copy())) else: target_names = self.get_names_from_uuid(targets) conditionals_names = self.get_names_from_uuid(variables.keys()) - conditionals_names = conditionals_names if not exact_match else tuple(sorted(set(conditionals_names) - set(target_names))) + conditionals_names = conditionals_names if not exact_match else \ + tuple(sorted(set(conditionals_names) - set(target_names))) if conditionals_names in algorithms: algs = algorithms[conditionals_names] @@ -372,15 +386,21 @@ def _get_algorithm_for_target_conditional_pair(self, algorithms, targets, variab if exact_match and target_names == set(t): return alg - raise ModelSpecificationError("The targets-conditionals pattern for draw_samples computation "+str((target_names, conditionals_names))+" cannot find a matched inference algorithm.") + raise ModelSpecificationError("The targets-conditionals pattern for draw_samples computation " + + str((target_names, conditionals_names)) + + " cannot find a matched inference algorithm.") def prepare_executor(self, rv_scaling=None): """ - Prepare the creation of an executor. This includes collecting the list of variable transformations and the list of the variables that are inherited from external Gluon blocks, and setting log_pdf_scaling for random variables. + Prepare the creation of an executor. This includes collecting the list of variable transformations and the list + of the variables that are inherited from external Gluon blocks, and setting log_pdf_scaling for + random variables. - :param rv_scaling: The scaling of log_pdf of the random variables that are set by users for data sub-sampling or mini-batch learning. + :param rv_scaling: The scaling of log_pdf of the random variables that are set by users for data sub-sampling + or mini-batch learning. :type rv_scaling: {UUID: float} - :returns: the list of the variable transformations and the list of the variables that are excluded from being set as Gluon block parameters (see the excluded argument of __init__ of ObjectiveBlock). + :returns: the list of the variable transformations and the list of the variables that are excluded from being + set as Gluon block parameters (see the excluded argument of __init__ of ObjectiveBlock). :rtypes: {str(UUID): Transformation}, set(str(UUID)) """ excluded = set() @@ -390,8 +410,6 @@ def prepare_executor(self, rv_scaling=None): for v in g.variables.values(): if v.type == VariableType.PARAMETER and v.transformation is not None: var_trans[v.uuid] = v.transformation - if v.type == VariableType.PARAMETER and v.isInherited: - excluded.add(v.uuid) if v.type == VariableType.RANDVAR: if v.uuid in rv_scaling: v.factor.log_pdf_scaling = rv_scaling[v.uuid] @@ -407,8 +425,11 @@ def _clone_algorithms(self, algorithms, replicant): for conditionals, algorithms in algorithms.items(): for targets, algorithm, alg_name in algorithms: graphs_index = {g: i for i,g in enumerate(self._extra_graphs)} - extra_graphs = [replicant._extra_graphs[graphs_index[graph]] for graph in algorithm.graphs if graph in graphs_index] - algs[conditionals] = (targets, algorithm.replicate_self(replicant._module_graph, extra_graphs), alg_name) + extra_graphs = [replicant._extra_graphs[graphs_index[graph]] for graph in algorithm.graphs + if graph in graphs_index] + algs[conditionals] = (targets, + algorithm.replicate_self(replicant._module_graph, extra_graphs), + alg_name) return algs def reconcile_with_module(self, previous_module): @@ -417,7 +438,9 @@ def reconcile_with_module(self, previous_module): primary_previous_graph = previous_module._module_graph secondary_previous_graphs = previous_module._extra_graphs primary_current_graph = self._module_graph - component_map = FactorGraph.reconcile_graphs(current_graphs, primary_previous_graph, secondary_previous_graphs=secondary_previous_graphs, primary_current_graph=primary_current_graph) + component_map = FactorGraph.reconcile_graphs(current_graphs, primary_previous_graph, + secondary_previous_graphs=secondary_previous_graphs, + primary_current_graph=primary_current_graph) return component_map def replicate_self(self, attribute_map=None): @@ -445,10 +468,10 @@ def load_module(self, module_json): from ..models import FactorGraph self._module_graph = FactorGraph(module_json['graphs'][0]['name']).load_from_json(module_json['graphs'][0]) if len(module_json['graphs']) > 1: - self._extra_graphs = [FactorGraph(extra_graph['name']).load_from_json(extra_graph) for extra_graph in module_json['graphs'][1:]] + self._extra_graphs = [FactorGraph(extra_graph['name']).load_from_json(extra_graph) + for extra_graph in module_json['graphs'][1:]] return self - def as_json(self): mod_dict = super(Module, self).as_json() graphs = [g.as_json()for g in [self._module_graph] + self._extra_graphs] diff --git a/mxfusion/util/testutils.py b/mxfusion/util/testutils.py index f699d04..bf9b9a8 100644 --- a/mxfusion/util/testutils.py +++ b/mxfusion/util/testutils.py @@ -215,3 +215,18 @@ def plot_bivariate(samples, dist, buffer=0, **kwargs): ax.contour(x, y, z, levels=10, linewidth=10) ax.scatter(samples[:, 0], samples[:, 1], alpha=0.05) plt.show() + + +def make_spd_matrix(dim): + """ + Generate a random symmetric, positive-definite matrix. + + :param dim: The matrix dimension (matrix is square). + :type dim: int + :return X: The random symmetric, positive-definite matrix. + :rtype: array of shape [n_dim, n_dim] + """ + A = np.random.rand(dim, dim) + U, s, V = np.linalg.svd(np.dot(A.T, A)) + X = np.dot(np.dot(U, 1.0 + np.diag(np.random.rand(dim))), V) + return X diff --git a/requirements/test_requirements.txt b/requirements/test_requirements.txt index 4c7d901..2553dea 100644 --- a/requirements/test_requirements.txt +++ b/requirements/test_requirements.txt @@ -6,5 +6,4 @@ pytest-cov>=2.5.1 scipy>=1.1.0 GPy>=1.9.6 matplotlib -scikit-learn>=0.20.0 mxnet>=1.3 diff --git a/testing/components/distributions/gp/cond_gp_test.py b/testing/components/distributions/gp/cond_gp_test.py index 1cacbb8..b82cbb3 100644 --- a/testing/components/distributions/gp/cond_gp_test.py +++ b/testing/components/distributions/gp/cond_gp_test.py @@ -15,14 +15,17 @@ import pytest import mxnet as mx +import mxnet.gluon.nn as nn import numpy as np from mxfusion.models import Model from mxfusion.components.variables.runtime_variable import array_has_samples, get_num_samples from mxfusion.components.distributions import ConditionalGaussianProcess from mxfusion.components.distributions.gp.kernels import RBF from mxfusion.components.variables import Variable +from mxfusion.components.functions import MXFusionGluonFunction from mxfusion.util.testutils import prepare_mxnet_array from mxfusion.util.testutils import MockMXNetRandomGenerator +from mxfusion.common.exceptions import ModelSpecificationError from scipy.stats import multivariate_normal import matplotlib matplotlib.use('Agg') @@ -88,6 +91,78 @@ def test_log_pdf(self, dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, assert get_num_samples(mx.nd, log_pdf_rt) == num_samples assert np.allclose(log_pdf_np, log_pdf_rt) + @pytest.mark.parametrize("dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, Y_cond_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv, rv_isSamples, num_samples", [ + (np.float64, np.random.rand(5,2), False, np.random.rand(8,2), False, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(3,5,1), True, 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(8,2), False, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(5,1), False, 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(8,2), False, np.random.rand(3,8,1), True, np.random.rand(3,2)+0.1, True, np.random.rand(3,1)+0.1, True, np.random.rand(3,5,1), True, 3), + (np.float64, np.random.rand(5,2), False, np.random.rand(8,2), False, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(5,1), False, 1), + ]) + def test_log_pdf_w_mean(self, dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, Y_cond_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, + rv, rv_isSamples, num_samples): + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(rv.shape[-1], flatten=False, activation="tanh", + in_units=X.shape[-1], dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + from scipy.linalg.lapack import dtrtrs + X_mx = prepare_mxnet_array(X, X_isSamples, dtype) + X_cond_mx = prepare_mxnet_array(X_cond, X_cond_isSamples, dtype) + Y_cond_mx = prepare_mxnet_array(Y_cond, Y_cond_isSamples, dtype) + rbf_lengthscale_mx = prepare_mxnet_array(rbf_lengthscale, rbf_lengthscale_isSamples, dtype) + rbf_variance_mx = prepare_mxnet_array(rbf_variance, rbf_variance_isSamples, dtype) + rv_mx = prepare_mxnet_array(rv, rv_isSamples, dtype) + rv_shape = rv.shape[1:] if rv_isSamples else rv.shape + mean_mx = net(X_mx) + mean_np = mean_mx.asnumpy() + mean_cond_mx = net(X_cond_mx) + mean_cond_np = mean_cond_mx.asnumpy() + + rbf = RBF(2, True, 1., 1., 'rbf', None, dtype) + X_var = Variable(shape=(5,2)) + X_cond_var = Variable(shape=(8,2)) + Y_cond_var = Variable(shape=(8,1)) + mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + mean_var = mean_func(X_var) + mean_cond_var = mean_func(X_cond_var) + gp = ConditionalGaussianProcess.define_variable(X=X_var, X_cond=X_cond_var, Y_cond=Y_cond_var, mean=mean_var, mean_cond=mean_cond_var, kernel=rbf, shape=rv_shape, dtype=dtype).factor + + variables = {gp.X.uuid: X_mx, gp.X_cond.uuid: X_cond_mx, gp.Y_cond.uuid: Y_cond_mx, gp.rbf_lengthscale.uuid: rbf_lengthscale_mx, gp.rbf_variance.uuid: rbf_variance_mx, gp.random_variable.uuid: rv_mx, gp.mean.uuid: mean_mx, gp.mean_cond.uuid: mean_cond_mx} + log_pdf_rt = gp.log_pdf(F=mx.nd, variables=variables).asnumpy() + + log_pdf_np = [] + for i in range(num_samples): + X_i = X[i] if X_isSamples else X + X_cond_i = X_cond[i] if X_cond_isSamples else X_cond + Y_cond_i = Y_cond[i] if Y_cond_isSamples else Y_cond + Y_cond_i = Y_cond_i - mean_cond_np[i] if X_cond_isSamples else Y_cond_i - mean_cond_np[0] + lengthscale_i = rbf_lengthscale[i] if rbf_lengthscale_isSamples else rbf_lengthscale + variance_i = rbf_variance[i] if rbf_variance_isSamples else rbf_variance + rv_i = rv[i] if rv_isSamples else rv + rv_i = rv_i - mean_np[i] if X_isSamples else rv_i - mean_np[0] + rbf_np = GPy.kern.RBF(input_dim=2, ARD=True) + rbf_np.lengthscale = lengthscale_i + rbf_np.variance = variance_i + K_np = rbf_np.K(X_i) + Kc_np = rbf_np.K(X_cond_i, X_i) + Kcc_np = rbf_np.K(X_cond_i) + + L = np.linalg.cholesky(Kcc_np) + LInvY = dtrtrs(L, Y_cond_i, lower=1, trans=0)[0] + LinvKxt = dtrtrs(L, Kc_np, lower=1, trans=0)[0] + + mu = LinvKxt.T.dot(LInvY) + cov = K_np - LinvKxt.T.dot(LinvKxt) + log_pdf_np.append(multivariate_normal.logpdf(rv_i[:,0], mean=mu[:,0], cov=cov)) + log_pdf_np = np.array(log_pdf_np) + isSamples_any = any([X_isSamples, rbf_lengthscale_isSamples, rbf_variance_isSamples, rv_isSamples]) + assert np.issubdtype(log_pdf_rt.dtype, dtype) + assert array_has_samples(mx.nd, log_pdf_rt) == isSamples_any + if isSamples_any: + assert get_num_samples(mx.nd, log_pdf_rt) == num_samples + assert np.allclose(log_pdf_np, log_pdf_rt) + @pytest.mark.parametrize("dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, Y_cond_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv_shape, num_samples", [ (np.float64, np.random.rand(5,2), False, np.random.rand(8,2), False, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), (np.float64, np.random.rand(3,5,2), True, np.random.rand(3,8,2), True, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), @@ -142,7 +217,77 @@ def test_draw_samples(self, dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_c samples_np = np.array(samples_np) assert np.issubdtype(samples_rt.dtype, dtype) assert get_num_samples(mx.nd, samples_rt) == num_samples - print(samples_np, samples_rt) + assert np.allclose(samples_np, samples_rt) + + @pytest.mark.parametrize("dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, Y_cond_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv_shape, num_samples", [ + (np.float64, np.random.rand(5,2), False, np.random.rand(8,2), False, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(3,8,2), True, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(3,8,2), True, np.random.rand(3,8,1), True, np.random.rand(3,2)+0.1, True, np.random.rand(3,1)+0.1, True, (5,1), 3), + (np.float64, np.random.rand(5,2), False, np.random.rand(8,2), False, np.random.rand(8,1), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 1), + ]) + def test_draw_samples_w_mean(self, dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, Y_cond_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, + rv_shape, num_samples): + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(rv_shape[-1], flatten=False, activation="tanh", + in_units=X.shape[-1], dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + from scipy.linalg.lapack import dtrtrs + X_mx = prepare_mxnet_array(X, X_isSamples, dtype) + X_cond_mx = prepare_mxnet_array(X_cond, X_cond_isSamples, dtype) + Y_cond_mx = prepare_mxnet_array(Y_cond, Y_cond_isSamples, dtype) + rbf_lengthscale_mx = prepare_mxnet_array(rbf_lengthscale, rbf_lengthscale_isSamples, dtype) + rbf_variance_mx = prepare_mxnet_array(rbf_variance, rbf_variance_isSamples, dtype) + mean_mx = net(X_mx) + mean_np = mean_mx.asnumpy() + mean_cond_mx = net(X_cond_mx) + mean_cond_np = mean_cond_mx.asnumpy() + + rand = np.random.randn(num_samples, *rv_shape) + rand_gen = MockMXNetRandomGenerator(mx.nd.array(rand.flatten(), dtype=dtype)) + + rbf = RBF(2, True, 1., 1., 'rbf', None, dtype) + X_var = Variable(shape=(5,2)) + X_cond_var = Variable(shape=(8,2)) + Y_cond_var = Variable(shape=(8,1)) + mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + mean_var = mean_func(X_var) + mean_cond_var = mean_func(X_cond_var) + gp = ConditionalGaussianProcess.define_variable(X=X_var, X_cond=X_cond_var, Y_cond=Y_cond_var, mean=mean_var, mean_cond=mean_cond_var, kernel=rbf, shape=rv_shape, dtype=dtype, rand_gen=rand_gen).factor + + variables = {gp.X.uuid: X_mx, gp.X_cond.uuid: X_cond_mx, gp.Y_cond.uuid: Y_cond_mx, gp.rbf_lengthscale.uuid: rbf_lengthscale_mx, gp.rbf_variance.uuid: rbf_variance_mx, gp.mean.uuid: mean_mx, gp.mean_cond.uuid: mean_cond_mx} + samples_rt = gp.draw_samples(F=mx.nd, variables=variables, num_samples=num_samples).asnumpy() + + samples_np = [] + for i in range(num_samples): + X_i = X[i] if X_isSamples else X + X_cond_i = X_cond[i] if X_cond_isSamples else X_cond + Y_cond_i = Y_cond[i] if Y_cond_isSamples else Y_cond + Y_cond_i = Y_cond_i - mean_cond_np[i] if X_cond_isSamples else Y_cond_i - mean_cond_np[0] + lengthscale_i = rbf_lengthscale[i] if rbf_lengthscale_isSamples else rbf_lengthscale + variance_i = rbf_variance[i] if rbf_variance_isSamples else rbf_variance + rand_i = rand[i] + rbf_np = GPy.kern.RBF(input_dim=2, ARD=True) + rbf_np.lengthscale = lengthscale_i + rbf_np.variance = variance_i + K_np = rbf_np.K(X_i) + Kc_np = rbf_np.K(X_cond_i, X_i) + Kcc_np = rbf_np.K(X_cond_i) + + L = np.linalg.cholesky(Kcc_np) + LInvY = dtrtrs(L, Y_cond_i, lower=1, trans=0)[0] + LinvKxt = dtrtrs(L, Kc_np, lower=1, trans=0)[0] + + mu = LinvKxt.T.dot(LInvY) + cov = K_np - LinvKxt.T.dot(LinvKxt) + L_cov_np = np.linalg.cholesky(cov) + sample_np = mu + L_cov_np.dot(rand_i) + samples_np.append(sample_np) + samples_np = np.array(samples_np)+mean_np + assert np.issubdtype(samples_rt.dtype, dtype) + assert get_num_samples(mx.nd, samples_rt) == num_samples assert np.allclose(samples_np, samples_rt) @pytest.mark.parametrize("dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_cond, Y_cond_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv, rv_isSamples, num_samples", [ @@ -200,3 +345,24 @@ def test_clone_cond_gp(self, dtype, X, X_isSamples, X_cond, X_cond_isSamples, Y_ if isSamples_any: assert get_num_samples(mx.nd, log_pdf_rt) == num_samples assert np.allclose(log_pdf_np, log_pdf_rt) + + def test_mean_argument(self): + + with pytest.raises(ModelSpecificationError): + dtype='float64' + + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(1, flatten=False, activation="tanh", + in_units=2, dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + rbf = RBF(2, True, 1., 1., 'rbf', None, dtype) + X_var = Variable(shape=(5, 2)) + X_cond_var = Variable(shape=(8, 2)) + Y_cond_var = Variable(shape=(8, 1)) + mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + mean_var = mean_func(X_var) + mean_cond_var = mean_func(X_cond_var) + gp = ConditionalGaussianProcess.define_variable(X=X_var, X_cond=X_cond_var, Y_cond=Y_cond_var, mean_cond=mean_cond_var, kernel=rbf, shape=(5, 1), dtype=dtype) diff --git a/testing/components/distributions/gp/gp_test.py b/testing/components/distributions/gp/gp_test.py index 28b99c5..caa64b1 100644 --- a/testing/components/distributions/gp/gp_test.py +++ b/testing/components/distributions/gp/gp_test.py @@ -15,12 +15,14 @@ import pytest import mxnet as mx +import mxnet.gluon.nn as nn import numpy as np from mxfusion.models import Model from mxfusion.components.variables.runtime_variable import array_has_samples, get_num_samples from mxfusion.components.distributions import GaussianProcess from mxfusion.components.distributions.gp.kernels import RBF from mxfusion.components import Variable +from mxfusion.components.functions import MXFusionGluonFunction from mxfusion.util.testutils import prepare_mxnet_array from mxfusion.util.testutils import MockMXNetRandomGenerator from scipy.stats import multivariate_normal @@ -72,6 +74,61 @@ def test_log_pdf(self, dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_i assert get_num_samples(mx.nd, log_pdf_rt) == num_samples assert np.allclose(log_pdf_np, log_pdf_rt) + + @pytest.mark.parametrize("dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv, rv_isSamples, num_samples", [ + (np.float64, np.random.rand(5,2), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(3,5,1), True, 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(5,1), False, 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(3,2)+0.1, True, np.random.rand(3,1)+0.1, True, np.random.rand(3,5,1), True, 3), + (np.float64, np.random.rand(5,2), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(5,1), False, 1), + ]) + def test_log_pdf_w_mean(self, dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, + rv, rv_isSamples, num_samples): + + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(rv.shape[-1], flatten=False, activation="tanh", + in_units=X.shape[-1], dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + X_mx = prepare_mxnet_array(X, X_isSamples, dtype) + rbf_lengthscale_mx = prepare_mxnet_array(rbf_lengthscale, rbf_lengthscale_isSamples, dtype) + rbf_variance_mx = prepare_mxnet_array(rbf_variance, rbf_variance_isSamples, dtype) + rv_mx = prepare_mxnet_array(rv, rv_isSamples, dtype) + rv_shape = rv.shape[1:] if rv_isSamples else rv.shape + mean_mx = net(X_mx) + mean_np = mean_mx.asnumpy() + + rbf = RBF(2, True, 1., 1., 'rbf', None, dtype) + X_var = Variable(shape=(5,2)) + mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + mean_var = mean_func(X_var) + gp = GaussianProcess.define_variable(X=X_var, kernel=rbf, shape=rv_shape, mean=mean_var, dtype=dtype).factor + + variables = {gp.X.uuid: X_mx, gp.rbf_lengthscale.uuid: rbf_lengthscale_mx, gp.rbf_variance.uuid: rbf_variance_mx, gp.random_variable.uuid: rv_mx, gp.mean.uuid: mean_mx} + log_pdf_rt = gp.log_pdf(F=mx.nd, variables=variables).asnumpy() + + log_pdf_np = [] + for i in range(num_samples): + X_i = X[i] if X_isSamples else X + lengthscale_i = rbf_lengthscale[i] if rbf_lengthscale_isSamples else rbf_lengthscale + variance_i = rbf_variance[i] if rbf_variance_isSamples else rbf_variance + rv_i = rv[i] if rv_isSamples else rv + rv_i = rv_i - mean_np[i] if X_isSamples else rv_i - mean_np[0] + rbf_np = GPy.kern.RBF(input_dim=2, ARD=True) + rbf_np.lengthscale = lengthscale_i + rbf_np.variance = variance_i + K_np = rbf_np.K(X_i) + log_pdf_np.append(multivariate_normal.logpdf(rv_i[:,0], mean=None, cov=K_np)) + log_pdf_np = np.array(log_pdf_np) + isSamples_any = any([X_isSamples, rbf_lengthscale_isSamples, rbf_variance_isSamples, rv_isSamples]) + assert np.issubdtype(log_pdf_rt.dtype, dtype) + assert array_has_samples(mx.nd, log_pdf_rt) == isSamples_any + if isSamples_any: + assert get_num_samples(mx.nd, log_pdf_rt) == num_samples + assert np.allclose(log_pdf_np, log_pdf_rt) + + @pytest.mark.parametrize("dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv_shape, num_samples", [ (np.float64, np.random.rand(5,2), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), (np.float64, np.random.rand(3,5,2), True, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), @@ -114,6 +171,60 @@ def test_draw_samples(self, dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthsc assert np.allclose(samples_np, samples_rt) + @pytest.mark.parametrize("dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv_shape, num_samples", [ + (np.float64, np.random.rand(5,2), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 3), + (np.float64, np.random.rand(3,5,2), True, np.random.rand(3,2)+0.1, True, np.random.rand(3,1)+0.1, True, (5,1), 3), + (np.float64, np.random.rand(5,2), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, (5,1), 1), + ]) + def test_draw_samples_w_mean(self, dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, + rv_shape, num_samples): + + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(rv_shape[-1], flatten=False, activation="tanh", + in_units=X.shape[-1], dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + X_mx = prepare_mxnet_array(X, X_isSamples, dtype) + rbf_lengthscale_mx = prepare_mxnet_array(rbf_lengthscale, rbf_lengthscale_isSamples, dtype) + rbf_variance_mx = prepare_mxnet_array(rbf_variance, rbf_variance_isSamples, dtype) + mean_mx = net(X_mx) + mean_np = mean_mx.asnumpy() + + rand = np.random.randn(num_samples, *rv_shape) + rand_gen = MockMXNetRandomGenerator(mx.nd.array(rand.flatten(), dtype=dtype)) + + rbf = RBF(2, True, 1., 1., 'rbf', None, dtype) + X_var = Variable(shape=(5,2)) + mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + mean_var = mean_func(X_var) + gp = GaussianProcess.define_variable(X=X_var, kernel=rbf, shape=rv_shape, mean=mean_var, dtype=dtype, rand_gen=rand_gen).factor + + variables = {gp.X.uuid: X_mx, gp.rbf_lengthscale.uuid: rbf_lengthscale_mx, gp.rbf_variance.uuid: rbf_variance_mx, gp.mean.uuid: mean_mx} + samples_rt = gp.draw_samples(F=mx.nd, variables=variables, num_samples=num_samples).asnumpy() + + samples_np = [] + for i in range(num_samples): + X_i = X[i] if X_isSamples else X + lengthscale_i = rbf_lengthscale[i] if rbf_lengthscale_isSamples else rbf_lengthscale + variance_i = rbf_variance[i] if rbf_variance_isSamples else rbf_variance + rand_i = rand[i] + rbf_np = GPy.kern.RBF(input_dim=2, ARD=True) + rbf_np.lengthscale = lengthscale_i + rbf_np.variance = variance_i + K_np = rbf_np.K(X_i) + L_np = np.linalg.cholesky(K_np) + sample_np = L_np.dot(rand_i) + samples_np.append(sample_np) + samples_np = np.array(samples_np)+mean_np + + assert np.issubdtype(samples_rt.dtype, dtype) + assert get_num_samples(mx.nd, samples_rt) == num_samples + assert np.allclose(samples_np, samples_rt) + + @pytest.mark.parametrize("dtype, X, X_isSamples, rbf_lengthscale, rbf_lengthscale_isSamples, rbf_variance, rbf_variance_isSamples, rv, rv_isSamples, num_samples", [ (np.float64, np.random.rand(5,2), False, np.random.rand(2)+0.1, False, np.random.rand(1)+0.1, False, np.random.rand(3,5,1), True, 3), ]) diff --git a/testing/components/distributions/wishart_test.py b/testing/components/distributions/wishart_test.py index 873d6f3..d982c90 100644 --- a/testing/components/distributions/wishart_test.py +++ b/testing/components/distributions/wishart_test.py @@ -15,46 +15,48 @@ import pytest import mxnet as mx -from sklearn.datasets import make_spd_matrix import numpy as np from scipy.stats import wishart, chi2 from mxfusion.components.distributions import Wishart from mxfusion.components.variables.runtime_variable import add_sample_dimension, array_has_samples, get_num_samples -from mxfusion.util.testutils import MockMXNetRandomGenerator, numpy_array_reshape, plot_univariate +from mxfusion.util.testutils import MockMXNetRandomGenerator, numpy_array_reshape, plot_univariate, make_spd_matrix -def make_spd_matrices_3d(num_samples, num_dimensions, random_state): +def make_spd_matrices_3d(num_samples, num_dimensions, random_seed): matrices = np.zeros((num_samples, num_dimensions, num_dimensions)) + np.random.seed(random_seed) for i in range(num_samples): - matrices[i, :, :] = make_spd_matrix(num_dimensions, random_state=random_state) + matrices[i, :, :] = make_spd_matrix(num_dimensions) return matrices -def make_spd_matrices_4d(num_samples, num_data_points, num_dimensions, random_state): +def make_spd_matrices_4d(num_samples, num_data_points, num_dimensions, random_seed): matrices = np.zeros((num_samples, num_data_points, num_dimensions, num_dimensions)) + np.random.seed(random_seed) for i in range(num_samples): for j in range(num_data_points): - matrices[i, j, :, :] = make_spd_matrix(num_dimensions, random_state=random_state) + matrices[i, j, :, :] = make_spd_matrix(num_dimensions) return matrices @pytest.mark.usefixtures("set_seed") class TestWishartDistribution(object): - @pytest.mark.parametrize("dtype_dof, dtype, degrees_of_freedom, random_state, scale_is_samples, " + @pytest.mark.parametrize("dtype_dof, dtype, degrees_of_freedom, random_seed, scale_is_samples, " "rv_is_samples, num_data_points, num_samples, broadcast", [ (np.int32, np.float32, 2, 0, True, True, 3, 6, False), ]) - def test_log_pdf(self, dtype_dof, dtype, degrees_of_freedom, random_state, + def test_log_pdf(self, dtype_dof, dtype, degrees_of_freedom, random_seed, scale_is_samples, rv_is_samples, num_data_points, num_samples, broadcast): # Create positive semi-definite matrices - rv = make_spd_matrices_4d(num_samples, num_data_points, degrees_of_freedom, random_state=random_state) + np.random.seed(random_seed) + rv = make_spd_matrices_4d(num_samples, num_data_points, degrees_of_freedom, random_seed=random_seed) if broadcast: - scale = make_spd_matrix(n_dim=degrees_of_freedom, random_state=random_state) + scale = make_spd_matrix(dim=degrees_of_freedom) else: - scale = make_spd_matrices_4d(num_samples, num_data_points, degrees_of_freedom, random_state=random_state) + scale = make_spd_matrices_4d(num_samples, num_data_points, degrees_of_freedom, random_seed=random_seed) degrees_of_freedom_mx = mx.nd.array([degrees_of_freedom], dtype=dtype_dof) degrees_of_freedom = degrees_of_freedom_mx.asnumpy()[0] # ensures the correct dtype @@ -100,12 +102,11 @@ def test_log_pdf(self, dtype_dof, dtype, degrees_of_freedom, random_state, @pytest.mark.parametrize( "dtype_dof, dtype, degrees_of_freedom, scale, scale_is_samples, rv_shape, num_samples", [ - (np.int64, np.float64, 3, make_spd_matrix(3, 0), False, (3, 3), 5), + (np.int64, np.float64, 3, make_spd_matrix(3), False, (3, 3), 5), (np.int64, np.float64, 3, make_spd_matrices_4d(5, 5, 3, 0), True, (5, 3, 3), 5), ]) def test_draw_samples_no_broadcast(self, dtype_dof, dtype, degrees_of_freedom, scale, scale_is_samples, rv_shape, num_samples): - degrees_of_freedom_mx = mx.nd.array([degrees_of_freedom], dtype=dtype_dof) scale_mx = mx.nd.array(scale, dtype=dtype) if not scale_is_samples: diff --git a/testing/components/factor_test.py b/testing/components/factor_test.py index f93486c..4e9b95a 100644 --- a/testing/components/factor_test.py +++ b/testing/components/factor_test.py @@ -41,7 +41,8 @@ def test_replicate_function_only_self(self): self.D = 10 self.net = nn.HybridSequential() with self.net.name_scope(): - self.net.add(nn.Dense(self.D, activation="relu")) + self.net.add(nn.Dense(self.D, in_units=1, activation="relu")) + self.net.initialize() m = mf.models.Model(verbose=False) f = MXFusionGluonFunction(self.net, num_outputs=1) diff --git a/testing/components/functions/mxfusion_gluon_function_test.py b/testing/components/functions/mxfusion_gluon_function_test.py index 576b579..8b5d8aa 100644 --- a/testing/components/functions/mxfusion_gluon_function_test.py +++ b/testing/components/functions/mxfusion_gluon_function_test.py @@ -22,6 +22,8 @@ from mxfusion.components.functions.mxfusion_gluon_function import MXFusionGluonFunction from mxfusion.components import Variable from mxfusion.components.variables.runtime_variable import add_sample_dimension, array_has_samples +from mxfusion import Model +from mxfusion.inference import Inference, ForwardSamplingAlgorithm @pytest.mark.usefixtures("set_seed") @@ -33,7 +35,8 @@ def setUp(self): self.D = 10 self.net = nn.HybridSequential() with self.net.name_scope(): - self.net.add(nn.Dense(self.D, activation="relu")) + self.net.add(nn.Dense(self.D, in_units=1, activation="relu")) + self.net.initialize() def _make_gluon_function_evaluation(self, dtype, broadcastable): class Dot(HybridBlock): @@ -162,3 +165,15 @@ def test_success(self): x = Variable() y = f(x) #z = y.value.eval({'x' : mx.nd.ones(self.D)}) + + def test_gluon_parameters(self): + self.setUp() + + m = Model() + m.x = Variable(shape=(1,1)) + m.f = MXFusionGluonFunction(self.net, num_outputs=1) + m.y = m.f(m.x) + + infr = Inference(ForwardSamplingAlgorithm(m, observed=[m.x])) + infr.run(x=mx.nd.ones((1, 1))) + assert all([v.uuid in infr.params.param_dict for v in m.f.parameters.values()]) diff --git a/testing/inference/inference_serialization_test.py b/testing/inference/inference_serialization_test.py index 64c5a3a..68dd276 100644 --- a/testing/inference/inference_serialization_test.py +++ b/testing/inference/inference_serialization_test.py @@ -24,7 +24,8 @@ from mxfusion.components.functions import MXFusionGluonFunction from mxfusion.common.config import get_default_dtype from mxfusion.components.functions.operators import broadcast_to -from mxfusion import Variable +from mxfusion import Variable, Model +from mxfusion.inference import Inference, ForwardSamplingAlgorithm class InferenceSerializationTests(unittest.TestCase): @@ -64,6 +65,14 @@ def make_net(self): net.initialize(mx.init.Xavier(magnitude=3)) return net + def make_simple_gluon_model(self): + net = self.make_net() + m = Model() + m.x = Variable(shape=(1, 1)) + m.f = MXFusionGluonFunction(net, num_outputs=1) + m.y = m.f(m.x) + return m + def make_gpregr_model(self, lengthscale, variance, noise_var): from mxfusion.models import Model from mxfusion.components.variables import Variable, PositiveTransformation @@ -210,3 +219,20 @@ def test_gp_module_save_and_load(self): loss2, _ = infr2.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) os.remove(self.ZIPNAME) + + def test_gluon_func_save_and_load(self): + m = self.make_simple_gluon_model() + infr = Inference(ForwardSamplingAlgorithm(m, observed=[m.x])) + infr.run(x=mx.nd.ones((1, 1))) + infr.save(self.ZIPNAME) + + m2 = self.make_simple_gluon_model() + infr2 = Inference(ForwardSamplingAlgorithm(m2, observed=[m2.x])) + infr2.run(x=mx.nd.ones((1, 1))) + infr2.load(self.ZIPNAME) + infr2.run(x=mx.nd.ones((1, 1))) + + for n in m.f.parameter_names: + assert np.allclose(infr.params[getattr(m.y.factor, n)].asnumpy(), infr2.params[getattr(m2.y.factor, n)].asnumpy()) + + os.remove(self.ZIPNAME) diff --git a/testing/inference/pilco_test.py b/testing/inference/pilco_test.py new file mode 100644 index 0000000..ac35f9e --- /dev/null +++ b/testing/inference/pilco_test.py @@ -0,0 +1,183 @@ +# Copyright 2018 Amazon.com, Inc. or its affiliates. All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"). +# You may not use this file except in compliance with the License. +# A copy of the License is located at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# or in the "license" file accompanying this file. This file is distributed +# on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either +# express or implied. See the License for the specific language governing +# permissions and limitations under the License. +# ============================================================================== + +import numpy as np +import pytest +import mxnet as mx +from mxfusion import Model, Variable +from mxfusion.components.variables import PositiveTransformation +from mxfusion.components.distributions.gp.kernels import RBF +from mxfusion.modules.gp_modules import GPRegression +from mxfusion.inference import GradBasedInference, MAP +from mxnet.gluon import HybridBlock +from mxnet.gluon.nn import Dense +from mxfusion.inference import GradTransferInference +from mxfusion.inference.pilco_alg import PILCOAlgorithm + +class NNController(HybridBlock): + def __init__(self, prefix=None, params=None, in_units=100, obs_space_high=3): + super(NNController, self).__init__(prefix=prefix, params=params) + self.dense1 = Dense(100, in_units=obs_space_high, activation='relu') + self.dense2 = Dense(1, in_units=100, activation='tanh') + def hybrid_forward(self, F, x): + out = self.dense2(self.dense1(x))*2 + return out + +class CostFunction(mx.gluon.HybridBlock): + """ + The goal is to get the pendulum upright and stable as quickly as possible. + Taken from the code for Pendulum. + """ + def hybrid_forward(self, F, state, action): + """ + :param state: [np.cos(theta), np.sin(theta), ~ momentum(theta)] + a -> 0 when pendulum is upright, largest when pendulum is hanging down completely. + b -> penalty for taking action + c -> penalty for pendulum momentum + """ + a_scale = 2. + b_scale = .001 + c_scale = .1 + a = F.sum(a_scale * (state[:,:,0:1] -1) ** 2, axis=-1) + b = F.sum(b_scale * action ** 2, axis=-1) + c = F.sum(c_scale * state[:,:,2:3] ** 2, axis=-1) + return (a + c + b) + +@pytest.mark.usefixtures("set_seed") +class TestPILCOInference(object): + """ + Test class that tests the MXFusion.inference.PILCOAlgorithm and MXFusion.inferenceGradTransferInference classes. + """ + + def run_one_episode(self): + reward_shape = (1,) + observations_shape = (200,3) # steps, obs shape + actions_shape = (199,1) # steps - 1, action shape + return np.random.rand(*reward_shape), np.random.rand(*observations_shape), np.random.rand(*actions_shape) + + def prepare_data(self, state_list, action_list, win_in): + """ + Prepares a list of states and a list of actions as inputs to the Gaussian Process for training. + """ + + X_list = [] + Y_list = [] + + for state_array, action_array in zip(state_list, action_list): + # the state and action array shape should be aligned. + assert state_array.shape[0]-1 == action_array.shape[0] + + for i in range(state_array.shape[0]-win_in): + Y_list.append(state_array[i+win_in:i+win_in+1]) + X_list.append(np.hstack([state_array[i:i+win_in].flatten(), action_array[i:i+win_in].flatten()])) + X = np.vstack(X_list) + Y = np.vstack(Y_list) + return X, Y + + + def fit_model(self, state_list, action_list, win_in, verbose=True, max_iter=1000): + """ + Fits a Gaussian Process model to the state / action pairs passed in. + This creates a model of the environment which is used during + policy optimization instead of querying the environment directly. + + See mxfusion.gp_modules for additional types of GP models to fit, + including Sparse GP and Stochastic Varitional Inference Sparse GP. + """ + X, Y = self.prepare_data(state_list, action_list, win_in) + + m = Model() + m.N = Variable() + m.X = Variable(shape=(m.N, X.shape[-1])) + m.noise_var = Variable(shape=(1,), transformation=PositiveTransformation(), + initial_value=0.01) + m.kernel = RBF(input_dim=X.shape[-1], variance=1, lengthscale=1, ARD=True) + m.Y = GPRegression.define_variable( + X=m.X, kernel=m.kernel, noise_var=m.noise_var, + shape=(m.N, Y.shape[-1])) + m.Y.factor.gp_log_pdf.jitter = 1e-6 + + infr = GradBasedInference( + inference_algorithm=MAP(model=m, observed=[m.X, m.Y])) + infr.run(X=mx.nd.array(X), + Y=mx.nd.array(Y), + max_iter=max_iter, learning_rate=0.1, verbose=verbose) + return m, infr, X, Y + + def optimize_policy(self, alg, policy, cost_func, model, infr, + model_data_X, model_data_Y, + initial_state_generator, num_grad_steps, + learning_rate=1e-2, num_time_steps=100, + num_samples=10, verbose=True): + """ + Takes as primary inputs a policy, cost function, and trained model. + Optimizes the policy for num_grad_steps number of iterations. + """ + mb_alg = alg( + model=model, observed=[model.X, model.Y], + cost_function=cost_func, + policy=policy, n_time_steps=num_time_steps, + initial_state_generator=initial_state_generator, + num_samples=num_samples) + + infr_pred = GradTransferInference( + mb_alg, infr_params=infr.params, train_params=policy.collect_params()) + infr_pred.run( + max_iter=num_grad_steps, + X=mx.nd.array(model_data_X), + Y=mx.nd.array(model_data_Y), + verbose=verbose, learning_rate=learning_rate) + return policy + + def initial_state_generator(self, num_initial_states, obs_space_shape=3): + """ + Starts from valid states by drawing theta and momentum + then computing np.cos(theta) and np.sin(theta) for state[0:2].s + """ + return mx.nd.array( + [np.random.rand(obs_space_shape) for i in range(num_initial_states)]) + + + @pytest.mark.parametrize("pilco_alg", [ + (PILCOAlgorithm)]) + def test_pilco_basic_passthrough(self, pilco_alg): + policy = NNController() + policy.collect_params().initialize(mx.initializer.Xavier(magnitude=1)) + cost = CostFunction() + num_episode = 2 # how many model fit + policy optimization episodes to run + num_samples = 2 # how many sample trajectories the policy optimization loop uses + num_grad_steps = 2 # how many gradient steps the optimizer takes per episode + num_time_steps = 2 # how far to roll out each sample trajectory + learning_rate = 1e-3 # learning rate for the policy optimization + + all_states = [] + all_actions = [] + + for i_ep in range(num_episode): + # Run an episode and collect data. + policy_func = lambda x: policy(mx.nd.expand_dims(mx.nd.array(x), axis=0)).asnumpy()[0] + total_reward, states, actions = self.run_one_episode() + all_states.append(states) + all_actions.append(actions) + + # Fit a model. + model, infr, model_data_X, model_data_Y = self.fit_model( + all_states, all_actions, win_in=1, verbose=True, max_iter=5) + + # Optimize the policy. + policy = self.optimize_policy(pilco_alg, + policy, cost, model, infr, model_data_X, model_data_Y, + self.initial_state_generator, num_grad_steps=num_grad_steps, + num_samples=num_samples, learning_rate=learning_rate, + num_time_steps=num_time_steps) diff --git a/testing/models/factor_graph_test.py b/testing/models/factor_graph_test.py index 641a9a9..1055d24 100644 --- a/testing/models/factor_graph_test.py +++ b/testing/models/factor_graph_test.py @@ -68,9 +68,9 @@ def make_net(self): D = 100 net = nn.HybridSequential(prefix='hybrid0_') with net.name_scope(): - net.add(nn.Dense(D, activation="tanh")) - net.add(nn.Dense(D, activation="tanh")) - net.add(nn.Dense(2, flatten=True)) + net.add(nn.Dense(D, in_units=10, activation="tanh", flatten=False)) + net.add(nn.Dense(D, in_units=D, activation="tanh", flatten=False)) + net.add(nn.Dense(2, in_units=D, flatten=False)) net.initialize(mx.init.Xavier(magnitude=3)) return net @@ -96,7 +96,8 @@ def setUp(self): self.D = 10 self.basic_net = nn.HybridSequential() with self.basic_net.name_scope(): - self.basic_net.add(nn.Dense(self.D, activation="relu")) + self.basic_net.add(nn.Dense(self.D, in_units=10, activation="relu")) + self.basic_net.initialize() self.bnn_net = self.make_net() def test_bnn_model(self): @@ -291,8 +292,8 @@ def test_reconcile_gp_model(self): self.assertTrue(len(component_map) == len(set(m1.components).union(set(m1.Y.factor._module_graph.components)).union(set(m1.Y.factor._extra_graphs[0].components)))) def test_reconcile_model_and_posterior(self): - x = np.random.rand(1000, 1) - y = np.random.rand(1000, 1) + x = np.random.rand(1000, 10) + y = np.random.rand(1000, 10) x_nd, y_nd = mx.nd.array(y), mx.nd.array(x) net1 = self.make_net() diff --git a/testing/modules/gpregression_test.py b/testing/modules/gpregression_test.py index 8bf7ed2..b982a1e 100644 --- a/testing/modules/gpregression_test.py +++ b/testing/modules/gpregression_test.py @@ -13,18 +13,18 @@ # ============================================================================== -import pytest import warnings import mxnet as mx +import mxnet.gluon.nn as nn import numpy as np from mxfusion.models import Model from mxfusion.modules.gp_modules import GPRegression from mxfusion.components.distributions.gp.kernels import RBF, White from mxfusion.components.distributions import GaussianProcess, Normal from mxfusion.components import Variable -from mxfusion.inference import Inference, MAP, ModulePredictionAlgorithm, TransferInference, create_Gaussian_meanfield, StochasticVariationalInference, GradBasedInference, ForwardSamplingAlgorithm, ModulePredictionAlgorithm +from mxfusion.components.functions import MXFusionGluonFunction +from mxfusion.inference import Inference, MAP, TransferInference, create_Gaussian_meanfield, StochasticVariationalInference, GradBasedInference, ForwardSamplingAlgorithm, ModulePredictionAlgorithm from mxfusion.components.variables.var_trans import PositiveTransformation -from mxfusion.inference.forward_sampling import ForwardSamplingAlgorithm from mxfusion.util.testutils import MockMXNetRandomGenerator from mxfusion.modules.gp_modules.gp_regression import GPRegressionSamplingPrediction @@ -57,6 +57,25 @@ def gen_mxfusion_model(self, dtype, D, noise_var, lengthscale, variance, m.Y = GPRegression.define_variable(X=m.X, kernel=kernel, noise_var=m.noise_var, shape=(m.N, D), dtype=dtype, rand_gen=rand_gen) return m + def gen_mxfusion_model_w_mean(self, dtype, D, noise_var, lengthscale, + variance, rand_gen=None): + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(D, flatten=False, activation="tanh", + in_units=3, dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + m = Model() + m.N = Variable() + m.X = Variable(shape=(m.N, 3)) + m.noise_var = Variable(transformation=PositiveTransformation(), initial_value=mx.nd.array(noise_var, dtype=dtype)) + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + m.Y = GPRegression.define_variable(X=m.X, kernel=kernel, mean=m.mean_func(m.X), noise_var=m.noise_var, shape=(m.N, D), dtype=dtype, rand_gen=rand_gen) + m.Y.factor.gp_log_pdf.jitter = 1e-6 + return m, net + def test_log_pdf(self): D, X, Y, noise_var, lengthscale, variance = self.gen_data() @@ -76,6 +95,28 @@ def test_log_pdf(self): assert np.allclose(l_mf.asnumpy(), l_gpy) + def test_log_pdf_w_mean(self): + D, X, Y, noise_var, lengthscale, variance = self.gen_data() + + # MXFusion log-likelihood + dtype = 'float64' + m, net = self.gen_mxfusion_model_w_mean( + dtype, D, noise_var, lengthscale, variance) + + mean = net(mx.nd.array(X, dtype=dtype)).asnumpy() + + # GPy log-likelihood + m_gpy = GPy.models.GPRegression(X=X, Y=Y-mean, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance), noise_var=noise_var) + l_gpy = m_gpy.log_likelihood() + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + l_mf = -loss + + assert np.allclose(l_mf.asnumpy(), l_gpy) + def test_draw_samples(self): D, X, Y, noise_var, lengthscale, variance = self.gen_data() dtype = 'float64' @@ -99,6 +140,32 @@ def test_draw_samples(self): assert np.allclose(samples, samples_2), (samples, samples_2) + def test_draw_samples_w_mean(self): + D, X, Y, noise_var, lengthscale, variance = self.gen_data() + dtype = 'float64' + + rand_gen = MockMXNetRandomGenerator(mx.nd.array(np.random.rand(20*D), dtype=dtype)) + + m, net = self.gen_mxfusion_model_w_mean(dtype, D, noise_var, lengthscale, variance, rand_gen) + + observed = [m.X] + infr = Inference(ForwardSamplingAlgorithm( + m, observed, num_samples=2, target_variables=[m.Y]), dtype=dtype) + + samples = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype))[0].asnumpy() + + kern = RBF(3, True, name='rbf', dtype=dtype) + White(3, dtype=dtype) + X_var = Variable(shape=(10, 3)) + mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + mean_var = mean_func(X_var) + gp = GaussianProcess.define_variable(X=X_var, kernel=kern, mean=mean_var, shape=(10, D), dtype=dtype, rand_gen=rand_gen).factor + + variables = {gp.X.uuid: mx.nd.expand_dims(mx.nd.array(X, dtype=dtype), axis=0), gp.add_rbf_lengthscale.uuid: mx.nd.expand_dims(mx.nd.array(lengthscale, dtype=dtype), axis=0), gp.add_rbf_variance.uuid: mx.nd.expand_dims(mx.nd.array(variance, dtype=dtype), axis=0), gp.add_white_variance.uuid: mx.nd.expand_dims(mx.nd.array(noise_var, dtype=dtype), axis=0), mean_var.uuid: mx.nd.expand_dims(net(mx.nd.array(X, dtype=dtype)), axis=0)} + samples_2 = gp.draw_samples(F=mx.nd, variables=variables, num_samples=2).asnumpy() + + assert np.allclose(samples, samples_2), (samples, samples_2) + def test_prediction(self): D, X, Y, noise_var, lengthscale, variance = self.gen_data() Xt = np.random.rand(20, 3) @@ -154,16 +221,41 @@ def test_prediction(self): infr2.inference_algorithm.model.Y.factor.gp_predict.noise_free = False res = infr2.run(X=mx.nd.array(Xt, dtype=dtype))[0] mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] - print((var_gpy, var_mf)) assert np.allclose(mu_gpy, mu_mf), (mu_gpy, mu_mf) assert np.allclose(var_gpy, var_mf), (var_gpy, var_mf) - def test_sampling_prediction(self): + def test_prediction_w_mean(self): D, X, Y, noise_var, lengthscale, variance = self.gen_data() Xt = np.random.rand(20, 3) + dtype = 'float64' - m_gpy = GPy.models.GPRegression(X=X, Y=Y, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance), noise_var=noise_var) + m, net = self.gen_mxfusion_model_w_mean( + dtype, D, noise_var, lengthscale, variance) + + mean = net(mx.nd.array(X, dtype=dtype)).asnumpy() + mean_t = net(mx.nd.array(Xt, dtype=dtype)).asnumpy() + + m_gpy = GPy.models.GPRegression(X=X, Y=Y-mean, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance), noise_var=noise_var) + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + + # noise_free, diagonal + mu_gpy, var_gpy = m_gpy.predict_noiseless(Xt) + mu_gpy += mean_t + + infr2 = TransferInference(ModulePredictionAlgorithm(m, observed=[m.X], target_variables=[m.Y]), infr_params=infr.params, dtype=np.float64) + res = infr2.run(X=mx.nd.array(Xt, dtype=dtype))[0] + mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] + + assert np.allclose(mu_gpy, mu_mf, rtol=1e-04, atol=1e-05), (mu_gpy, mu_mf) + assert np.allclose(var_gpy[:,0], var_mf, rtol=1e-04, atol=1e-05), (var_gpy[:,0], var_mf) + + def test_sampling_prediction(self): + D, X, Y, noise_var, lengthscale, variance = self.gen_data() + Xt = np.random.rand(20, 3) dtype = 'float64' m = self.gen_mxfusion_model(dtype, D, noise_var, lengthscale, variance) @@ -171,7 +263,7 @@ def test_sampling_prediction(self): observed = [m.X, m.Y] infr = Inference(MAP(model=m, observed=observed), dtype=dtype) - loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype), max_iter=1) infr_pred = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y], num_samples=5), infr_params=infr.params) @@ -182,11 +274,38 @@ def test_sampling_prediction(self): gp._module_graph, gp._extra_graphs[0], [gp._module_graph.X]), alg_name='gp_predict') gp.gp_predict.diagonal_variance = False + gp.gp_predict.noise_free = False gp.gp_predict.jitter = 1e-6 y_samples = infr_pred.run(X=mx.nd.array(Xt, dtype=dtype))[0].asnumpy() # TODO: Check the correctness of the sampling + def test_sampling_prediction_w_mean(self): + D, X, Y, noise_var, lengthscale, variance = self.gen_data() + Xt = np.random.rand(20, 3) + dtype = 'float64' + m, net = self.gen_mxfusion_model_w_mean( + dtype, D, noise_var, lengthscale, variance) + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype), max_iter=1) + + infr_pred = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y], num_samples=5), + infr_params=infr.params) + gp = m.Y.factor + gp.attach_prediction_algorithms( + targets=gp.output_names, conditionals=gp.input_names, + algorithm=GPRegressionSamplingPrediction( + gp._module_graph, gp._extra_graphs[0], [gp._module_graph.X]), + alg_name='gp_predict') + gp.gp_predict.diagonal_variance = True + gp.gp_predict.noise_free = False + gp.gp_predict.jitter = 1e-6 + + y_samples = infr_pred.run(X=mx.nd.array(Xt, dtype=dtype))[0].asnumpy() + def test_with_samples(self): from mxfusion.common import config config.DEFAULT_DTYPE = 'float64' @@ -230,7 +349,6 @@ def test_with_samples(self): xt = np.random.rand(13, 3) res = infr_pred2.run(X=mx.nd.array(xt, dtype=dtype))[0] - def test_prediction_print(self): D, X, Y, noise_var, lengthscale, variance = self.gen_data() Xt = np.random.rand(20, 3) @@ -247,3 +365,13 @@ def test_prediction_print(self): loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) print = infr.print_params() assert (len(print) > 1) + + def test_module_clone(self): + D, X, Y, noise_var, lengthscale, variance = self.gen_data() + dtype = 'float64' + + m = Model() + m.N = Variable() + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.Y = GPRegression.define_variable(X=mx.nd.zeros((2, 3)), kernel=kernel, noise_var=mx.nd.ones((1,)), dtype=dtype) + m.clone() diff --git a/testing/modules/sparsegpregression_test.py b/testing/modules/sparsegpregression_test.py index 891ffbe..6639c8e 100644 --- a/testing/modules/sparsegpregression_test.py +++ b/testing/modules/sparsegpregression_test.py @@ -15,12 +15,14 @@ import pytest import mxnet as mx +import mxnet.gluon.nn as nn import numpy as np from mxfusion.models import Model from mxfusion.modules.gp_modules import SparseGPRegression from mxfusion.components.distributions.gp.kernels import RBF from mxfusion.components.distributions import Normal from mxfusion.components import Variable +from mxfusion.components.functions import MXFusionGluonFunction from mxfusion.inference import Inference, MAP, ModulePredictionAlgorithm, TransferInference, create_Gaussian_meanfield, StochasticVariationalInference, GradBasedInference, ForwardSamplingAlgorithm from mxfusion.components.variables.var_trans import PositiveTransformation from mxfusion.modules.gp_modules.sparsegp_regression import SparseGPRegressionSamplingPrediction @@ -56,6 +58,26 @@ def gen_mxfusion_model(self, dtype, D, Z, noise_var, lengthscale, variance, m.Y.factor.sgp_log_pdf.jitter = 1e-8 return m + def gen_mxfusion_model_w_mean(self, dtype, D, Z, noise_var, lengthscale, + variance, rand_gen=None): + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(D, flatten=False, activation="tanh", + in_units=3, dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + m = Model() + m.N = Variable() + m.X = Variable(shape=(m.N, 3)) + m.Z = Variable(shape=(3, 3), initial_value=mx.nd.array(Z, dtype=dtype)) + m.noise_var = Variable(transformation=PositiveTransformation(), initial_value=mx.nd.array(noise_var, dtype=dtype)) + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + m.Y = SparseGPRegression.define_variable(X=m.X, kernel=kernel, noise_var=m.noise_var, mean=m.mean_func(m.X), inducing_inputs=m.Z, shape=(m.N, D), dtype=dtype) + m.Y.factor.sgp_log_pdf.jitter = 1e-8 + return m, net + def test_log_pdf(self): D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() @@ -76,6 +98,42 @@ def test_log_pdf(self): assert np.allclose(l_mf.asnumpy(), l_gpy) + def test_log_pdf_w_mean(self): + D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() + + # MXFusion log-likelihood + dtype = 'float64' + m, net = self.gen_mxfusion_model_w_mean( + dtype, D, Z, noise_var, lengthscale, variance) + + mean = net(mx.nd.array(X, dtype=dtype)).asnumpy() + + # GPy log-likelihood + m_gpy = GPy.models.SparseGPRegression(X=X, Y=Y-mean, Z=Z, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance), num_inducing=3) + m_gpy.likelihood.variance = noise_var + l_gpy = m_gpy.log_likelihood() + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + l_mf = -loss + + assert np.allclose(l_mf.asnumpy(), l_gpy) + + def test_draw_samples(self): + D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() + dtype = 'float64' + + m = self.gen_mxfusion_model(dtype, D, Z, noise_var, lengthscale, + variance) + + observed = [m.X] + infr = Inference(ForwardSamplingAlgorithm( + m, observed, num_samples=2, target_variables=[m.Y]), dtype=dtype) + samples = infr.run(X=mx.nd.array(X, dtype=dtype))[0] + assert samples.shape == (2,) + Y.shape + def test_prediction(self): D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() Xt = np.random.rand(20, 3) @@ -137,6 +195,35 @@ def test_prediction(self): assert np.allclose(mu_gpy, mu_mf), (mu_gpy, mu_mf) assert np.allclose(var_gpy, var_mf), (var_gpy, var_mf) + def test_prediction_w_mean(self): + D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() + Xt = np.random.rand(20, 3) + dtype = 'float64' + + m, net = self.gen_mxfusion_model_w_mean( + dtype, D, Z, noise_var, lengthscale, variance) + + mean = net(mx.nd.array(X, dtype=dtype)).asnumpy() + mean_t = net(mx.nd.array(Xt, dtype=dtype)).asnumpy() + + m_gpy = GPy.models.SparseGPRegression(X=X, Y=Y-mean, Z=Z, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance)) + m_gpy.likelihood.variance = noise_var + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + + # noise_free, diagonal + mu_gpy, var_gpy = m_gpy.predict_noiseless(Xt) + mu_gpy += mean_t + + infr2 = TransferInference(ModulePredictionAlgorithm(m, observed=[m.X], target_variables=[m.Y]), infr_params=infr.params, dtype=np.float64) + res = infr2.run(X=mx.nd.array(Xt, dtype=dtype))[0] + mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] + + assert np.allclose(mu_gpy, mu_mf, rtol=1e-04, atol=1e-05), (mu_gpy, mu_mf) + assert np.allclose(var_gpy[:,0], var_mf, rtol=1e-04, atol=1e-05), (var_gpy[:,0], var_mf) + def test_sampling_prediction(self): D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() Xt = np.random.rand(20, 3) @@ -164,11 +251,38 @@ def test_sampling_prediction(self): gp._module_graph, gp._extra_graphs[0], [gp._module_graph.X]), alg_name='sgp_predict') gp.sgp_predict.diagonal_variance = False + gp.sgp_predict.noise_free = False gp.sgp_predict.jitter = 1e-6 y_samples = infr_pred.run(X=mx.nd.array(Xt, dtype=dtype))[0].asnumpy() - # TODO: Check the correctness of the sampling + def test_sampling_prediction_w_mean(self): + D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() + Xt = np.random.rand(20, 3) + + dtype = 'float64' + m, net = self.gen_mxfusion_model_w_mean( + dtype, D, Z, noise_var, lengthscale, variance) + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + + # noise_free, diagonal + infr_pred = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y], num_samples=5), + infr_params=infr.params) + gp = m.Y.factor + gp.attach_prediction_algorithms( + targets=gp.output_names, conditionals=gp.input_names, + algorithm=SparseGPRegressionSamplingPrediction( + gp._module_graph, gp._extra_graphs[0], [gp._module_graph.X]), + alg_name='sgp_predict') + gp.sgp_predict.diagonal_variance = True + gp.sgp_predict.noise_free = False + gp.sgp_predict.jitter = 1e-6 + + y_samples = infr_pred.run(X=mx.nd.array(Xt, dtype=dtype))[0].asnumpy() def test_with_samples(self): from mxfusion.common import config @@ -214,3 +328,13 @@ def test_with_samples(self): infr_pred2 = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y]), infr_params=infr.params) xt = np.random.rand(13, 3) res = infr_pred2.run(X=mx.nd.array(xt, dtype=dtype))[0] + + def test_module_clone(self): + D, X, Y, Z, noise_var, lengthscale, variance = self.gen_data() + dtype = 'float64' + + m = Model() + m.N = Variable() + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.Y = SparseGPRegression.define_variable(X=mx.nd.zeros((2, 3)), kernel=kernel, noise_var=mx.nd.ones((1,)), dtype=dtype) + m.clone() diff --git a/testing/modules/svgpregression_test.py b/testing/modules/svgpregression_test.py index 416f799..06ce5b8 100644 --- a/testing/modules/svgpregression_test.py +++ b/testing/modules/svgpregression_test.py @@ -16,12 +16,14 @@ import pytest import warnings import mxnet as mx +import mxnet.gluon.nn as nn import numpy as np from mxfusion.models import Model from mxfusion.modules.gp_modules import SVGPRegression from mxfusion.components.distributions.gp.kernels import RBF from mxfusion.components.distributions import Normal from mxfusion.components import Variable +from mxfusion.components.functions import MXFusionGluonFunction from mxfusion.inference import Inference, MAP, ModulePredictionAlgorithm, TransferInference, create_Gaussian_meanfield, StochasticVariationalInference, GradBasedInference, ForwardSamplingAlgorithm from mxfusion.components.variables.var_trans import PositiveTransformation from mxfusion.modules.gp_modules.svgp_regression import SVGPRegressionSamplingPrediction @@ -63,8 +65,29 @@ def gen_mxfusion_model(self, dtype, D, Z, noise_var, lengthscale, variance, kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) m.Y = SVGPRegression.define_variable(X=m.X, kernel=kernel, noise_var=m.noise_var, inducing_inputs=m.Z, shape=(m.N, D), dtype=dtype) gp = m.Y.factor + m.Y.factor.svgp_log_pdf.jitter = 1e-8 return m, gp + def gen_mxfusion_model_w_mean(self, dtype, D, Z, noise_var, lengthscale, + variance, rand_gen=None): + net = nn.HybridSequential(prefix='nn_') + with net.name_scope(): + net.add(nn.Dense(D, flatten=False, activation="tanh", + in_units=3, dtype=dtype)) + net.initialize(mx.init.Xavier(magnitude=3)) + + m = Model() + m.N = Variable() + m.X = Variable(shape=(m.N, 3)) + m.Z = Variable(shape=(3, 3), initial_value=mx.nd.array(Z, dtype=dtype)) + m.noise_var = Variable(transformation=PositiveTransformation(), initial_value=mx.nd.array(noise_var, dtype=dtype)) + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.mean_func = MXFusionGluonFunction(net, num_outputs=1, + broadcastable=True) + m.Y = SVGPRegression.define_variable(X=m.X, kernel=kernel, noise_var=m.noise_var, mean=m.mean_func(m.X), inducing_inputs=m.Z, shape=(m.N, D), dtype=dtype) + gp = m.Y.factor + return m, gp, net + def test_log_pdf(self): D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() @@ -91,6 +114,60 @@ def test_log_pdf(self): assert np.allclose(l_mf.asnumpy(), l_gpy) + def test_log_pdf_w_mean(self): + D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ + qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() + dtype = 'float64' + m, gp, net = self.gen_mxfusion_model_w_mean(dtype, D, Z, noise_var, + lengthscale, variance) + mean = net(mx.nd.array(X, dtype=dtype)).asnumpy() + + m_gpy = GPy.core.SVGP(X=X, Y=Y-mean, Z=Z, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance), likelihood=GPy.likelihoods.Gaussian(variance=noise_var)) + m_gpy.q_u_mean = qU_mean + m_gpy.q_u_chol = GPy.util.choleskies.triang_to_flat(qU_chol) + + l_gpy = m_gpy.log_likelihood() + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + infr.initialize(X=X.shape, Y=Y.shape) + infr.params[gp._extra_graphs[0].qU_mean] = mx.nd.array(qU_mean, dtype=dtype) + infr.params[gp._extra_graphs[0].qU_cov_W] = mx.nd.array(qU_cov_W, dtype=dtype) + infr.params[gp._extra_graphs[0].qU_cov_diag] = mx.nd.array(qU_cov_diag, dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + l_mf = -loss + + assert np.allclose(l_mf.asnumpy(), l_gpy) + + def test_log_pdf_w_samples_of_noise_var(self): + D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ + qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() + dtype = 'float64' + D = 2 + Y = np.random.rand(10, D) + qU_mean = np.random.rand(3, D) + + m = Model() + m.N = Variable() + m.X = Variable(shape=(m.N, 3)) + m.Z = Variable(shape=(3, 3), initial_value=mx.nd.array(Z, dtype=dtype)) + m.noise_var = Variable(transformation=PositiveTransformation(), shape=(m.N, D)) + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.Y = SVGPRegression.define_variable(X=m.X, kernel=kernel, noise_var=m.noise_var, inducing_inputs=m.Z, shape=(m.N, D), dtype=dtype) + gp = m.Y.factor + m.Y.factor.svgp_log_pdf.jitter = 1e-8 + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + infr.initialize(X=X.shape, Y=Y.shape) + infr.params[gp._extra_graphs[0].qU_mean] = mx.nd.array(qU_mean, dtype=dtype) + infr.params[gp._extra_graphs[0].qU_cov_W] = mx.nd.array(qU_cov_W, dtype=dtype) + infr.params[gp._extra_graphs[0].qU_cov_diag] = mx.nd.array(qU_cov_diag, dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype), max_iter=1) + + def test_prediction(self): D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() @@ -121,7 +198,8 @@ def test_prediction(self): mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] assert np.allclose(mu_gpy, mu_mf), (mu_gpy, mu_mf) - assert np.allclose(var_gpy[:,0], var_mf), (var_gpy[:,0], var_mf) + assert np.allclose(var_gpy, var_mf), (var_gpy, var_mf) + assert var_gpy.shape == var_mf.shape # noisy, diagonal mu_gpy, var_gpy = m_gpy.predict(Xt) @@ -132,9 +210,10 @@ def test_prediction(self): mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] assert np.allclose(mu_gpy, mu_mf), (mu_gpy, mu_mf) - assert np.allclose(var_gpy[:,0], var_mf), (var_gpy[:,0], var_mf) + assert np.allclose(var_gpy, var_mf), (var_gpy, var_mf) + assert var_gpy.shape == var_mf.shape - # TODO: The full covariance matrix prediction with SVGP in GPy may not be correct. Need further investigation. + m.Y.factor.svgp_predict.jitter = 1e-8 # noise_free, full_cov mu_gpy, var_gpy = m_gpy.predict_noiseless(Xt, full_cov=True) @@ -145,10 +224,9 @@ def test_prediction(self): res = infr2.run(X=mx.nd.array(Xt, dtype=dtype))[0] mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] - print(var_gpy.shape, var_mf.shape) - assert np.allclose(mu_gpy, mu_mf), (mu_gpy, mu_mf) - assert np.allclose(var_gpy[:, :, 0], var_mf), (var_gpy[:, :, 0], var_mf) + assert np.allclose(var_gpy, var_mf), (var_gpy, var_mf) + assert var_gpy.shape == var_mf.shape # noisy, full_cov mu_gpy, var_gpy = m_gpy.predict(Xt, full_cov=True) @@ -160,7 +238,55 @@ def test_prediction(self): mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] assert np.allclose(mu_gpy, mu_mf), (mu_gpy, mu_mf) - assert np.allclose(var_gpy[:, :, 0], var_mf), (var_gpy[:, :, 0], var_mf) + assert np.allclose(var_gpy, var_mf), (var_gpy, var_mf) + assert var_gpy.shape == var_mf.shape + + def test_draw_samples(self): + D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ + qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() + dtype = 'float64' + m, gp = self.gen_mxfusion_model(dtype, D, Z, noise_var, lengthscale, + variance) + + observed = [m.X] + infr = Inference(ForwardSamplingAlgorithm( + m, observed, num_samples=2, target_variables=[m.Y]), dtype=dtype) + samples = infr.run(X=mx.nd.array(X, dtype=dtype))[0] + assert samples.shape == (2,) + Y.shape + + def test_prediction_w_mean(self): + D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ + qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() + Xt = np.random.rand(5, 3) + dtype = 'float64' + m, gp, net = self.gen_mxfusion_model_w_mean(dtype, D, Z, noise_var, + lengthscale, variance) + mean = net(mx.nd.array(X, dtype=dtype)).asnumpy() + mean_t = net(mx.nd.array(Xt, dtype=dtype)).asnumpy() + + m_gpy = GPy.core.SVGP(X=X, Y=Y-mean, Z=Z, kernel=GPy.kern.RBF(3, ARD=True, lengthscale=lengthscale, variance=variance), likelihood=GPy.likelihoods.Gaussian(variance=noise_var)) + m_gpy.q_u_mean = qU_mean + m_gpy.q_u_chol = GPy.util.choleskies.triang_to_flat(qU_chol) + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + infr.initialize(X=X.shape, Y=Y.shape) + infr.params[gp._extra_graphs[0].qU_mean] = mx.nd.array(qU_mean, dtype=dtype) + infr.params[gp._extra_graphs[0].qU_cov_W] = mx.nd.array(qU_cov_W, dtype=dtype) + infr.params[gp._extra_graphs[0].qU_cov_diag] = mx.nd.array(qU_cov_diag, dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + + # noise_free, diagonal + mu_gpy, var_gpy = m_gpy.predict_noiseless(Xt) + mu_gpy += mean_t + + infr2 = TransferInference(ModulePredictionAlgorithm(m, observed=[m.X], target_variables=[m.Y]), infr_params=infr.params, dtype=np.float64) + res = infr2.run(X=mx.nd.array(Xt, dtype=dtype))[0] + mu_mf, var_mf = res[0].asnumpy()[0], res[1].asnumpy()[0] + + assert np.allclose(mu_gpy, mu_mf, rtol=1e-04, atol=1e-05), (mu_gpy, mu_mf) + assert np.allclose(var_gpy, var_mf, rtol=1e-04, atol=1e-05), (var_gpy, var_mf) def test_sampling_prediction(self): D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ @@ -194,11 +320,39 @@ def test_sampling_prediction(self): gp._module_graph, gp._extra_graphs[0], [gp._module_graph.X]), alg_name='svgp_predict') gp.svgp_predict.diagonal_variance = False + gp.svgp_predict.noise_free = False gp.svgp_predict.jitter = 1e-6 y_samples = infr_pred.run(X=mx.nd.array(Xt, dtype=dtype))[0].asnumpy() - # TODO: Check the correctness of the sampling + def test_sampling_prediction_w_mean(self): + D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ + qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() + Xt = np.random.rand(20, 3) + + dtype = 'float64' + m, gp, net = self.gen_mxfusion_model_w_mean(dtype, D, Z, noise_var, + lengthscale, variance) + + observed = [m.X, m.Y] + infr = Inference(MAP(model=m, observed=observed), dtype=dtype) + + loss, _ = infr.run(X=mx.nd.array(X, dtype=dtype), Y=mx.nd.array(Y, dtype=dtype)) + + # noise_free, diagonal + infr_pred = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y], num_samples=5), + infr_params=infr.params) + gp = m.Y.factor + gp.attach_prediction_algorithms( + targets=gp.output_names, conditionals=gp.input_names, + algorithm=SVGPRegressionSamplingPrediction( + gp._module_graph, gp._extra_graphs[0], [gp._module_graph.X]), + alg_name='svgp_predict') + gp.svgp_predict.diagonal_variance = True + gp.svgp_predict.noise_free = False + gp.svgp_predict.jitter = 1e-6 + + y_samples = infr_pred.run(X=mx.nd.array(Xt, dtype=dtype))[0].asnumpy() def test_with_samples(self): from mxfusion.common import config @@ -250,3 +404,15 @@ def test_with_samples(self): infr_pred2 = TransferInference(ModulePredictionAlgorithm(model=m, observed=[m.X], target_variables=[m.Y]), infr_params=infr.params) xt = np.random.rand(13, 3) res = infr_pred2.run(X=mx.nd.array(xt, dtype=dtype))[0] + + def test_module_clone(self): + D, X, Y, Z, noise_var, lengthscale, variance, qU_mean, \ + qU_cov_W, qU_cov_diag, qU_chol = self.gen_data() + dtype = 'float64' + + m = Model() + m.N = Variable() + m.X = Variable(shape=(m.N, 3)) + kernel = RBF(input_dim=3, ARD=True, variance=mx.nd.array(variance, dtype=dtype), lengthscale=mx.nd.array(lengthscale, dtype=dtype), dtype=dtype) + m.Y = SVGPRegression.define_variable(X=mx.nd.zeros((2, 3)), kernel=kernel, noise_var=mx.nd.ones((1,)), dtype=dtype) + m.clone() diff --git a/testing/util/special_test.py b/testing/util/special_test.py index 7b4822c..7a8cf7f 100644 --- a/testing/util/special_test.py +++ b/testing/util/special_test.py @@ -17,12 +17,11 @@ import mxnet as mx import numpy as np from mxfusion.util.special import log_determinant, log_multivariate_gamma -from sklearn.datasets import make_spd_matrix +from mxfusion.util.testutils import make_spd_matrix from itertools import product from scipy.special import multigammaln -# @pytest.mark.usefixtures("set_seed") class TestSpecialFunctions: """ Tests special functions. @@ -31,7 +30,8 @@ class TestSpecialFunctions: @pytest.mark.parametrize("n_dim, random_state", list(product((10, 100, 1000), range(1, 4)))) def test_log_determinant(self, n_dim, random_state): - A = make_spd_matrix(n_dim=n_dim, random_state=random_state) + np.random.seed(random_state) + A = make_spd_matrix(dim=n_dim) assert all(np.linalg.eigvals(A) > 0) a = mx.nd.array(A)