Not adding or removing semicolons

eli-b · eli-b · commit a1b9d3788bc3 · 2014-03-08T15:39:12.000+02:00
diff --git a/Chapter5_LossFunctions/LossFunctions.ipynb b/Chapter5_LossFunctions/LossFunctions.ipynb
@@ -254,13 +254,13 @@
       "\n",
       "@pm.potential\n",
       "def error(true_price=true_price, price_estimate=price_estimate):\n",
-      "    return pm.normal_like(true_price, price_estimate, 1 / (3e3) ** 2)\n",
+      "        return pm.normal_like(true_price, price_estimate, 1 / (3e3) ** 2)\n",
       "\n",
       "\n",
       "mcmc = pm.MCMC([true_price, prize_1, prize_2, price_estimate, error])\n",
       "mcmc.sample(50000, 10000)\n",
       "\n",
-      "price_trace = mcmc.trace(\"true_price\")[:];"
+      "price_trace = mcmc.trace(\"true_price\")[:]"
      ],
      "language": "python",
      "metadata": {},
@@ -299,8 +299,9 @@
       "plt.title(\"Posterior of the true price estimate\")\n",
       "plt.vlines(mu_prior, 0, 1.1 * np.max(_hist[0]), label=\"prior's mean\",\n",
       "           linestyles=\"--\")\n",
-      "plt.vlines(price_trace.mean(), 0, 1.1 * np.max(_hist[0]), label=\"posterior's mean\", linestyles=\"-.\")\n",
-      "plt.legend(loc=\"upper left\");"
+      "plt.vlines(price_trace.mean(), 0, 1.1 * np.max(_hist[0]),\n",
+      "           label=\"posterior's mean\", linestyles=\"-.\")\n",
+      "plt.legend(loc=\"upper left\")"
      ],
      "language": "python",
      "metadata": {},
@@ -361,23 +362,26 @@
       "\n",
       "\n",
       "def showdown_loss(guess, true_price, risk=80000):\n",
-      "    loss = np.zeros_like(true_price)\n",
-      "    ix = true_price < guess\n",
-      "    loss[~ix] = np.abs(guess - true_price[~ix])\n",
-      "    close_mask = [abs(true_price - guess) <= 250]\n",
-      "    loss[close_mask] = -2 * true_price[close_mask]\n",
-      "    loss[ix] = risk\n",
-      "    return loss\n",
+      "        loss = np.zeros_like(true_price)\n",
+      "        ix = true_price < guess\n",
+      "        loss[~ix] = np.abs(guess - true_price[~ix])\n",
+      "        close_mask = [abs(true_price - guess) <= 250]\n",
+      "        loss[close_mask] = -2 * true_price[close_mask]\n",
+      "        loss[ix] = risk\n",
+      "        return loss\n",
+      "\n",
       "\n",
       "guesses = np.linspace(5000, 50000, 70)\n",
       "risks = np.linspace(30000, 150000, 6)\n",
-      "expected_loss = lambda guess, risk: showdown_loss(guess, price_trace, risk).mean()\n",
+      "expected_loss = lambda guess, risk: \\\n",
+      "    showdown_loss(guess, price_trace, risk).mean()\n",
       "\n",
       "for _p in risks:\n",
       "    results = [expected_loss(_g, _p) for _g in guesses]\n",
       "    plt.plot(guesses, results, label=\"%d\" % _p)\n",
       "\n",
-      "plt.title(\"Expected loss of different guesses, \\nvarious risk-levels of overestimating\")\n",
+      "plt.title(\"Expected loss of different guesses, \\nvarious risk-levels of \\\n",
+      "overestimating\")\n",
       "plt.legend(loc=\"upper left\", title=\"Risk parameter\")\n",
       "plt.xlabel(\"price bid\")\n",
       "plt.ylabel(\"expected loss\")\n",
@@ -420,21 +424,24 @@
       "\n",
       "ax = plt.subplot(111)\n",
       "\n",
+      "\n",
       "for _p in risks:\n",
       "    _color = ax._get_lines.color_cycle.next()\n",
       "    _min_results = sop.fmin(expected_loss, 15000, args=(_p,), disp=False)\n",
       "    _results = [expected_loss(_g, _p) for _g in guesses]\n",
       "    plt.plot(guesses, _results, color=_color)\n",
-      "    plt.scatter(_min_results, 0, s=60, color=_color, label=\"%d\" % _p)\n",
+      "    plt.scatter(_min_results, 0, s=60,\n",
+      "                color=_color, label=\"%d\" % _p)\n",
       "    plt.vlines(_min_results, 0, 120000, color=_color, linestyles=\"--\")\n",
       "    print \"minimum at risk %d: %.2f\" % (_p, _min_results)\n",
       "\n",
-      "plt.title(\"Expected loss & Bayes actions of different guesses, \\n various risk-levels of overestimating\")\n",
+      "plt.title(\"Expected loss & Bayes actions of different guesses, \\n \\\n",
+      "various risk-levels of overestimating\")\n",
       "plt.legend(loc=\"upper left\", scatterpoints=1, title=\"Bayes action at risk:\")\n",
       "plt.xlabel(\"price guess\")\n",
       "plt.ylabel(\"expected loss\")\n",
       "plt.xlim(7000, 30000)\n",
-      "plt.ylim(-1000, 80000);"
+      "plt.ylim(-1000, 80000)"
      ],
      "language": "python",
      "metadata": {},
@@ -575,15 +582,18 @@
       "\n",
       "def stock_loss(true_return, yhat, alpha=100.):\n",
       "    if true_return * yhat < 0:\n",
-      "    # opposite signs, not good\n",
-      "        return alpha * yhat ** 2 - np.sign(true_return) * yhat + abs(true_return)\n",
+      "        # opposite signs, not good\n",
+      "        return alpha * yhat ** 2 - np.sign(true_return) * yhat \\\n",
+      "            + abs(true_return)\n",
       "    else:\n",
       "        return abs(true_return - yhat)\n",
       "\n",
+      "\n",
       "true_value = .05\n",
       "pred = np.linspace(-.04, .12, 75)\n",
       "\n",
-      "plt.plot(pred, [stock_loss(true_value, _p) for _p in pred], label=\"Loss associated with\\n prediction if true value=0.05\", lw=3)\n",
+      "plt.plot(pred, [stock_loss(true_value, _p) for _p in pred],\n",
+      "         label=\"Loss associated with\\n prediction if true value = 0.05\", lw=3)\n",
       "plt.vlines(0, 0, .25, linestyles=\"--\")\n",
       "\n",
       "plt.xlabel(\"prediction\")\n",
@@ -592,9 +602,10 @@
       "plt.ylim(0, 0.25)\n",
       "\n",
       "true_value = -.02\n",
-      "plt.plot(pred, [stock_loss(true_value, _p) for _p in pred], alpha=0.6, label=\"Loss associated with\\n prediction if true value=-0.02\", lw=3)\n",
+      "plt.plot(pred, [stock_loss(true_value, _p) for _p in pred], alpha=0.6,\n",
+      "         label=\"Loss associated with\\n prediction if true value = -0.02\", lw=3)\n",
       "plt.legend()\n",
-      "plt.title(\"Stock returns loss if true value=0.05, -0.02\");"
+      "plt.title(\"Stock returns loss if true value = 0.05, -0.02\");"
      ],
      "language": "python",
      "metadata": {},
@@ -695,7 +706,7 @@
       "mcmc = pm.MCMC([obs, beta, alpha, std, prec])\n",
       "\n",
       "mcmc.sample(100000, 80000)\n",
-      "mcplot(mcmc);"
+      "mcplot(mcmc)"
      ],
      "language": "python",
      "metadata": {},
@@ -800,7 +811,8 @@
       "\n",
       "noise = 1. / np.sqrt(tau_samples) * np.random.randn(N)\n",
       "\n",
-      "possible_outcomes = lambda signal: alpha_samples + beta_samples * signal + noise\n",
+      "possible_outcomes = lambda signal: alpha_samples + beta_samples * signal \\\n",
+      "    + noise\n",
       "\n",
       "\n",
       "opt_predictions = np.zeros(50)\n",
@@ -894,11 +906,12 @@
       "from draw_sky2 import draw_sky\n",
       "\n",
       "n_sky = 3  # choose a file/sky to examine.\n",
-      "data = np.genfromtxt(\"data/Train_Skies/Train_Skies/Training_Sky%d.csv\" % (n_sky),\n",
-      "                     dtype=None,\n",
-      "                     skip_header=1,\n",
-      "                     delimiter=\",\",\n",
-      "                     usecols=[1, 2, 3, 4])\n",
+      "data = np.genfromtxt(\"data/Train_Skies/Train_Skies/\\\n",
+      "Training_Sky%d.csv\" % (n_sky),\n",
+      "                      dtype=None,\n",
+      "                      skip_header=1,\n",
+      "                      delimiter=\",\",\n",
+      "                      usecols=[1, 2, 3, 4])\n",
       "print \"Data on galaxies in sky %d.\" % n_sky\n",
       "print \"position_x, position_y, e_1, e_2 \"\n",
       "print data[:3]\n",
@@ -952,10 +965,10 @@
       "\n",
       "and in PyMC, \n",
       "\n",
-      "    exp_mass_large = pm.Uniform( \"exp_mass_large\", 40, 180)\n",
+      "    exp_mass_large = pm.Uniform(\"exp_mass_large\", 40, 180)\n",
       "    @pm.deterministic\n",
       "    def mass_large(u = exp_mass_large):\n",
-      "       return np.log( u )\n",
+      "       return np.log(u)\n",
       "\n",
       "(This is what we mean when we say *log*-uniform.) For smaller galaxies, Tim set the mass to be the logarithm of 20. Why did Tim not create a prior for the smaller mass, nor treat it as a unknown? I believe this decision was made to speed up convergence of the algorithm. This is not too restrictive, as by construction the smaller halos have less influence on the galaxies.\n",
       "\n",
@@ -1013,7 +1026,8 @@
       "\n",
       "@pm.deterministic\n",
       "def mean(mass=mass_large, h_pos=halo_position, glx_pos=data[:, :2]):\n",
-      "    return mass / f_distance(glx_pos, h_pos, 240) * tangential_distance(glx_pos, h_pos);"
+      "    return mass / f_distance(glx_pos, h_pos, 240) *\\\n",
+      "        tangential_distance(glx_pos, h_pos)"
      ],
      "language": "python",
      "metadata": {},
@@ -1029,7 +1043,7 @@
       "mcmc = pm.MCMC([ellpty, mean, halo_position, mass_large])\n",
       "map_ = pm.MAP([ellpty, mean, halo_position, mass_large])\n",
       "map_.fit()\n",
-      "mcmc.sample(200000, 140000, 3);"
+      "mcmc.sample(200000, 140000, 3)"
      ],
      "language": "python",
      "metadata": {},
@@ -1101,7 +1115,7 @@
       "                          delimiter=\",\",\n",
       "                          usecols=[1, 2, 3, 4, 5, 6, 7, 8, 9],\n",
       "                          skip_header=1)\n",
-      "print halo_data[n_sky];"
+      "print halo_data[n_sky]"
      ],
      "language": "python",
      "metadata": {},
@@ -1139,9 +1153,9 @@
       "            c=\"k\", s=70)\n",
       "plt.legend(scatterpoints=1, loc=\"lower left\")\n",
       "plt.xlim(0, 4200)\n",
-      "plt.ylim(0, 4200)\n",
+      "plt.ylim(0, 4200);\n",
       "\n",
-      "print \"True halo location:\", halo_data[n_sky][3], halo_data[n_sky][4];"
+      "print \"True halo location:\", halo_data[n_sky][3], halo_data[n_sky][4]"
      ],
      "language": "python",
      "metadata": {},
@@ -1173,7 +1187,7 @@
      "collapsed": false,
      "input": [
       "mean_posterior = t.mean(axis=0).reshape(1, 2)\n",
-      "print mean_posterior;"
+      "print mean_posterior"
      ],
      "language": "python",
      "metadata": {},
@@ -1204,14 +1218,16 @@
       "sky_prediction = mean_posterior\n",
       "\n",
       "print \"Using the mean:\"\n",
-      "main_score(nhalo_all, x_true_all, y_true_all, x_ref_all, y_ref_all, sky_prediction)\n",
+      "main_score(nhalo_all, x_true_all, y_true_all,\n",
+      "           x_ref_all, y_ref_all, sky_prediction)\n",
       "\n",
       "# what's a bad score?\n",
       "print\n",
       "random_guess = np.random.randint(0, 4200, size=(1, 2))\n",
       "print \"Using a random location:\", random_guess\n",
-      "main_score(nhalo_all, x_true_all, y_true_all, x_ref_all, y_ref_all, random_guess)\n",
-      "print;"
+      "main_score(nhalo_all, x_true_all, y_true_all,\n",
+      "           x_ref_all, y_ref_all, random_guess)\n",
+      "print"
      ],
      "language": "python",
      "metadata": {},
@@ -1298,7 +1314,8 @@
       "\n",
       "        _sum = 0\n",
       "        for i in range(n_halos_in_sky):\n",
-      "            _sum += mass[i] / f_distance(glx_pos, h_pos[i, :], fdist_constants[i]) * tangential_distance(glx_pos, h_pos[i, :])\n",
+      "            _sum += mass[i] / f_distance(glx_pos, h_pos[i, :], fdist_constants[i]) *\\\n",
+      "                tangential_distance(glx_pos, h_pos[i, :])\n",
       "\n",
       "        return _sum\n",
       "\n",
@@ -1310,7 +1327,7 @@
       "\n",
       "    mcmc = pm.MCMC([ellpty, mean, halo_positions, mass_large])\n",
       "    mcmc.sample(samples, burn_in, thin)\n",
-      "    return mcmc.trace(\"halo_positions\")[:];"
+      "    return mcmc.trace(\"halo_positions\")[:]"
      ],
      "language": "python",
      "metadata": {},
@@ -1322,11 +1339,12 @@
      "collapsed": false,
      "input": [
       "n_sky = 215\n",
-      "data = np.genfromtxt(\"data/Train_Skies/Train_Skies/Training_Sky%d.csv\" % (n_sky),\n",
-      "                     dtype=None,\n",
-      "                     skip_header=1,\n",
-      "                     delimiter=\",\",\n",
-      "                     usecols=[1, 2, 3, 4]);"
+      "data = np.genfromtxt(\"data/Train_Skies/Train_Skies/\\\n",
+      "Training_Sky%d.csv\" % (n_sky),\n",
+      "                      dtype=None,\n",
+      "                      skip_header=1,\n",
+      "                      delimiter=\",\",\n",
+      "                      usecols=[1, 2, 3, 4])"
      ],
      "language": "python",
      "metadata": {},
@@ -1341,7 +1359,7 @@
       "samples = 10.5e5\n",
       "traces = halo_posteriors(3, data, samples=samples,\n",
       "                         burn_in=9.5e5,\n",
-      "                         thin=10);"
+      "                         thin=10)"
      ],
      "language": "python",
      "metadata": {},
@@ -1368,6 +1386,7 @@
      "cell_type": "code",
      "collapsed": false,
      "input": [
+      "\n",
       "fig = draw_sky(data)\n",
       "plt.title(\"Galaxy positions and ellipcities of sky %d.\" % n_sky)\n",
       "plt.xlabel(\"x-position\")\n",
@@ -1384,7 +1403,7 @@
       "                label=\"True halo position\",\n",
       "                c=\"k\", s=90)\n",
       "\n",
-      "# plt.legend(scatterpoints=1)\n",
+      "# plt.legend(scatterpoints = 1)\n",
       "plt.xlim(0, 4200)\n",
       "plt.ylim(0, 4200);"
      ],
@@ -1424,22 +1443,26 @@
       "mean_posterior = traces.mean(axis=0).reshape(1, 4)\n",
       "print mean_posterior\n",
       "\n",
+      "\n",
       "nhalo_all = _halo_data[0].reshape(1, 1)\n",
       "x_true_all = _halo_data[3].reshape(1, 1)\n",
       "y_true_all = _halo_data[4].reshape(1, 1)\n",
       "x_ref_all = _halo_data[1].reshape(1, 1)\n",
       "y_ref_all = _halo_data[2].reshape(1, 1)\n",
       "sky_prediction = mean_posterior\n",
       "\n",
+      "\n",
       "print \"Using the mean:\"\n",
-      "main_score([1], x_true_all, y_true_all, x_ref_all, y_ref_all, sky_prediction)\n",
+      "main_score([1], x_true_all, y_true_all,\n",
+      "           x_ref_all, y_ref_all, sky_prediction)\n",
       "\n",
       "# what's a bad score?\n",
       "print\n",
       "random_guess = np.random.randint(0, 4200, size=(1, 2))\n",
       "print \"Using a random location:\", random_guess\n",
-      "main_score([1], x_true_all, y_true_all, x_ref_all, y_ref_all, random_guess)\n",
-      "print;"
+      "main_score([1], x_true_all, y_true_all,\n",
+      "           x_ref_all, y_ref_all, random_guess)\n",
+      "print"
      ],
      "language": "python",
      "metadata": {},
@@ -1519,7 +1542,7 @@
       "def css_styling():\n",
       "    styles = open(\"../styles/custom.css\", \"r\").read()\n",
       "    return HTML(styles)\n",
-      "css_styling();"
+      "css_styling()"
      ],
      "language": "python",
      "metadata": {},