{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "cae56ed1-f6f4-48f3-ae53-b85d721e8b68", "metadata": { "execution": { "iopub.execute_input": "2025-12-10T19:32:13.782702Z", "iopub.status.busy": "2025-12-10T19:32:13.782510Z", "iopub.status.idle": "2025-12-10T19:32:15.268831Z", "shell.execute_reply": "2025-12-10T19:32:15.268350Z", "shell.execute_reply.started": "2025-12-10T19:32:13.782687Z" } }, "outputs": [], "source": [ "from sklearn.datasets import fetch_openml\n", "dataset = fetch_openml(\"higgs\", version=2)" ] }, { "cell_type": "markdown", "id": "1abade28-4644-4ee2-95fe-7a24cc060294", "metadata": {}, "source": [ "# Examine" ] }, { "cell_type": "code", "execution_count": 2, "id": "c6cce885-516c-4f6b-a4d7-910182c53da4", "metadata": { "execution": { "iopub.execute_input": "2025-12-10T19:32:15.272358Z", "iopub.status.busy": "2025-12-10T19:32:15.272252Z", "iopub.status.idle": "2025-12-10T19:32:15.290262Z", "shell.execute_reply": "2025-12-10T19:32:15.289806Z", "shell.execute_reply.started": "2025-12-10T19:32:15.272345Z" } }, "outputs": [ { "data": { "text/html": [ "
| \n", " | lepton_pT | \n", "lepton_eta | \n", "lepton_phi | \n", "missing_energy_magnitude | \n", "missing_energy_phi | \n", "jet1pt | \n", "jet1eta | \n", "jet1phi | \n", "jet1b-tag | \n", "jet2pt | \n", "... | \n", "jet4eta | \n", "jet4phi | \n", "jet4b-tag | \n", "m_jj | \n", "m_jjj | \n", "m_lv | \n", "m_jlv | \n", "m_bb | \n", "m_wbb | \n", "m_wwbb | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "0.907542 | \n", "0.329147 | \n", "0.359412 | \n", "1.497970 | \n", "-0.313010 | \n", "1.095531 | \n", "-0.557525 | \n", "-1.588230 | \n", "2.173076 | \n", "0.812581 | \n", "... | \n", "-1.138930 | \n", "-0.000819 | \n", "0.000000 | \n", "0.302220 | \n", "0.833048 | \n", "0.985700 | \n", "0.978098 | \n", "0.779732 | \n", "0.992356 | \n", "0.798343 | \n", "
| 1 | \n", "0.798835 | \n", "1.470639 | \n", "-1.635975 | \n", "0.453773 | \n", "0.425629 | \n", "1.104875 | \n", "1.282322 | \n", "1.381664 | \n", "0.000000 | \n", "0.851737 | \n", "... | \n", "1.128848 | \n", "0.900461 | \n", "0.000000 | \n", "0.909753 | \n", "1.108330 | \n", "0.985692 | \n", "0.951331 | \n", "0.803252 | \n", "0.865924 | \n", "0.780118 | \n", "
| 2 | \n", "1.344385 | \n", "-0.876626 | \n", "0.935913 | \n", "1.992050 | \n", "0.882454 | \n", "1.786066 | \n", "-1.646778 | \n", "-0.942383 | \n", "0.000000 | \n", "2.423265 | \n", "... | \n", "-0.678379 | \n", "-1.360356 | \n", "0.000000 | \n", "0.946652 | \n", "1.028704 | \n", "0.998656 | \n", "0.728281 | \n", "0.869200 | \n", "1.026736 | \n", "0.957904 | \n", "
| 3 | \n", "1.105009 | \n", "0.321356 | \n", "1.522401 | \n", "0.882808 | \n", "-1.205349 | \n", "0.681466 | \n", "-1.070464 | \n", "-0.921871 | \n", "0.000000 | \n", "0.800872 | \n", "... | \n", "-0.373566 | \n", "0.113041 | \n", "0.000000 | \n", "0.755856 | \n", "1.361057 | \n", "0.986610 | \n", "0.838085 | \n", "1.133295 | \n", "0.872245 | \n", "0.808487 | \n", "
| 4 | \n", "1.595839 | \n", "-0.607811 | \n", "0.007075 | \n", "1.818450 | \n", "-0.111906 | \n", "0.847550 | \n", "-0.566437 | \n", "1.581239 | \n", "2.173076 | \n", "0.755421 | \n", "... | \n", "-0.654227 | \n", "-1.274345 | \n", "3.101961 | \n", "0.823761 | \n", "0.938191 | \n", "0.971758 | \n", "0.789176 | \n", "0.430553 | \n", "0.961357 | \n", "0.957818 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 98045 | \n", "0.908091 | \n", "-0.825006 | \n", "-0.830871 | \n", "0.736298 | \n", "1.512713 | \n", "0.881811 | \n", "-0.363440 | \n", "0.006813 | \n", "1.086538 | \n", "0.763227 | \n", "... | \n", "-0.187013 | \n", "0.716785 | \n", "0.000000 | \n", "1.317681 | \n", "1.010795 | \n", "0.985962 | \n", "0.957878 | \n", "1.454672 | \n", "0.903937 | \n", "0.786069 | \n", "
| 98046 | \n", "2.512898 | \n", "0.530759 | \n", "-1.470626 | \n", "1.641798 | \n", "1.613386 | \n", "0.934027 | \n", "1.521958 | \n", "-0.049836 | \n", "0.000000 | \n", "1.029891 | \n", "... | \n", "0.053673 | \n", "-0.386483 | \n", "0.000000 | \n", "0.774413 | \n", "0.745263 | \n", "0.997088 | \n", "1.392387 | \n", "0.864681 | \n", "1.179783 | \n", "1.086167 | \n", "
| 98047 | \n", "0.903699 | \n", "0.261943 | \n", "-0.429149 | \n", "1.892855 | \n", "0.313687 | \n", "0.493396 | \n", "-1.494282 | \n", "-1.458506 | \n", "0.000000 | \n", "0.575505 | \n", "... | \n", "-0.283621 | \n", "1.110772 | \n", "3.101961 | \n", "0.527038 | \n", "0.607263 | \n", "1.125286 | \n", "0.634106 | \n", "0.115543 | \n", "0.425828 | \n", "0.692506 | \n", "
| 98048 | \n", "0.566047 | \n", "-0.317568 | \n", "0.062561 | \n", "0.358186 | \n", "-1.315823 | \n", "0.691176 | \n", "1.154583 | \n", "-0.242759 | \n", "2.173076 | \n", "0.680634 | \n", "... | \n", "-0.844943 | \n", "-0.294922 | \n", "0.000000 | \n", "0.747239 | \n", "1.008975 | \n", "0.989497 | \n", "1.203147 | \n", "0.892492 | \n", "1.090807 | \n", "0.888965 | \n", "
| 98049 | \n", "0.708611 | \n", "1.190136 | \n", "0.593008 | \n", "1.899366 | \n", "-0.111872 | \n", "0.871276 | \n", "0.982283 | \n", "-1.684691 | \n", "2.173076 | \n", "0.653187 | \n", "... | \n", "1.797605 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "
98050 rows × 28 columns
\n", "LogisticRegression()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
| \n", " | penalty | \n", "'l2' | \n", "
| \n", " | dual | \n", "False | \n", "
| \n", " | tol | \n", "0.0001 | \n", "
| \n", " | C | \n", "1.0 | \n", "
| \n", " | fit_intercept | \n", "True | \n", "
| \n", " | intercept_scaling | \n", "1 | \n", "
| \n", " | class_weight | \n", "None | \n", "
| \n", " | random_state | \n", "None | \n", "
| \n", " | solver | \n", "'lbfgs' | \n", "
| \n", " | max_iter | \n", "100 | \n", "
| \n", " | multi_class | \n", "'deprecated' | \n", "
| \n", " | verbose | \n", "0 | \n", "
| \n", " | warm_start | \n", "False | \n", "
| \n", " | n_jobs | \n", "None | \n", "
| \n", " | l1_ratio | \n", "None | \n", "