UnravelSports
diff --git a/‎README.md‎
Lines changed: 11 additions & 10 deletions b/‎README.md‎
Lines changed: 11 additions & 10 deletions
diff --git a/‎examples/0_quick_start_guide.ipynb‎
Lines changed: 125 additions & 28 deletions b/‎examples/0_quick_start_guide.ipynb‎
Lines changed: 125 additions & 28 deletions
@@ -30,18 +30,21 @@ This package currently supports:
 ```python
 from unravel.soccer import KloppyPolarsDataset
 
-from kloppy import skillcorner
+from kloppy import sportec
 
-kloppy_dataset = skillcorner.load_open_data(
-    match_id=2068, 
-    include_empty_frames=False,
-    limit=500,
-)
+kloppy_dataset = sportec.load_open_tracking_data()
 kloppy_polars_dataset = KloppyPolarsDataset(
-    kloppy_dataset=kloppy_dataset, 
-    ball_carrier_threshold=25.0
+    kloppy_dataset=kloppy_dataset
 )
 ```
+|    |   period_id | timestamp       |   frame_id | ball_state   | id             |      x |     y |   z | team_id        | position_name   | game_id        |     vx |     vy |   vz |     v |   ax |   ay |   az |   a | ball_owning_team_id   | is_ball_carrier   |
+|---:|------------:|:----------------|-----------:|:-------------|:---------------|-------:|------:|----:|:---------------|:----------------|:---------------|-------:|-------:|-----:|------:|-----:|-----:|-----:|----:|:----------------------|:------------------|
+|  0 |           1 | 0 days 00:00:00 |      10000 | alive        | DFL-OBJ-00008F | -20.67 | -4.56 |   0 | DFL-CLU-000005 | RCB             | DFL-MAT-J03WPY |  0.393 | -0.214 |    0 | 0.447 |    0 |    0 |    0 |   0 | DFL-CLU-00000P        | False             |
+|  1 |           1 | 0 days 00:00:00 |      10000 | alive        | DFL-OBJ-0000EJ |  -8.86 | -0.94 |   0 | DFL-CLU-000005 | UNK             | DFL-MAT-J03WPY | -0.009 |  0.018 |    0 | 0.02  |    0 |    0 |    0 |   0 | DFL-CLU-00000P        | False             |
+|  2 |           1 | 0 days 00:00:00 |      10000 | alive        | DFL-OBJ-0000F8 |  -2.12 |  9.85 |   0 | DFL-CLU-00000P | RM              | DFL-MAT-J03WPY |  0     |  0     |    0 | 0     |    0 |    0 |    0 |   0 | DFL-CLU-00000P        | False             |
+|  3 |           1 | 0 days 00:00:00 |      10000 | alive        | DFL-OBJ-0000NZ |   0.57 | 23.23 |   0 | DFL-CLU-00000P | RB              | DFL-MAT-J03WPY |  0.179 | -0.134 |    0 | 0.223 |    0 |    0 |    0 |   0 | DFL-CLU-00000P        | False             |
+|  4 |           1 | 0 days 00:00:00 |      10000 | alive        | DFL-OBJ-0001HW | -46.26 |  0.08 |   0 | DFL-CLU-000005 | GK              | DFL-MAT-J03WPY |  0.357 |  0.071 |    0 | 0.364 |    0 |    0 |    0 |   0 | DFL-CLU-00000P        | False             |
+
 
 $^1$ <small>Open data available through kloppy.</small>
 
@@ -67,8 +70,6 @@ bdb = BigDataBowlDataset(
 ```python
 converter = SoccerGraphConverterPolars(
     dataset=kloppy_polars_dataset,
-    max_player_speed=12.0,
-    max_ball_speed=28.0,
     self_loop_ball=True,
     adjacency_matrix_connect_type="ball",
     adjacency_matrix_type="split_by_team",
 
@@ -36,9 +36,20 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m24.2\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m25.0.1\u001b[0m\n",
+      "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n",
+      "Note: you may need to restart the kernel to use updated packages.\n"
+     ]
+    }
+   ],
    "source": [
     "%pip install unravelsports --quiet"
    ]
@@ -51,35 +62,32 @@
     "\n",
     "1. Load [Kloppy](https://github.com/PySport/kloppy) dataset. \n",
     "    See [in-depth Tutorial](1_kloppy_gnn_train.ipynb) on how do processes multiple match files, and to see an overview of all possible settings.\n",
-    "2. Convert to Graph format using `SoccerGraphConverter`\n",
+    "2. Convert to Graph format using `SoccerGraphConverterPolars`\n",
     "3. Create dataset for easy processing with [Spektral](https://graphneural.network/) using `CustomSpektralDataset`"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
-    "from unravel.soccer import SoccerGraphConverter\n",
+    "from unravel.soccer import SoccerGraphConverterPolars, KloppyPolarsDataset\n",
     "from unravel.utils import CustomSpektralDataset\n",
     "\n",
-    "from kloppy import skillcorner\n",
-    "\n",
-    "from unravel.utils import dummy_labels\n",
+    "from kloppy import sportec\n",
     "\n",
     "# Load Kloppy dataset\n",
-    "kloppy_dataset = skillcorner.load_open_data(\n",
-    "    match_id=4039,\n",
-    "    include_empty_frames=False,\n",
-    "    limit=500,  # limit to 500 frames in this example\n",
+    "kloppy_dataset = sportec.load_open_tracking_data(only_alive=True, limit=500)\n",
+    "kloppy_polars_dataset = KloppyPolarsDataset(\n",
+    "    kloppy_dataset=kloppy_dataset,\n",
     ")\n",
+    "kloppy_polars_dataset.add_dummy_labels()\n",
+    "kloppy_polars_dataset.add_graph_ids(by=[\"frame_id\"])\n",
     "\n",
-    "# Initialize the Graph Converter, with dataset and labels\n",
+    "# Initialize the Graph Converter with dataset\n",
     "# Here we use the default settings\n",
-    "converter = SoccerGraphConverter(\n",
-    "    dataset=kloppy_dataset, labels=dummy_labels(kloppy_dataset)\n",
-    ")\n",
+    "converter = SoccerGraphConverterPolars(dataset=kloppy_polars_dataset)\n",
     "\n",
     "# Compute the graphs and add them to the CustomSpektralDataset\n",
     "dataset = CustomSpektralDataset(graphs=converter.to_spektral_graphs())"
@@ -96,14 +104,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
     "from spektral.data import DisjointLoader\n",
     "\n",
     "train, test, val = dataset.split_test_train_validation(\n",
-    "    split_train=4, split_test=1, split_validation=1, random_seed=42\n",
+    "    split_train=4, split_test=1, split_validation=1, random_seed=43\n",
     ")"
    ]
   },
@@ -121,9 +129,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "WARNING:absl:At this time, the v2.11+ optimizer `tf.keras.optimizers.Adam` runs slowly on M1/M2 Macs, please use the legacy Keras optimizer instead, located at `tf.keras.optimizers.legacy.Adam`.\n"
+     ]
+    }
+   ],
    "source": [
     "from unravel.classifiers import CrystalGraphClassifier\n",
     "\n",
@@ -150,9 +166,74 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Epoch 1/10\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/jbekkers/PycharmProjects/unravelsports/.venv311/lib/python3.11/site-packages/keras/src/initializers/initializers.py:120: UserWarning: The initializer GlorotUniform is unseeded and being called multiple times, which will return identical values each time (even if the initializer is unseeded). Please update your code to provide a seed to the initializer, or avoid using the same initializer instance more than once.\n",
+      "  warnings.warn(\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "11/11 [==============================] - 1s 16ms/step - loss: 21.7806 - auc: 0.5278 - binary_accuracy: 0.5419 - val_loss: 5.1682 - val_auc: 0.5000 - val_binary_accuracy: 0.5000\n",
+      "Epoch 2/10\n",
+      " 1/11 [=>............................] - ETA: 0s - loss: 9.2846 - auc: 0.3651 - binary_accuracy: 0.5000WARNING:tensorflow:Your input ran out of data; interrupting training. Make sure that your dataset or generator can generate at least `steps_per_epoch * epochs` batches (in this case, 3 batches). You may need to use the repeat() function when building your dataset.\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "WARNING:tensorflow:Your input ran out of data; interrupting training. Make sure that your dataset or generator can generate at least `steps_per_epoch * epochs` batches (in this case, 3 batches). You may need to use the repeat() function when building your dataset.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "11/11 [==============================] - 0s 6ms/step - loss: 4.5155 - auc: 0.5366 - binary_accuracy: 0.5449\n",
+      "Epoch 3/10\n",
+      "11/11 [==============================] - 0s 4ms/step - loss: 2.0773 - auc: 0.4515 - binary_accuracy: 0.4731\n",
+      "Epoch 4/10\n",
+      "11/11 [==============================] - 0s 5ms/step - loss: 1.1006 - auc: 0.5205 - binary_accuracy: 0.5150\n",
+      "Epoch 5/10\n",
+      "11/11 [==============================] - 0s 4ms/step - loss: 0.9159 - auc: 0.4915 - binary_accuracy: 0.5180\n",
+      "Epoch 6/10\n",
+      "11/11 [==============================] - 0s 5ms/step - loss: 0.8020 - auc: 0.4873 - binary_accuracy: 0.5060\n",
+      "Epoch 7/10\n",
+      "11/11 [==============================] - 0s 4ms/step - loss: 0.8067 - auc: 0.4960 - binary_accuracy: 0.5299\n",
+      "Epoch 8/10\n",
+      "11/11 [==============================] - 0s 6ms/step - loss: 0.7808 - auc: 0.5055 - binary_accuracy: 0.5299\n",
+      "Epoch 9/10\n",
+      "11/11 [==============================] - 0s 4ms/step - loss: 0.7661 - auc: 0.4937 - binary_accuracy: 0.5060\n",
+      "Epoch 10/10\n",
+      "11/11 [==============================] - 0s 5ms/step - loss: 0.7406 - auc: 0.5098 - binary_accuracy: 0.5329\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "<keras.src.callbacks.History at 0x39fe49d10>"
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "from tensorflow.keras.callbacks import EarlyStopping\n",
     "\n",
@@ -186,9 +267,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "3/3 [==============================] - 0s 6ms/step - loss: 0.7001 - auc: 0.5000 - binary_accuracy: 0.4819\n"
+     ]
+    }
+   ],
    "source": [
     "loader_te = DisjointLoader(test, epochs=1, shuffle=False, batch_size=batch_size)\n",
     "results = model.evaluate(loader_te.load())"
@@ -207,9 +296,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "3/3 [==============================] - 0s 5ms/step\n"
+     ]
+    }
+   ],
    "source": [
     "loader_te = DisjointLoader(test, batch_size=batch_size, epochs=1, shuffle=False)\n",
     "loaded_pred = model.predict(loader_te.load(), use_multiprocessing=True)"
@@ -218,7 +315,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "venv",
+   "display_name": ".venv311",
    "language": "python",
    "name": "python3"
   },
@@ -232,7 +329,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.12.2"
+   "version": "3.11.11"
   }
  },
  "nbformat": 4,