justinkang221
diff --git a/‎docs/source/notebooks/language_notebooks/language_model_game.ipynb‎
Lines changed: 61 additions & 60 deletions b/‎docs/source/notebooks/language_notebooks/language_model_game.ipynb‎
Lines changed: 61 additions & 60 deletions
@@ -16,33 +16,34 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "96756a5298128aed",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Install the required packages\n",
     "!pip install transformers torch"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "233a68eadd33ade3",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Import the required libraries\n",
-    "from transformers import pipeline\n",
     "import numpy as np\n",
+    "from transformers import pipeline\n",
+    "\n",
     "import shapiq\n",
     "\n",
     "shapiq.__version__"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -59,10 +60,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "50f59cc77301eef0",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Load the model and tokenizer\n",
     "classifier = pipeline(task=\"sentiment-analysis\", model=\"lvwerra/distilbert-imdb\")\n",
@@ -79,9 +82,7 @@
     "\n",
     "mask_toke_id = tokenizer.mask_token_id\n",
     "print(f\"Mask token id: {mask_toke_id}\")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -95,10 +96,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "c3b3b6f4193e7d73",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Test the tokenizer\n",
     "decoded_sentence = tokenizer.decode(tokenized_sentence[\"input_ids\"])\n",
@@ -110,9 +113,7 @@
     "print(\n",
     "    f\"Decoded sentence: {decoded_sentence} - Tokenized input: {tokenized_input} - {len(tokenized_input)} tokens.\"\n",
     ")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -143,10 +144,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "bce879ce457e9a98",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Define the model call function\n",
     "def model_call(input_texts: list[str]) -> np.ndarray[float]:\n",
@@ -170,9 +173,7 @@
     "\n",
     "# Test the model call function\n",
     "print(f\"Model call: {model_call(['I love this movie!', 'I hate this movie!'])}\")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -186,10 +187,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "d176905292347ec1",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Show coalitions\n",
     "n_players = len(tokenized_sentence[\"input_ids\"]) - 2  # remove [CLS] and [SEP]\n",
@@ -199,9 +202,7 @@
     "\n",
     "print(f\"Empty coalition: {empty_coalition}\")\n",
     "print(f\"Full coalition: {full_coalition}\")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -219,10 +220,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "79a5c423622a0904",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Define the value function\n",
     "def value_function(\n",
@@ -253,9 +256,7 @@
     "    normalized_sentiments = sentiments - normalization_value\n",
     "\n",
     "    return normalized_sentiments"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -269,10 +270,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "22b2201ca139c0d0",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Test the value function without normalization\n",
     "print(f\"Output of the classifier: {classifier(test_sentence)}\")\n",
@@ -283,9 +286,7 @@
     "print(\n",
     "    f\"Value function for the empty coalition: {value_function(empty_coalition, tokenized_input=tokenized_input)[0]}\"\n",
     ")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -299,10 +300,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "338e1ae439120652",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Test the value function with normalization\n",
     "normalization_value = float(value_function(empty_coalition, tokenized_input=tokenized_input)[0])\n",
@@ -312,9 +315,7 @@
     "print(\n",
     "    f\"Value function for the empty coalition: {value_function(empty_coalition, tokenized_input=tokenized_input, normalization_value=normalization_value)[0]}\"\n",
     ")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -328,10 +329,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "91e8b195226e1ecb",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Define the game function\n",
     "def game_fun(coalitions: np.ndarray[bool]) -> np.ndarray[float]:\n",
@@ -351,9 +354,7 @@
     "# Test the game function\n",
     "print(f\"Game for the full coalition: {game_fun(full_coalition)[0]}\")\n",
     "print(f\"Game for the empty coalition: {game_fun(empty_coalition)[0]}\")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -367,10 +368,12 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "ea94eb7697abad0d",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "class SentimentClassificationGame(shapiq.Game):\n",
     "    \"\"\"The sentiment analysis classifier modeled as a cooperative game.\n",
@@ -438,9 +441,7 @@
     "game_class = SentimentClassificationGame(classifier, tokenizer, test_sentence)\n",
     "print(f\"Game for the full coalition: {game_class(full_coalition)[0]}\")\n",
     "print(f\"Game for the empty coalition: {game_class(empty_coalition)[0]}\")"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "markdown",
@@ -455,48 +456,51 @@
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "f62adc49538c8a79",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Compute Shapley interactions with the ShapIQ approximator for the game function\n",
     "approximator = shapiq.KernelSHAPIQ(n=n_players, max_order=2, index=\"k-SII\")\n",
     "sii_values = approximator.approximate(budget=2**n_players, game=game_fun)\n",
     "sii_values.dict_values"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "id": "7641d33a850cdd16",
    "metadata": {
     "collapsed": false
    },
+   "outputs": [],
    "source": [
     "# Compute Shapley interactions with the ShapIQ approximator for the game object\n",
     "approximator = shapiq.KernelSHAPIQ(n=game_class.n_players, max_order=2, index=\"k-SII\")\n",
     "sii_values = approximator.approximate(budget=2**game_class.n_players, game=game_class)\n",
     "sii_values.dict_values"
-   ],
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
-   "metadata": {},
    "cell_type": "markdown",
+   "id": "ef3641f671c8616b",
+   "metadata": {},
    "source": [
     "Now let's say we want to do this for a much larger inputs. We can use the `shapiq.SPEX` approximator which is a sparse\n",
     "transform approximator. This approximator is much faster than the KernelSHAPIQ approximator when the number of\n",
     "players is large and can be used for larger inputs. Instead of computing all interactions it computes only the\n",
     "most important ones."
-   ],
-   "id": "ef3641f671c8616b"
+   ]
   },
   {
-   "metadata": {},
    "cell_type": "code",
+   "execution_count": null,
+   "id": "ce6bc4d47530fa2b",
+   "metadata": {},
+   "outputs": [],
    "source": [
     "text = \\\n",
     "\"\"\"\n",
@@ -505,7 +509,7 @@
     "\"\"\"\n",
     "big_game = SentimentClassificationGame(classifier=classifier,\n",
     "                                       tokenizer=tokenizer,\n",
-    "                                       test_sentence=text,)\n",
+    "                                       test_sentence=text)\n",
     "print(f\"There are a total of {big_game.n_players} players.\")\n",
     "# To speed up inference, run pipeline with gpu support. Takes ~10 minutes on Mac M1 with MPS.\n",
     "scalable_approximator = shapiq.SPEX(n=big_game.n_players, index=\"SII\")\n",
@@ -514,31 +518,24 @@
     "print(f\"Game for the empty coalition: {game_class(empty_coalition)[0]}\")\n",
     "interactions = (list(large_sii.dict_values.items()))\n",
     "interactions.sort(key= lambda x : abs(x[1]), reverse=True)"
-   ],
-   "id": "ce6bc4d47530fa2b",
-   "outputs": [],
-   "execution_count": null
+   ]
   },
   {
-   "metadata": {},
    "cell_type": "markdown",
-   "source": "`shapiq.SPEX` identifies interactions between the most sentiment-rich tokens in the paragraph (i.e. *powerful*, *valuable*, *weakness*)",
-   "id": "e81434a652831817"
+   "id": "e81434a652831817",
+   "metadata": {},
+   "source": "`shapiq.SPEX` identifies interactions between the most sentiment-rich tokens in the paragraph (i.e. *powerful*, *valuable*, *weakness*)"
   },
   {
+   "cell_type": "code",
+   "execution_count": 28,
+   "id": "a09121f781d9be77",
    "metadata": {
     "ExecuteTime": {
      "end_time": "2025-04-15T18:41:34.838256Z",
      "start_time": "2025-04-15T18:41:34.829935Z"
     }
    },
-   "cell_type": "code",
-   "source": [
-    "for inter, value in interactions[:10]:\n",
-    "    tokens = [big_game.tokenizer.decode(big_game.tokenized_input[idx]) for idx in inter]\n",
-    "    print(f'Tokens: {tokens}, Value: {value:.3f}')"
-   ],
-   "id": "a09121f781d9be77",
    "outputs": [
     {
      "name": "stdout",
@@ -557,7 +554,11 @@
      ]
     }
    ],
-   "execution_count": 28
+   "source": [
+    "for inter, value in interactions[:10]:\n",
+    "    tokens = [big_game.tokenizer.decode(big_game.tokenized_input[idx]) for idx in inter]\n",
+    "    print(f'Tokens: {tokens}, Value: {value:.3f}')"
+   ]
   }
  ],
  "metadata": {