{ "cells": [ { "cell_type": "markdown", "id": "05b7b43f", "metadata": {}, "source": [ "# Predicting Gene Expression with Decima" ] }, { "cell_type": "markdown", "id": "42034677", "metadata": {}, "source": [ "Decima allows prediction of gene expression at the cell type level, and this tutorial demonstrates how to leverage the prediction API for both genes in the training data and custom genes." ] }, { "cell_type": "markdown", "id": "1898aff7", "metadata": { "vscode": { "languageId": "plaintext" } }, "source": [ "### Precomputed Predictions" ] }, { "cell_type": "markdown", "id": "f4634c23", "metadata": {}, "source": [ "Scores for all genes in the training data are precomputed and saved to metadata h5ad object for each model replicate and are available under the `DecimaResult` class. `predicted_expression_matrix` class returns predicted average gene expression across the replicates." ] }, { "cell_type": "code", "execution_count": 1, "id": "6b76abce", "metadata": { "execution": { "iopub.execute_input": "2025-11-21T06:24:54.170009Z", "iopub.status.busy": "2025-11-21T06:24:54.169485Z", "iopub.status.idle": "2025-11-21T06:25:32.182146Z", "shell.execute_reply": "2025-11-21T06:25:32.181240Z" } }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/home/celikm5/miniforge3/envs/decima2/lib/python3.11/site-packages/pydantic/_internal/_generate_schema.py:2249: UnsupportedFieldAttributeWarning: The 'repr' attribute with value False was provided to the `Field()` function, which has no effect in the context it was used. 'repr' is field-specific metadata, and can only be attached to a model field using `Annotated` metadata or by assignment. This may have happened because an `Annotated` type alias using the `type` statement was used, or if the `Field()` function was attached to a single member of a union type.\n", " warnings.warn(\n", "/home/celikm5/miniforge3/envs/decima2/lib/python3.11/site-packages/pydantic/_internal/_generate_schema.py:2249: UnsupportedFieldAttributeWarning: The 'frozen' attribute with value True was provided to the `Field()` function, which has no effect in the context it was used. 'frozen' is field-specific metadata, and can only be attached to a model field using `Annotated` metadata or by assignment. This may have happened because an `Annotated` type alias using the `type` statement was used, or if the `Field()` function was attached to a single member of a union type.\n", " warnings.warn(\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "\u001b[34m\u001b[1mwandb\u001b[0m: Currently logged in as: \u001b[33mmhcelik\u001b[0m (\u001b[33mmhcw\u001b[0m) to \u001b[32mhttps://api.wandb.ai\u001b[0m. Use \u001b[1m`wandb login --relogin`\u001b[0m to force relogin\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "\u001b[34m\u001b[1mwandb\u001b[0m: Downloading large artifact 'metadata:latest', 3122.32MB. 1 files...\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "\u001b[34m\u001b[1mwandb\u001b[0m: 1 of 1 files downloaded. \n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "Done. 00:00:08.3 (375.3MB/s)\n" ] }, { "data": { "text/html": [ "
| \n", " | STRADA | \n", "ETV4 | \n", "USP25 | \n", "ZSWIM5 | \n", "C21orf58 | \n", "MIR497HG | \n", "CFAP74 | \n", "GSE1 | \n", "LPP | \n", "CLK1 | \n", "... | \n", "STRIP2 | \n", "TNFRSF1A | \n", "RBM14-RBM4 | \n", "C1orf21 | \n", "LINC00639 | \n", "NPDC1 | \n", "ZNF425 | \n", "COL5A1 | \n", "BRD3 | \n", "EVI5L | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| agg_0 | \n", "2.973438 | \n", "1.845565 | \n", "4.592531 | \n", "5.099802 | \n", "1.774879 | \n", "0.356812 | \n", "2.590836 | \n", "4.629774 | \n", "4.897171 | \n", "3.326940 | \n", "... | \n", "2.836060 | \n", "0.297015 | \n", "1.883849 | \n", "4.293593 | \n", "1.463565 | \n", "3.183534 | \n", "2.340202 | \n", "2.374942 | \n", "2.911916 | \n", "3.230072 | \n", "
| agg_1 | \n", "2.954213 | \n", "1.896726 | \n", "4.688557 | \n", "5.510440 | \n", "1.666929 | \n", "0.352725 | \n", "2.292625 | \n", "4.459535 | \n", "4.915286 | \n", "3.192858 | \n", "... | \n", "3.125704 | \n", "0.242543 | \n", "1.908177 | \n", "4.439424 | \n", "1.236739 | \n", "3.494824 | \n", "2.425672 | \n", "2.054568 | \n", "2.713408 | \n", "3.491463 | \n", "
| agg_2 | \n", "2.938851 | \n", "2.197247 | \n", "4.861410 | \n", "5.617520 | \n", "1.773381 | \n", "0.380867 | \n", "2.394917 | \n", "4.415038 | \n", "4.836399 | \n", "3.390717 | \n", "... | \n", "3.082098 | \n", "0.263285 | \n", "2.006456 | \n", "4.383455 | \n", "1.208590 | \n", "4.013819 | \n", "2.408381 | \n", "2.297343 | \n", "2.892222 | \n", "3.695785 | \n", "
| agg_3 | \n", "3.045972 | \n", "2.138573 | \n", "4.863791 | \n", "5.273604 | \n", "1.760097 | \n", "0.463555 | \n", "2.391702 | \n", "3.940975 | \n", "4.857763 | \n", "3.410926 | \n", "... | \n", "2.882890 | \n", "0.290327 | \n", "1.922963 | \n", "4.550189 | \n", "1.430520 | \n", "3.693118 | \n", "2.297103 | \n", "2.121887 | \n", "2.626117 | \n", "3.223912 | \n", "
| agg_4 | \n", "3.025518 | \n", "2.019096 | \n", "4.602948 | \n", "5.257001 | \n", "1.755338 | \n", "0.382190 | \n", "2.432810 | \n", "4.392480 | \n", "4.959488 | \n", "3.250500 | \n", "... | \n", "3.082296 | \n", "0.258540 | \n", "2.038277 | \n", "4.464807 | \n", "1.249043 | \n", "3.665800 | \n", "2.400820 | \n", "2.255862 | \n", "2.925619 | \n", "3.471005 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| agg_9533 | \n", "2.333562 | \n", "0.633322 | \n", "4.675825 | \n", "2.793023 | \n", "0.752030 | \n", "0.692083 | \n", "0.503531 | \n", "4.327948 | \n", "6.903193 | \n", "3.695593 | \n", "... | \n", "0.549795 | \n", "2.270181 | \n", "1.563218 | \n", "4.395422 | \n", "0.550088 | \n", "1.330252 | \n", "1.044471 | \n", "3.759369 | \n", "2.491346 | \n", "1.872717 | \n", "
| agg_9535 | \n", "0.835037 | \n", "0.358773 | \n", "1.964896 | \n", "0.307449 | \n", "0.337240 | \n", "0.834196 | \n", "0.093885 | \n", "1.853794 | \n", "3.700790 | \n", "4.467302 | \n", "... | \n", "0.176885 | \n", "1.370898 | \n", "1.022708 | \n", "3.400267 | \n", "0.052162 | \n", "1.908870 | \n", "0.253417 | \n", "1.448111 | \n", "1.622033 | \n", "1.064292 | \n", "
| agg_9536 | \n", "3.008039 | \n", "1.209324 | \n", "4.798392 | \n", "3.931870 | \n", "1.401328 | \n", "1.638555 | \n", "0.969720 | \n", "4.779201 | \n", "6.631931 | \n", "4.127797 | \n", "... | \n", "1.174298 | \n", "1.870530 | \n", "2.506874 | \n", "5.151776 | \n", "0.967644 | \n", "1.809947 | \n", "2.205356 | \n", "4.244005 | \n", "2.974467 | \n", "2.659873 | \n", "
| agg_9537 | \n", "1.241936 | \n", "0.455059 | \n", "2.919995 | \n", "0.571672 | \n", "0.486448 | \n", "1.175586 | \n", "0.145397 | \n", "2.412148 | \n", "4.759118 | \n", "4.913945 | \n", "... | \n", "0.371035 | \n", "1.361073 | \n", "1.668085 | \n", "4.005738 | \n", "0.078611 | \n", "1.571750 | \n", "0.508187 | \n", "2.067150 | \n", "2.323764 | \n", "1.429850 | \n", "
| agg_9538 | \n", "1.715507 | \n", "0.700955 | \n", "3.044732 | \n", "0.858696 | \n", "0.903406 | \n", "1.763168 | \n", "0.215304 | \n", "2.604478 | \n", "4.549708 | \n", "4.839124 | \n", "... | \n", "0.594310 | \n", "1.801298 | \n", "2.075996 | \n", "3.933860 | \n", "0.165590 | \n", "1.970268 | \n", "0.993521 | \n", "2.232347 | \n", "2.473388 | \n", "1.902884 | \n", "
8856 rows Γ 18457 columns
\n", "| \n", " | STRADA | \n", "ETV4 | \n", "USP25 | \n", "ZSWIM5 | \n", "C21orf58 | \n", "MIR497HG | \n", "CFAP74 | \n", "GSE1 | \n", "LPP | \n", "CLK1 | \n", "... | \n", "STRIP2 | \n", "TNFRSF1A | \n", "RBM14-RBM4 | \n", "C1orf21 | \n", "LINC00639 | \n", "NPDC1 | \n", "ZNF425 | \n", "COL5A1 | \n", "BRD3 | \n", "EVI5L | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| agg_0 | \n", "2.973438 | \n", "1.845565 | \n", "4.592531 | \n", "5.099802 | \n", "1.774879 | \n", "0.356812 | \n", "2.590836 | \n", "4.629774 | \n", "4.897171 | \n", "3.326940 | \n", "... | \n", "2.836060 | \n", "0.297015 | \n", "1.883849 | \n", "4.293593 | \n", "1.463565 | \n", "3.183534 | \n", "2.340202 | \n", "2.374942 | \n", "2.911916 | \n", "3.230072 | \n", "
| agg_1 | \n", "2.954213 | \n", "1.896726 | \n", "4.688557 | \n", "5.510440 | \n", "1.666929 | \n", "0.352725 | \n", "2.292625 | \n", "4.459535 | \n", "4.915286 | \n", "3.192858 | \n", "... | \n", "3.125704 | \n", "0.242543 | \n", "1.908177 | \n", "4.439424 | \n", "1.236739 | \n", "3.494824 | \n", "2.425672 | \n", "2.054568 | \n", "2.713408 | \n", "3.491463 | \n", "
| agg_2 | \n", "2.938851 | \n", "2.197247 | \n", "4.861410 | \n", "5.617520 | \n", "1.773381 | \n", "0.380867 | \n", "2.394917 | \n", "4.415038 | \n", "4.836399 | \n", "3.390717 | \n", "... | \n", "3.082098 | \n", "0.263285 | \n", "2.006456 | \n", "4.383455 | \n", "1.208590 | \n", "4.013819 | \n", "2.408381 | \n", "2.297343 | \n", "2.892222 | \n", "3.695785 | \n", "
| agg_3 | \n", "3.045972 | \n", "2.138573 | \n", "4.863791 | \n", "5.273604 | \n", "1.760097 | \n", "0.463555 | \n", "2.391702 | \n", "3.940975 | \n", "4.857763 | \n", "3.410926 | \n", "... | \n", "2.882890 | \n", "0.290327 | \n", "1.922963 | \n", "4.550189 | \n", "1.430520 | \n", "3.693118 | \n", "2.297103 | \n", "2.121887 | \n", "2.626117 | \n", "3.223912 | \n", "
| agg_4 | \n", "3.025518 | \n", "2.019096 | \n", "4.602948 | \n", "5.257001 | \n", "1.755338 | \n", "0.382190 | \n", "2.432810 | \n", "4.392480 | \n", "4.959488 | \n", "3.250500 | \n", "... | \n", "3.082296 | \n", "0.258540 | \n", "2.038277 | \n", "4.464807 | \n", "1.249043 | \n", "3.665800 | \n", "2.400820 | \n", "2.255862 | \n", "2.925619 | \n", "3.471005 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| agg_9533 | \n", "2.333562 | \n", "0.633322 | \n", "4.675825 | \n", "2.793023 | \n", "0.752030 | \n", "0.692083 | \n", "0.503531 | \n", "4.327948 | \n", "6.903193 | \n", "3.695593 | \n", "... | \n", "0.549795 | \n", "2.270181 | \n", "1.563218 | \n", "4.395422 | \n", "0.550088 | \n", "1.330252 | \n", "1.044471 | \n", "3.759369 | \n", "2.491346 | \n", "1.872717 | \n", "
| agg_9535 | \n", "0.835037 | \n", "0.358773 | \n", "1.964896 | \n", "0.307449 | \n", "0.337240 | \n", "0.834196 | \n", "0.093885 | \n", "1.853794 | \n", "3.700790 | \n", "4.467302 | \n", "... | \n", "0.176885 | \n", "1.370898 | \n", "1.022708 | \n", "3.400267 | \n", "0.052162 | \n", "1.908870 | \n", "0.253417 | \n", "1.448111 | \n", "1.622033 | \n", "1.064292 | \n", "
| agg_9536 | \n", "3.008039 | \n", "1.209324 | \n", "4.798392 | \n", "3.931870 | \n", "1.401328 | \n", "1.638555 | \n", "0.969720 | \n", "4.779201 | \n", "6.631931 | \n", "4.127797 | \n", "... | \n", "1.174298 | \n", "1.870530 | \n", "2.506874 | \n", "5.151776 | \n", "0.967644 | \n", "1.809947 | \n", "2.205356 | \n", "4.244005 | \n", "2.974467 | \n", "2.659873 | \n", "
| agg_9537 | \n", "1.241936 | \n", "0.455059 | \n", "2.919995 | \n", "0.571672 | \n", "0.486448 | \n", "1.175586 | \n", "0.145397 | \n", "2.412148 | \n", "4.759118 | \n", "4.913945 | \n", "... | \n", "0.371035 | \n", "1.361073 | \n", "1.668085 | \n", "4.005738 | \n", "0.078611 | \n", "1.571750 | \n", "0.508187 | \n", "2.067150 | \n", "2.323764 | \n", "1.429850 | \n", "
| agg_9538 | \n", "1.715507 | \n", "0.700955 | \n", "3.044732 | \n", "0.858696 | \n", "0.903406 | \n", "1.763168 | \n", "0.215304 | \n", "2.604478 | \n", "4.549708 | \n", "4.839124 | \n", "... | \n", "0.594310 | \n", "1.801298 | \n", "2.075996 | \n", "3.933860 | \n", "0.165590 | \n", "1.970268 | \n", "0.993521 | \n", "2.232347 | \n", "2.473388 | \n", "1.902884 | \n", "
8856 rows Γ 18457 columns
\n", "| \n", " | STRADA | \n", "ETV4 | \n", "USP25 | \n", "ZSWIM5 | \n", "C21orf58 | \n", "MIR497HG | \n", "CFAP74 | \n", "GSE1 | \n", "LPP | \n", "CLK1 | \n", "... | \n", "STRIP2 | \n", "TNFRSF1A | \n", "RBM14-RBM4 | \n", "C1orf21 | \n", "LINC00639 | \n", "NPDC1 | \n", "ZNF425 | \n", "COL5A1 | \n", "BRD3 | \n", "EVI5L | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| agg_0 | \n", "2.973438 | \n", "1.845565 | \n", "4.592531 | \n", "5.099802 | \n", "1.774879 | \n", "0.356812 | \n", "2.590836 | \n", "4.629774 | \n", "4.897171 | \n", "3.326940 | \n", "... | \n", "2.836060 | \n", "0.297015 | \n", "1.883849 | \n", "4.293593 | \n", "1.463565 | \n", "3.183534 | \n", "2.340202 | \n", "2.374942 | \n", "2.911916 | \n", "3.230072 | \n", "
| agg_1 | \n", "2.954213 | \n", "1.896726 | \n", "4.688557 | \n", "5.510440 | \n", "1.666929 | \n", "0.352725 | \n", "2.292625 | \n", "4.459535 | \n", "4.915286 | \n", "3.192858 | \n", "... | \n", "3.125704 | \n", "0.242543 | \n", "1.908177 | \n", "4.439424 | \n", "1.236739 | \n", "3.494824 | \n", "2.425672 | \n", "2.054568 | \n", "2.713408 | \n", "3.491463 | \n", "
| agg_2 | \n", "2.938851 | \n", "2.197247 | \n", "4.861410 | \n", "5.617520 | \n", "1.773381 | \n", "0.380867 | \n", "2.394917 | \n", "4.415038 | \n", "4.836399 | \n", "3.390717 | \n", "... | \n", "3.082098 | \n", "0.263285 | \n", "2.006456 | \n", "4.383455 | \n", "1.208590 | \n", "4.013819 | \n", "2.408381 | \n", "2.297343 | \n", "2.892222 | \n", "3.695785 | \n", "
| agg_3 | \n", "3.045972 | \n", "2.138573 | \n", "4.863791 | \n", "5.273604 | \n", "1.760097 | \n", "0.463555 | \n", "2.391702 | \n", "3.940975 | \n", "4.857763 | \n", "3.410926 | \n", "... | \n", "2.882890 | \n", "0.290327 | \n", "1.922963 | \n", "4.550189 | \n", "1.430520 | \n", "3.693118 | \n", "2.297103 | \n", "2.121887 | \n", "2.626117 | \n", "3.223912 | \n", "
| agg_4 | \n", "3.025518 | \n", "2.019096 | \n", "4.602948 | \n", "5.257001 | \n", "1.755338 | \n", "0.382190 | \n", "2.432810 | \n", "4.392480 | \n", "4.959488 | \n", "3.250500 | \n", "... | \n", "3.082296 | \n", "0.258540 | \n", "2.038277 | \n", "4.464807 | \n", "1.249043 | \n", "3.665800 | \n", "2.400820 | \n", "2.255862 | \n", "2.925619 | \n", "3.471005 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| agg_9533 | \n", "2.333562 | \n", "0.633322 | \n", "4.675825 | \n", "2.793023 | \n", "0.752030 | \n", "0.692083 | \n", "0.503531 | \n", "4.327948 | \n", "6.903193 | \n", "3.695593 | \n", "... | \n", "0.549795 | \n", "2.270181 | \n", "1.563218 | \n", "4.395422 | \n", "0.550088 | \n", "1.330252 | \n", "1.044471 | \n", "3.759369 | \n", "2.491346 | \n", "1.872717 | \n", "
| agg_9535 | \n", "0.835037 | \n", "0.358773 | \n", "1.964896 | \n", "0.307449 | \n", "0.337240 | \n", "0.834196 | \n", "0.093885 | \n", "1.853794 | \n", "3.700790 | \n", "4.467302 | \n", "... | \n", "0.176885 | \n", "1.370898 | \n", "1.022708 | \n", "3.400267 | \n", "0.052162 | \n", "1.908870 | \n", "0.253417 | \n", "1.448111 | \n", "1.622033 | \n", "1.064292 | \n", "
| agg_9536 | \n", "3.008039 | \n", "1.209324 | \n", "4.798392 | \n", "3.931870 | \n", "1.401328 | \n", "1.638555 | \n", "0.969720 | \n", "4.779201 | \n", "6.631931 | \n", "4.127797 | \n", "... | \n", "1.174298 | \n", "1.870530 | \n", "2.506874 | \n", "5.151776 | \n", "0.967644 | \n", "1.809947 | \n", "2.205356 | \n", "4.244005 | \n", "2.974467 | \n", "2.659873 | \n", "
| agg_9537 | \n", "1.241936 | \n", "0.455059 | \n", "2.919995 | \n", "0.571672 | \n", "0.486448 | \n", "1.175586 | \n", "0.145397 | \n", "2.412148 | \n", "4.759118 | \n", "4.913945 | \n", "... | \n", "0.371035 | \n", "1.361073 | \n", "1.668085 | \n", "4.005738 | \n", "0.078611 | \n", "1.571750 | \n", "0.508187 | \n", "2.067150 | \n", "2.323764 | \n", "1.429850 | \n", "
| agg_9538 | \n", "1.715507 | \n", "0.700955 | \n", "3.044732 | \n", "0.858696 | \n", "0.903406 | \n", "1.763168 | \n", "0.215304 | \n", "2.604478 | \n", "4.549708 | \n", "4.839124 | \n", "... | \n", "0.594310 | \n", "1.801298 | \n", "2.075996 | \n", "3.933860 | \n", "0.165590 | \n", "1.970268 | \n", "0.993521 | \n", "2.232347 | \n", "2.473388 | \n", "1.902884 | \n", "
8856 rows Γ 18457 columns
\n", "| \n", " | STRADA | \n", "ETV4 | \n", "USP25 | \n", "
|---|---|---|---|
| agg_0 | \n", "3.060561 | \n", "2.882100 | \n", "3.469085 | \n", "
| agg_1 | \n", "3.117702 | \n", "2.825738 | \n", "3.596372 | \n", "
| agg_2 | \n", "3.156642 | \n", "3.122381 | \n", "3.718749 | \n", "
| agg_3 | \n", "3.214047 | \n", "3.204670 | \n", "3.629874 | \n", "
| agg_4 | \n", "3.103570 | \n", "3.032028 | \n", "3.512117 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "
| agg_9533 | \n", "2.313220 | \n", "2.173597 | \n", "3.156157 | \n", "
| agg_9535 | \n", "0.952112 | \n", "0.956720 | \n", "1.250005 | \n", "
| agg_9536 | \n", "2.779494 | \n", "2.705945 | \n", "3.530610 | \n", "
| agg_9537 | \n", "1.342694 | \n", "1.407407 | \n", "1.867070 | \n", "
| agg_9538 | \n", "1.745080 | \n", "1.633314 | \n", "2.082985 | \n", "
8856 rows Γ 3 columns
\n", "| \n", " | STRADA | \n", "ETV4 | \n", "USP25 | \n", "
|---|---|---|---|
| agg_0 | \n", "2.933017 | \n", "2.892934 | \n", "2.858879 | \n", "
| agg_1 | \n", "2.816778 | \n", "2.812964 | \n", "3.058485 | \n", "
| agg_2 | \n", "2.743120 | \n", "2.971366 | \n", "2.950323 | \n", "
| agg_3 | \n", "2.804692 | \n", "3.346689 | \n", "2.837382 | \n", "
| agg_4 | \n", "2.816030 | \n", "3.088620 | \n", "2.973081 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "
| agg_9533 | \n", "2.510605 | \n", "2.760446 | \n", "1.965776 | \n", "
| agg_9535 | \n", "1.246022 | \n", "1.192524 | \n", "0.407104 | \n", "
| agg_9536 | \n", "2.809229 | \n", "3.369957 | \n", "2.927355 | \n", "
| agg_9537 | \n", "1.580334 | \n", "1.533467 | \n", "0.879179 | \n", "
| agg_9538 | \n", "2.014224 | \n", "2.078125 | \n", "1.374325 | \n", "
8856 rows Γ 3 columns
\n", "