From cc65ae1735f082b09620a611f2137e8c5ed0f69d Mon Sep 17 00:00:00 2001 From: zethson Date: Tue, 8 Oct 2024 09:32:11 +0200 Subject: [PATCH 1/4] Simplify 10ktp Signed-off-by: zethson --- .gitignore | 1 + .../10ktp_make_vitessce.py | 18 ++--- .../10ktp_to_lamin.py | 66 +++++-------------- pyproject.toml | 6 +- 4 files changed, 27 insertions(+), 64 deletions(-) diff --git a/.gitignore b/.gitignore index 9f15966..ccf848b 100644 --- a/.gitignore +++ b/.gitignore @@ -28,3 +28,4 @@ __pycache__/ *.pye Sandbox.ipynb +test.ipynb diff --git a/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_make_vitessce.py b/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_make_vitessce.py index 7f21b41..3dd3a13 100644 --- a/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_make_vitessce.py +++ b/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_make_vitessce.py @@ -1,18 +1,8 @@ -# ADJUST -uid = "10ktp" - -# Setup before running this script for the first time -# 1) Ensure you have a lamin.ai account -# 2) Run `lamin login` to authenticate -# 3) Activate lamin db connection with `lamin load scverse/spatialdata-db` -# 4) Execute script once and replace the stem_uid for this file +theislab_uid = "10ktp" import lamindb as ln -ln.settings.transform.stem_uid = "5PYtTxDE7LvE" -ln.settings.transform.version = "1" - -ln.track() +ln.context.track("5PYtTxDE7LvE") from vitessce import ( VitessceConfig, @@ -31,7 +21,7 @@ from lamindb.integrations import save_vitessce_config -artifact = ln.Artifact.filter(ulabels__name=uid).one() +artifact = ln.Artifact.filter(ulabels__name=theislab_uid).one() vc = VitessceConfig( schema_version="1.0.16", @@ -49,4 +39,4 @@ dataset = vc.add_dataset(name='Visium demo').add_object(wrapper) spatial = vc.add_view("spatialBeta", dataset=dataset) vc.layout(spatial) -view = save_vitessce_config(vc, description="Visium HD demo vitessce config") \ No newline at end of file +view = save_vitessce_config(vc, description="Visium HD demo vitessce config") diff --git a/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_to_lamin.py b/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_to_lamin.py index ec141ce..ccf2425 100644 --- a/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_to_lamin.py +++ b/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp_to_lamin.py @@ -1,42 +1,31 @@ -# ADJUST -uid = "10ktp" - -# Setup before running this script for the first time -# 1) Ensure you have a lamin.ai account -# 2) Run `lamin login` to authenticate -# 3) Activate lamin db connection with `lamin load scverse/spatialdata-db` -# 4) Execute script once and replace the stem_uid for this file +theislab_uid = "10ktp" import lamindb as ln +from spatialdata_db import load_10x_metadata -ln.settings.transform.stem_uid = "KgGzOw8PUYKO" -ln.settings.transform.version = "3" ln.track("KgGzOw8PUYKO7CpM") + try: - artifact = ln.Artifact.filter(ulabels__name=uid).one() + artifact = ln.Artifact.filter(ulabels__name=theislab_uid).one() artifact.delete(permanent=True) except: pass -### From here on we assume Lamin is set up correctly DATASET_PATH = "/lustre/groups/ml01/projects/2024_spatialdata_db/data/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0/10ktp__10X__Visium__Mouse__brain__20200623__v1.1.0.zarr" artifact = ln.Artifact(DATASET_PATH, description="10X, Visium, Mouse, Brain") -artifact.save() # transfers to Lamin +artifact.save() # Associate ID with the artifact so we can retrieve afterwards tuid_parent = ln.ULabel.filter(name="theislab unique ID").one() -tuid = ln.ULabel(name=uid).save() +tuid = ln.ULabel(name=theislab_uid).save() tuid.parents.add(tuid_parent) artifact.labels.add(tuid) # load 10X metadata we have on disk -import pandas as pd -from spatialdata_db import load_10x_metadata - all_metadata_10x = load_10x_metadata() -assert len(all_metadata_10x.query(f"uid == '{uid}'")) == 1 -metadata = all_metadata_10x.query(f"uid == '{uid}'").iloc[0] +assert len(all_metadata_10x.query(f"uid == '{theislab_uid}'")) == 1 +metadata = all_metadata_10x.query(f"uid == '{theislab_uid}'").iloc[0] # Associate metadata as features import bionty as bt @@ -45,39 +34,18 @@ organism_lo = bt.Organism.public().lookup() tissue_lo = bt.Tissue.public().lookup() -# Species -- - -if metadata["Species"].lower() == "mouse": - feature_organism = bt.Organism.from_public(name=organism_lo.mouse.name) -elif metadata["Species"].lower() == "human": - feature_organism = bt.Organism.from_public(name=organism_lo.human.name) -else: - raise NotImplementedError("Unknown species!") - -feature_organism.save() - -# Tissue +# Species (Organism) +organisms = bt.Organism.from_values(metadata["Species"].lower(), field="name") +ln.save(organisms) +# Orgna (Tissue) if metadata["organ"].lower() == "olfactory_bulb": metadata["organ"] = "olfactorybulb" - -if metadata["organ"].lower() == "brain": - feature_tissue = bt.Tissue.from_public(name=tissue_lo.brain.name) -elif metadata["organ"].lower() == "kidney": - feature_tissue = bt.Tissue.from_public(name=tissue_lo.kidney.name) -elif metadata["organ"].lower() == "colon": - feature_tissue = bt.Tissue.from_public(name=tissue_lo.colon.name) -else: - raise NotImplementedError("Unknown tissue!") - -feature_tissue.save() +tissues = bt.Tissue.from_values(metadata["organ"].lower(), field="name") +ln.save(tissues) # Associate bionty terms to artifact +artifact.organism.set(organisms) +artifact.tissue.set(tissues) -artifact.labels.add(feature_organism, feature=feature_lo.organism) -artifact.labels.add(feature_tissue, feature=feature_lo.tissue) - - -# finish for tracing in Lamin - -ln.finish() \ No newline at end of file +ln.context.finish() diff --git a/pyproject.toml b/pyproject.toml index ff7bf63..902e7d6 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -25,7 +25,11 @@ dependencies = [ "anndata", # for debug logging (referenced from the issue template) "session-info", - "lamindb[aws,bionty,jupyter]" + "lamindb[aws,bionty,jupyter]", + "vitessce", + "spatialdata", + "spatialdata-io", + "spatialdata-plot" ] optional-dependencies.dev = [ "pre-commit", From 559c7eba041977ca1dbdff4dbd3328b77426f59d Mon Sep 17 00:00:00 2001 From: zethson Date: Tue, 8 Oct 2024 09:42:01 +0200 Subject: [PATCH 2/4] Restrict to less than Python 3.12 Signed-off-by: zethson --- .github/workflows/build.yaml | 6 +++--- .github/workflows/test.yaml | 8 ++++---- pyproject.toml | 5 +++-- 3 files changed, 10 insertions(+), 9 deletions(-) diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index 265a95e..8ae322e 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -14,11 +14,11 @@ jobs: package: runs-on: ubuntu-latest steps: - - uses: actions/checkout@v3 + - uses: actions/checkout@v4 - name: Set up Python 3.10 - uses: actions/setup-python@v4 + uses: actions/setup-python@v5 with: - python-version: "3.10" + python-version: "3.11" cache: "pip" cache-dependency-path: "**/pyproject.toml" - name: Install build dependencies diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 2bfe232..9227b0f 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -26,9 +26,9 @@ jobs: - os: ubuntu-latest python: "3.10" - os: ubuntu-latest - python: "3.12" + python: "3.11" - os: ubuntu-latest - python: "3.12" + python: "3.11" pip-flags: "--pre" name: PRE-RELEASE DEPENDENCIES @@ -39,9 +39,9 @@ jobs: PYTHON: ${{ matrix.python }} steps: - - uses: actions/checkout@v3 + - uses: actions/checkout@v4 - name: Set up Python ${{ matrix.python }} - uses: actions/setup-python@v4 + uses: actions/setup-python@v5 with: python-version: ${{ matrix.python }} cache: "pip" diff --git a/pyproject.toml b/pyproject.toml index 902e7d6..ddb1668 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -14,10 +14,11 @@ maintainers = [ authors = [ { name = "Tim Treis" }, ] -requires-python = ">=3.9" +requires-python = ">=3.10, <3.12" +# 3.12 attempts to install an old version of dask-image which isn't 3.12 compatible +# See https://github.com/theislab/spatialdata-db/actions/runs/11230700843/job/31218561107?pr=35 classifiers = [ "Programming Language :: Python :: 3 :: Only", - "Programming Language :: Python :: 3.9", "Programming Language :: Python :: 3.10", "Programming Language :: Python :: 3.11", ] From 6b4430acdfbb6863b747a34e493de870ec33e822 Mon Sep 17 00:00:00 2001 From: zethson Date: Tue, 8 Oct 2024 09:57:48 +0200 Subject: [PATCH 3/4] Move scripts folder Signed-off-by: zethson --- .../utils/scripts => scripts}/create_uids.ipynb | 4 ++-- {src/spatialdata_db/utils => scripts}/data/datasets_10x.csv | 0 {src/spatialdata_db/utils => scripts}/data/uid_master.csv | 0 .../utils/scripts => scripts}/download_10X_data.ipynb | 2 +- .../utils/scripts => scripts}/download_10X_data.py | 2 +- .../utils/scripts => scripts}/parse_10X_ST_table.ipynb | 0 .../utils/scripts => scripts}/rename_on_lustre.ipynb | 2 +- .../utils/scripts => scripts}/update_uid_master.py | 4 ++-- src/spatialdata_db/utils/__init__.py | 0 9 files changed, 7 insertions(+), 7 deletions(-) rename {src/spatialdata_db/utils/scripts => scripts}/create_uids.ipynb (99%) rename {src/spatialdata_db/utils => scripts}/data/datasets_10x.csv (100%) rename {src/spatialdata_db/utils => scripts}/data/uid_master.csv (100%) rename {src/spatialdata_db/utils/scripts => scripts}/download_10X_data.ipynb (99%) rename {src/spatialdata_db/utils/scripts => scripts}/download_10X_data.py (98%) rename {src/spatialdata_db/utils/scripts => scripts}/parse_10X_ST_table.ipynb (100%) rename {src/spatialdata_db/utils/scripts => scripts}/rename_on_lustre.ipynb (99%) rename {src/spatialdata_db/utils/scripts => scripts}/update_uid_master.py (93%) delete mode 100644 src/spatialdata_db/utils/__init__.py diff --git a/src/spatialdata_db/utils/scripts/create_uids.ipynb b/scripts/create_uids.ipynb similarity index 99% rename from src/spatialdata_db/utils/scripts/create_uids.ipynb rename to scripts/create_uids.ipynb index f1d70f0..1058706 100644 --- a/src/spatialdata_db/utils/scripts/create_uids.ipynb +++ b/scripts/create_uids.ipynb @@ -198,7 +198,7 @@ ], "metadata": { "kernelspec": { - "display_name": "lamin", + "display_name": "spatialdatadb", "language": "python", "name": "python3" }, @@ -212,7 +212,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.11.8" + "version": "3.11.10" } }, "nbformat": 4, diff --git a/src/spatialdata_db/utils/data/datasets_10x.csv b/scripts/data/datasets_10x.csv similarity index 100% rename from src/spatialdata_db/utils/data/datasets_10x.csv rename to scripts/data/datasets_10x.csv diff --git a/src/spatialdata_db/utils/data/uid_master.csv b/scripts/data/uid_master.csv similarity index 100% rename from src/spatialdata_db/utils/data/uid_master.csv rename to scripts/data/uid_master.csv diff --git a/src/spatialdata_db/utils/scripts/download_10X_data.ipynb b/scripts/download_10X_data.ipynb similarity index 99% rename from src/spatialdata_db/utils/scripts/download_10X_data.ipynb rename to scripts/download_10X_data.ipynb index b1950e7..f5915c9 100644 --- a/src/spatialdata_db/utils/scripts/download_10X_data.ipynb +++ b/scripts/download_10X_data.ipynb @@ -175,7 +175,7 @@ } ], "source": [ - "data = pd.read_csv(\"/home/icb/tim.treis/projects/spatialdata-db/utils/data/10x_datasets.csv\")[:2]\n", + "data = pd.read_csv(\"/home/icb/tim.treis/projects/spatialdata-db/scripts/data/10x_datasets.csv\")[:2]\n", "data" ] }, diff --git a/src/spatialdata_db/utils/scripts/download_10X_data.py b/scripts/download_10X_data.py similarity index 98% rename from src/spatialdata_db/utils/scripts/download_10X_data.py rename to scripts/download_10X_data.py index 0deb943..5a258b7 100644 --- a/src/spatialdata_db/utils/scripts/download_10X_data.py +++ b/scripts/download_10X_data.py @@ -22,7 +22,7 @@ # In[2]: -data = pd.read_csv("/home/icb/tim.treis/projects/spatialdata-db/utils/data/10x_datasets.csv")[:2] +data = pd.read_csv("/home/icb/tim.treis/projects/spatialdata-db/scripts/data/10x_datasets.csv")[:2] data diff --git a/src/spatialdata_db/utils/scripts/parse_10X_ST_table.ipynb b/scripts/parse_10X_ST_table.ipynb similarity index 100% rename from src/spatialdata_db/utils/scripts/parse_10X_ST_table.ipynb rename to scripts/parse_10X_ST_table.ipynb diff --git a/src/spatialdata_db/utils/scripts/rename_on_lustre.ipynb b/scripts/rename_on_lustre.ipynb similarity index 99% rename from src/spatialdata_db/utils/scripts/rename_on_lustre.ipynb rename to scripts/rename_on_lustre.ipynb index 0f9d3dd..7898776 100644 --- a/src/spatialdata_db/utils/scripts/rename_on_lustre.ipynb +++ b/scripts/rename_on_lustre.ipynb @@ -18,7 +18,7 @@ "import os\n", "from concurrent.futures import ProcessPoolExecutor, as_completed\n", "\n", - "tenx = pd.read_csv(\"../data/datasets_10x.csv\", sep=\";\")" + "tenx = pd.read_csv(\"data/datasets_10x.csv\", sep=\";\")" ] }, { diff --git a/src/spatialdata_db/utils/scripts/update_uid_master.py b/scripts/update_uid_master.py similarity index 93% rename from src/spatialdata_db/utils/scripts/update_uid_master.py rename to scripts/update_uid_master.py index fe60ef7..b841e5e 100644 --- a/src/spatialdata_db/utils/scripts/update_uid_master.py +++ b/scripts/update_uid_master.py @@ -30,9 +30,9 @@ def update_master_with_ids(uid_master_csv_path, file_paths): if __name__ == "__main__": - master_csv_path = "../data/uid_master.csv" + master_csv_path = "data/uid_master.csv" dataset_paths = [ - "../data/datasets_10x.csv", + "data/datasets_10x.csv", # tbd ] diff --git a/src/spatialdata_db/utils/__init__.py b/src/spatialdata_db/utils/__init__.py deleted file mode 100644 index e69de29..0000000 From 24399b8457ffff63a9290d81f4c4df8c703ae991 Mon Sep 17 00:00:00 2001 From: zethson Date: Tue, 8 Oct 2024 09:58:45 +0200 Subject: [PATCH 4/4] Use uv Signed-off-by: zethson --- .github/workflows/build.yaml | 2 +- .github/workflows/test.yaml | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index 8ae322e..ddfbe96 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -15,7 +15,7 @@ jobs: runs-on: ubuntu-latest steps: - uses: actions/checkout@v4 - - name: Set up Python 3.10 + - name: Set up Python 3.11 uses: actions/setup-python@v5 with: python-version: "3.11" diff --git a/.github/workflows/test.yaml b/.github/workflows/test.yaml index 9227b0f..0af16b0 100644 --- a/.github/workflows/test.yaml +++ b/.github/workflows/test.yaml @@ -49,10 +49,10 @@ jobs: - name: Install test dependencies run: | - python -m pip install --upgrade pip wheel + python -m pip install --upgrade uv wheel - name: Install dependencies run: | - pip install ${{ matrix.pip-flags }} ".[dev,test]" + uv pip install --system ${{ matrix.pip-flags }} ".[dev,test]" - name: Test env: MPLBACKEND: agg