Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
30 commits
Select commit Hold shift + click to select a range
08c0bc9
integrate new dataloaders
selmanozleyen Aug 8, 2025
14dda75
put working state
selmanozleyen Aug 8, 2025
e40e575
add new files
selmanozleyen Aug 8, 2025
691e941
fix
selmanozleyen Aug 8, 2025
a2a8ab1
fix this
selmanozleyen Aug 8, 2025
4a2cb76
format
selmanozleyen Aug 8, 2025
73900f6
remove extra test files
selmanozleyen Aug 19, 2025
245b595
update the write function
selmanozleyen Aug 25, 2025
2a0d870
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Aug 25, 2025
6e34cc7
remove compat test
selmanozleyen Aug 25, 2025
1b78a05
Merge branch 'feature/zarr-data' of https://github.com/theislab/cellf…
selmanozleyen Aug 25, 2025
cc2d53b
fix import problems and rename function to write_zarr
selmanozleyen Aug 25, 2025
297a83c
hide explicit torch imports
selmanozleyen Aug 25, 2025
2be2bd6
add read and write zarr tests
selmanozleyen Aug 25, 2025
a1f974c
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Aug 25, 2025
f4062bb
push working state
selmanozleyen Aug 25, 2025
93c66a7
Merge branch 'feature/zarr-data' of https://github.com/theislab/cellf…
selmanozleyen Aug 25, 2025
7ac0f8f
remove torch test for cellflow workflow
selmanozleyen Aug 26, 2025
8abe9b1
Merge branch 'main' into feature/zarr-data
selmanozleyen Aug 26, 2025
042e07a
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Aug 26, 2025
d454e34
Delete tests/test_optional.py
selmanozleyen Aug 26, 2025
9e56b37
fix unintentionally removed line
selmanozleyen Aug 26, 2025
e67de7d
ability to add names and tests
selmanozleyen Aug 26, 2025
feae2dd
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Aug 26, 2025
5c611f9
bug fix
selmanozleyen Sep 17, 2025
3423c39
add trainsampler with pool
selmanozleyen Sep 19, 2025
8291b7a
save current state
selmanozleyen Sep 20, 2025
2a26de9
[pre-commit.ci] auto fixes from pre-commit.com hooks
pre-commit-ci[bot] Sep 20, 2025
00b678d
Merge pull request #1 from theislab/feature/zarr-data
selmanozleyen Sep 20, 2025
4e89f50
name change to avoid conflicts
AlejandroTL Sep 29, 2025
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
470 changes: 470 additions & 0 deletions docs/notebooks/600_trainsampler.ipynb

Large diffs are not rendered by default.

6 changes: 3 additions & 3 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ build-backend = "hatchling.build"
requires = [ "hatch-vcs", "hatchling" ]

[project]
name = "cellflow-tools"
name = "scaleflow-tools"
description = "Modeling complex perturbations with flow matching at single-cell resolution"
readme = "README.md"
license = "PolyForm-Noncommercial-1.0.0"
Expand Down Expand Up @@ -103,7 +103,7 @@ urls.Home-page = "https://github.com/theislab/cellflow"
urls.Source = "https://github.com/theislab/cellflow"

[tool.hatch.build.targets.wheel]
packages = [ 'src/cellflow' ]
packages = [ 'src/scaleflow' ]

[tool.hatch.version]
source = "vcs"
Expand Down Expand Up @@ -201,7 +201,7 @@ extras = test,pp,external,embedding
pass_env = PYTEST_*,CI
commands =
coverage run -m pytest {tty:--color=yes} {posargs: \
--cov={env_site_packages_dir}{/}cellflow --cov-config={tox_root}{/}pyproject.toml \
--cov={env_site_packages_dir}{/}scaleflow --cov-config={tox_root}{/}pyproject.toml \
--no-cov-on-fail --cov-report=xml --cov-report=term-missing:skip-covered}

[testenv:lint-code]
Expand Down
32 changes: 32 additions & 0 deletions scripts/create_tahoe.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
from sc_exp_design.models import CellFlow
import anndata as ad
import h5py

from anndata.experimental import read_lazy

print("loading data")
with h5py.File("/lustre/groups/ml01/workspace/100mil/100m_int_indices.h5ad", "r") as f:
adata_all = ad.AnnData(
obs=ad.io.read_elem(f["obs"]),
var=read_lazy(f["var"]),
uns = read_lazy(f["uns"]),
obsm = read_lazy(f["obsm"]),
)
cf = CellFlow()

print(" preparing train data ")
cf.prepare_train_data(adata_all,
sample_rep="X_pca",
control_key="control",
perturbation_covariates={"drugs": ("drug",), "dosage": ("dosage",)},
perturbation_covariate_reps={"drugs": "drug_embeddings"},
sample_covariates=["cell_line"],
sample_covariate_reps={"cell_line": "cell_line_embeddings"},
split_covariates=["cell_line"])




print("writing zarr")
cf.train_data.write_zarr(f"/lustre/groups/ml01/workspace/100mil/tahoe_train_data.zarr")
print("zarr written")
4 changes: 0 additions & 4 deletions src/cellflow/__init__.py

This file was deleted.

15 changes: 0 additions & 15 deletions src/cellflow/data/__init__.py

This file was deleted.

303 changes: 0 additions & 303 deletions src/cellflow/data/_dataloader.py

This file was deleted.

14 changes: 0 additions & 14 deletions src/cellflow/data/_utils.py

This file was deleted.

Loading
Loading