From 4d2cda90ab0fe6f1ac067bd93c2397a6ac6fac39 Mon Sep 17 00:00:00 2001
From: nojhan <nojhan@nojhan.net>
Date: Sat, 8 Apr 2023 07:56:23 +0200
Subject: [PATCH] refactor preproc around anndata

---
 scripts/paris/ranks_tsv_to_h5an.py | 14 ++++++++++++++
 scripts/paris/signatures.py        |  1 +
 2 files changed, 15 insertions(+)
 create mode 100644 scripts/paris/ranks_tsv_to_h5an.py

diff --git a/scripts/paris/ranks_tsv_to_h5an.py b/scripts/paris/ranks_tsv_to_h5an.py
new file mode 100644
index 0000000..8f45829
--- /dev/null
+++ b/scripts/paris/ranks_tsv_to_h5an.py
@@ -0,0 +1,14 @@
+import anndata as ad
+import signatures
+
+if __name__ == "__main__":
+    import sys
+
+    assert(len(sys.argv) == 4)
+
+    ranks = signatures.load_ranks_csv(sys.argv[1])
+    adata = ad.read(sys.argv[2])
+    adata.layers["ranks"] = ranks
+    adata.write(sys.argv[3], compressed="gzip")
+
+    print(adata, out=sys.stderr, flush=True)
diff --git a/scripts/paris/signatures.py b/scripts/paris/signatures.py
index 16a51da..8bab335 100644
--- a/scripts/paris/signatures.py
+++ b/scripts/paris/signatures.py
@@ -272,6 +272,7 @@ def load_ranks_csv(rankfile):
             print("\r", n, end=" ", file=sys.stderr, flush=True)
             ranks_row = numpy.array([float(r) for r in row[1:]])
             ranks_l.append(ranks_row)
+
     assert(len(ranks_l) > 0)
     assert(len(ranks_l) == len(genes))
     ngenes = len(genes)
-- 
GitLab