Skip to content

Commit 3b8a54d

Browse files
committed
server/queue/task/plot: Move t-SNE transformer to core
1 parent b1be793 commit 3b8a54d

File tree

7 files changed

+29
-27
lines changed

7 files changed

+29
-27
lines changed

Cargo.lock

+1-1
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

atlas-core/Cargo.toml

+1
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@ version = "0.1.0"
44
edition.workspace = true
55

66
[dependencies]
7+
bhtsne = { version = "0.5.2", default-features = false }
78
indexmap.workspace = true
89
ndarray = "0.16.1"
910
noodles = { workspace = true, features = ["core", "gff"] }

atlas-core/src/counts.rs

+1
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,3 @@
1+
pub mod dimension_reduction;
12
pub mod normalization;
23
pub mod reader;
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
pub mod tsne;
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,23 @@
1+
pub fn transform(perplexity: f64, theta: f64, counts: Vec<i32>, feature_count: usize) -> Vec<f64> {
2+
fn euclidean_distance(a: &&[f64], b: &&[f64]) -> f64 {
3+
a.iter()
4+
.zip(b.iter())
5+
.map(|(p, q)| (p - q).powi(2))
6+
.sum::<f64>()
7+
.sqrt()
8+
}
9+
10+
let sum: u64 = counts.iter().map(|n| *n as u64).sum();
11+
12+
let normalized_counts: Vec<_> = counts
13+
.into_iter()
14+
.map(|count| (count as f64) / (sum as f64))
15+
.collect();
16+
17+
let data: Vec<_> = normalized_counts.chunks(feature_count).collect();
18+
19+
bhtsne::tSNE::new(&data)
20+
.perplexity(perplexity)
21+
.barnes_hut(theta, euclidean_distance)
22+
.embedding()
23+
}

atlas-server/Cargo.toml

-1
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,6 @@ edition.workspace = true
77
anyhow.workspace = true
88
atlas-core = { path = "../atlas-core", version = "0.1.0" }
99
axum = "0.7.1"
10-
bhtsne = { version = "0.5.2", default-features = false }
1110
clap = { workspace = true, features = ["derive", "env"] }
1211
dotenvy = "0.15.0"
1312
futures = { version = "0.3.21", default-features = false, features = ["std"] }

atlas-server/src/queue/task/plot.rs

+2-25
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@ mod options;
33

44
use std::collections::HashMap;
55

6+
use atlas_core::counts::dimension_reduction::tsne;
67
use sqlx::PgPool;
78

89
pub use self::{error::Error, options::Options};
@@ -84,7 +85,7 @@ pub async fn plot(
8485
});
8586
}
8687

87-
let embedding = transform(options.perplexity, options.theta, raw_counts, feature_count);
88+
let embedding = tsne::transform(options.perplexity, options.theta, raw_counts, feature_count);
8889

8990
let mut xs = Vec::with_capacity(sample_count);
9091
let mut ys = Vec::with_capacity(sample_count);
@@ -103,30 +104,6 @@ fn is_perplexity_too_large(perplexity: f64, sample_count: usize) -> bool {
103104
sample_count > 0 && (n - 1.0 < 3.0 * perplexity)
104105
}
105106

106-
fn transform(perplexity: f64, theta: f64, counts: Vec<i32>, feature_count: usize) -> Vec<f64> {
107-
fn euclidean_distance(a: &&[f64], b: &&[f64]) -> f64 {
108-
a.iter()
109-
.zip(b.iter())
110-
.map(|(p, q)| (p - q).powi(2))
111-
.sum::<f64>()
112-
.sqrt()
113-
}
114-
115-
let sum: u64 = counts.iter().map(|n| *n as u64).sum();
116-
117-
let normalized_counts: Vec<_> = counts
118-
.into_iter()
119-
.map(|count| (count as f64) / (sum as f64))
120-
.collect();
121-
122-
let data: Vec<_> = normalized_counts.chunks(feature_count).collect();
123-
124-
bhtsne::tSNE::new(&data)
125-
.perplexity(perplexity)
126-
.barnes_hut(theta, euclidean_distance)
127-
.embedding()
128-
}
129-
130107
#[cfg(test)]
131108
mod tests {
132109
use super::*;

0 commit comments

Comments
 (0)