1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
extern crate flate2;
extern crate io_utils;
extern crate string_utils;
use flate2::read::MultiGzDecoder;
use io_utils::*;
use std::*;
use std::{
fs::File,
io::{BufRead, BufReader},
};
use string_utils::*;
pub fn load_feature_bc_matrix(
outs: &String,
features: &mut Vec<String>,
barcodes: &mut Vec<String>,
gex_sparse_matrix: &mut Vec<Vec<(i32, i32)>>,
) {
let mut dir = format!("{}/raw_feature_bc_matrix", outs);
if !path_exists(&dir) {
dir = format!("{}/raw_gene_bc_matrices_mex", outs);
}
let mut matrix_file = format!("{}/matrix.mtx.gz", dir);
if path_exists(&format!("{}/GRCh38", dir)) {
read_maybe_unzipped(&format!("{}/GRCh38/genes.tsv.gz", dir), features);
read_maybe_unzipped(&format!("{}/GRCh38/barcodes.tsv.gz", dir), barcodes);
matrix_file = format!("{}/GRCh38/matrix.mtx.gz", dir);
} else {
read_maybe_unzipped(&format!("{}/features.tsv.gz", dir), features);
read_maybe_unzipped(&format!("{}/barcodes.tsv.gz", dir), barcodes);
}
if path_exists(&matrix_file) {
let gz = MultiGzDecoder::new(File::open(&matrix_file).unwrap());
let f = BufReader::new(gz);
for _i in 0..barcodes.len() {
gex_sparse_matrix.push(Vec::<(i32, i32)>::new());
}
let mut line_count = 1;
for line in f.lines() {
let s = line.unwrap();
if line_count > 3 {
let fields = s.split(' ').collect::<Vec<&str>>();
let feature = fields[0].force_i32() - 1;
let bc = fields[1].force_i32() - 1;
let count = fields[2].force_i32();
gex_sparse_matrix[bc as usize].push((feature, count));
}
line_count += 1;
}
} else {
let f = open_for_read![matrix_file.before(".gz")];
for _i in 0..barcodes.len() {
gex_sparse_matrix.push(Vec::<(i32, i32)>::new());
}
let mut line_count = 1;
for line in f.lines() {
let s = line.unwrap();
if line_count > 3 {
let fields = s.split(' ').collect::<Vec<&str>>();
let feature = fields[0].force_i32() - 1;
let bc = fields[1].force_i32() - 1;
let count = fields[2].force_i32();
gex_sparse_matrix[bc as usize].push((feature, count));
}
line_count += 1;
}
}
}