-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathrun.py
executable file
·108 lines (94 loc) · 4.33 KB
/
run.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
import spatrio
import pandas as pd
import argparse
def str2bool(v):
if isinstance(v, bool):
return v
if v.lower() in ('yes', 'true', 't', 'y', '1'):
return True
elif v.lower() in ('no', 'false', 'f', 'n', '0'):
return False
else:
raise argparse.ArgumentTypeError('Boolean value expected.')
parser = argparse.ArgumentParser(description='Spatrio argparse')
# load_data
parser.add_argument('--input_path', default=None, help='Path to read in input data')
parser.add_argument('--expected_num_path', default=None, help='Path to read in expected cell number')
# process_input
parser.add_argument('--marker_use', default=True, type=str2bool)
parser.add_argument('--top_marker_num', default=100, type=int)
parser.add_argument('--hvg_use', default=False, type=str2bool)
# ot_alignment
parser.add_argument('--alpha', default=0.1, type=float)
parser.add_argument('--dissimilarity', default='scaled_euc', type=str)
parser.add_argument('--k', default=10, type=int)
parser.add_argument('--graph_mode', default='connectivity', type=str)
parser.add_argument('--aware_spatial', default=True, type=str2bool)
parser.add_argument('--aware_multi', default=True, type=str2bool)
parser.add_argument('--aware_power', default=2, type=int)
# assign_coord
parser.add_argument('--top_num', default=5, type=int)
parser.add_argument('--random', default=False, type=str2bool)
# save output
parser.add_argument('--output_path', default=None, help='Path to save output data')
args = parser.parse_args()
path = args.input_path
expected_num_path = args.expected_num_path
top_num = args.top_num
print('\n','***Spatrio is running***','\n')
print('\n','***STEP1 LOAD DATA***','\n')
print('Loading data...')
spot_ann = spatrio.load_data(path+'/spatial_rna.csv' )
single_ann = spatrio.load_data( path+'/multi_rna.csv' )
spot_meta = pd.read_csv(path+'/spatial_meta.csv', index_col=0)
spot_meta['type'] = spot_meta['type'].apply(lambda x: str(x))
single_meta = pd.read_csv(path+'/multi_meta.csv', index_col=0)
single_meta['type'] = single_meta['type'].apply(lambda x: str(x))
spot_meta[['sample']] = 'spot'
single_meta[['sample']] = 'single'
spot_ann.obs['type'] = spot_meta['type']
spot_ann.obs['type'] = spot_ann.obs['type'].astype(object)
single_ann.obs['type'] = single_meta['type']
single_ann.obs['type'] = single_ann.obs['type'].astype(object)
print('Done!')
pos = pd.read_csv(path+'/pos.csv', index_col=0)
emb = pd.read_csv(path+'/emb.csv', index_col=0)
spot_ann.obsm['spatial'] = pos
single_ann.obsm['reduction'] = emb
if expected_num_path is not None:
expected_num = pd.read_csv(expected_num_path,index_col=0)
elif top_num is not None:
expected_num = None
print('\n','***STEP2 PROCESS DATA***','\n')
print('Processing data...')
data1,data2 = spatrio.process_input(spot_ann,single_ann,
marker_use = args.marker_use,
top_marker_num = args.top_marker_num,
hvg_use = args.hvg_use)
print('Done!')
print('\n','***STEP3 OT ALIGNMENT***','\n')
if expected_num is not None:
expected_num = expected_num.loc[data1.obs_names]
tmp_num = expected_num['cell_num'].values
p_distribution = tmp_num/sum(tmp_num)
else:
p_distribution = None
spatrio_decon = spatrio.ot_alignment(adata1 = data1,
adata2 = data2,
dissimilarity = args.dissimilarity,
alpha = args.alpha,
k = args.k,
graph_mode = args.graph_mode,
aware_spatial = args.aware_spatial,
aware_multi = args.aware_multi,
aware_power = args.aware_power,
p_distribution = p_distribution)
print('\n','***STEP4 ASSIGN COORD***','\n')
spatrio_map = spatrio.assign_coord(adata1 = data1,
adata2 = data2,
out_data = spatrio_decon,
top_num = args.top_num,
random = args.random,
expected_num = expected_num)
print('\n','The output was saved as '+str(args.output_path)+'/output.csv')
spatrio_map.to_csv(args.output_path+'/'+'output.csv')