You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
"for category, values in zip(sample_category, sample_list):\n",
28
+
" print(category+\" : \"+str(len(values)) + \", List number : \" + str(count))\n",
29
+
" count+=1"
30
+
],
31
+
"outputs": [
32
+
{
33
+
"output_type": "stream",
34
+
"name": "stdout",
35
+
"text": [
36
+
"Sample Count\n",
37
+
"RR : 82, List number : 0\n",
38
+
"PP : 14, List number : 1\n",
39
+
"SP : 1, List number : 2\n",
40
+
"RIS : 2, List number : 3\n",
41
+
"CIS : 40, List number : 4\n",
42
+
"Unknown : 1, List number : 5\n",
43
+
"Healthy : 22, List number : 6\n"
44
+
]
45
+
}
46
+
],
47
+
"metadata": {}
48
+
},
49
+
{
50
+
"cell_type": "code",
51
+
"execution_count": 2,
52
+
"source": [
53
+
"duration_df = meta_data.dropna(subset=['DiseaseDuration']) # data for patient's duration set\n",
54
+
"duration_df['DiseaseDuration'] = duration_df['DiseaseDuration'].astype(float) # make float\n",
55
+
"\n",
56
+
"## Long DD\n",
57
+
"longDD_samples = duration_df.loc[ duration_df['DiseaseDuration'] >= duration_df['DiseaseDuration'].median(), 'HCVB_ID'] # Get sampleData which has longDD from metadata\n",
58
+
"longDD_sampleList = list(set(gene_tpm.columns.tolist()).intersection(longDD_samples.values.tolist())) # Get intersected sampleID between expr and longDD\n",
59
+
"longDD_meta = duration_df[duration_df['HCVB_ID'].isin(longDD_sampleList)] # Get meta with sampleNames\n",
60
+
"longDD_gene_expr = gene_tpm[longDD_sampleList] # Get expr with sampleNames\n",
0 commit comments