diff --git a/00/00_Data_Overview_and_Preparation_Sample_Data.ipynb b/00/00_Data_Overview_and_Preparation_Sample_Data.ipynb
index 146dee0..1ec3bea 100644
--- a/00/00_Data_Overview_and_Preparation_Sample_Data.ipynb
+++ b/00/00_Data_Overview_and_Preparation_Sample_Data.ipynb
@@ -1065,67 +1065,6 @@
"nrow(sample_data) # more because some samples measured twice"
]
},
- {
- "cell_type": "code",
- "execution_count": 47,
- "id": "ff9f0251-8536-47a1-a446-81f0ed509fc9",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "
\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "\t | id | sample | measurement | sample_id | library | id.y | name | read | pattern | sequence | feature_type | X | in_sample | measurement_tp | sc_rna_seq_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <lgl> | <int> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | 1 | K1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 |
\n",
- "\t2 | 1.1 | M1 | TP1 | m1.1 | L1 | HTO_B0251 | 1.1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 1 | TP1 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 15\n",
- "\\begin{tabular}{r|lllllllllllllll}\n",
- " & id & sample & measurement & sample\\_id & library & id.y & name & read & pattern & sequence & feature\\_type & X & in\\_sample & measurement\\_tp & sc\\_rna\\_seq\\_data\\\\\n",
- " & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & 1 & K1 & TP0 & k1 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & Antibody Capture & NA & 0 & No-CCS & 1\\\\\n",
- "\t2 & 1.1 & M1 & TP1 & m1.1 & L1 & HTO\\_B0251 & 1.1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & Antibody Capture & NA & 1 & TP1 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "| | id <chr> | sample <chr> | measurement <chr> | sample_id <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | feature_type <chr> | X <lgl> | in_sample <int> | measurement_tp <chr> | sc_rna_seq_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | 1 | K1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 |\n",
- "| 2 | 1.1 | M1 | TP1 | m1.1 | L1 | HTO_B0251 | 1.1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 1 | TP1 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " id sample measurement sample_id library id.y name read\n",
- "1 1 K1 TP0 k1 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 1.1 M1 TP1 m1.1 L1 HTO_B0251 1.1 R2 \n",
- " pattern sequence feature_type X in_sample measurement_tp\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG Antibody Capture NA 0 No-CCS \n",
- "2 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG Antibody Capture NA 1 TP1 \n",
- " sc_rna_seq_data\n",
- "1 1 \n",
- "2 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 48,
@@ -1380,64 +1319,6 @@
"group_classification$library = paste0('L', str_replace(group_classification$library.hashtag, '\\\\..*', ''))"
]
},
- {
- "cell_type": "code",
- "execution_count": 57,
- "id": "cb5d2fd2-bf11-4580-b9c1-e716cfb9cc7c",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 9\n",
- "\n",
- "\t | library.hashtag | age | sex | m | classification | group | measurement | sample | library |
\n",
- "\t | <dbl> | <int> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | NA | 55 | f | K1 | vollstaendiger_ausschluss | no_ccs | TP0 | 1 | LNA |
\n",
- "\t2 | 1.2 | 62 | m | M2 | acs_w_o_infection | acs | TP1 | 2.1 | L1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 9\n",
- "\\begin{tabular}{r|lllllllll}\n",
- " & library.hashtag & age & sex & m & classification & group & measurement & sample & library\\\\\n",
- " & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & NA & 55 & f & K1 & vollstaendiger\\_ausschluss & no\\_ccs & TP0 & 1 & LNA\\\\\n",
- "\t2 & 1.2 & 62 & m & M2 & acs\\_w\\_o\\_infection & acs & TP1 & 2.1 & L1 \\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 9\n",
- "\n",
- "| | library.hashtag <dbl> | age <int> | sex <chr> | m <chr> | classification <chr> | group <chr> | measurement <chr> | sample <chr> | library <chr> |\n",
- "|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | NA | 55 | f | K1 | vollstaendiger_ausschluss | no_ccs | TP0 | 1 | LNA |\n",
- "| 2 | 1.2 | 62 | m | M2 | acs_w_o_infection | acs | TP1 | 2.1 | L1 |\n",
- "\n"
- ],
- "text/plain": [
- " library.hashtag age sex m classification group measurement\n",
- "1 NA 55 f K1 vollstaendiger_ausschluss no_ccs TP0 \n",
- "2 1.2 62 m M2 acs_w_o_infection acs TP1 \n",
- " sample library\n",
- "1 1 LNA \n",
- "2 2.1 L1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(group_classification,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 58,
@@ -1477,61 +1358,6 @@
"classification_data = unique(group_classification[,c('age', 'sex', 'm', 'classification', 'group')])"
]
},
- {
- "cell_type": "code",
- "execution_count": 60,
- "id": "3f8b2843-0fbf-44d6-bae0-e5453deb82f9",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 5\n",
- "\n",
- "\t | age | sex | m | classification | group |
\n",
- "\t | <int> | <chr> | <chr> | <chr> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | 55 | f | K1 | vollstaendiger_ausschluss | no_ccs |
\n",
- "\t2 | 62 | m | M2 | acs_w_o_infection | acs |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 5\n",
- "\\begin{tabular}{r|lllll}\n",
- " & age & sex & m & classification & group\\\\\n",
- " & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & 55 & f & K1 & vollstaendiger\\_ausschluss & no\\_ccs\\\\\n",
- "\t2 & 62 & m & M2 & acs\\_w\\_o\\_infection & acs \\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 5\n",
- "\n",
- "| | age <int> | sex <chr> | m <chr> | classification <chr> | group <chr> |\n",
- "|---|---|---|---|---|---|\n",
- "| 1 | 55 | f | K1 | vollstaendiger_ausschluss | no_ccs |\n",
- "| 2 | 62 | m | M2 | acs_w_o_infection | acs |\n",
- "\n"
- ],
- "text/plain": [
- " age sex m classification group \n",
- "1 55 f K1 vollstaendiger_ausschluss no_ccs\n",
- "2 62 m M2 acs_w_o_infection acs "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(classification_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 61,
@@ -1691,64 +1517,6 @@
"all_samples_info = merge(all_samples_info, classification_data, by.x = 'sample', by.y = 'm', all.x = TRUE)"
]
},
- {
- "cell_type": "code",
- "execution_count": 70,
- "id": "1b53aee8-3997-49e0-8c6c-e45bedf27566",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 10\n",
- "\n",
- "\t | sample | id | measurement | sample_id | sc_rna_seq_data | age | sex | classification | group | meta_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | K1 | 1 | TP0 | k1 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 |
\n",
- "\t2 | K10 | 10 | TP0 | k10 | 1 | 57 | m | ccs | ccs | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 10\n",
- "\\begin{tabular}{r|llllllllll}\n",
- " & sample & id & measurement & sample\\_id & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data\\\\\n",
- " & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & K1 & 1 & TP0 & k1 & 0 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1\\\\\n",
- "\t2 & K10 & 10 & TP0 & k10 & 1 & 57 & m & ccs & ccs & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 10\n",
- "\n",
- "| | sample <chr> | id <chr> | measurement <chr> | sample_id <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | K1 | 1 | TP0 | k1 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 |\n",
- "| 2 | K10 | 10 | TP0 | k10 | 1 | 57 | m | ccs | ccs | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample id measurement sample_id sc_rna_seq_data age sex\n",
- "1 K1 1 TP0 k1 0 55 f \n",
- "2 K10 10 TP0 k10 1 57 m \n",
- " classification group meta_data\n",
- "1 vollstaendiger_ausschluss no_ccs 1 \n",
- "2 ccs ccs 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(all_samples_info,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 71,
@@ -1856,67 +1624,6 @@
"nrow(sample_data)"
]
},
- {
- "cell_type": "code",
- "execution_count": 76,
- "id": "802aee1e-fa1e-4d74-9f8d-189ca3828847",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "\t | id | sample | measurement | sample_id | library | id.y | name | read | pattern | sequence | feature_type | X | in_sample | measurement_tp | sc_rna_seq_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <lgl> | <int> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | 1 | K1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 |
\n",
- "\t2 | 1.1 | M1 | TP1 | m1.1 | L1 | HTO_B0251 | 1.1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 1 | TP1 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 15\n",
- "\\begin{tabular}{r|lllllllllllllll}\n",
- " & id & sample & measurement & sample\\_id & library & id.y & name & read & pattern & sequence & feature\\_type & X & in\\_sample & measurement\\_tp & sc\\_rna\\_seq\\_data\\\\\n",
- " & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & 1 & K1 & TP0 & k1 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & Antibody Capture & NA & 0 & No-CCS & 1\\\\\n",
- "\t2 & 1.1 & M1 & TP1 & m1.1 & L1 & HTO\\_B0251 & 1.1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & Antibody Capture & NA & 1 & TP1 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "| | id <chr> | sample <chr> | measurement <chr> | sample_id <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | feature_type <chr> | X <lgl> | in_sample <int> | measurement_tp <chr> | sc_rna_seq_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | 1 | K1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 |\n",
- "| 2 | 1.1 | M1 | TP1 | m1.1 | L1 | HTO_B0251 | 1.1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 1 | TP1 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " id sample measurement sample_id library id.y name read\n",
- "1 1 K1 TP0 k1 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 1.1 M1 TP1 m1.1 L1 HTO_B0251 1.1 R2 \n",
- " pattern sequence feature_type X in_sample measurement_tp\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG Antibody Capture NA 0 No-CCS \n",
- "2 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG Antibody Capture NA 1 TP1 \n",
- " sc_rna_seq_data\n",
- "1 1 \n",
- "2 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 77,
@@ -1956,69 +1663,6 @@
"nrow(sample_data)"
]
},
- {
- "cell_type": "code",
- "execution_count": 79,
- "id": "068aa3a6-d2f4-43ca-973c-225781fe3328",
- "metadata": {
- "tags": []
- },
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 20\n",
- "\n",
- "\t | sample | id | measurement | sample_id | library | id.y | name | read | pattern | sequence | feature_type | X | in_sample | measurement_tp | sc_rna_seq_data | age | sex | classification | group | meta_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <lgl> | <int> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 |
\n",
- "\t2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | Antibody Capture | NA | 1 | Chronic-CCS | 1 | 57 | m | ccs | ccs | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 20\n",
- "\\begin{tabular}{r|llllllllllllllllllll}\n",
- " & sample & id & measurement & sample\\_id & library & id.y & name & read & pattern & sequence & feature\\_type & X & in\\_sample & measurement\\_tp & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data\\\\\n",
- " & & & & & & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & K1 & 1 & TP0 & k1 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & Antibody Capture & NA & 0 & No-CCS & 1 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1\\\\\n",
- "\t2 & K10 & 10 & TP0 & k10 & L11 & HTO\\_B0256 & Ch-CCS-10 & R2 & 5PNNNNNNNNNN(BC) & GGTTGCCAGATGTCA & Antibody Capture & NA & 1 & Chronic-CCS & 1 & 57 & m & ccs & ccs & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 20\n",
- "\n",
- "| | sample <chr> | id <chr> | measurement <chr> | sample_id <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | feature_type <chr> | X <lgl> | in_sample <int> | measurement_tp <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 |\n",
- "| 2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | Antibody Capture | NA | 1 | Chronic-CCS | 1 | 57 | m | ccs | ccs | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample id measurement sample_id library id.y name read\n",
- "1 K1 1 TP0 k1 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 K10 10 TP0 k10 L11 HTO_B0256 Ch-CCS-10 R2 \n",
- " pattern sequence feature_type X in_sample measurement_tp\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG Antibody Capture NA 0 No-CCS \n",
- "2 5PNNNNNNNNNN(BC) GGTTGCCAGATGTCA Antibody Capture NA 1 Chronic-CCS \n",
- " sc_rna_seq_data age sex classification group meta_data\n",
- "1 1 55 f vollstaendiger_ausschluss no_ccs 1 \n",
- "2 1 57 m ccs ccs 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "raw",
"id": "6dad6bc9-91f0-4bae-82ba-58e1668490ff",
@@ -2067,54 +1711,38 @@
},
{
"cell_type": "code",
- "execution_count": 82,
- "id": "ecda4595-82df-427d-be5c-1de2a0baacf8",
- "metadata": {
- "tags": []
- },
+ "execution_count": 83,
+ "id": "1180f3c3-6a12-44ec-b32a-1a9af5e69748",
+ "metadata": {},
"outputs": [
{
"data": {
"text/html": [
- "\n",
- "A data.frame: 2 × 7\n",
- "\n",
- "\t | X | library.hashtag | m | measurement | delta_ef_value_group | delta_ef_value | sample |
\n",
- "\t | <int> | <chr> | <chr> | <chr> | <chr> | <dbl> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | 1 | 1.2 | M2 (1,15) | TP1 | x_greater_1 | 1.15 | 2.1 |
\n",
- "\t2 | 2 | 1.4 | M4 (3,1) | TP1 | x_greater_1 | 3.10 | 4.1 |
\n",
- "\n",
- "
\n"
+ "\n",
+ "- 'x_greater_1'
- 'x_smaller_1'
- 'x_smaller_0'
- NA
\n"
],
"text/latex": [
- "A data.frame: 2 × 7\n",
- "\\begin{tabular}{r|lllllll}\n",
- " & X & library.hashtag & m & measurement & delta\\_ef\\_value\\_group & delta\\_ef\\_value & sample\\\\\n",
- " & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & 1 & 1.2 & M2 (1,15) & TP1 & x\\_greater\\_1 & 1.15 & 2.1\\\\\n",
- "\t2 & 2 & 1.4 & M4 (3,1) & TP1 & x\\_greater\\_1 & 3.10 & 4.1\\\\\n",
- "\\end{tabular}\n"
+ "\\begin{enumerate*}\n",
+ "\\item 'x\\_greater\\_1'\n",
+ "\\item 'x\\_smaller\\_1'\n",
+ "\\item 'x\\_smaller\\_0'\n",
+ "\\item NA\n",
+ "\\end{enumerate*}\n"
],
"text/markdown": [
+ "1. 'x_greater_1'\n",
+ "2. 'x_smaller_1'\n",
+ "3. 'x_smaller_0'\n",
+ "4. NA\n",
"\n",
- "A data.frame: 2 × 7\n",
- "\n",
- "| | X <int> | library.hashtag <chr> | m <chr> | measurement <chr> | delta_ef_value_group <chr> | delta_ef_value <dbl> | sample <chr> |\n",
- "|---|---|---|---|---|---|---|---|\n",
- "| 1 | 1 | 1.2 | M2 (1,15) | TP1 | x_greater_1 | 1.15 | 2.1 |\n",
- "| 2 | 2 | 1.4 | M4 (3,1) | TP1 | x_greater_1 | 3.10 | 4.1 |\n",
"\n"
],
"text/plain": [
- " X library.hashtag m measurement delta_ef_value_group delta_ef_value\n",
- "1 1 1.2 M2 (1,15) TP1 x_greater_1 1.15 \n",
- "2 2 1.4 M4 (3,1) TP1 x_greater_1 3.10 \n",
- " sample\n",
- "1 2.1 \n",
- "2 4.1 "
+ "[1] \"x_greater_1\" \"x_smaller_1\" \"x_smaller_0\" NA "
]
},
"metadata": {},
@@ -2122,51 +1750,7 @@
}
],
"source": [
- "head(ef_classification,2)"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 83,
- "id": "1180f3c3-6a12-44ec-b32a-1a9af5e69748",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "- 'x_greater_1'
- 'x_smaller_1'
- 'x_smaller_0'
- NA
\n"
- ],
- "text/latex": [
- "\\begin{enumerate*}\n",
- "\\item 'x\\_greater\\_1'\n",
- "\\item 'x\\_smaller\\_1'\n",
- "\\item 'x\\_smaller\\_0'\n",
- "\\item NA\n",
- "\\end{enumerate*}\n"
- ],
- "text/markdown": [
- "1. 'x_greater_1'\n",
- "2. 'x_smaller_1'\n",
- "3. 'x_smaller_0'\n",
- "4. NA\n",
- "\n",
- "\n"
- ],
- "text/plain": [
- "[1] \"x_greater_1\" \"x_smaller_1\" \"x_smaller_0\" NA "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "unique(ef_classification$delta_ef_value_group)"
+ "unique(ef_classification$delta_ef_value_group)"
]
},
{
@@ -2454,67 +2038,6 @@
"all_samples_info = merge(all_samples_info, ef_classification_data[,c('sample', 'delta_ef_value_class')], by.x = 'sample', by.y = 'sample', all.x = TRUE)"
]
},
- {
- "cell_type": "code",
- "execution_count": 101,
- "id": "06c4632a-92d9-4cdc-a73d-3a193387b69b",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 12\n",
- "\n",
- "\t | sample | id | measurement | sample_id | sc_rna_seq_data | age | sex | classification | group | meta_data | ef_classification_data | delta_ef_value_class |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <dbl> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | K1 | 1 | TP0 | k1 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | NA | NA |
\n",
- "\t2 | K10 | 10 | TP0 | k10 | 1 | 57 | m | ccs | ccs | 1 | NA | NA |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 12\n",
- "\\begin{tabular}{r|llllllllllll}\n",
- " & sample & id & measurement & sample\\_id & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & ef\\_classification\\_data & delta\\_ef\\_value\\_class\\\\\n",
- " & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & K1 & 1 & TP0 & k1 & 0 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & NA & NA\\\\\n",
- "\t2 & K10 & 10 & TP0 & k10 & 1 & 57 & m & ccs & ccs & 1 & NA & NA\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 12\n",
- "\n",
- "| | sample <chr> | id <chr> | measurement <chr> | sample_id <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | ef_classification_data <dbl> | delta_ef_value_class <chr> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | K1 | 1 | TP0 | k1 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | NA | NA |\n",
- "| 2 | K10 | 10 | TP0 | k10 | 1 | 57 | m | ccs | ccs | 1 | NA | NA |\n",
- "\n"
- ],
- "text/plain": [
- " sample id measurement sample_id sc_rna_seq_data age sex\n",
- "1 K1 1 TP0 k1 0 55 f \n",
- "2 K10 10 TP0 k10 1 57 m \n",
- " classification group meta_data ef_classification_data\n",
- "1 vollstaendiger_ausschluss no_ccs 1 NA \n",
- "2 ccs ccs 1 NA \n",
- " delta_ef_value_class\n",
- "1 NA \n",
- "2 NA "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(all_samples_info,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 102,
@@ -2622,67 +2145,6 @@
"nrow(sample_data)"
]
},
- {
- "cell_type": "code",
- "execution_count": 107,
- "id": "570c488d-cdb8-4049-91fd-ec48889aaf13",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 20\n",
- "\n",
- "\t | sample | id | measurement | sample_id | library | id.y | name | read | pattern | sequence | feature_type | X | in_sample | measurement_tp | sc_rna_seq_data | age | sex | classification | group | meta_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <lgl> | <int> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 |
\n",
- "\t2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | Antibody Capture | NA | 1 | Chronic-CCS | 1 | 57 | m | ccs | ccs | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 20\n",
- "\\begin{tabular}{r|llllllllllllllllllll}\n",
- " & sample & id & measurement & sample\\_id & library & id.y & name & read & pattern & sequence & feature\\_type & X & in\\_sample & measurement\\_tp & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data\\\\\n",
- " & & & & & & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & K1 & 1 & TP0 & k1 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & Antibody Capture & NA & 0 & No-CCS & 1 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1\\\\\n",
- "\t2 & K10 & 10 & TP0 & k10 & L11 & HTO\\_B0256 & Ch-CCS-10 & R2 & 5PNNNNNNNNNN(BC) & GGTTGCCAGATGTCA & Antibody Capture & NA & 1 & Chronic-CCS & 1 & 57 & m & ccs & ccs & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 20\n",
- "\n",
- "| | sample <chr> | id <chr> | measurement <chr> | sample_id <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | feature_type <chr> | X <lgl> | in_sample <int> | measurement_tp <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | Antibody Capture | NA | 0 | No-CCS | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 |\n",
- "| 2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | Antibody Capture | NA | 1 | Chronic-CCS | 1 | 57 | m | ccs | ccs | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample id measurement sample_id library id.y name read\n",
- "1 K1 1 TP0 k1 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 K10 10 TP0 k10 L11 HTO_B0256 Ch-CCS-10 R2 \n",
- " pattern sequence feature_type X in_sample measurement_tp\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG Antibody Capture NA 0 No-CCS \n",
- "2 5PNNNNNNNNNN(BC) GGTTGCCAGATGTCA Antibody Capture NA 1 Chronic-CCS \n",
- " sc_rna_seq_data age sex classification group meta_data\n",
- "1 1 55 f vollstaendiger_ausschluss no_ccs 1 \n",
- "2 1 57 m ccs ccs 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 108,
@@ -2722,72 +2184,6 @@
"nrow(sample_data)"
]
},
- {
- "cell_type": "code",
- "execution_count": 110,
- "id": "8baf7cf5-a7a1-4e0a-ac9e-927534634583",
- "metadata": {
- "tags": []
- },
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 24\n",
- "\n",
- "\t | sample | id | measurement | sample_id | library | id.y | name | read | pattern | sequence | ⋯ | sc_rna_seq_data | age | sex | classification | group | meta_data | delta_ef_value_group | delta_ef_value | delta_ef_value_class | ef_classification_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | ⋯ | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <chr> | <dbl> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | ⋯ | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | NA | NA | NA | NA |
\n",
- "\t2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | ⋯ | 1 | 57 | m | ccs | ccs | 1 | NA | NA | NA | NA |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 24\n",
- "\\begin{tabular}{r|lllllllllllllllllllll}\n",
- " & sample & id & measurement & sample\\_id & library & id.y & name & read & pattern & sequence & ⋯ & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & delta\\_ef\\_value\\_group & delta\\_ef\\_value & delta\\_ef\\_value\\_class & ef\\_classification\\_data\\\\\n",
- " & & & & & & & & & & & ⋯ & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & K1 & 1 & TP0 & k1 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & ⋯ & 1 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & NA & NA & NA & NA\\\\\n",
- "\t2 & K10 & 10 & TP0 & k10 & L11 & HTO\\_B0256 & Ch-CCS-10 & R2 & 5PNNNNNNNNNN(BC) & GGTTGCCAGATGTCA & ⋯ & 1 & 57 & m & ccs & ccs & 1 & NA & NA & NA & NA\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 24\n",
- "\n",
- "| | sample <chr> | id <chr> | measurement <chr> | sample_id <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | ⋯ ⋯ | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | delta_ef_value_group <chr> | delta_ef_value <dbl> | delta_ef_value_class <chr> | ef_classification_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | ⋯ | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | NA | NA | NA | NA |\n",
- "| 2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | ⋯ | 1 | 57 | m | ccs | ccs | 1 | NA | NA | NA | NA |\n",
- "\n"
- ],
- "text/plain": [
- " sample id measurement sample_id library id.y name read\n",
- "1 K1 1 TP0 k1 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 K10 10 TP0 k10 L11 HTO_B0256 Ch-CCS-10 R2 \n",
- " pattern sequence ⋯ sc_rna_seq_data age sex\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG ⋯ 1 55 f \n",
- "2 5PNNNNNNNNNN(BC) GGTTGCCAGATGTCA ⋯ 1 57 m \n",
- " classification group meta_data delta_ef_value_group\n",
- "1 vollstaendiger_ausschluss no_ccs 1 NA \n",
- "2 ccs ccs 1 NA \n",
- " delta_ef_value delta_ef_value_class ef_classification_data\n",
- "1 NA NA NA \n",
- "2 NA NA NA "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 111,
@@ -2893,374 +2289,6 @@
"print(file.info(path)$mtime)"
]
},
- {
- "cell_type": "code",
- "execution_count": 116,
- "id": "12eedde4-8726-49a0-b46c-c4b8df40858c",
- "metadata": {
- "tags": []
- },
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 4\n",
- "\n",
- "\t | CK | CK_MB | Troponin | sample_id |
\n",
- "\t | <int> | <chr> | <dbl> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | 128 | | 0.169 | m2.1 |
\n",
- "\t2 | NA | | NA | m3.1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 4\n",
- "\\begin{tabular}{r|llll}\n",
- " & CK & CK\\_MB & Troponin & sample\\_id\\\\\n",
- " & & & & \\\\\n",
- "\\hline\n",
- "\t1 & 128 & & 0.169 & m2.1\\\\\n",
- "\t2 & NA & & NA & m3.1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 4\n",
- "\n",
- "| | CK <int> | CK_MB <chr> | Troponin <dbl> | sample_id <chr> |\n",
- "|---|---|---|---|---|\n",
- "| 1 | 128 | | 0.169 | m2.1 |\n",
- "| 2 | NA | | NA | m3.1 |\n",
- "\n"
- ],
- "text/plain": [
- " CK CK_MB Troponin sample_id\n",
- "1 128 0.169 m2.1 \n",
- "2 NA NA m3.1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(clinical,2)"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 117,
- "id": "4fc6b00b-fa39-4885-9ee9-9eb1dcbc8a37",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 2\n",
- "\n",
- "\t | sample_id | CRP |
\n",
- "\t | <chr> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | k2 | 0.1 |
\n",
- "\t2 | k4 | 0.3 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 2\n",
- "\\begin{tabular}{r|ll}\n",
- " & sample\\_id & CRP\\\\\n",
- " & & \\\\\n",
- "\\hline\n",
- "\t1 & k2 & 0.1\\\\\n",
- "\t2 & k4 & 0.3\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 2\n",
- "\n",
- "| | sample_id <chr> | CRP <chr> |\n",
- "|---|---|---|\n",
- "| 1 | k2 | 0.1 |\n",
- "| 2 | k4 | 0.3 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id CRP\n",
- "1 k2 0.1\n",
- "2 k4 0.3"
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(clinical_crp,2)"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 118,
- "id": "b188beb4-5353-40e4-976c-092c99c432ca",
- "metadata": {},
- "outputs": [
- {
- "name": "stderr",
- "output_type": "stream",
- "text": [
- "Warning message in unique(as.numeric(clinical_crp$CRP)):\n",
- "“NAs introduced by coercion”\n"
- ]
- },
- {
- "data": {
- "text/html": [
- "\n",
- "- 0.1
- 0.2
- 0.3
- 0.4
- 0.6
- 0.7
- 0.8
- 0.9
- 1
- 1.1
- 1.3
- 1.4
- 1.8
- 1.9
- 2.3
- 2.5
- 2.8
- 3.2
- 3.4
- 4.2
- 4.4
- 5.6
- 5.7
- 5.9
- 6.2
- 6.3
- 6.5
- 6.8
- 7.1
- 7.3
- 7.8
- 7.9
- 8.1
- 12.4
- 12.5
- 15.1
- 16.9
- 17.4
\n"
- ],
- "text/latex": [
- "\\begin{enumerate*}\n",
- "\\item 0.1\n",
- "\\item 0.2\n",
- "\\item 0.3\n",
- "\\item 0.4\n",
- "\\item 0.6\n",
- "\\item 0.7\n",
- "\\item 0.8\n",
- "\\item 0.9\n",
- "\\item 1\n",
- "\\item 1.1\n",
- "\\item 1.3\n",
- "\\item 1.4\n",
- "\\item 1.8\n",
- "\\item 1.9\n",
- "\\item 2.3\n",
- "\\item 2.5\n",
- "\\item 2.8\n",
- "\\item 3.2\n",
- "\\item 3.4\n",
- "\\item 4.2\n",
- "\\item 4.4\n",
- "\\item 5.6\n",
- "\\item 5.7\n",
- "\\item 5.9\n",
- "\\item 6.2\n",
- "\\item 6.3\n",
- "\\item 6.5\n",
- "\\item 6.8\n",
- "\\item 7.1\n",
- "\\item 7.3\n",
- "\\item 7.8\n",
- "\\item 7.9\n",
- "\\item 8.1\n",
- "\\item 12.4\n",
- "\\item 12.5\n",
- "\\item 15.1\n",
- "\\item 16.9\n",
- "\\item 17.4\n",
- "\\end{enumerate*}\n"
- ],
- "text/markdown": [
- "1. 0.1\n",
- "2. 0.2\n",
- "3. 0.3\n",
- "4. 0.4\n",
- "5. 0.6\n",
- "6. 0.7\n",
- "7. 0.8\n",
- "8. 0.9\n",
- "9. 1\n",
- "10. 1.1\n",
- "11. 1.3\n",
- "12. 1.4\n",
- "13. 1.8\n",
- "14. 1.9\n",
- "15. 2.3\n",
- "16. 2.5\n",
- "17. 2.8\n",
- "18. 3.2\n",
- "19. 3.4\n",
- "20. 4.2\n",
- "21. 4.4\n",
- "22. 5.6\n",
- "23. 5.7\n",
- "24. 5.9\n",
- "25. 6.2\n",
- "26. 6.3\n",
- "27. 6.5\n",
- "28. 6.8\n",
- "29. 7.1\n",
- "30. 7.3\n",
- "31. 7.8\n",
- "32. 7.9\n",
- "33. 8.1\n",
- "34. 12.4\n",
- "35. 12.5\n",
- "36. 15.1\n",
- "37. 16.9\n",
- "38. 17.4\n",
- "\n",
- "\n"
- ],
- "text/plain": [
- " [1] 0.1 0.2 0.3 0.4 0.6 0.7 0.8 0.9 1.0 1.1 1.3 1.4 1.8 1.9 2.3\n",
- "[16] 2.5 2.8 3.2 3.4 4.2 4.4 5.6 5.7 5.9 6.2 6.3 6.5 6.8 7.1 7.3\n",
- "[31] 7.8 7.9 8.1 12.4 12.5 15.1 16.9 17.4"
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "sort(unique(as.numeric(clinical_crp$CRP)))"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 119,
- "id": "969c39f1-3e69-4af6-822f-082171681353",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "- ''
- '-'
- '<0,1'
- '0,2 (-1d) '
- '0,3 (-2d) '
- '0,5 (-1d) '
- '0.1'
- '0.2'
- '0.3'
- '0.4'
- '0.6'
- '0.7'
- '0.8'
- '0.9'
- '1'
- '1.1'
- '1.3'
- '1.4'
- '1.8'
- '1.9'
- '12.4'
- '12.5'
- '15.1'
- '16.9'
- '17.4'
- '2.3'
- '2.5'
- '2.8'
- '3,8 (-1d) '
- '3.2'
- '3.4'
- '4.2'
- '4.4'
- '5.6'
- '5.7'
- '5.9'
- '6.2'
- '6.3'
- '6.5'
- '6.8'
- '7.1'
- '7.3'
- '7.8'
- '7.9'
- '8.1'
\n"
- ],
- "text/latex": [
- "\\begin{enumerate*}\n",
- "\\item ''\n",
- "\\item '-'\n",
- "\\item '<0,1'\n",
- "\\item '0,2 (-1d) '\n",
- "\\item '0,3 (-2d) '\n",
- "\\item '0,5 (-1d) '\n",
- "\\item '0.1'\n",
- "\\item '0.2'\n",
- "\\item '0.3'\n",
- "\\item '0.4'\n",
- "\\item '0.6'\n",
- "\\item '0.7'\n",
- "\\item '0.8'\n",
- "\\item '0.9'\n",
- "\\item '1'\n",
- "\\item '1.1'\n",
- "\\item '1.3'\n",
- "\\item '1.4'\n",
- "\\item '1.8'\n",
- "\\item '1.9'\n",
- "\\item '12.4'\n",
- "\\item '12.5'\n",
- "\\item '15.1'\n",
- "\\item '16.9'\n",
- "\\item '17.4'\n",
- "\\item '2.3'\n",
- "\\item '2.5'\n",
- "\\item '2.8'\n",
- "\\item '3,8 (-1d) '\n",
- "\\item '3.2'\n",
- "\\item '3.4'\n",
- "\\item '4.2'\n",
- "\\item '4.4'\n",
- "\\item '5.6'\n",
- "\\item '5.7'\n",
- "\\item '5.9'\n",
- "\\item '6.2'\n",
- "\\item '6.3'\n",
- "\\item '6.5'\n",
- "\\item '6.8'\n",
- "\\item '7.1'\n",
- "\\item '7.3'\n",
- "\\item '7.8'\n",
- "\\item '7.9'\n",
- "\\item '8.1'\n",
- "\\end{enumerate*}\n"
- ],
- "text/markdown": [
- "1. ''\n",
- "2. '-'\n",
- "3. '<0,1'\n",
- "4. '0,2 (-1d) '\n",
- "5. '0,3 (-2d) '\n",
- "6. '0,5 (-1d) '\n",
- "7. '0.1'\n",
- "8. '0.2'\n",
- "9. '0.3'\n",
- "10. '0.4'\n",
- "11. '0.6'\n",
- "12. '0.7'\n",
- "13. '0.8'\n",
- "14. '0.9'\n",
- "15. '1'\n",
- "16. '1.1'\n",
- "17. '1.3'\n",
- "18. '1.4'\n",
- "19. '1.8'\n",
- "20. '1.9'\n",
- "21. '12.4'\n",
- "22. '12.5'\n",
- "23. '15.1'\n",
- "24. '16.9'\n",
- "25. '17.4'\n",
- "26. '2.3'\n",
- "27. '2.5'\n",
- "28. '2.8'\n",
- "29. '3,8 (-1d) '\n",
- "30. '3.2'\n",
- "31. '3.4'\n",
- "32. '4.2'\n",
- "33. '4.4'\n",
- "34. '5.6'\n",
- "35. '5.7'\n",
- "36. '5.9'\n",
- "37. '6.2'\n",
- "38. '6.3'\n",
- "39. '6.5'\n",
- "40. '6.8'\n",
- "41. '7.1'\n",
- "42. '7.3'\n",
- "43. '7.8'\n",
- "44. '7.9'\n",
- "45. '8.1'\n",
- "\n",
- "\n"
- ],
- "text/plain": [
- " [1] \"\" \"-\" \"<0,1\" \"0,2 (-1d) \" \"0,3 (-2d) \"\n",
- " [6] \"0,5 (-1d) \" \"0.1\" \"0.2\" \"0.3\" \"0.4\" \n",
- "[11] \"0.6\" \"0.7\" \"0.8\" \"0.9\" \"1\" \n",
- "[16] \"1.1\" \"1.3\" \"1.4\" \"1.8\" \"1.9\" \n",
- "[21] \"12.4\" \"12.5\" \"15.1\" \"16.9\" \"17.4\" \n",
- "[26] \"2.3\" \"2.5\" \"2.8\" \"3,8 (-1d) \" \"3.2\" \n",
- "[31] \"3.4\" \"4.2\" \"4.4\" \"5.6\" \"5.7\" \n",
- "[36] \"5.9\" \"6.2\" \"6.3\" \"6.5\" \"6.8\" \n",
- "[41] \"7.1\" \"7.3\" \"7.8\" \"7.9\" \"8.1\" "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "sort(unique(clinical_crp$CRP))"
- ]
- },
{
"cell_type": "code",
"execution_count": 120,
@@ -3407,61 +2435,6 @@
"nrow(clinical) # all samples kept after merging"
]
},
- {
- "cell_type": "code",
- "execution_count": 127,
- "id": "0d48f696-5a1f-46f0-a1fc-e60303df1bc5",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 5\n",
- "\n",
- "\t | sample_id | CK | CK_MB | Troponin | CRP |
\n",
- "\t | <chr> | <int> | <chr> | <dbl> | <chr> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | 43 | | 0.013 | 0.4 |
\n",
- "\t2 | k10 | NA | | NA | 0.2 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 5\n",
- "\\begin{tabular}{r|lllll}\n",
- " & sample\\_id & CK & CK\\_MB & Troponin & CRP\\\\\n",
- " & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & k1 & 43 & & 0.013 & 0.4\\\\\n",
- "\t2 & k10 & NA & & NA & 0.2\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 5\n",
- "\n",
- "| | sample_id <chr> | CK <int> | CK_MB <chr> | Troponin <dbl> | CRP <chr> |\n",
- "|---|---|---|---|---|---|\n",
- "| 1 | k1 | 43 | | 0.013 | 0.4 |\n",
- "| 2 | k10 | NA | | NA | 0.2 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id CK CK_MB Troponin CRP\n",
- "1 k1 43 0.013 0.4\n",
- "2 k10 NA NA 0.2"
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(clinical,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 128,
@@ -3584,79 +2557,15 @@
"source": [
"nrow(all_samples_info)"
]
- },
- {
- "cell_type": "code",
- "execution_count": 136,
- "id": "542b84d0-a474-420e-94c9-e356d0633cec",
- "metadata": {},
- "outputs": [],
- "source": [
- "all_samples_info = merge(all_samples_info, clinical[,c('sample_id', 'clinical_data', 'complete_clinical_data', 'min_1_clinical_value')], by.x = 'sample_id', by.y = 'sample_id')"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 137,
- "id": "91d71ba0-689b-4fc0-bbf0-8eaf5d63e829",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "\t | sample_id | sample | id | measurement | sc_rna_seq_data | age | sex | classification | group | meta_data | ef_classification_data | delta_ef_value_class | clinical_data | complete_clinical_data | min_1_clinical_value |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <dbl> | <chr> | <dbl> | <dbl> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 |
\n",
- "\t2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 15\n",
- "\\begin{tabular}{r|lllllllllllllll}\n",
- " & sample\\_id & sample & id & measurement & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & ef\\_classification\\_data & delta\\_ef\\_value\\_class & clinical\\_data & complete\\_clinical\\_data & min\\_1\\_clinical\\_value\\\\\n",
- " & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & k1 & K1 & 1 & TP0 & 0 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & 0 & NA & 1 & 0 & 1\\\\\n",
- "\t2 & k10 & K10 & 10 & TP0 & 1 & 57 & m & ccs & ccs & 1 & 0 & NA & 1 & 0 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "| | sample_id <chr> | sample <chr> | id <chr> | measurement <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | ef_classification_data <dbl> | delta_ef_value_class <chr> | clinical_data <dbl> | complete_clinical_data <dbl> | min_1_clinical_value <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 |\n",
- "| 2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id sample id measurement sc_rna_seq_data age sex\n",
- "1 k1 K1 1 TP0 0 55 f \n",
- "2 k10 K10 10 TP0 1 57 m \n",
- " classification group meta_data ef_classification_data\n",
- "1 vollstaendiger_ausschluss no_ccs 1 0 \n",
- "2 ccs ccs 1 0 \n",
- " delta_ef_value_class clinical_data complete_clinical_data\n",
- "1 NA 1 0 \n",
- "2 NA 1 0 \n",
- " min_1_clinical_value\n",
- "1 1 \n",
- "2 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 136,
+ "id": "542b84d0-a474-420e-94c9-e356d0633cec",
+ "metadata": {},
+ "outputs": [],
"source": [
- "head(all_samples_info,2)"
+ "all_samples_info = merge(all_samples_info, clinical[,c('sample_id', 'clinical_data', 'complete_clinical_data', 'min_1_clinical_value')], by.x = 'sample_id', by.y = 'sample_id')"
]
},
{
@@ -3756,70 +2665,6 @@
"nrow(sample_data)"
]
},
- {
- "cell_type": "code",
- "execution_count": 142,
- "id": "85dc0cd0-a3c8-426b-91fb-b300d4c5ba9e",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 24\n",
- "\n",
- "\t | sample | id | measurement | sample_id | library | id.y | name | read | pattern | sequence | ⋯ | sc_rna_seq_data | age | sex | classification | group | meta_data | delta_ef_value_group | delta_ef_value | delta_ef_value_class | ef_classification_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | ⋯ | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <chr> | <dbl> | <chr> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | ⋯ | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | NA | NA | NA | 0 |
\n",
- "\t2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | ⋯ | 1 | 57 | m | ccs | ccs | 1 | NA | NA | NA | 0 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 24\n",
- "\\begin{tabular}{r|lllllllllllllllllllll}\n",
- " & sample & id & measurement & sample\\_id & library & id.y & name & read & pattern & sequence & ⋯ & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & delta\\_ef\\_value\\_group & delta\\_ef\\_value & delta\\_ef\\_value\\_class & ef\\_classification\\_data\\\\\n",
- " & & & & & & & & & & & ⋯ & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & K1 & 1 & TP0 & k1 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & ⋯ & 1 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & NA & NA & NA & 0\\\\\n",
- "\t2 & K10 & 10 & TP0 & k10 & L11 & HTO\\_B0256 & Ch-CCS-10 & R2 & 5PNNNNNNNNNN(BC) & GGTTGCCAGATGTCA & ⋯ & 1 & 57 & m & ccs & ccs & 1 & NA & NA & NA & 0\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 24\n",
- "\n",
- "| | sample <chr> | id <chr> | measurement <chr> | sample_id <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | ⋯ ⋯ | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | delta_ef_value_group <chr> | delta_ef_value <dbl> | delta_ef_value_class <chr> | ef_classification_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | K1 | 1 | TP0 | k1 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | ⋯ | 1 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | NA | NA | NA | 0 |\n",
- "| 2 | K10 | 10 | TP0 | k10 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | ⋯ | 1 | 57 | m | ccs | ccs | 1 | NA | NA | NA | 0 |\n",
- "\n"
- ],
- "text/plain": [
- " sample id measurement sample_id library id.y name read\n",
- "1 K1 1 TP0 k1 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 K10 10 TP0 k10 L11 HTO_B0256 Ch-CCS-10 R2 \n",
- " pattern sequence ⋯ sc_rna_seq_data age sex\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG ⋯ 1 55 f \n",
- "2 5PNNNNNNNNNN(BC) GGTTGCCAGATGTCA ⋯ 1 57 m \n",
- " classification group meta_data delta_ef_value_group\n",
- "1 vollstaendiger_ausschluss no_ccs 1 NA \n",
- "2 ccs ccs 1 NA \n",
- " delta_ef_value delta_ef_value_class ef_classification_data\n",
- "1 NA NA 0 \n",
- "2 NA NA 0 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 143,
@@ -3859,72 +2704,6 @@
"nrow(sample_data)"
]
},
- {
- "cell_type": "code",
- "execution_count": 145,
- "id": "41278fbc-209f-426f-ad7d-d9d3b3fbf2e4",
- "metadata": {
- "tags": []
- },
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 31\n",
- "\n",
- "\t | sample_id | sample | id | measurement | library | id.y | name | read | pattern | sequence | ⋯ | delta_ef_value | delta_ef_value_class | ef_classification_data | CK | CK_MB | Troponin | CRP | clinical_data | complete_clinical_data | min_1_clinical_value |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | <chr> | ⋯ | <dbl> | <chr> | <dbl> | <int> | <chr> | <dbl> | <chr> | <dbl> | <dbl> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | K1 | 1 | TP0 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | ⋯ | NA | NA | 0 | 43 | | 0.013 | 0.4 | 1 | 0 | 1 |
\n",
- "\t2 | k10 | K10 | 10 | TP0 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | ⋯ | NA | NA | 0 | NA | | NA | 0.2 | 1 | 0 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 31\n",
- "\\begin{tabular}{r|lllllllllllllllllllll}\n",
- " & sample\\_id & sample & id & measurement & library & id.y & name & read & pattern & sequence & ⋯ & delta\\_ef\\_value & delta\\_ef\\_value\\_class & ef\\_classification\\_data & CK & CK\\_MB & Troponin & CRP & clinical\\_data & complete\\_clinical\\_data & min\\_1\\_clinical\\_value\\\\\n",
- " & & & & & & & & & & & ⋯ & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & k1 & K1 & 1 & TP0 & L13 & HTO\\_B0251 & No-CCS-1 & R2 & 5PNNNNNNNNNN(BC) & GTCAACTCTTTAGCG & ⋯ & NA & NA & 0 & 43 & & 0.013 & 0.4 & 1 & 0 & 1\\\\\n",
- "\t2 & k10 & K10 & 10 & TP0 & L11 & HTO\\_B0256 & Ch-CCS-10 & R2 & 5PNNNNNNNNNN(BC) & GGTTGCCAGATGTCA & ⋯ & NA & NA & 0 & NA & & NA & 0.2 & 1 & 0 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 31\n",
- "\n",
- "| | sample_id <chr> | sample <chr> | id <chr> | measurement <chr> | library <chr> | id.y <chr> | name <chr> | read <chr> | pattern <chr> | sequence <chr> | ⋯ ⋯ | delta_ef_value <dbl> | delta_ef_value_class <chr> | ef_classification_data <dbl> | CK <int> | CK_MB <chr> | Troponin <dbl> | CRP <chr> | clinical_data <dbl> | complete_clinical_data <dbl> | min_1_clinical_value <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | k1 | K1 | 1 | TP0 | L13 | HTO_B0251 | No-CCS-1 | R2 | 5PNNNNNNNNNN(BC) | GTCAACTCTTTAGCG | ⋯ | NA | NA | 0 | 43 | | 0.013 | 0.4 | 1 | 0 | 1 |\n",
- "| 2 | k10 | K10 | 10 | TP0 | L11 | HTO_B0256 | Ch-CCS-10 | R2 | 5PNNNNNNNNNN(BC) | GGTTGCCAGATGTCA | ⋯ | NA | NA | 0 | NA | | NA | 0.2 | 1 | 0 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id sample id measurement library id.y name read\n",
- "1 k1 K1 1 TP0 L13 HTO_B0251 No-CCS-1 R2 \n",
- "2 k10 K10 10 TP0 L11 HTO_B0256 Ch-CCS-10 R2 \n",
- " pattern sequence ⋯ delta_ef_value delta_ef_value_class\n",
- "1 5PNNNNNNNNNN(BC) GTCAACTCTTTAGCG ⋯ NA NA \n",
- "2 5PNNNNNNNNNN(BC) GGTTGCCAGATGTCA ⋯ NA NA \n",
- " ef_classification_data CK CK_MB Troponin CRP clinical_data\n",
- "1 0 43 0.013 0.4 1 \n",
- "2 0 NA NA 0.2 1 \n",
- " complete_clinical_data min_1_clinical_value\n",
- "1 0 1 \n",
- "2 0 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(sample_data,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 146,
@@ -4259,70 +3038,6 @@
"### Add information about available cytokine data"
]
},
- {
- "cell_type": "code",
- "execution_count": 159,
- "id": "63398678-189f-42b2-bea9-7347212b415b",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "\t | sample_id | sample | id | measurement | sc_rna_seq_data | age | sex | classification | group | meta_data | ef_classification_data | delta_ef_value_class | clinical_data | complete_clinical_data | min_1_clinical_value |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <dbl> | <chr> | <dbl> | <dbl> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 |
\n",
- "\t2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 15\n",
- "\\begin{tabular}{r|lllllllllllllll}\n",
- " & sample\\_id & sample & id & measurement & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & ef\\_classification\\_data & delta\\_ef\\_value\\_class & clinical\\_data & complete\\_clinical\\_data & min\\_1\\_clinical\\_value\\\\\n",
- " & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & k1 & K1 & 1 & TP0 & 0 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & 0 & NA & 1 & 0 & 1\\\\\n",
- "\t2 & k10 & K10 & 10 & TP0 & 1 & 57 & m & ccs & ccs & 1 & 0 & NA & 1 & 0 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 15\n",
- "\n",
- "| | sample_id <chr> | sample <chr> | id <chr> | measurement <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | ef_classification_data <dbl> | delta_ef_value_class <chr> | clinical_data <dbl> | complete_clinical_data <dbl> | min_1_clinical_value <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 |\n",
- "| 2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id sample id measurement sc_rna_seq_data age sex\n",
- "1 k1 K1 1 TP0 0 55 f \n",
- "2 k10 K10 10 TP0 1 57 m \n",
- " classification group meta_data ef_classification_data\n",
- "1 vollstaendiger_ausschluss no_ccs 1 0 \n",
- "2 ccs ccs 1 0 \n",
- " delta_ef_value_class clinical_data complete_clinical_data\n",
- "1 NA 1 0 \n",
- "2 NA 1 0 \n",
- " min_1_clinical_value\n",
- "1 1 \n",
- "2 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(all_samples_info,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 160,
@@ -4395,70 +3110,6 @@
"nrow(all_samples_info)"
]
},
- {
- "cell_type": "code",
- "execution_count": 164,
- "id": "188fbff7-4621-41b6-a743-c609725dffed",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 16\n",
- "\n",
- "\t | sample_id | sample | id | measurement | sc_rna_seq_data | age | sex | classification | group | meta_data | ef_classification_data | delta_ef_value_class | clinical_data | complete_clinical_data | min_1_clinical_value | cytokine_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <dbl> | <chr> | <dbl> | <dbl> | <dbl> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |
\n",
- "\t2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 16\n",
- "\\begin{tabular}{r|llllllllllllllll}\n",
- " & sample\\_id & sample & id & measurement & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & ef\\_classification\\_data & delta\\_ef\\_value\\_class & clinical\\_data & complete\\_clinical\\_data & min\\_1\\_clinical\\_value & cytokine\\_data\\\\\n",
- " & & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & k1 & K1 & 1 & TP0 & 0 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & 0 & NA & 1 & 0 & 1 & 1\\\\\n",
- "\t2 & k10 & K10 & 10 & TP0 & 1 & 57 & m & ccs & ccs & 1 & 0 & NA & 1 & 0 & 1 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 16\n",
- "\n",
- "| | sample_id <chr> | sample <chr> | id <chr> | measurement <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | ef_classification_data <dbl> | delta_ef_value_class <chr> | clinical_data <dbl> | complete_clinical_data <dbl> | min_1_clinical_value <dbl> | cytokine_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |\n",
- "| 2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id sample id measurement sc_rna_seq_data age sex\n",
- "1 k1 K1 1 TP0 0 55 f \n",
- "2 k10 K10 10 TP0 1 57 m \n",
- " classification group meta_data ef_classification_data\n",
- "1 vollstaendiger_ausschluss no_ccs 1 0 \n",
- "2 ccs ccs 1 0 \n",
- " delta_ef_value_class clinical_data complete_clinical_data\n",
- "1 NA 1 0 \n",
- "2 NA 1 0 \n",
- " min_1_clinical_value cytokine_data\n",
- "1 1 1 \n",
- "2 1 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(all_samples_info,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 165,
@@ -5582,16 +4233,6 @@
"check_similarity3[check_similarity3$sample_id == 'k4',]"
]
},
- {
- "cell_type": "code",
- "execution_count": 198,
- "id": "5774f067-6d55-467a-8cf2-4375a21f3fbb",
- "metadata": {},
- "outputs": [],
- "source": [
- "### Not sure with which file to continue? - To discuss with Victoria"
- ]
- },
{
"cell_type": "code",
"execution_count": 199,
@@ -5661,70 +4302,6 @@
"### Investigate sample IDs + compare with remaining data"
]
},
- {
- "cell_type": "code",
- "execution_count": 204,
- "id": "c78ab9ea-7a4c-44f9-aeb9-62466add3ab9",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 16\n",
- "\n",
- "\t | sample_id | sample | id | measurement | sc_rna_seq_data | age | sex | classification | group | meta_data | ef_classification_data | delta_ef_value_class | clinical_data | complete_clinical_data | min_1_clinical_value | cytokine_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <dbl> | <chr> | <dbl> | <dbl> | <dbl> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |
\n",
- "\t2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 16\n",
- "\\begin{tabular}{r|llllllllllllllll}\n",
- " & sample\\_id & sample & id & measurement & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & ef\\_classification\\_data & delta\\_ef\\_value\\_class & clinical\\_data & complete\\_clinical\\_data & min\\_1\\_clinical\\_value & cytokine\\_data\\\\\n",
- " & & & & & & & & & & & & & & & & \\\\\n",
- "\\hline\n",
- "\t1 & k1 & K1 & 1 & TP0 & 0 & 55 & f & vollstaendiger\\_ausschluss & no\\_ccs & 1 & 0 & NA & 1 & 0 & 1 & 1\\\\\n",
- "\t2 & k10 & K10 & 10 & TP0 & 1 & 57 & m & ccs & ccs & 1 & 0 & NA & 1 & 0 & 1 & 1\\\\\n",
- "\\end{tabular}\n"
- ],
- "text/markdown": [
- "\n",
- "A data.frame: 2 × 16\n",
- "\n",
- "| | sample_id <chr> | sample <chr> | id <chr> | measurement <chr> | sc_rna_seq_data <dbl> | age <int> | sex <chr> | classification <chr> | group <chr> | meta_data <dbl> | ef_classification_data <dbl> | delta_ef_value_class <chr> | clinical_data <dbl> | complete_clinical_data <dbl> | min_1_clinical_value <dbl> | cytokine_data <dbl> |\n",
- "|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n",
- "| 1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |\n",
- "| 2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 |\n",
- "\n"
- ],
- "text/plain": [
- " sample_id sample id measurement sc_rna_seq_data age sex\n",
- "1 k1 K1 1 TP0 0 55 f \n",
- "2 k10 K10 10 TP0 1 57 m \n",
- " classification group meta_data ef_classification_data\n",
- "1 vollstaendiger_ausschluss no_ccs 1 0 \n",
- "2 ccs ccs 1 0 \n",
- " delta_ef_value_class clinical_data complete_clinical_data\n",
- "1 NA 1 0 \n",
- "2 NA 1 0 \n",
- " min_1_clinical_value cytokine_data\n",
- "1 1 1 \n",
- "2 1 1 "
- ]
- },
- "metadata": {},
- "output_type": "display_data"
- }
- ],
- "source": [
- "head(all_samples_info,2)"
- ]
- },
{
"cell_type": "code",
"execution_count": 205,
@@ -5764,70 +4341,6 @@
"nrow(all_samples_info)"
]
},
- {
- "cell_type": "code",
- "execution_count": 207,
- "id": "70eec507-b66e-4bea-bde7-2ea57a2db845",
- "metadata": {},
- "outputs": [
- {
- "data": {
- "text/html": [
- "\n",
- "A data.frame: 2 × 17\n",
- "\n",
- "\t | sample_id | sample | id | measurement | sc_rna_seq_data | age | sex | classification | group | meta_data | ef_classification_data | delta_ef_value_class | clinical_data | complete_clinical_data | min_1_clinical_value | cytokine_data | neutrophil_data |
\n",
- "\t | <chr> | <chr> | <chr> | <chr> | <dbl> | <int> | <chr> | <chr> | <chr> | <dbl> | <dbl> | <chr> | <dbl> | <dbl> | <dbl> | <dbl> | <dbl> |
\n",
- "\n",
- "\n",
- "\t1 | k1 | K1 | 1 | TP0 | 0 | 55 | f | vollstaendiger_ausschluss | no_ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 | 1 |
\n",
- "\t2 | k10 | K10 | 10 | TP0 | 1 | 57 | m | ccs | ccs | 1 | 0 | NA | 1 | 0 | 1 | 1 | 1 |
\n",
- "\n",
- "
\n"
- ],
- "text/latex": [
- "A data.frame: 2 × 17\n",
- "\\begin{tabular}{r|lllllllllllllllll}\n",
- " & sample\\_id & sample & id & measurement & sc\\_rna\\_seq\\_data & age & sex & classification & group & meta\\_data & ef\\_classification\\_data & delta\\_ef\\_value\\_class & clinical\\_data & complete\\_clinical\\_data & min\\_1\\_clinical\\_value & cytokine\\_data & neutrophil\\_data\\\\\n",
- " & & & & & & & &