NIGMS
diff --git a/‎AWS/01-RNA-Seq/RNA-seq.ipynb
+107-23 b/‎AWS/01-RNA-Seq/RNA-seq.ipynb
+107-23
diff --git a/‎AWS/01-RNA-Seq/rnaseq-aws.config
+4-4 b/‎AWS/01-RNA-Seq/rnaseq-aws.config
+4-4
@@ -20,7 +20,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "f0e9ac26-e308-471a-83a4-113f767524b0",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "IRdisplay::display_html('<iframe src = \"../../docs/quiz_files/rna-pre_module.html\" width=95% height=600></iframe>')"
@@ -218,7 +222,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "6da16610-a83f-42b5-be52-f8116db3fb03",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "#Install nexflow, make it exceutable, and update it\n",
@@ -232,7 +240,7 @@
    "id": "3852204f-a42a-40a2-8b3f-4c153a9b0416",
    "metadata": {},
    "source": [
-    "**The size of the output data generated by Nextflow is quite large we can mitigate that by storing the temporary and output files to a bucket by setting the 'workDir' and 'params.outdir' to an existing bucket. Make sure you modify the file called rnaseq-aws.config**\n",
+    "The size of the output data generated by Nextflow is quite large we can mitigate that by storing the temporary and output files to a bucket by setting the 'workDir' and 'params.outdir' to an existing bucket. Make sure you modify the file called rnaseq-aws.config.\n",
     " \n",
     "`workDir = 's3://your_bucket_name/rna-tmp'`  \n",
     "`params.outdir = 's3://your_bucket_name/rna-outputs'`"
@@ -250,7 +258,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "bb2e1f61-eea1-4464-9842-76fabae4c39a",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "system('./nextflow run nf-core/rnaseq -c rnaseq-aws.config -profile test,aws', intern=TRUE)"
@@ -295,7 +307,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "d888aacf-8f6d-427e-8646-f33a33203fd9",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "system('chmod +x install_rna_seq_packages.sh' , intern=TRUE)\n",
@@ -307,14 +323,18 @@
    "id": "8ad88e67",
    "metadata": {},
    "source": [
-    "**Important**: Choose \"R-RNA-Seq\" kernel for the rest of the notebook."
+    "**Important: Choose \"R-RNA-Seq\" kernel for the rest of the notebook.**"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
    "id": "a5ea70df-98ba-4a69-aeec-2baed34a72fc",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "library(DESeq2)\n",
@@ -337,7 +357,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "e49c7007-61b3-4057-89de-3f3fb1085800",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# download data files from storage bucket\n",
@@ -372,7 +396,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "5fce0d5b-740b-4f9c-8479-fa60a0566532",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "DESeq.ds <- DESeqDataSetFromMatrix(countData = round(readcounts), colData = sample_info, design = ~condition)\n"
@@ -392,7 +420,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "cb7c8095-8d5c-4165-a0bf-9acfec7d97fe",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "colData(DESeq.ds) %>% head\n",
@@ -417,7 +449,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "4fc2ab39-8608-435b-a8f9-fb6f379be65a",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "DESeq.ds <- DESeq.ds[ rowSums(counts(DESeq.ds)) > 0, ]\n",
@@ -441,7 +477,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "40aa5366-4c12-4443-99a9-39ac707639d3",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# Get the size factor using estimateSizeFactors from DESeq.\n",
@@ -466,7 +506,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "38523c0a-b9af-49ca-b7e8-2dbb4604fe5c",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# transform size-factor normalized read counts to log2 scale using pseudocount of 1\n",
@@ -495,7 +539,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "a283f6d7-3370-41e7-a85c-c54c695f721f",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# mean-sd plot\n",
@@ -523,7 +571,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "8f444ca6-b525-4e2e-9f9e-4363663b45fc",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# Regularized log-transformed values\n",
@@ -551,7 +603,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "8ca292e8-27a2-4336-b047-07751cef499d",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# cor() calculates the correlation between columns of a matrix\n",
@@ -579,7 +635,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "b38f5fab-4b48-4e74-9e23-793e202312dc",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "P <- plotPCA(DESeq.rlog)\n",
@@ -602,7 +662,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "f36513db-22f6-417f-aaa8-39ba1837ca35",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "# DESeq2 uses the levels of the condition to determine the order of the comparison\n",
@@ -625,7 +689,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "17827bd4-0938-49e8-9f3a-b4e979fedb3a",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "#Check the results of deseq analysis\n",
@@ -646,7 +714,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "39a986b0-3ee2-436a-927b-37f539e7c627",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "#Histogram\n",
@@ -668,7 +740,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "079404d0-d179-4bdf-8a2a-63e135b68c45",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "#MA plot\n",
@@ -692,7 +768,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "5bdda266-08e2-47fd-bdd8-f06cd4dd7f0c",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "#HEATMAP\n",
@@ -736,7 +816,11 @@
    "cell_type": "code",
    "execution_count": null,
    "id": "38f62bcf-3150-417e-bebb-787763db04aa",
-   "metadata": {},
+   "metadata": {
+    "vscode": {
+     "languageId": "r"
+    }
+   },
    "outputs": [],
    "source": [
     "write.table(DGE.results.sorted, file=\"rna-seq_dge-results.txt\", sep = \"\\t\")"
 
@@ -5,13 +5,13 @@ plugins {
 profiles {
     aws {
         process {
-            executor = 'awsbatch'    
-            queue = 'nextflow-batch-job-queue'
+            executor = 'awsbatch'    // name of your Compute environments
+            queue = 'nextflow-batch-job-queue'  // name of your Job queue
             container = 'nf-core/rnaseq'
 
         }
-        workDir = 's3://your_bucket_name/rna-tmp/'
-        params.outdir = 's3://your_bucket_name/rna-outputs/' 
+        workDir = 's3://your_bucket_name/rna-tmp/'    // path of your working directory
+        params.outdir = 's3://your_bucket_name/rna-outputs/'   // path of your output directory
 
         fusion.enabled = true
         wave.enabled = true