|
20 | 20 | "cell_type": "code",
|
21 | 21 | "execution_count": null,
|
22 | 22 | "id": "1c2d28e0",
|
23 |
| - "metadata": { |
24 |
| - "vscode": { |
25 |
| - "languageId": "r" |
26 |
| - } |
27 |
| - }, |
| 23 | + "metadata": {}, |
28 | 24 | "outputs": [],
|
29 | 25 | "source": [
|
30 | 26 | "IRdisplay::display_html('<iframe src = \"../../quiz_files/rna-pre_module.html\" width=95% height=600></iframe>')"
|
|
205 | 201 | "cell_type": "code",
|
206 | 202 | "execution_count": null,
|
207 | 203 | "id": "95cda0d2",
|
208 |
| - "metadata": { |
209 |
| - "vscode": { |
210 |
| - "languageId": "r" |
211 |
| - } |
212 |
| - }, |
| 204 | + "metadata": {}, |
213 | 205 | "outputs": [],
|
214 | 206 | "source": [
|
215 | 207 | "system('chmod +x install_rna_seq_packages.sh' , intern=TRUE)\n",
|
|
253 | 245 | "cell_type": "code",
|
254 | 246 | "execution_count": null,
|
255 | 247 | "id": "6da16610-a83f-42b5-be52-f8116db3fb03",
|
256 |
| - "metadata": { |
257 |
| - "vscode": { |
258 |
| - "languageId": "r" |
259 |
| - } |
260 |
| - }, |
| 248 | + "metadata": {}, |
261 | 249 | "outputs": [],
|
262 | 250 | "source": [
|
263 | 251 | "#Install nexflow, make it exceutable, and update it\n",
|
|
292 | 280 | "cell_type": "code",
|
293 | 281 | "execution_count": null,
|
294 | 282 | "id": "bb2e1f61-eea1-4464-9842-76fabae4c39a",
|
295 |
| - "metadata": { |
296 |
| - "vscode": { |
297 |
| - "languageId": "r" |
298 |
| - } |
299 |
| - }, |
| 283 | + "metadata": {}, |
300 | 284 | "outputs": [],
|
301 | 285 | "source": [
|
302 | 286 | "system('./nextflow run nf-core/rnaseq -c rnaseq-aws.config -profile test,aws', intern=TRUE)"
|
|
333 | 317 | "cell_type": "code",
|
334 | 318 | "execution_count": null,
|
335 | 319 | "id": "a5ea70df-98ba-4a69-aeec-2baed34a72fc",
|
336 |
| - "metadata": { |
337 |
| - "vscode": { |
338 |
| - "languageId": "r" |
339 |
| - } |
340 |
| - }, |
| 320 | + "metadata": {}, |
341 | 321 | "outputs": [],
|
342 | 322 | "source": [
|
343 | 323 | "library(DESeq2)\n",
|
|
360 | 340 | "cell_type": "code",
|
361 | 341 | "execution_count": null,
|
362 | 342 | "id": "e49c7007-61b3-4057-89de-3f3fb1085800",
|
363 |
| - "metadata": { |
364 |
| - "vscode": { |
365 |
| - "languageId": "r" |
366 |
| - } |
367 |
| - }, |
| 343 | + "metadata": {}, |
368 | 344 | "outputs": [],
|
369 | 345 | "source": [
|
370 | 346 | "# download data files from storage bucket\n",
|
|
399 | 375 | "cell_type": "code",
|
400 | 376 | "execution_count": null,
|
401 | 377 | "id": "5fce0d5b-740b-4f9c-8479-fa60a0566532",
|
402 |
| - "metadata": { |
403 |
| - "vscode": { |
404 |
| - "languageId": "r" |
405 |
| - } |
406 |
| - }, |
| 378 | + "metadata": {}, |
407 | 379 | "outputs": [],
|
408 | 380 | "source": [
|
409 | 381 | "DESeq.ds <- DESeqDataSetFromMatrix(countData = round(readcounts), colData = sample_info, design = ~condition)\n"
|
|
423 | 395 | "cell_type": "code",
|
424 | 396 | "execution_count": null,
|
425 | 397 | "id": "cb7c8095-8d5c-4165-a0bf-9acfec7d97fe",
|
426 |
| - "metadata": { |
427 |
| - "vscode": { |
428 |
| - "languageId": "r" |
429 |
| - } |
430 |
| - }, |
| 398 | + "metadata": {}, |
431 | 399 | "outputs": [],
|
432 | 400 | "source": [
|
433 | 401 | "colData(DESeq.ds) %>% head\n",
|
|
452 | 420 | "cell_type": "code",
|
453 | 421 | "execution_count": null,
|
454 | 422 | "id": "4fc2ab39-8608-435b-a8f9-fb6f379be65a",
|
455 |
| - "metadata": { |
456 |
| - "vscode": { |
457 |
| - "languageId": "r" |
458 |
| - } |
459 |
| - }, |
| 423 | + "metadata": {}, |
460 | 424 | "outputs": [],
|
461 | 425 | "source": [
|
462 | 426 | "DESeq.ds <- DESeq.ds[ rowSums(counts(DESeq.ds)) > 0, ]\n",
|
|
480 | 444 | "cell_type": "code",
|
481 | 445 | "execution_count": null,
|
482 | 446 | "id": "40aa5366-4c12-4443-99a9-39ac707639d3",
|
483 |
| - "metadata": { |
484 |
| - "vscode": { |
485 |
| - "languageId": "r" |
486 |
| - } |
487 |
| - }, |
| 447 | + "metadata": {}, |
488 | 448 | "outputs": [],
|
489 | 449 | "source": [
|
490 | 450 | "# Get the size factor using estimateSizeFactors from DESeq.\n",
|
|
509 | 469 | "cell_type": "code",
|
510 | 470 | "execution_count": null,
|
511 | 471 | "id": "38523c0a-b9af-49ca-b7e8-2dbb4604fe5c",
|
512 |
| - "metadata": { |
513 |
| - "vscode": { |
514 |
| - "languageId": "r" |
515 |
| - } |
516 |
| - }, |
| 472 | + "metadata": {}, |
517 | 473 | "outputs": [],
|
518 | 474 | "source": [
|
519 | 475 | "# transform size-factor normalized read counts to log2 scale using pseudocount of 1\n",
|
|
542 | 498 | "cell_type": "code",
|
543 | 499 | "execution_count": null,
|
544 | 500 | "id": "a283f6d7-3370-41e7-a85c-c54c695f721f",
|
545 |
| - "metadata": { |
546 |
| - "vscode": { |
547 |
| - "languageId": "r" |
548 |
| - } |
549 |
| - }, |
| 501 | + "metadata": {}, |
550 | 502 | "outputs": [],
|
551 | 503 | "source": [
|
552 | 504 | "# mean-sd plot\n",
|
|
574 | 526 | "cell_type": "code",
|
575 | 527 | "execution_count": null,
|
576 | 528 | "id": "8f444ca6-b525-4e2e-9f9e-4363663b45fc",
|
577 |
| - "metadata": { |
578 |
| - "vscode": { |
579 |
| - "languageId": "r" |
580 |
| - } |
581 |
| - }, |
| 529 | + "metadata": {}, |
582 | 530 | "outputs": [],
|
583 | 531 | "source": [
|
584 | 532 | "# Regularized log-transformed values\n",
|
|
606 | 554 | "cell_type": "code",
|
607 | 555 | "execution_count": null,
|
608 | 556 | "id": "8ca292e8-27a2-4336-b047-07751cef499d",
|
609 |
| - "metadata": { |
610 |
| - "vscode": { |
611 |
| - "languageId": "r" |
612 |
| - } |
613 |
| - }, |
| 557 | + "metadata": {}, |
614 | 558 | "outputs": [],
|
615 | 559 | "source": [
|
616 | 560 | "# cor() calculates the correlation between columns of a matrix\n",
|
|
638 | 582 | "cell_type": "code",
|
639 | 583 | "execution_count": null,
|
640 | 584 | "id": "b38f5fab-4b48-4e74-9e23-793e202312dc",
|
641 |
| - "metadata": { |
642 |
| - "vscode": { |
643 |
| - "languageId": "r" |
644 |
| - } |
645 |
| - }, |
| 585 | + "metadata": {}, |
646 | 586 | "outputs": [],
|
647 | 587 | "source": [
|
648 | 588 | "P <- plotPCA(DESeq.rlog)\n",
|
|
665 | 605 | "cell_type": "code",
|
666 | 606 | "execution_count": null,
|
667 | 607 | "id": "f36513db-22f6-417f-aaa8-39ba1837ca35",
|
668 |
| - "metadata": { |
669 |
| - "vscode": { |
670 |
| - "languageId": "r" |
671 |
| - } |
672 |
| - }, |
| 608 | + "metadata": {}, |
673 | 609 | "outputs": [],
|
674 | 610 | "source": [
|
675 | 611 | "# DESeq2 uses the levels of the condition to determine the order of the comparison\n",
|
|
692 | 628 | "cell_type": "code",
|
693 | 629 | "execution_count": null,
|
694 | 630 | "id": "17827bd4-0938-49e8-9f3a-b4e979fedb3a",
|
695 |
| - "metadata": { |
696 |
| - "vscode": { |
697 |
| - "languageId": "r" |
698 |
| - } |
699 |
| - }, |
| 631 | + "metadata": {}, |
700 | 632 | "outputs": [],
|
701 | 633 | "source": [
|
702 | 634 | "#Check the results of deseq analysis\n",
|
|
717 | 649 | "cell_type": "code",
|
718 | 650 | "execution_count": null,
|
719 | 651 | "id": "39a986b0-3ee2-436a-927b-37f539e7c627",
|
720 |
| - "metadata": { |
721 |
| - "vscode": { |
722 |
| - "languageId": "r" |
723 |
| - } |
724 |
| - }, |
| 652 | + "metadata": {}, |
725 | 653 | "outputs": [],
|
726 | 654 | "source": [
|
727 | 655 | "#Histogram\n",
|
|
743 | 671 | "cell_type": "code",
|
744 | 672 | "execution_count": null,
|
745 | 673 | "id": "079404d0-d179-4bdf-8a2a-63e135b68c45",
|
746 |
| - "metadata": { |
747 |
| - "vscode": { |
748 |
| - "languageId": "r" |
749 |
| - } |
750 |
| - }, |
| 674 | + "metadata": {}, |
751 | 675 | "outputs": [],
|
752 | 676 | "source": [
|
753 | 677 | "#MA plot\n",
|
|
771 | 695 | "cell_type": "code",
|
772 | 696 | "execution_count": null,
|
773 | 697 | "id": "5bdda266-08e2-47fd-bdd8-f06cd4dd7f0c",
|
774 |
| - "metadata": { |
775 |
| - "vscode": { |
776 |
| - "languageId": "r" |
777 |
| - } |
778 |
| - }, |
| 698 | + "metadata": {}, |
779 | 699 | "outputs": [],
|
780 | 700 | "source": [
|
781 | 701 | "#HEATMAP\n",
|
|
819 | 739 | "cell_type": "code",
|
820 | 740 | "execution_count": null,
|
821 | 741 | "id": "38f62bcf-3150-417e-bebb-787763db04aa",
|
822 |
| - "metadata": { |
823 |
| - "vscode": { |
824 |
| - "languageId": "r" |
825 |
| - } |
826 |
| - }, |
| 742 | + "metadata": {}, |
827 | 743 | "outputs": [],
|
828 | 744 | "source": [
|
829 | 745 | "write.table(DGE.results.sorted, file=\"rna-seq_dge-results.txt\", sep = \"\\t\")"
|
|
0 commit comments