mirror of
http://43.156.76.180:8026/YuuMJ/EukPhylo.git
synced 2025-12-27 05:10:28 +08:00
Fixed typo by changing geom_line(data = enc_null, aes(GC3, ENc)) to geom_line(data = enc_null, aes(GC3S, ENc))
39 lines
1.7 KiB
R
39 lines
1.7 KiB
R
'''
|
|
#Author, date: Auden Cote-L'Heureux, last updated in September 2023 by Adri
|
|
#Intent: To make a simple jellyfish plot from a dataset like the one produced by the CUB_v2.1.py script, also in the Github Utilities folder.
|
|
#Input: CompTrans.ENc.Raw.tsv and ENc.Null.tsv
|
|
#Output: Jellyfish plots
|
|
'''
|
|
|
|
#load necessary packages
|
|
library(tidyverse)
|
|
|
|
#Change to the path of the directory you're working from
|
|
#Use "getwd()" in console below to get path
|
|
setwd("/Users/agrow/Desktop/NewCUB_meta/CUBOutput/SpreadSheets")
|
|
|
|
#You may need to change name of data frame below
|
|
#if you used the CUB_v2.1.py script from Github, it should be in the
|
|
#CUBOutput folder and then inside the SpreadSheets folder
|
|
#you are looking for the CompTrans.ENc.Raw.tsv
|
|
gc3 <- data.frame(read_tsv('CompTrans.ENc.Raw.tsv'))%>%
|
|
mutate(taxon = paste(substr(SequenceID, 1, 4), substr(SequenceID,6,10), sep = '')) #this line reads in your 10-digit codes to a column in the data frame called taxon
|
|
|
|
#This .tsv is generated by the CUB script and will be in the same folder as the .tsv above
|
|
#This generates the null expectation line
|
|
enc_null <- data.frame(read_tsv('ENc.Null.tsv'))
|
|
|
|
#change data in first line here to what you want plotted
|
|
#you need as.numeric to ensure R is reading the variable correctly
|
|
gc3_plot <- ggplot(gc3, aes(as.numeric(GC3.Degen), as.numeric(ObsWrightENc_No6Fold)))+
|
|
geom_point(size = 0.1)+
|
|
geom_line(data = enc_null, aes(GC3S, ENc))+
|
|
theme_classic()+
|
|
labs(x = 'GC3 Degen', y = 'ObsWrightENc_No6fold')+
|
|
theme(legend.position = 'none')+
|
|
ggtitle("Metatranscriptomics R2G NTD files")+
|
|
theme(axis.text.x=element_text(colour="black"))+
|
|
theme(axis.text.y=element_text(colour="black"))+
|
|
facet_wrap(vars(taxon), scales = 'free_x')
|
|
gc3_plot
|