# script to run phyloscanner: https://github.com/BDI-pathogens/phyloscanner
# this script run the second part of phyloscanner:
# it will analyze trees generated with script 7.Estimate_trees_read_alignments_v2.R
# phyloscanner dependencies
# https://github.com/BDI-pathogens/phyloscanner/blob/master/InfoAndInputs/InstallationNotesForMakingTrees.sh
#start of script
start_time <- Sys.time()
library(DescTools)
#location of phyloscanner make analyse_trees R program
phyloscanner <- paste(getwd(), "phyloscanner", sep = "/")
analyse_trees <- paste(phyloscanner, "phyloscanner_analyse_trees.R", sep = "/")
# phyloscanner analyse_trees parameters that does not depend on location
# of results of running run_phyloscanner_part1.R
#label to name output results
output_label <- "results"
#splits rule
splitsRule <- "s,20"
# outgroup name
outgroup <- "--outgroupName C.BR.92.BR025_d.U52953"
# multifurcation threshold as g = "guess"
multifurcation <- "--multifurcationThreshold g"
#allow multi transmission
multtrans <- "--allowMultiTrans"
#allow all classifications
classification <- "--allClassifications"
#distance threshold
#summarize all pairwise relationships in csv summary file
# I did not used the value for distance threshold and phyloscanner then assumes
#it is Inf (shows all transmission pairs)
distance <- "--distanceThreshold 0.05"
#normRefFileName: using
#update this later using the 2019 reference genome sequences I used with shiver
#check manual on how to create this normalization file
norm_file_location <- paste(getwd(),"output_all_ByPosition.csv", sep ="/")
#norm_file_location <- "/Users/user/Desktop/Imperial/newHIVproject-01Aug2020/shiver/HIV_REF_alignment/norm_resultscanner_ByPosition.csv"
norm <- paste("--normRefFileName", norm_file_location, sep = " ")
# list directories
tree_files <- list.files(path = "iqtree",
pattern = "treefile")
#directory phyloscanner used to save results of make_trees
iqtree_dir <- paste(getwd(), "iqtree", sep = "/")
#location of iqtree tree files
iqtree_trees <- paste(iqtree_dir, "*.treefile", sep = "/")
treefile_extension <- "--treeFileExtension .treefile"
parameters <- paste(iqtree_dir, treefile_extension, output_label, splitsRule, outgroup,
multifurcation, multtrans, classification, distance, norm, sep = " ")
command_analyse_trees <- paste("cd", iqtree_dir, "&&", analyse_trees, sep = " ")
analyseTrees_and_args <- paste(command_analyse_trees, parameters, sep = " ")
system(analyseTrees_and_args)
#end of script
end_time <- Sys.time()
print("Simulation took:")
end_time - start_time
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.