repeseq_scripts is a collection of scripts used for the
- Artificial generation of sequencing reads replicating a capture experiment of a 4 repeat “GGCCCC” probe within the human genome.
- Alignment and repeat expansion quantification from repeSeq capture
code_location=/Users/zacc/USyd/UMI_repeatexpansions/manuscript_scripts
${code_location}/launch_read_generator_align.pbs
# NOTE - artificial reads can be generated independently by ${code_location}/bash/read_generator_1.2.sh
${code_location}/collapse_trim.sh
${code_location}/repeSeq_STRetch.sh
${code_location}/bed_interesect_analysis.sh
for i in *collapsed_trimmed_R1.fastq.gz;do
echo $i
zcat $i | awk 'NR%4==2' | grep "CCGGGG" | wc -l
zcat $i | awk 'NR%4==2' | grep "CCGGGGCCGGGG" | wc -l
done
${code_location}/general_plotting.R
${code_location}/lola_analysis_repeseq.R