We looked into the relationship between INDEL length and pi and Tajima's D.
bedtools intersect -header -a /fastdata/bop15hjb/h_j_b/GT_data/BGI_BWA_GATK/Analysis_ready_data/final/bgi_10birds.filtered_indels.pol.anno.recomb.line.vcf.gz -b /fastdata/bop15hjb/h_j_b/GT_ref/gt_cds.bed.gz | ./length_summary_stats.py -region CDS > gt_cds_indels_length_sum_raw.csv
bedtools intersect -header -a /fastdata/bop15hjb/h_j_b/GT_data/BGI_BWA_GATK/Analysis_ready_data/final/bgi_10birds.filtered_indels.pol.anno.recomb.line.vcf.gz -b /fastdata/bop15hjb/h_j_b/GT_ref/gt_noncoding.bed.gz | ./length_summary_stats.py -region noncoding > gt_nc_indels_length_sum_raw.csv
bedtools intersect -header -a /fastdata/bop15hjb/h_j_b/GT_data/BGI_BWA_GATK/Analysis_ready_data/final/bgi_10birds.filtered_indels.pol.anno.recomb.line.vcf.gz -b /fastdata/bop15hjb/h_j_b/GT_ref/gt_cds.bed.gz | ./length_summary_stats.py -region CDS -correct_sfs > gt_cds_indels_length_sum.csv
bedtools intersect -header -a /fastdata/bop15hjb/h_j_b/GT_data/BGI_BWA_GATK/Analysis_ready_data/final/bgi_10birds.filtered_indels.pol.anno.recomb.line.vcf.gz -b /fastdata/bop15hjb/h_j_b/GT_ref/gt_noncoding.bed.gz | ./length_summary_stats.py -region noncoding -correct_sfs > gt_nc_indels_length_sum.csv
Rscript length_sum_stats.R