Skip to content

Commit

Permalink
Asymmetrical cut point (pinellolab#457)
Browse files Browse the repository at this point in the history
* add cut_point_ind to plot_alleles_heatmap for asymmetrical plotting

* Cole asymmetrical cut point (pinellolab#453)

* Pin versions of numpy and matplotlib in CI environment (#84) (pinellolab#452)

* Reduce duplication and implement cut_point_ind in plot_alleles_heatmap_hist

---------

Co-authored-by: Cole Lyman <[email protected]>
  • Loading branch information
2 people authored and mbowcut2 committed Jul 22, 2024
1 parent be9831e commit c1fc5ef
Show file tree
Hide file tree
Showing 2 changed files with 101 additions and 215 deletions.
78 changes: 69 additions & 9 deletions CRISPResso2/CRISPRessoPlot.py
Original file line number Diff line number Diff line change
Expand Up @@ -3061,6 +3061,7 @@ def plot_alleles_heatmap(
custom_colors,
SAVE_ALSO_PNG=False,
plot_cut_point=True,
cut_point_ind=None,
sgRNA_intervals=None,
sgRNA_names=None,
sgRNA_mismatches=None,
Expand All @@ -3077,6 +3078,7 @@ def plot_alleles_heatmap(
-per_element_annot_kws: annotations for each cell (e.g. bold for substitutions, etc.)
-SAVE_ALSO_PNG: whether to write png file as well
-plot_cut_point: if false, won't draw 'predicted cleavage' line
-cut_point_ind: index of cut point (if None, will be plot in the middle calculated as len(reference_seq)/2)
-sgRNA_intervals: locations where sgRNA is located
-sgRNA_mismatches: array (for each sgRNA_interval) of locations in sgRNA where there are mismatches
-sgRNA_names: array (for each sgRNA_interval) of names of sgRNAs (otherwise empty)
Expand Down Expand Up @@ -3198,7 +3200,9 @@ def plot_alleles_heatmap(

#cut point vertical line
if plot_cut_point:
ax_hm.vlines([plot_nuc_len/2], *ax_hm.get_ylim(), linestyles='dashed')
if cut_point_ind is None:
cut_point_ind = [plot_nuc_len / 2]
ax_hm.vlines(cut_point_ind,*ax_hm.get_ylim(),linestyles='dashed')


ax_hm_ref.yaxis.tick_right()
Expand Down Expand Up @@ -3233,7 +3237,7 @@ def plot_alleles_heatmap(
fig.savefig(fig_filename_root+'.png', bbox_inches='tight', bbox_extra_artists=(lgd,))
plt.close(fig)

def plot_alleles_heatmap_hist(reference_seq,fig_filename_root,X,annot,y_labels,insertion_dict,per_element_annot_kws,count_values,custom_colors,SAVE_ALSO_PNG=False,plot_cut_point=True,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,**kwargs):
def plot_alleles_heatmap_hist(reference_seq,fig_filename_root,X,annot,y_labels,insertion_dict,per_element_annot_kws,count_values,custom_colors,SAVE_ALSO_PNG=False,plot_cut_point=True,cut_point_ind=None,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,**kwargs):
"""
Plots alleles in a heatmap (nucleotides color-coded for easy visualization)
input:
Expand All @@ -3246,6 +3250,7 @@ def plot_alleles_heatmap_hist(reference_seq,fig_filename_root,X,annot,y_labels,i
-per_element_annot_kws: annotations for each cell (e.g. bold for substitutions, etc.)
-SAVE_ALSO_PNG: whether to write png file as well
-plot_cut_point: if false, won't draw 'predicted cleavage' line
-cut_point_ind: index of cut point (if None, will be plot in the middle calculated as len(reference_seq)/2)
-sgRNA_intervals: locations where sgRNA is located
-sgRNA_mismatches: array (for each sgRNA_interval) of locations in sgRNA where there are mismatches
-sgRNA_names: array (for each sgRNA_interval) of names of sgRNAs (otherwise empty)
Expand Down Expand Up @@ -3328,7 +3333,9 @@ def plot_alleles_heatmap_hist(reference_seq,fig_filename_root,X,annot,y_labels,i

#cut point vertical line
if plot_cut_point:
ax_hm.vlines([plot_nuc_len/2], *ax_hm.get_ylim(), linestyles='dashed')
if cut_point_ind is None:
cut_point_ind = [plot_nuc_len / 2]
ax_hm.vlines(cut_point_ind, *ax_hm.get_ylim(), linestyles='dashed')

#create boxes for ins
for idx, lss in insertion_dict.items():
Expand Down Expand Up @@ -3368,7 +3375,7 @@ def plot_alleles_heatmap_hist(reference_seq,fig_filename_root,X,annot,y_labels,i
plt.savefig(fig_filename_root+'.png', bbox_inches='tight', bbox_extra_artists=(lgd,), pad_inches=0.1)
plt.close()

def plot_alleles_table(reference_seq,df_alleles,fig_filename_root,custom_colors,MIN_FREQUENCY=0.5,MAX_N_ROWS=100,SAVE_ALSO_PNG=False,plot_cut_point=True,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,annotate_wildtype_allele='****',**kwargs):
def plot_alleles_table(reference_seq,df_alleles,fig_filename_root,custom_colors,MIN_FREQUENCY=0.5,MAX_N_ROWS=100,SAVE_ALSO_PNG=False,plot_cut_point=True,cut_point_ind=None,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,annotate_wildtype_allele='****',**kwargs):
"""
plots an allele table for a dataframe with allele frequencies
input:
Expand All @@ -3379,6 +3386,7 @@ def plot_alleles_table(reference_seq,df_alleles,fig_filename_root,custom_colors,
MAX_N_ROWS: max rows to plot
SAVE_ALSO_PNG: whether to write png file as well
plot_cut_point: if false, won't draw 'predicted cleavage' line
cut_point_ind: index of cut point (if None, will be plot in the middle calculated as len(reference_seq)/2)
sgRNA_intervals: locations where sgRNA is located
sgRNA_mismatches: array (for each sgRNA_interval) of locations in sgRNA where there are mismatches
sgRNA_names: array (for each sgRNA_interval) of names of sgRNAs (otherwise empty)
Expand All @@ -3390,9 +3398,23 @@ def plot_alleles_table(reference_seq,df_alleles,fig_filename_root,custom_colors,
for ix, is_ref in enumerate(is_reference):
if is_ref:
y_labels[ix] += annotate_wildtype_allele
plot_alleles_heatmap(reference_seq, fig_filename_root, X, annot, y_labels, insertion_dict, per_element_annot_kws, custom_colors, SAVE_ALSO_PNG, plot_cut_point, sgRNA_intervals, sgRNA_names, sgRNA_mismatches)

def plot_alleles_table_from_file(alleles_file_name,fig_filename_root,custom_colors,MIN_FREQUENCY=0.5,MAX_N_ROWS=100,SAVE_ALSO_PNG=False,plot_cut_point=True,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,annotate_wildtype_allele='',**kwargs):
plot_alleles_heatmap(reference_seq=reference_seq,
fig_filename_root=fig_filename_root,
X=X,
annot=annot,
y_labels=y_labels,
insertion_dict=insertion_dict,
per_element_annot_kws=per_element_annot_kws,
custom_colors=custom_colors,
SAVE_ALSO_PNG=SAVE_ALSO_PNG,
plot_cut_point=plot_cut_point,
cut_point_ind=cut_point_ind,
sgRNA_intervals=sgRNA_intervals,
sgRNA_names=sgRNA_names,
sgRNA_mismatches=sgRNA_mismatches)

def plot_alleles_table_from_file(alleles_file_name,fig_filename_root,custom_colors,MIN_FREQUENCY=0.5,MAX_N_ROWS=100,SAVE_ALSO_PNG=False,plot_cut_point=True,cut_point_ind=None,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,annotate_wildtype_allele='',**kwargs):
"""
plots an allele table for a dataframe with allele frequencies
infers the reference sequence by finding reference sequences without gaps (-)
Expand All @@ -3405,6 +3427,7 @@ def plot_alleles_table_from_file(alleles_file_name,fig_filename_root,custom_colo
MAX_N_ROWS: max rows to plot
SAVE_ALSO_PNG: whether to write png file as well
plot_cut_point: if false, won't draw 'predicted cleavage' line
cut_point_ind: index of cut point (if None, will be plot in the middle calculated as len(reference_seq)/2)
sgRNA_intervals: locations where sgRNA is located
sgRNA_mismatches: array (for each sgRNA_interval) of locations in sgRNA where there are mismatches
sgRNA_names: array (for each sgRNA_interval) of names of sgRNAs (otherwise empty)
Expand All @@ -3426,7 +3449,20 @@ def plot_alleles_table_from_file(alleles_file_name,fig_filename_root,custom_colo
for ix, is_ref in enumerate(is_reference):
if is_ref:
y_labels[ix] += annotate_wildtype_allele
plot_alleles_heatmap(reference_seq, fig_filename_root, X, annot, y_labels, insertion_dict, per_element_annot_kws, custom_colors, SAVE_ALSO_PNG, plot_cut_point, sgRNA_intervals, sgRNA_names, sgRNA_mismatches)
plot_alleles_heatmap(reference_seq=reference_seq,
fig_filename_root=fig_filename_root,
X=X,
annot=annot,
y_labels=y_labels,
insertion_dict=insertion_dict,
per_element_annot_kws=per_element_annot_kws,
custom_colors=custom_colors,
SAVE_ALSO_PNG=SAVE_ALSO_PNG,
plot_cut_point=plot_cut_point,
cut_point_ind=cut_point_ind,
sgRNA_intervals=sgRNA_intervals,
sgRNA_names=sgRNA_names,
sgRNA_mismatches=sgRNA_mismatches)

def plot_alleles_tables_from_folder(crispresso_output_folder,fig_filename_root,custom_colors,MIN_FREQUENCY=None,MAX_N_ROWS=None,SAVE_ALSO_PNG=False,plot_cut_point=True,sgRNA_intervals=None,sgRNA_names=None,sgRNA_mismatches=None,**kwargs):
"""
Expand Down Expand Up @@ -3495,7 +3531,19 @@ def plot_alleles_tables_from_folder(crispresso_output_folder,fig_filename_root,c
new_sgRNA_intervals += [(int_start - new_sel_cols_start - 1, int_end - new_sel_cols_start - 1)]

X, annot, y_labels, insertion_dict, per_element_annot_kws, is_reference = prep_alleles_table(df_alleles, ref_seq_around_cut, MAX_N_ROWS, MIN_FREQUENCY)
plot_alleles_heatmap(ref_seq_around_cut, fig_filename_root+"_"+ref_name+"_"+sgRNA_label, X, annot, y_labels, insertion_dict, per_element_annot_kws, custom_colors, SAVE_ALSO_PNG, plot_cut_point, new_sgRNA_intervals, sgRNA_names, sgRNA_mismatches)
plot_alleles_heatmap(reference_seq=ref_seq_around_cut,
fig_filename_root=fig_filename_root+"_"+ref_name+"_"+sgRNA_label,
X=X,
annot=annot,
y_labels=y_labels,
insertion_dict=insertion_dict,
per_element_annot_kws=per_element_annot_kws,
custom_colors=custom_colors,
SAVE_ALSO_PNG=SAVE_ALSO_PNG,
plot_cut_point=plot_cut_point,
sgRNA_intervals=new_sgRNA_intervals,
sgRNA_names=sgRNA_names,
sgRNA_mismatches=sgRNA_mismatches)
plot_count += 1
print('Plotted ' + str(plot_count) + ' plots')

Expand All @@ -3517,7 +3565,19 @@ def plot_alleles_table_compare(reference_seq,df_alleles,sample_name_1,sample_nam
custom_colors: dict of colors to plot (e.g. colors['A'] = (1,0,0,0.4) # red,blue,green,alpha )
"""
X, annot, y_labels, insertion_dict, per_element_annot_kws = prep_alleles_table_compare(df_alleles, sample_name_1, sample_name_2, MAX_N_ROWS, MIN_FREQUENCY)
plot_alleles_heatmap(reference_seq, fig_filename_root, X, annot, y_labels, insertion_dict, per_element_annot_kws, custom_colors, SAVE_ALSO_PNG, plot_cut_point, sgRNA_intervals, sgRNA_names, sgRNA_mismatches)
plot_alleles_heatmap(reference_seq=reference_seq,
fig_filename_root=fig_filename_root,
X=X,
annot=annot,
y_labels=y_labels,
insertion_dict=insertion_dict,
per_element_annot_kws=per_element_annot_kws,
custom_colors=custom_colors,
SAVE_ALSO_PNG=SAVE_ALSO_PNG,
plot_cut_point=plot_cut_point,
sgRNA_intervals=sgRNA_intervals,
sgRNA_names=sgRNA_names,
sgRNA_mismatches=sgRNA_mismatches)

def plot_nucleotide_quilt_from_folder(crispresso_output_folder,fig_filename_root,save_also_png=False,sgRNA_intervals=None,min_text_pct=0.5,max_text_pct=0.95,quantification_window_idxs=None,sgRNA_names=None,sgRNA_mismatches=None,shade_unchanged=True,**kwargs):
"""
Expand Down
Loading

0 comments on commit c1fc5ef

Please sign in to comment.