Spaces:
Sleeping
Sleeping
Update utils.py
Browse files
utils.py
CHANGED
@@ -68,6 +68,24 @@ def plot_2d_comparison(dna_sequences_grouped, labels, mapping=mapping_easy):
|
|
68 |
ax.legend(by_label.values(), by_label.keys())
|
69 |
return fig
|
70 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
71 |
|
72 |
############################################################# Virus Dataset ########################################################
|
73 |
#ds = load_dataset('Hack90/virus_tiny')
|
|
|
68 |
ax.legend(by_label.values(), by_label.keys())
|
69 |
return fig
|
70 |
|
71 |
+
# Function to plot a comparison of DNA sequences
|
72 |
+
def plot_distrobutions(dna_sequences_grouped, labels, basepair, mapping=mapping_easy):
|
73 |
+
fig, ax = plt.subplots()
|
74 |
+
colors = plt.cm.rainbow(np.linspace(0, 1, len(dna_sequences_grouped)))
|
75 |
+
for count, (dna_sequences, color) in enumerate(zip(dna_sequences_grouped, colors)):
|
76 |
+
virus_y = []
|
77 |
+
for dna_sequence in dna_sequences:
|
78 |
+
mapped_coords = _dna_to_coordinates(dna_sequence, mapping)
|
79 |
+
cumulative_coords = _get_cumulative_coords(mapped_coords)
|
80 |
+
y = cumulative_coords[:, 1][basepair]
|
81 |
+
virus_y.append(y)
|
82 |
+
count_bins, bins = np.histogram(virus_y)
|
83 |
+
ax.stairs(count_bins, bins , color= color, label[count])
|
84 |
+
# Only show unique labels in the legend
|
85 |
+
handles, labels = ax.get_legend_handles_labels()
|
86 |
+
by_label = dict(zip(labels, handles))
|
87 |
+
ax.legend(by_label.values(), by_label.keys())
|
88 |
+
return fig
|
89 |
|
90 |
############################################################# Virus Dataset ########################################################
|
91 |
#ds = load_dataset('Hack90/virus_tiny')
|