from encoder.data_objects.speaker_verification_dataset import SpeakerVerificationDataset from datetime import datetime from time import perf_counter as clock import matplotlib.pyplot as plt import numpy as np import webbrowser import visdom import umap colormap = np.array([ [76, 255, 0], [0, 127, 70], [255, 0, 0], [255, 217, 38], [0, 135, 255], [165, 0, 165], [255, 167, 255], [0, 255, 255], [255, 96, 38], [142, 76, 0], [33, 0, 127], [0, 0, 0], [183, 183, 183], ], dtype=np.float) / 255 class Visualizations: def __init__(self, env_name=None, device_name=None, server="http://localhost", disabled=False): self.last_update_timestamp = clock() self.mean_time_per_step = -1 self.loss_exp = None self.eer_exp = None self.disabled = disabled # TODO: use a better paradigm for that if self.disabled: return now = str(datetime.now().strftime("%d-%m %Hh%M")) if env_name is None: self.env_name = now else: self.env_name = "%s (%s)" % (env_name, now) try: self.vis = visdom.Visdom(server, env=self.env_name, raise_exceptions=True) except ConnectionError: raise Exception("No visdom server detected. Run the command \"visdom\" in your CLI to " "start it.") # webbrowser.open("http://localhost:8097/env/" + self.env_name) self.loss_win = None self.eer_win = None self.lr_win = None self.implementation_win = None self.projection_win = None self.implementation_string = "" self.log_params() if device_name is not None: self.log_implementation({"Device": device_name}) def log_params(self): if self.disabled: return from encoder import params_data from encoder import params_model param_string = "Model parameters:
" for param_name in (p for p in dir(params_model) if not p.startswith("__")): value = getattr(params_model, param_name) param_string += "\t%s: %s
" % (param_name, value) param_string += "Data parameters:
" for param_name in (p for p in dir(params_data) if not p.startswith("__")): value = getattr(params_data, param_name) param_string += "\t%s: %s
" % (param_name, value) self.vis.text(param_string, opts={"title": "Parameters"}) def log_dataset(self, dataset: SpeakerVerificationDataset): if self.disabled: return dataset_string = "" dataset_string += "Speakers: %s\n" % len(dataset.speakers) dataset_string += "\n" + dataset.get_logs() dataset_string = dataset_string.replace("\n", "
") self.vis.text(dataset_string, opts={"title": "Dataset"}) def log_implementation(self, params): if self.disabled: return implementation_string = "" for param, value in params.items(): implementation_string += "%s: %s\n" % (param, value) implementation_string = implementation_string.replace("\n", "
") self.implementation_string = implementation_string self.implementation_win = self.vis.text( implementation_string, opts={"title": "Training implementation"} ) def update(self, loss, eer, lr, step): self.loss_exp = loss if self.loss_exp is None else 0.985 * self.loss_exp + 0.015 * loss self.eer_exp = eer if self.eer_exp is None else 0.985 * self.eer_exp + 0.015 * eer if not self.disabled: self.loss_win = self.vis.line( [[loss, self.loss_exp]], [[step, step]], win=self.loss_win, update="append" if self.loss_win else None, opts=dict( legend=["Loss", "Avg. loss"], xlabel="Step", ylabel="Loss", title="Loss", ) ) self.eer_win = self.vis.line( [[eer, self.eer_exp]], [[step, step]], win=self.eer_win, update="append" if self.eer_win else None, opts=dict( legend=["EER", "Avg. EER"], xlabel="Step", ylabel="EER", title="Equal error rate" ) ) self.lr_win = self.vis.line( [lr], [step], win=self.lr_win, update="append" if self.lr_win else None, opts=dict( xlabel="Step", ylabel="Learning rate", ytype="log", title="Learning rate" ) ) now = clock() time_per_step = (now - self.last_update_timestamp) self.last_update_timestamp = now if self.mean_time_per_step == -1: self.mean_time_per_step = time_per_step else: self.mean_time_per_step = self.mean_time_per_step * 0.9 + time_per_step * 0.1 if not self.disabled and self.implementation_win is not None: time_string = "Mean time per step: %dms" % int(1000 * self.mean_time_per_step) time_string += "
Last step time: %dms" % int(1000 * time_per_step) self.vis.text( self.implementation_string + time_string, win=self.implementation_win, opts={"title": "Training implementation"}, ) print("Step %6d Loss: %.4f EER: %.4f LR: %g Mean step time: %5dms " "Last step time: %5dms" % (step, self.loss_exp, self.eer_exp, lr, int(1000 * self.mean_time_per_step), int(1000 * time_per_step))) def draw_projections(self, embeds, utterances_per_speaker, step, out_fpath=None, max_speakers=10): max_speakers = min(max_speakers, len(colormap)) embeds = embeds[:max_speakers * utterances_per_speaker] n_speakers = len(embeds) // utterances_per_speaker ground_truth = np.repeat(np.arange(n_speakers), utterances_per_speaker) colors = [colormap[i] for i in ground_truth] reducer = umap.UMAP() projected = reducer.fit_transform(embeds) plt.scatter(projected[:, 0], projected[:, 1], c=colors) plt.gca().set_aspect("equal", "datalim") plt.title("UMAP projection (step %d)" % step) if not self.disabled: self.projection_win = self.vis.matplot(plt, win=self.projection_win) if out_fpath is not None: plt.savefig(out_fpath) plt.clf() def save(self): if not self.disabled: self.vis.save([self.env_name])