From a1d310649ca743aa41cf9834c8c7e91b09715207 Mon Sep 17 00:00:00 2001 From: Ayush Chaurasia Date: Mon, 21 Jun 2021 19:37:11 +0000 Subject: [PATCH 1/2] Update tables API and windows path fix --- utils/wandb_logging/wandb_utils.py | 17 +++++++++++------ 1 file changed, 11 insertions(+), 6 deletions(-) diff --git a/utils/wandb_logging/wandb_utils.py b/utils/wandb_logging/wandb_utils.py index d82633c7e2f6..402305f6fd5b 100644 --- a/utils/wandb_logging/wandb_utils.py +++ b/utils/wandb_logging/wandb_utils.py @@ -171,9 +171,11 @@ def setup_training(self, opt, data_dict): data_dict['val'] = str(val_path) self.val_table = self.val_artifact.get("val") self.map_val_table_path() + wandb.log({"validation dataset": self.val_table}) + if self.val_artifact is not None: self.result_artifact = wandb.Artifact("run_" + wandb.run.id + "_progress", "evaluation") - self.result_table = wandb.Table(["epoch", "id", "prediction", "avg_confidence"]) + self.result_table = wandb.Table(["epoch", "id", "ground truth", "prediction", "avg_confidence"]) if opt.bbox_interval == -1: self.bbox_interval = opt.bbox_interval = (opt.epochs // 10) if opt.epochs > 10 else 1 return data_dict @@ -181,7 +183,7 @@ def setup_training(self, opt, data_dict): def download_dataset_artifact(self, path, alias): if isinstance(path, str) and path.startswith(WANDB_ARTIFACT_PREFIX): artifact_path = Path(remove_prefix(path, WANDB_ARTIFACT_PREFIX) + ":" + alias) - dataset_artifact = wandb.use_artifact(artifact_path.as_posix()) + dataset_artifact = wandb.use_artifact(artifact_path.as_posix().replace("\\","/")) assert dataset_artifact is not None, "'Error: W&B dataset artifact doesn\'t exist'" datadir = dataset_artifact.download() return datadir, dataset_artifact @@ -213,7 +215,7 @@ def log_model(self, path, opt, epoch, fitness_score, best_model=False): aliases=['latest', 'last', 'epoch ' + str(self.current_epoch), 'best' if best_model else '']) print("Saving model artifact on epoch ", epoch + 1) - def log_dataset_artifact(self, data_file, single_cls, project, overwrite_config=False): + def log_dataset_artifact(self, data_file, single_cls, project, overwrite_config=False, ): with open(data_file) as f: data = yaml.safe_load(f) # data dict nc, names = (1, ['item']) if single_cls else (int(data['nc']), data['names']) @@ -297,6 +299,7 @@ def log_training_progress(self, predn, path, names): id = self.val_table_map[Path(path).name] self.result_table.add_data(self.current_epoch, id, + self.val_table.data[id][1], wandb.Image(self.val_table.data[id][1], boxes=boxes, classes=class_set), total_conf / max(1, len(box_data)) ) @@ -312,11 +315,13 @@ def end_epoch(self, best_result=False): wandb.log(self.log_dict) self.log_dict = {} if self.result_artifact: - train_results = wandb.JoinedTable(self.val_table, self.result_table, "id") - self.result_artifact.add(train_results, 'result') + #train_results = wandb.JoinedTable(self.val_table, self.result_table, "id") + self.result_artifact.add(self.result_table, 'result') wandb.log_artifact(self.result_artifact, aliases=['latest', 'last', 'epoch ' + str(self.current_epoch), ('best' if best_result else '')]) - self.result_table = wandb.Table(["epoch", "id", "prediction", "avg_confidence"]) + + wandb.log({"evaluation": self.result_table}) + self.result_table = wandb.Table(["epoch", "id", "ground truth", "prediction", "avg_confidence"]) self.result_artifact = wandb.Artifact("run_" + wandb.run.id + "_progress", "evaluation") def finish_run(self): From a013a2ff3335957ddc1e4e9e3bb08f1d10ec5338 Mon Sep 17 00:00:00 2001 From: Ayush Chaurasia Date: Fri, 25 Jun 2021 14:29:55 +0000 Subject: [PATCH 2/2] update dataset check --- utils/wandb_logging/wandb_utils.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/utils/wandb_logging/wandb_utils.py b/utils/wandb_logging/wandb_utils.py index 402305f6fd5b..f031a819b977 100644 --- a/utils/wandb_logging/wandb_utils.py +++ b/utils/wandb_logging/wandb_utils.py @@ -136,7 +136,6 @@ def __init__(self, opt, name, run_id, data_dict, job_type='Training'): def check_and_upload_dataset(self, opt): assert wandb, 'Install wandb to upload dataset' - check_dataset(self.data_dict) config_path = self.log_dataset_artifact(check_file(opt.data), opt.single_cls, 'YOLOv5' if opt.project == 'runs/train' else Path(opt.project).stem) @@ -215,9 +214,10 @@ def log_model(self, path, opt, epoch, fitness_score, best_model=False): aliases=['latest', 'last', 'epoch ' + str(self.current_epoch), 'best' if best_model else '']) print("Saving model artifact on epoch ", epoch + 1) - def log_dataset_artifact(self, data_file, single_cls, project, overwrite_config=False, ): + def log_dataset_artifact(self, data_file, single_cls, project, overwrite_config=False): with open(data_file) as f: data = yaml.safe_load(f) # data dict + check_dataset(data) nc, names = (1, ['item']) if single_cls else (int(data['nc']), data['names']) names = {k: v for k, v in enumerate(names)} # to index dictionary self.train_artifact = self.create_dataset_table(LoadImagesAndLabels( @@ -230,6 +230,7 @@ def log_dataset_artifact(self, data_file, single_cls, project, overwrite_config= data['val'] = WANDB_ARTIFACT_PREFIX + str(Path(project) / 'val') path = data_file if overwrite_config else '_wandb.'.join(data_file.rsplit('.', 1)) # updated data.yaml path data.pop('download', None) + data.pop('path', None) with open(path, 'w') as f: yaml.safe_dump(data, f) @@ -315,7 +316,6 @@ def end_epoch(self, best_result=False): wandb.log(self.log_dict) self.log_dict = {} if self.result_artifact: - #train_results = wandb.JoinedTable(self.val_table, self.result_table, "id") self.result_artifact.add(self.result_table, 'result') wandb.log_artifact(self.result_artifact, aliases=['latest', 'last', 'epoch ' + str(self.current_epoch), ('best' if best_result else '')])