From 650057f96946d4766e7a5dfbb958058e38bd73fb Mon Sep 17 00:00:00 2001 From: Labbeti Date: Mon, 4 Mar 2024 18:43:32 +0100 Subject: [PATCH] Version 0.5.1 --- .pre-commit-config.yaml | 36 +++++ CHANGELOG.md | 7 +- CITATION.cff | 6 +- README.md | 14 +- docs/conf.py | 3 +- docs/data_subsets.rst | 14 +- docs/usage.rst | 9 -- examples/dataloader.ipynb | 8 +- requirements-dev.txt | 9 +- src/aac_datasets/__init__.py | 5 +- src/aac_datasets/check.py | 9 +- src/aac_datasets/datasets/audiocaps.py | 33 ++-- src/aac_datasets/datasets/base.py | 142 +++++++++--------- src/aac_datasets/datasets/clotho.py | 18 +-- .../datasets/functional/audiocaps.py | 47 +++--- .../datasets/functional/clotho.py | 20 +-- src/aac_datasets/datasets/functional/macs.py | 15 +- .../datasets/functional/wavcaps.py | 131 +++++++++++----- src/aac_datasets/datasets/macs.py | 21 +-- src/aac_datasets/datasets/wavcaps.py | 25 ++- src/aac_datasets/utils/collections.py | 7 +- src/aac_datasets/utils/download.py | 31 ++-- tests/test_datasets_base.py | 5 +- 23 files changed, 332 insertions(+), 283 deletions(-) create mode 100644 .pre-commit-config.yaml diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml new file mode 100644 index 0000000..15b5d0f --- /dev/null +++ b/.pre-commit-config.yaml @@ -0,0 +1,36 @@ +# exclude: "" + +repos: + # Format Code + - repo: https://github.com/ambv/black + rev: 22.10.0 + hooks: + - id: black + + # Sort imports + - repo: https://github.com/PyCQA/isort + rev: 5.12.0 + hooks: + - id: isort + args: ["--profile", "black"] + + # Formatting, Whitespace, etc + - repo: https://github.com/pre-commit/pre-commit-hooks + rev: v2.2.3 + hooks: + - id: trailing-whitespace + - id: check-added-large-files + args: ['--maxkb=1000'] + - id: check-ast + - id: check-json + - id: check-merge-conflict + - id: check-xml + - id: check-yaml + - id: debug-statements + - id: end-of-file-fixer + - id: requirements-txt-fixer + - id: mixed-line-ending + args: ['--fix=no'] + - id: flake8 + # args: ['--ignore=E203,E501,F811,E712,W503'] + args: ['--config=.flake8'] diff --git a/CHANGELOG.md b/CHANGELOG.md index 0194f92..c5a0040 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -2,6 +2,11 @@ All notable changes to this project will be documented in this file. +## [0.5.1] 2024-03-04 +### Fixed +- WavCaps download preparation (#3). +- `safe_rmdir` function when sub-directories are deleted. + ## [0.5.0] 2024-01-05 ### Changed - Update typing for paths with python class `Path`. @@ -83,7 +88,7 @@ All notable changes to this project will be documented in this file. - Weak private methods are now strongly private in datasets. - Rename `item_transform` to `transform` in datasets. - Rename `load_tags` to `with_tags` in `AudioCaps`. - + ### Fixed - AudioCaps loading when `with_tags` is False. - Clotho files download. diff --git a/CITATION.cff b/CITATION.cff index db5dd24..edde21f 100644 --- a/CITATION.cff +++ b/CITATION.cff @@ -11,7 +11,7 @@ authors: affiliation: IRIT orcid: 'https://orcid.org/0000-0002-7219-5463' repository-code: 'https://github.com/Labbeti/aac-datasets/' -abstract: Audio Captioning datasets for Pytorch. +abstract: Audio Captioning datasets for PyTorch. keywords: - audio - deep-learning @@ -22,5 +22,5 @@ keywords: - captioning - audio-captioning license: MIT -version: 0.5.0 -date-released: '2024-01-05' +version: 0.5.1 +date-released: '2024-03-04' diff --git a/README.md b/README.md index 1143565..5bc8739 100644 --- a/README.md +++ b/README.md @@ -67,7 +67,7 @@ aac-datasets-download --root "." clotho --subsets "dev" ``` ## Datasets information -Here is the statistics for each dataset : +`aac-datasets` package contains 4 different datasets :