dataset-format-benchmark
========================
This package runs different image format benchmarks for dataset ML tasks
Installation
------------
Make sure you have some system deps installed:
.. code:: bash
sudo apt install pkg-config libhdf5-dev
.. code:: bash
python3.11 -m venv venv --upgrade-deps
source venv/bin/activate
python -m pip install -U -r requirements_dev.txt
# For running on Nvidia GPU:
python -m pip install -U torch torchvision
# For running on CPU:
python -m pip install -U torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cpu
# For some reason h5py fails to install Cython while it needs it
python -m pip install -U Cython
python setup.py develop
Running dataset format benchmark
--------------------------------
.. code:: bash
python -m dataset_format_benchmark --data-root /path/to/datasets/
Raw data
{
"_id": null,
"home_page": "https://github.com/kamikaze/dataset-format-benchmark",
"name": "dataset-format-benchmark",
"maintainer": null,
"docs_url": null,
"requires_python": ">=3.13",
"maintainer_email": null,
"keywords": null,
"author": "Oleg Korsak",
"author_email": "kamikaze.is.waiting.you@gmail.com",
"download_url": "https://files.pythonhosted.org/packages/f8/09/9ae5307a87c6b74c87f0d397f0a38029a7332e5b33e079dc56f9f1fe6776/dataset_format_benchmark-0.2.2.tar.gz",
"platform": "any",
"description": "dataset-format-benchmark\n========================\n\nThis package runs different image format benchmarks for dataset ML tasks\n\nInstallation\n------------\n\nMake sure you have some system deps installed:\n\n.. code:: bash\n\n sudo apt install pkg-config libhdf5-dev\n\n.. code:: bash\n\n python3.11 -m venv venv --upgrade-deps\n source venv/bin/activate\n python -m pip install -U -r requirements_dev.txt\n\n # For running on Nvidia GPU:\n python -m pip install -U torch torchvision\n\n # For running on CPU:\n python -m pip install -U torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cpu\n\n # For some reason h5py fails to install Cython while it needs it\n python -m pip install -U Cython\n\n python setup.py develop\n\nRunning dataset format benchmark\n--------------------------------\n\n.. code:: bash\n\n python -m dataset_format_benchmark --data-root /path/to/datasets/\n",
"bugtrack_url": null,
"license": "gpl-3",
"summary": "Image dataset format benchmark",
"version": "0.2.2",
"project_urls": {
"Documentation": "https://github.com/kamikaze/dataset-format-benchmark/wiki",
"Homepage": "https://github.com/kamikaze/dataset-format-benchmark"
},
"split_keywords": [],
"urls": [
{
"comment_text": null,
"digests": {
"blake2b_256": "79be0bfb02f7f0d8ad385e789ab02124d6741b8a32af93e635b9c70b17f9dbac",
"md5": "345177dd52c02a6cd8120f6fe56ad7ce",
"sha256": "f5ef17e7a5489eed51e3d59fb67012fef1957aeffcaf926a61bcadda2bd6ad3b"
},
"downloads": -1,
"filename": "dataset_format_benchmark-0.2.2-py2.py3-none-any.whl",
"has_sig": false,
"md5_digest": "345177dd52c02a6cd8120f6fe56ad7ce",
"packagetype": "bdist_wheel",
"python_version": "py2.py3",
"requires_python": ">=3.13",
"size": 45749,
"upload_time": "2025-01-30T14:17:07",
"upload_time_iso_8601": "2025-01-30T14:17:07.589099Z",
"url": "https://files.pythonhosted.org/packages/79/be/0bfb02f7f0d8ad385e789ab02124d6741b8a32af93e635b9c70b17f9dbac/dataset_format_benchmark-0.2.2-py2.py3-none-any.whl",
"yanked": false,
"yanked_reason": null
},
{
"comment_text": null,
"digests": {
"blake2b_256": "f8099ae5307a87c6b74c87f0d397f0a38029a7332e5b33e079dc56f9f1fe6776",
"md5": "b08fa6eddc35a5011c6f265efdd77d05",
"sha256": "8a3f5adf8d183d64ee93a286e99bd4f77265cd2908e949afde2f6fccafc24d27"
},
"downloads": -1,
"filename": "dataset_format_benchmark-0.2.2.tar.gz",
"has_sig": false,
"md5_digest": "b08fa6eddc35a5011c6f265efdd77d05",
"packagetype": "sdist",
"python_version": "source",
"requires_python": ">=3.13",
"size": 47905,
"upload_time": "2025-01-30T14:17:11",
"upload_time_iso_8601": "2025-01-30T14:17:11.018371Z",
"url": "https://files.pythonhosted.org/packages/f8/09/9ae5307a87c6b74c87f0d397f0a38029a7332e5b33e079dc56f9f1fe6776/dataset_format_benchmark-0.2.2.tar.gz",
"yanked": false,
"yanked_reason": null
}
],
"upload_time": "2025-01-30 14:17:11",
"github": true,
"gitlab": false,
"bitbucket": false,
"codeberg": false,
"github_user": "kamikaze",
"github_project": "dataset-format-benchmark",
"travis_ci": false,
"coveralls": true,
"github_actions": true,
"requirements": [
{
"name": "Cython",
"specs": [
[
"==",
"3.0.11"
]
]
},
{
"name": "h5py",
"specs": [
[
"==",
"3.12.1"
]
]
},
{
"name": "imageio",
"specs": [
[
"==",
"2.37.0"
]
]
},
{
"name": "kaggle",
"specs": [
[
"==",
"1.6.17"
]
]
},
{
"name": "lightning",
"specs": [
[
"==",
"2.5.0.post0"
]
]
},
{
"name": "matplotlib",
"specs": [
[
"==",
"3.10.0"
]
]
},
{
"name": "numpy",
"specs": [
[
"==",
"2.2.2"
]
]
},
{
"name": "Pillow",
"specs": [
[
"==",
"11.1.0"
]
]
},
{
"name": "pkgconfig",
"specs": [
[
"==",
"1.5.5"
]
]
},
{
"name": "rawpy",
"specs": [
[
"==",
"0.24.0"
]
]
},
{
"name": "scikit-learn",
"specs": [
[
"==",
"1.6.1"
]
]
},
{
"name": "scipy",
"specs": [
[
"==",
"1.15.1"
]
]
},
{
"name": "seaborn",
"specs": [
[
"==",
"0.13.2"
]
]
},
{
"name": "torch",
"specs": []
},
{
"name": "torchvision",
"specs": []
},
{
"name": "tqdm",
"specs": [
[
"==",
"4.67.1"
]
]
},
{
"name": "zarr",
"specs": [
[
"==",
"3.0.1"
]
]
},
{
"name": "requests",
"specs": [
[
"==",
"2.32.3"
]
]
}
],
"lcname": "dataset-format-benchmark"
}