dataset-format-benchmark

Name	dataset-format-benchmark JSON
Version	0.2.2 JSON
	download
home_page	https://github.com/kamikaze/dataset-format-benchmark
Summary	Image dataset format benchmark
upload_time	2025-01-30 14:17:11
maintainer	None
docs_url	None
author	Oleg Korsak
requires_python	>=3.13
license	gpl-3
keywords
VCS
bugtrack_url
requirements	Cython h5py imageio kaggle lightning matplotlib numpy Pillow pkgconfig rawpy scikit-learn scipy seaborn torch torchvision tqdm zarr requests
Travis-CI	No Travis.
coveralls test coverage

            dataset-format-benchmark
========================

This package runs different image format benchmarks for dataset ML tasks

Installation
------------

Make sure you have some system deps installed:

.. code:: bash

   sudo apt install pkg-config libhdf5-dev

.. code:: bash

   python3.11 -m venv venv --upgrade-deps
   source venv/bin/activate
   python -m pip install -U -r requirements_dev.txt

   # For running on Nvidia GPU:
   python -m pip install -U torch torchvision

   # For running on CPU:
   python -m pip install -U torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cpu

   # For some reason h5py fails to install Cython while it needs it
   python -m pip install -U Cython

   python setup.py develop

Running dataset format benchmark
--------------------------------

.. code:: bash

   python -m dataset_format_benchmark --data-root /path/to/datasets/

Raw data

            {
    "_id": null,
    "home_page": "https://github.com/kamikaze/dataset-format-benchmark",
    "name": "dataset-format-benchmark",
    "maintainer": null,
    "docs_url": null,
    "requires_python": ">=3.13",
    "maintainer_email": null,
    "keywords": null,
    "author": "Oleg Korsak",
    "author_email": "kamikaze.is.waiting.you@gmail.com",
    "download_url": "https://files.pythonhosted.org/packages/f8/09/9ae5307a87c6b74c87f0d397f0a38029a7332e5b33e079dc56f9f1fe6776/dataset_format_benchmark-0.2.2.tar.gz",
    "platform": "any",
    "description": "dataset-format-benchmark\n========================\n\nThis package runs different image format benchmarks for dataset ML tasks\n\nInstallation\n------------\n\nMake sure you have some system deps installed:\n\n.. code:: bash\n\n   sudo apt install pkg-config libhdf5-dev\n\n.. code:: bash\n\n   python3.11 -m venv venv --upgrade-deps\n   source venv/bin/activate\n   python -m pip install -U -r requirements_dev.txt\n\n   # For running on Nvidia GPU:\n   python -m pip install -U torch torchvision\n\n   # For running on CPU:\n   python -m pip install -U torch torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cpu\n\n   # For some reason h5py fails to install Cython while it needs it\n   python -m pip install -U Cython\n\n   python setup.py develop\n\nRunning dataset format benchmark\n--------------------------------\n\n.. code:: bash\n\n   python -m dataset_format_benchmark --data-root /path/to/datasets/\n",
    "bugtrack_url": null,
    "license": "gpl-3",
    "summary": "Image dataset format benchmark",
    "version": "0.2.2",
    "project_urls": {
        "Documentation": "https://github.com/kamikaze/dataset-format-benchmark/wiki",
        "Homepage": "https://github.com/kamikaze/dataset-format-benchmark"
    },
    "split_keywords": [],
    "urls": [
        {
            "comment_text": null,
            "digests": {
                "blake2b_256": "79be0bfb02f7f0d8ad385e789ab02124d6741b8a32af93e635b9c70b17f9dbac",
                "md5": "345177dd52c02a6cd8120f6fe56ad7ce",
                "sha256": "f5ef17e7a5489eed51e3d59fb67012fef1957aeffcaf926a61bcadda2bd6ad3b"
            },
            "downloads": -1,
            "filename": "dataset_format_benchmark-0.2.2-py2.py3-none-any.whl",
            "has_sig": false,
            "md5_digest": "345177dd52c02a6cd8120f6fe56ad7ce",
            "packagetype": "bdist_wheel",
            "python_version": "py2.py3",
            "requires_python": ">=3.13",
            "size": 45749,
            "upload_time": "2025-01-30T14:17:07",
            "upload_time_iso_8601": "2025-01-30T14:17:07.589099Z",
            "url": "https://files.pythonhosted.org/packages/79/be/0bfb02f7f0d8ad385e789ab02124d6741b8a32af93e635b9c70b17f9dbac/dataset_format_benchmark-0.2.2-py2.py3-none-any.whl",
            "yanked": false,
            "yanked_reason": null
        },
        {
            "comment_text": null,
            "digests": {
                "blake2b_256": "f8099ae5307a87c6b74c87f0d397f0a38029a7332e5b33e079dc56f9f1fe6776",
                "md5": "b08fa6eddc35a5011c6f265efdd77d05",
                "sha256": "8a3f5adf8d183d64ee93a286e99bd4f77265cd2908e949afde2f6fccafc24d27"
            },
            "downloads": -1,
            "filename": "dataset_format_benchmark-0.2.2.tar.gz",
            "has_sig": false,
            "md5_digest": "b08fa6eddc35a5011c6f265efdd77d05",
            "packagetype": "sdist",
            "python_version": "source",
            "requires_python": ">=3.13",
            "size": 47905,
            "upload_time": "2025-01-30T14:17:11",
            "upload_time_iso_8601": "2025-01-30T14:17:11.018371Z",
            "url": "https://files.pythonhosted.org/packages/f8/09/9ae5307a87c6b74c87f0d397f0a38029a7332e5b33e079dc56f9f1fe6776/dataset_format_benchmark-0.2.2.tar.gz",
            "yanked": false,
            "yanked_reason": null
        }
    ],
    "upload_time": "2025-01-30 14:17:11",
    "github": true,
    "gitlab": false,
    "bitbucket": false,
    "codeberg": false,
    "github_user": "kamikaze",
    "github_project": "dataset-format-benchmark",
    "travis_ci": false,
    "coveralls": true,
    "github_actions": true,
    "requirements": [
        {
            "name": "Cython",
            "specs": [
                [
                    "==",
                    "3.0.11"
                ]
            ]
        },
        {
            "name": "h5py",
            "specs": [
                [
                    "==",
                    "3.12.1"
                ]
            ]
        },
        {
            "name": "imageio",
            "specs": [
                [
                    "==",
                    "2.37.0"
                ]
            ]
        },
        {
            "name": "kaggle",
            "specs": [
                [
                    "==",
                    "1.6.17"
                ]
            ]
        },
        {
            "name": "lightning",
            "specs": [
                [
                    "==",
                    "2.5.0.post0"
                ]
            ]
        },
        {
            "name": "matplotlib",
            "specs": [
                [
                    "==",
                    "3.10.0"
                ]
            ]
        },
        {
            "name": "numpy",
            "specs": [
                [
                    "==",
                    "2.2.2"
                ]
            ]
        },
        {
            "name": "Pillow",
            "specs": [
                [
                    "==",
                    "11.1.0"
                ]
            ]
        },
        {
            "name": "pkgconfig",
            "specs": [
                [
                    "==",
                    "1.5.5"
                ]
            ]
        },
        {
            "name": "rawpy",
            "specs": [
                [
                    "==",
                    "0.24.0"
                ]
            ]
        },
        {
            "name": "scikit-learn",
            "specs": [
                [
                    "==",
                    "1.6.1"
                ]
            ]
        },
        {
            "name": "scipy",
            "specs": [
                [
                    "==",
                    "1.15.1"
                ]
            ]
        },
        {
            "name": "seaborn",
            "specs": [
                [
                    "==",
                    "0.13.2"
                ]
            ]
        },
        {
            "name": "torch",
            "specs": []
        },
        {
            "name": "torchvision",
            "specs": []
        },
        {
            "name": "tqdm",
            "specs": [
                [
                    "==",
                    "4.67.1"
                ]
            ]
        },
        {
            "name": "zarr",
            "specs": [
                [
                    "==",
                    "3.0.1"
                ]
            ]
        },
        {
            "name": "requests",
            "specs": [
                [
                    "==",
                    "2.32.3"
                ]
            ]
        }
    ],
    "lcname": "dataset-format-benchmark"
}

Oleg Korsak