|
- from typing import Callable, Dict, Optional, Tuple
- from .. import datasets as sjds
- from torchvision.datasets.utils import extract_archive
- import os
- import multiprocessing
- from concurrent.futures import ThreadPoolExecutor
- import time
- from .. import configure
- from ..datasets import np_savez
-
- class NCaltech101(sjds.NeuromorphicDatasetFolder):
- def __init__(
- self,
- root: str,
- data_type: str = 'event',
- frames_number: int = None,
- split_by: str = None,
- duration: int = None,
- custom_integrate_function: Callable = None,
- custom_integrated_frames_dir_name: str = None,
- transform: Optional[Callable] = None,
- target_transform: Optional[Callable] = None,
- ) -> None:
- """
- The N-Caltech101 dataset, which is proposed by `Converting Static Image Datasets to Spiking Neuromorphic Datasets Using Saccades <https://www.frontiersin.org/articles/10.3389/fnins.2015.00437/full>`_.
-
- Refer to :class:`spikingjelly.datasets.NeuromorphicDatasetFolder` for more details about params information.
- """
- super().__init__(root, None, data_type, frames_number, split_by, duration, custom_integrate_function, custom_integrated_frames_dir_name, transform, target_transform)
- @staticmethod
- def resource_url_md5() -> list:
- '''
- :return: A list ``url`` that ``url[i]`` is a tuple, which contains the i-th file's name, download link, and MD5
- :rtype: list
- '''
- url = 'https://www.garrickorchard.com/datasets/n-caltech101'
- return [
- ('Caltech101.zip', url, '66201824eabb0239c7ab992480b50ba3'),
- ('Caltech101_annotations.zip', url, '25e64cea645291e368db1e70f214988e'),
- ('ReadMe(Caltech101)-SINAPSE-G.txt', url, 'd464b81684e0af3b5773555eb1d5b95c'),
- ('ReadMe(Caltech101).txt', url, '33632a7a5c46074c70509f960d0dd5e5')
- ]
-
- @staticmethod
- def downloadable() -> bool:
- '''
- :return: Whether the dataset can be directly downloaded by python codes. If not, the user have to download it manually
- :rtype: bool
- '''
- return False
-
- @staticmethod
- def extract_downloaded_files(download_root: str, extract_root: str):
- '''
- :param download_root: Root directory path which saves downloaded dataset files
- :type download_root: str
- :param extract_root: Root directory path which saves extracted files from downloaded files
- :type extract_root: str
- :return: None
-
- This function defines how to extract download files.
- '''
- zip_file = os.path.join(download_root, 'Caltech101.zip')
- print(f'Extract [{zip_file}] to [{extract_root}].')
- extract_archive(zip_file, extract_root)
-
-
- @staticmethod
- def load_origin_data(file_name: str) -> Dict:
- '''
- :param file_name: path of the events file
- :type file_name: str
- :return: a dict whose keys are ``['t', 'x', 'y', 'p']`` and values are ``numpy.ndarray``
- :rtype: Dict
-
- This function defines how to read the origin binary data.
- '''
-
- return sjds.load_ATIS_bin(file_name)
-
- @staticmethod
- def get_H_W() -> Tuple:
- '''
- :return: A tuple ``(H, W)``, where ``H`` is the height of the data and ``W` is the weight of the data.
- For example, this function returns ``(128, 128)`` for the DVS128 Gesture dataset.
- :rtype: tuple
- '''
- return 180, 240
-
- @staticmethod
- def read_bin_save_to_np(bin_file: str, np_file: str):
- events = NCaltech101.load_origin_data(bin_file)
- np_savez(np_file,
- t=events['t'],
- x=events['x'],
- y=events['y'],
- p=events['p']
- )
- print(f'Save [{bin_file}] to [{np_file}].')
-
-
- @staticmethod
- def create_events_np_files(extract_root: str, events_np_root: str):
- '''
- :param extract_root: Root directory path which saves extracted files from downloaded files
- :type extract_root: str
- :param events_np_root: Root directory path which saves events files in the ``npz`` format
- :type events_np_root:
- :return: None
-
- This function defines how to convert the origin binary data in ``extract_root`` to ``npz`` format and save converted files in ``events_np_root``.
- '''
- t_ckp = time.time()
- extract_root = os.path.join(extract_root, 'Caltech101')
- with ThreadPoolExecutor(max_workers=min(multiprocessing.cpu_count(), configure.max_threads_number_for_datasets_preprocess)) as tpe:
- sub_threads = []
- # too many threads will make the disk overload
- for class_name in os.listdir(extract_root):
- bin_dir = os.path.join(extract_root, class_name)
- np_dir = os.path.join(events_np_root, class_name)
- os.mkdir(np_dir)
- print(f'Mkdir [{np_dir}].')
- for bin_file in os.listdir(bin_dir):
- source_file = os.path.join(bin_dir, bin_file)
- target_file = os.path.join(np_dir, os.path.splitext(bin_file)[0] + '.npz')
- print(f'Start to convert [{source_file}] to [{target_file}].')
- sub_threads.append(tpe.submit(NCaltech101.read_bin_save_to_np, source_file,
- target_file))
- for sub_thread in sub_threads:
- if sub_thread.exception():
- print(sub_thread.exception())
- exit(-1)
-
-
- print(f'Used time = [{round(time.time() - t_ckp, 2)}s].')
|