Struct burn::data::dataset::HuggingfaceDatasetLoader

pub struct HuggingfaceDatasetLoader { /* private fields */ }
Expand description

Load a dataset from huggingface datasets.

The dataset with all splits is stored in a single sqlite database (see SqliteDataset).

§Example

 use burn_dataset::HuggingfaceDatasetLoader;
 use burn_dataset::SqliteDataset;
 use serde::{Deserialize, Serialize};

#[derive(Deserialize, Debug, Clone)]
struct MnistItemRaw {
    pub image_bytes: Vec<u8>,
    pub label: usize,
}

 let train_ds:SqliteDataset<MnistItemRaw> = HuggingfaceDatasetLoader::new("mnist")
      .dataset("train")
      .unwrap();

Implementations§

§

impl HuggingfaceDatasetLoader

pub fn new(name: &str) -> HuggingfaceDatasetLoader

Create a huggingface dataset loader.

pub fn with_subset(self, subset: &str) -> HuggingfaceDatasetLoader

Create a huggingface dataset loader for a subset of the dataset.

The subset name must be one of the subsets listed in the dataset page.

If no subset names are listed, then do not use this method.

pub fn with_base_dir(self, base_dir: &str) -> HuggingfaceDatasetLoader

Specify a base directory to store the dataset.

If not specified, the dataset will be stored in ~/.cache/burn-dataset.

pub fn with_huggingface_token( self, huggingface_token: &str, ) -> HuggingfaceDatasetLoader

Specify a huggingface token to download datasets behind authentication.

You can get a token from tokens settings

pub fn with_huggingface_cache_dir( self, huggingface_cache_dir: &str, ) -> HuggingfaceDatasetLoader

Specify a huggingface cache directory to store the downloaded datasets.

If not specified, the dataset will be stored in ~/.cache/huggingface/datasets.

pub fn with_trust_remote_code( self, trust_remote_code: bool, ) -> HuggingfaceDatasetLoader

Specify whether or not to trust remote code.

If not specified, trust remote code is set to true.

pub fn dataset<I>(self, split: &str) -> Result<SqliteDataset<I>, ImporterError>

Load the dataset.

pub fn db_file(self) -> Result<PathBuf, ImporterError>

Get the path to the sqlite database file.

If the database file does not exist, it will be downloaded and imported.

Auto Trait Implementations§

Blanket Implementations§

source§

impl<T> Any for T
where T: 'static + ?Sized,

source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
source§

impl<T> Borrow<T> for T
where T: ?Sized,

source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
§

impl<T> Downcast<T> for T

§

fn downcast(&self) -> &T

source§

impl<T> From<T> for T

source§

fn from(t: T) -> T

Returns the argument unchanged.

§

impl<T> Instrument for T

§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided [Span], returning an Instrumented wrapper. Read more
§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
source§

impl<T, U> Into<U> for T
where U: From<T>,

source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

source§

impl<T> IntoEither for T

source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
§

impl<T> Pointable for T

§

const ALIGN: usize = _

The alignment of pointer.
§

type Init = T

The type for initializers.
§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
source§

impl<T> Same for T

§

type Output = T

Should always be Self
source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

§

type Error = Infallible

The type returned in the event of a conversion error.
source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
§

impl<T> Upcast<T> for T

§

fn upcast(&self) -> Option<&T>

§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

§

fn vzip(self) -> V

§

impl<T> WithSubscriber for T

§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a [WithDispatch] wrapper. Read more
§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a [WithDispatch] wrapper. Read more
§

impl<T> ErasedDestructor for T
where T: 'static,

§

impl<T> WasmNotSend for T
where T: Send,

§

impl<T> WasmNotSendSync for T
where T: WasmNotSend + WasmNotSync,

§

impl<T> WasmNotSync for T
where T: Sync,