hasktorch-gradually-typed-0.2.0.0: experimental project for hasktorch
Safe HaskellSafe-Inferred
LanguageHaskell2010

Torch.GraduallyTyped.NN.Transformer.T5.Base

Synopsis

Documentation

type T5BaseNumLayers = 12 Source #

T5-Base number of layers. 'num_layers = 12'

t5BaseNumLayers :: SNat T5BaseNumLayers Source #

T5-Base number of layers singleton.

type T5BaseHeadDim = 'Dim ('Name "*") ('Size 12) Source #

T5-Base number of attention heads. 'n_heads = 12'

type T5BaseHeadEmbedDim = 'Dim ('Name "*") ('Size 64) Source #

T5-Base head embedding dimension. 'd_kv = 64'

type T5BaseEmbedDim = 'Dim ('Name "*") ('Size 768) Source #

T5-Base embedding dimension. 'inner_dim = n_heads * d_kv = 768'

type T5BaseInputEmbedDim = 'Dim ('Name "*") ('Size 768) Source #

T5-Base model dimension. 'd_model = 768'

type T5BaseFFNDim = 'Dim ('Name "*") ('Size 3072) Source #

T5-Base feed-forward network dimension. 'd_ff = 3072'

type T5BaseVocabDim = 'Dim ('Name "*") ('Size 32128) Source #

T5-Base vocabulary dimension. 'vocab_size = 32128'

type T5Base (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = T5ModelF 'T5 transformerHead T5BaseNumLayers T5BaseNumLayers gradient device T5BaseHeadDim T5BaseHeadEmbedDim T5BaseEmbedDim T5BaseInputEmbedDim T5BaseFFNDim T5BaseVocabDim hasDropout Source #

T5-Base model.

t5BaseSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (T5Base transformerHead gradient device hasDropout) Source #

T5-Base model specification.