Safe Haskell | Safe-Inferred |
---|---|
Language | Haskell2010 |
Synopsis
- type T5BaseNumLayers = 12
- t5BaseNumLayers :: SNat T5BaseNumLayers
- type T5BaseHeadDim = 'Dim ('Name "*") ('Size 12)
- type T5BaseHeadEmbedDim = 'Dim ('Name "*") ('Size 64)
- type T5BaseEmbedDim = 'Dim ('Name "*") ('Size 768)
- type T5BaseInputEmbedDim = 'Dim ('Name "*") ('Size 768)
- type T5BaseFFNDim = 'Dim ('Name "*") ('Size 3072)
- type T5BaseVocabDim = 'Dim ('Name "*") ('Size 32128)
- type T5Base (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = T5ModelF 'T5 transformerHead T5BaseNumLayers T5BaseNumLayers gradient device T5BaseHeadDim T5BaseHeadEmbedDim T5BaseEmbedDim T5BaseInputEmbedDim T5BaseFFNDim T5BaseVocabDim hasDropout
- t5BaseSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (T5Base transformerHead gradient device hasDropout)
Documentation
type T5BaseNumLayers = 12 Source #
T5-Base number of layers. 'num_layers = 12'
t5BaseNumLayers :: SNat T5BaseNumLayers Source #
T5-Base number of layers singleton.
type T5BaseHeadDim = 'Dim ('Name "*") ('Size 12) Source #
T5-Base number of attention heads. 'n_heads = 12'
type T5BaseHeadEmbedDim = 'Dim ('Name "*") ('Size 64) Source #
T5-Base head embedding dimension. 'd_kv = 64'
type T5BaseEmbedDim = 'Dim ('Name "*") ('Size 768) Source #
T5-Base embedding dimension. 'inner_dim = n_heads * d_kv = 768'
type T5BaseInputEmbedDim = 'Dim ('Name "*") ('Size 768) Source #
T5-Base model dimension. 'd_model = 768'
type T5BaseFFNDim = 'Dim ('Name "*") ('Size 3072) Source #
T5-Base feed-forward network dimension. 'd_ff = 3072'
type T5BaseVocabDim = 'Dim ('Name "*") ('Size 32128) Source #
T5-Base vocabulary dimension. 'vocab_size = 32128'
type T5Base (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = T5ModelF 'T5 transformerHead T5BaseNumLayers T5BaseNumLayers gradient device T5BaseHeadDim T5BaseHeadEmbedDim T5BaseEmbedDim T5BaseInputEmbedDim T5BaseFFNDim T5BaseVocabDim hasDropout Source #
T5-Base model.
t5BaseSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (T5Base transformerHead gradient device hasDropout) Source #
T5-Base model specification.