Safe Haskell | Safe-Inferred |
---|---|
Language | Haskell2010 |
Synopsis
- type T5ElevenBNumLayers = 24
- t5ElevenBNumLayers :: SNat T5ElevenBNumLayers
- type T5ElevenBHeadDim = 'Dim ('Name "*") ('Size 128)
- type T5ElevenBHeadEmbedDim = 'Dim ('Name "*") ('Size 128)
- type T5ElevenBEmbedDim = 'Dim ('Name "*") ('Size 16384)
- type T5ElevenBInputEmbedDim = 'Dim ('Name "*") ('Size 1024)
- type T5ElevenBFFNDim = 'Dim ('Name "*") ('Size 65536)
- type T5ElevenBVocabDim = 'Dim ('Name "*") ('Size 32128)
- type T5ElevenB (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = T5ModelF 'T5 transformerHead T5ElevenBNumLayers T5ElevenBNumLayers gradient device T5ElevenBHeadDim T5ElevenBHeadEmbedDim T5ElevenBEmbedDim T5ElevenBInputEmbedDim T5ElevenBFFNDim T5ElevenBVocabDim hasDropout
- t5ElevenBSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (T5ElevenB transformerHead gradient device hasDropout)
Documentation
type T5ElevenBNumLayers = 24 Source #
T5-11B number of layers. 'num_layers = 24'
t5ElevenBNumLayers :: SNat T5ElevenBNumLayers Source #
T5-11B number of layers singleton.
type T5ElevenBHeadDim = 'Dim ('Name "*") ('Size 128) Source #
T5-11B number of attention heads. 'n_heads = 128'
type T5ElevenBHeadEmbedDim = 'Dim ('Name "*") ('Size 128) Source #
T5-11B head embedding dimension. 'd_kv = 128'
type T5ElevenBEmbedDim = 'Dim ('Name "*") ('Size 16384) Source #
T5-11B embedding dimension. 'inner_dim = n_heads * d_kv = 16384'
type T5ElevenBInputEmbedDim = 'Dim ('Name "*") ('Size 1024) Source #
T5-11B model dimension. 'd_model = 1024'
type T5ElevenBFFNDim = 'Dim ('Name "*") ('Size 65536) Source #
T5-11B feed-forward network dimension. 'd_ff = 65536'
type T5ElevenBVocabDim = 'Dim ('Name "*") ('Size 32128) Source #
T5-11B vocabulary dimension. 'vocab_size = 32128'
type T5ElevenB (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = T5ModelF 'T5 transformerHead T5ElevenBNumLayers T5ElevenBNumLayers gradient device T5ElevenBHeadDim T5ElevenBHeadEmbedDim T5ElevenBEmbedDim T5ElevenBInputEmbedDim T5ElevenBFFNDim T5ElevenBVocabDim hasDropout Source #
T5-11B model.
t5ElevenBSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (T5ElevenB transformerHead gradient device hasDropout) Source #
T5-11B model specification.