Safe Haskell | Safe-Inferred |
---|---|
Language | Haskell2010 |
Synopsis
- type BARTBaseNumLayers = 6
- bartBaseNumLayers :: SNat BARTBaseNumLayers
- type BARTBaseHeadDim = 'Dim ('Name "*") ('Size 12)
- bartBaseHeadDim :: SDim BARTBaseHeadDim
- type BARTBaseHeadEmbedDim = 'Dim ('Name "*") ('Size 64)
- bartBaseHeadEmbedDim :: SDim BARTBaseHeadEmbedDim
- type BARTBaseEmbedDim = 'Dim ('Name "*") ('Size 768)
- bartBaseEmbedDim :: SDim BARTBaseEmbedDim
- type BARTBaseInputEmbedDim = 'Dim ('Name "*") ('Size 768)
- bartBaseInputEmbedDim :: SDim BARTBaseInputEmbedDim
- type BARTBaseFFNDim = 'Dim ('Name "*") ('Size 3072)
- bartBaseFFNDim :: SDim BARTBaseFFNDim
- type BARTBaseVocabDim = 'Dim ('Name "*") ('Size 50265)
- bartBaseVocabDim :: SDim BARTBaseVocabDim
- type BARTBase (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = BARTModelF transformerHead BARTBaseNumLayers gradient device BARTBaseHeadDim BARTBaseHeadEmbedDim BARTBaseEmbedDim BARTBaseInputEmbedDim BARTBaseFFNDim BARTBaseVocabDim hasDropout
- bartBaseSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (BARTBase transformerHead gradient device hasDropout)
Documentation
type BARTBaseNumLayers = 6 Source #
BART-Base number of layers. 'encoder_layers = 6' 'decoder_layers = 6'
bartBaseNumLayers :: SNat BARTBaseNumLayers Source #
BART-Base number of layers singleton.
type BARTBaseHeadDim = 'Dim ('Name "*") ('Size 12) Source #
BART-Base number of attention heads. 'encoder_attention_heads = 12' 'decoder_attention_heads = 12'
bartBaseHeadDim :: SDim BARTBaseHeadDim Source #
BART-Base number of attention heads singleton.
type BARTBaseHeadEmbedDim = 'Dim ('Name "*") ('Size 64) Source #
BART-Base head embedding dimension. 'd_kv = 64'
bartBaseHeadEmbedDim :: SDim BARTBaseHeadEmbedDim Source #
BART-Base head embedding dimension singleton.
type BARTBaseEmbedDim = 'Dim ('Name "*") ('Size 768) Source #
BART-Base embedding dimension. 'hidden_size = n_heads * d_kv = 768'
bartBaseEmbedDim :: SDim BARTBaseEmbedDim Source #
BART-Base embedding dimension singleton.
type BARTBaseInputEmbedDim = 'Dim ('Name "*") ('Size 768) Source #
BART-Base model dimension. 'd_model = 768'
bartBaseInputEmbedDim :: SDim BARTBaseInputEmbedDim Source #
BART-Base model dimension singleton.
type BARTBaseFFNDim = 'Dim ('Name "*") ('Size 3072) Source #
BART-Base feed-forward network dimension. 'encoder_ffn_dim = 3072' 'decoder_ffn_dim = 3072'
bartBaseFFNDim :: SDim BARTBaseFFNDim Source #
BART-Base feed-forward network dimension singleton.
type BARTBaseVocabDim = 'Dim ('Name "*") ('Size 50265) Source #
BART-Base vocabulary dimension. 'vocab_size = 50265'
bartBaseVocabDim :: SDim BARTBaseVocabDim Source #
BART-Base vocabulary dimension singleton.
type BARTBase (transformerHead :: TransformerHead) (gradient :: Gradient RequiresGradient) (device :: Device (DeviceType Nat)) (hasDropout :: HasDropout) = BARTModelF transformerHead BARTBaseNumLayers gradient device BARTBaseHeadDim BARTBaseHeadEmbedDim BARTBaseEmbedDim BARTBaseInputEmbedDim BARTBaseFFNDim BARTBaseVocabDim hasDropout Source #
BART-Base model.
bartBaseSpec :: STransformerHead transformerHead -> SGradient gradient -> SDevice device -> SHasDropout hasDropout -> ModelSpec (BARTBase transformerHead gradient device hasDropout) Source #
BART-Base model specification.