hezar.models.mask_filling.distilbert.distilbert_mask_filling_config module

class hezar.models.mask_filling.distilbert.distilbert_mask_filling_config.DistilBertMaskFillingConfig(task: str = <TaskType.MASK_FILLING: 'mask_filling'>, activation: str = 'gelu', attention_dropout: float = 0.1, dim: int = 768, dropout: float = 0.1, hidden_dim: int = 3072, initializer_range: float = 0.02, max_position_embeddings: int = 512, n_heads: int = 12, n_layers: int = 6, output_past: bool = True, pad_token_id: int = 0, qa_dropout: float = 0.1, tie_weights_: bool = True, vocab_size: int = 42000)[source]

Bases: ModelConfig

activation: str = 'gelu'
attention_dropout: float = 0.1
dim: int = 768
dropout: float = 0.1
hidden_dim: int = 3072
initializer_range: float = 0.02
max_position_embeddings: int = 512
n_heads: int = 12
n_layers: int = 6
name: str = 'distilbert_mask_filling'
output_past: bool = True
pad_token_id: int = 0
qa_dropout: float = 0.1
task: str = 'mask_filling'
tie_weights_: bool = True
vocab_size: int = 42000