hezar.models.mask_filling.bert.bert_mask_filling_config module

class hezar.models.mask_filling.bert.bert_mask_filling_config.BertMaskFillingConfig(task: str = <TaskType.MASK_FILLING: 'mask_filling'>, vocab_size: int = 42000, hidden_size: int = 768, num_hidden_layers: int = 12, num_attention_heads: int = 12, intermediate_size: int = 3072, hidden_act: str = 'gelu', hidden_dropout_prob: float = 0.1, attention_probs_dropout_prob: float = 0.1, max_position_embeddings: int = 512, type_vocab_size: int = 2, initializer_range: float = 0.02, layer_norm_eps: float = 1e-12, pad_token_id: int = 0, position_embedding_type: str = 'absolute', use_cache: bool = True, classifier_dropout: float = None)[source]

Bases: ModelConfig

attention_probs_dropout_prob: float = 0.1
classifier_dropout: float = None
hidden_act: str = 'gelu'
hidden_dropout_prob: float = 0.1
hidden_size: int = 768
initializer_range: float = 0.02
intermediate_size: int = 3072
layer_norm_eps: float = 1e-12
max_position_embeddings: int = 512
name: str = 'bert_mask_filling'
num_attention_heads: int = 12
num_hidden_layers: int = 12
pad_token_id: int = 0
position_embedding_type: str = 'absolute'
task: str = 'mask_filling'
type_vocab_size: int = 2
use_cache: bool = True
vocab_size: int = 42000