def __init__(self, hidden_size, eps=1e-5): def __init__(self, hidden_size, eps=1e-6): self.gate_proj = nn.Linear(config.hidden_size, config.intermediate_size, bias ...
Some results have been hidden because they may be inaccessible to you
Show inaccessible results