|
attention
|
ugh
|
2024-08-30 14:39:07 -05:00 |
|
__init__.py
|
cleanup
|
2024-11-21 23:08:43 -06:00 |
|
llama.py
|
fixed training tqdm being stubborn
|
2024-11-23 09:45:23 -06:00 |
|
mamba.py
|
touch ups in docs
|
2024-12-02 19:10:42 -06:00 |
|
mixtral.py
|
fixed attentions for MoE
|
2024-08-27 17:02:42 -05:00 |
|
retnet.py
|
cleanup
|
2024-06-05 20:30:43 -05:00 |
|
transformer.py
|
cleanup
|
2024-06-05 20:30:43 -05:00 |