__init__.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
attention.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
blocks.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
embedding.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
feedforward.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
flash_triton.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
layernorm.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
linear.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
position_embedding.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |
transformer.py
|
add training coda and total model
|
2024-02-27 14:33:33 +08:00 |