CPM-9G-8B/9G-Train/cpm/layers
anrongqiao dfbc3be0dc add training coda and total model 2024-02-27 14:33:33 +08:00
..
__init__.py add training coda and total model 2024-02-27 14:33:33 +08:00
attention.py add training coda and total model 2024-02-27 14:33:33 +08:00
blocks.py add training coda and total model 2024-02-27 14:33:33 +08:00
embedding.py add training coda and total model 2024-02-27 14:33:33 +08:00
feedforward.py add training coda and total model 2024-02-27 14:33:33 +08:00
flash_triton.py add training coda and total model 2024-02-27 14:33:33 +08:00
layernorm.py add training coda and total model 2024-02-27 14:33:33 +08:00
linear.py add training coda and total model 2024-02-27 14:33:33 +08:00
position_embedding.py add training coda and total model 2024-02-27 14:33:33 +08:00
transformer.py add training coda and total model 2024-02-27 14:33:33 +08:00