awq
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
gptq
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
__init__.py
|
MLPSpeculator. (#1865)
|
2024-05-14 12:33:18 +02:00 |
conv.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
eetq.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
fp8.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
layernorm.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
linear.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
medusa.py
|
MLPSpeculator. (#1865)
|
2024-05-14 12:33:18 +02:00 |
mlp.py
|
MLPSpeculator. (#1865)
|
2024-05-14 12:33:18 +02:00 |
rotary.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |
speculative.py
|
MLPSpeculator. (#1865)
|
2024-05-14 12:33:18 +02:00 |
tensor_parallel.py
|
Refactor layers. (#1866)
|
2024-05-13 12:44:30 +02:00 |