Spaces:
Running
on
T4
Running
on
T4
Update app.py
Browse files
app.py
CHANGED
@@ -18,7 +18,7 @@ os.environ["RWKV_CUDA_ON"] = '1' # if '1' then use CUDA kernel for seq mode (muc
|
|
18 |
|
19 |
from rwkv.model import RWKV
|
20 |
model_path = hf_hub_download(repo_id="BlinkDL/rwkv-4-pile-14b", filename="RWKV-4-Pile-14B-20230228-ctx4096-test663.pth")
|
21 |
-
model = RWKV(model=model_path, strategy='cuda fp16i8 *
|
22 |
from rwkv.utils import PIPELINE, PIPELINE_ARGS
|
23 |
pipeline = PIPELINE(model, "20B_tokenizer.json")
|
24 |
|
|
|
18 |
|
19 |
from rwkv.model import RWKV
|
20 |
model_path = hf_hub_download(repo_id="BlinkDL/rwkv-4-pile-14b", filename="RWKV-4-Pile-14B-20230228-ctx4096-test663.pth")
|
21 |
+
model = RWKV(model=model_path, strategy='cuda fp16i8 *20 -> cuda fp16')
|
22 |
from rwkv.utils import PIPELINE, PIPELINE_ARGS
|
23 |
pipeline = PIPELINE(model, "20B_tokenizer.json")
|
24 |
|