Spaces:

RWKV-Red-Team
/

RWKV-LatestSpace

Running on T4

sparkleman commited on Mar 20

Commit

6b82cc0

1 Parent(s): 43cae0b

UPDATE

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,7 +5,7 @@ if os.environ.get("MODELSCOPE_ENVIRONMENT") == "studio":
     patch_hub()
-os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:128"
 from config import CONFIG, ModelConfig
@@ -247,7 +247,7 @@ def generate(
         if token == 0 and token in request.stop_tokens:
             yield {
                 "content": "".join(cache_word_list),
-                "tokens": out_tokens[out_last :],
                 "finish_reason": "stop:token:0",
                 "state": model_state,
             }
@@ -266,7 +266,7 @@ def generate(
         if token in request.stop_tokens:
             yield {
                 "content": "".join(cache_word_list),
-                "tokens": out_tokens[out_last :],
                 "finish_reason": f"stop:token:{token}",
                 "state": model_state,
             }

     patch_hub()
+os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:256"
 from config import CONFIG, ModelConfig
         if token == 0 and token in request.stop_tokens:
             yield {
                 "content": "".join(cache_word_list),
+                "tokens": out_tokens[out_last:],
                 "finish_reason": "stop:token:0",
                 "state": model_state,
             }
         if token in request.stop_tokens:
             yield {
                 "content": "".join(cache_word_list),
+                "tokens": out_tokens[out_last:],
                 "finish_reason": f"stop:token:{token}",
                 "state": model_state,
             }