Output Streaming on by Default

2025-06-05 21:59:24 +02:00 · 2022-08-06 16:47:04 +02:00
parent fccb464989
commit 610257b36e
1 changed files with 1 additions and 1 deletions
--- a/aiserver.py
+++ b/aiserver.py
@@ -364,7 +364,7 @@ class vars:
    lazy_load   = True  # Whether or not to use torch_lazy_loader.py for transformers models in order to reduce CPU memory usage
    use_colab_tpu = os.environ.get("COLAB_TPU_ADDR", "") != "" or os.environ.get("TPU_NAME", "") != ""  # Whether or not we're in a Colab TPU instance or Kaggle TPU instance and are going to use the TPU rather than the CPU
    revision    = None
-    output_streaming = False
+    output_streaming = True
    token_stream_queue = TokenStreamQueue() # Queue for the token streaming
    show_probs = False # Whether or not to show token probabilities