Temporary fix qwenvl2 queue error (#688)

In order to get the best performance from Qwenvl2, we need to temporary add this piece of code that is going to unqueue qwenvl queue. This is directly linked to: #652 which is that we currently having a queue issue within nodes for `queue_size: 1` where the queue is actually pending older data and not the newest one.
dora-rs · Oct 13, 2024 · a90221d · a90221d
2 parents 015208a + 309b40a
commit a90221d
Show file tree

Hide file tree

Showing 3 changed files with 25 additions and 5 deletions.
diff --git a/examples/vlm/dataflow.yml b/examples/vlm/dataflow.yml
@@ -18,7 +18,7 @@ nodes:
  image:
  source: camera/image
  queue_size: 1
- tick: dora/timer/millis/300
+ tick: dora/timer/millis/100
  outputs:
  - text
  - tick

diff --git a/node-hub/dora-qwenvl/dora_qwenvl/main.py b/node-hub/dora-qwenvl/dora_qwenvl/main.py
@@ -5,10 +5,19 @@
 import numpy as np
 import pyarrow as pa
 from PIL import Image
+from pathlib import Path
 import cv2
 
 DEFAULT_PATH = "Qwen/Qwen2-VL-2B-Instruct"
-CUSTOM_MODEL_PATH = os.getenv("CUSTOM_MODEL_PATH", DEFAULT_PATH)
+
+MODEL_NAME_OR_PATH = os.getenv("MODEL_NAME_OR_PATH", DEFAULT_PATH)
+
+if bool(os.getenv("MODELSCOPE")) is True:
+ from modelscope import snapshot_download
+
+ if not Path(MODEL_NAME_OR_PATH).exists():
+ MODEL_NAME_OR_PATH = snapshot_download(MODEL_NAME_OR_PATH)
+
 DEFAULT_QUESTION = os.getenv(
  "DEFAULT_QUESTION",
  "Describe this image",
@@ -20,14 +29,14 @@
  import flash_attn as _
 
  model = Qwen2VLForConditionalGeneration.from_pretrained(
- CUSTOM_MODEL_PATH,
+ MODEL_NAME_OR_PATH,
  torch_dtype="auto",
  device_map="auto",
  attn_implementation="flash_attention_2",
  )
 except (ImportError, ModuleNotFoundError):
  model = Qwen2VLForConditionalGeneration.from_pretrained(
- CUSTOM_MODEL_PATH,
+ MODEL_NAME_OR_PATH,
  torch_dtype="auto",
  device_map="auto",
  )
@@ -38,7 +47,7 @@
 
 
 # default processor
-processor = AutoProcessor.from_pretrained(CUSTOM_MODEL_PATH)
+processor = AutoProcessor.from_pretrained(MODEL_NAME_OR_PATH)
 
 
 def generate(frames: dict, question):
@@ -101,6 +110,16 @@ def main():
  event_type = event["type"]
 
  if event_type == "INPUT":
+
+ # pylint: disable=fixme
+ # TODO: Remove this after https://github.com/dora-rs/dora/pull/652
+ while True:
+ next_event = node.next(timeout=0.001)
+ if next_event is not None and next_event["type"] == "INPUT":
+ event = next_event
+ else:
+ break
+
  event_id = event["id"]
 
  if "image" in event_id:

diff --git a/node-hub/dora-qwenvl/pyproject.toml b/node-hub/dora-qwenvl/pyproject.toml
@@ -20,6 +20,7 @@ transformers = "^4.45"
 qwen-vl-utils = "^0.0.2"
 accelerate = "^0.33"
 opencv-python = ">= 4.1.1"
+modelscope = "^1.18.1"
 # flash_attn = "^2.6.1" # Install using: pip install -U flash-attn --no-build-isolation