diff --git a/node-hub/dora-qwen2-5-vl/README.md b/node-hub/dora-qwen2-5-vl/README.md index 535ff3c3..c22e2999 100644 --- a/node-hub/dora-qwen2-5-vl/README.md +++ b/node-hub/dora-qwen2-5-vl/README.md @@ -1,4 +1,4 @@ -# Dora QwenVL2 node +# Dora QwenVL2.5 node Experimental node for using a VLM within dora. @@ -8,8 +8,8 @@ This node is supposed to be used as follows: ```yaml - id: dora-qwenvl - build: pip install dora-qwenvl - path: dora-qwenvl + build: pip install dora-qwen2-5-vl + path: dora-qwen2-5-vl inputs: image: source: camera/image diff --git a/node-hub/dora-qwen2-5-vl/dora_qwenvl/__init__.py b/node-hub/dora-qwen2-5-vl/dora_qwen2_5_vl/__init__.py similarity index 100% rename from node-hub/dora-qwen2-5-vl/dora_qwenvl/__init__.py rename to node-hub/dora-qwen2-5-vl/dora_qwen2_5_vl/__init__.py diff --git a/node-hub/dora-qwen2-5-vl/dora_qwenvl/main.py b/node-hub/dora-qwen2-5-vl/dora_qwen2_5_vl/main.py similarity index 97% rename from node-hub/dora-qwen2-5-vl/dora_qwenvl/main.py rename to node-hub/dora-qwen2-5-vl/dora_qwen2_5_vl/main.py index 9bcd32f5..b5f8f05b 100644 --- a/node-hub/dora-qwen2-5-vl/dora_qwenvl/main.py +++ b/node-hub/dora-qwen2-5-vl/dora_qwen2_5_vl/main.py @@ -152,6 +152,7 @@ def main(): ], }, ] + cached_text = DEFAULT_QUESTION for event in node: event_type = event["type"] @@ -198,17 +199,19 @@ def main(): image = Image.fromarray(frame) frames[event_id] = image.resize((IMAGE_HEIGHT, IMAGE_WIDTH)) - elif event_id == "text": + elif "text" in event_id: if len(event["value"]) > 0: text = event["value"][0].as_py() else: - text = "" + text = cached_text words = text.split() if len(ACTIVATION_WORDS) > 0 and all( word not in ACTIVATION_WORDS for word in words ): continue + cached_text = text + if len(frames.keys()) == 0: continue # set the max number of tiles in `max_num` diff --git a/node-hub/dora-qwen2-5-vl/pyproject.toml b/node-hub/dora-qwen2-5-vl/pyproject.toml index 2074a7d5..29dd857f 100644 --- a/node-hub/dora-qwen2-5-vl/pyproject.toml +++ b/node-hub/dora-qwen2-5-vl/pyproject.toml @@ -43,8 +43,8 @@ dev = ["pytest >=8.1.1", "ruff >=0.9.1"] transformers = { git = "https://github.com/huggingface/transformers" } [project.scripts] -dora-qwenvl = "dora_qwenvl.main:main" +dora-qwen2-5-vl = "dora_qwen2_5_vl.main:main" [build-system] -requires = ["setuptools", "setuptools-scm", "torch"] +requires = ["setuptools", "setuptools-scm"] build-backend = "setuptools.build_meta" diff --git a/node-hub/llama-factory-recorder/README.md b/node-hub/llama-factory-recorder/README.md index 4603b7a2..b0ee6c14 100644 --- a/node-hub/llama-factory-recorder/README.md +++ b/node-hub/llama-factory-recorder/README.md @@ -40,7 +40,7 @@ Example: ```yaml,diff - model_name_or_path: Qwen/Qwen2-VL-7B-Instruct -+ model_name_or_path: Qwen/Qwen2-VL-2B-Instruct ++ model_name_or_path: Qwen/Qwen2.5-VL-3B-Instruct ``` - Then