Commit 2ed89c25 authored by YaningGao's avatar YaningGao
Browse files

minor

parent 7eecc7a0
Loading
Loading
Loading
Loading
+12 −4
Original line number Diff line number Diff line
@@ -2,15 +2,23 @@ models:
  # qwen_vl_3b:
  #   provider: vllm
  #   model_name: Qwen/Qwen2.5-VL-3B-Instruct
  #   max_tokens: 150
  #   max_tokens: 200
  #   temperature: 0.7
  #   tensor_parallel_size: 2
  #   gpu_memory_utilization: 0.9

  qwen_vl_7b:
    provider: vllm
    model_name: Qwen/Qwen2.5-VL-7B-Instruct
    max_tokens: 200
    temperature: 0.7
    tensor_parallel_size: 1
    gpu_memory_utilization: 0.9

  # gpt4o:
  #   provider: openai
  #   model_name: gpt-4o
  #   max_tokens: 150
  #   max_tokens: 200
  #   temperature: 0.7
  #   presence_penalty: 0.0
  #   frequency_penalty: 0.0
@@ -26,14 +34,14 @@ models:
  # Gemini_2.5_flask:
  #     provider: gemini
  #     model_name: gemini-2.0-flash
  #     max_tokens: 150
  #     max_tokens: 200
  #     temperature: 0.7
  
  # # Batch processing configuration example
  # claude_3_haiku_batch:
  #   provider: claude
  #   model_name: claude-3-haiku-20240307
  #   max_tokens: 150
  #   max_tokens: 200
  #   temperature: 0.7
  #   use_batch_api: true  # Use batch API for cost optimization
  #   batch_poll_interval: 10  # Poll every 10 seconds
+20 −20
Original line number Diff line number Diff line
from .vllm import VLLMModelInterface, VLLMModelConfig
from .openai import OpenAIModelInterface, OpenAIModelConfig
from .claude import ClaudeModelInterface, ClaudeModelConfig
from .gemini import GeminiModelInterface, GeminiModelConfig
from .routerapi import RouterAPIModelInterface, RouterAPIModelConfig
# from .openai import OpenAIModelInterface, OpenAIModelConfig
# from .claude import ClaudeModelInterface, ClaudeModelConfig
# from .gemini import GeminiModelInterface, GeminiModelConfig
# from .routerapi import RouterAPIModelInterface, RouterAPIModelConfig

REGISTERED_MODEL = {
    "vllm": {
        "model_cls": VLLMModelInterface,
        "config_cls": VLLMModelConfig,
    },
    "openai": {
        "model_cls": OpenAIModelInterface,
        "config_cls": OpenAIModelConfig
    },
    "claude": {
        "model_cls": ClaudeModelInterface,
        "config_cls": ClaudeModelConfig
    },
    "gemini": {
        "model_cls": GeminiModelInterface,
        "config_cls": GeminiModelConfig
    },
    "routerapi": {
        "model_cls": RouterAPIModelInterface,
        "config_cls": RouterAPIModelConfig
    }
    # "openai": {
    #     "model_cls": OpenAIModelInterface,
    #     "config_cls": OpenAIModelConfig
    # },
    # "claude": {
    #     "model_cls": ClaudeModelInterface,
    #     "config_cls": ClaudeModelConfig
    # },
    # "gemini": {
    #     "model_cls": GeminiModelInterface,
    #     "config_cls": GeminiModelConfig
    # },
    # "routerapi": {
    #     "model_cls": RouterAPIModelInterface,
    #     "config_cls": RouterAPIModelConfig
    # }
}
 No newline at end of file
+1 −0
Original line number Diff line number Diff line
@@ -50,6 +50,7 @@ class VLLMModelConfig(BaseModelConfig):
            "supported_models": [
                "Qwen/Qwen2.5-0.5B-Instruct",
                "Qwen/Qwen2.5-VL-3B-Instruct",
                "Qwen/Qwen2.5-VL-7B-Instruct",
                "omlab/VLM-R1-Qwen2.5VL-3B-OVD-0321",
                "omlab/VLM-R1-Qwen2.5VL-3B-Math-0305",
                "omlab/Qwen2.5VL-3B-VLM-R1-REC-500steps"
+2 −2
Original line number Diff line number Diff line
@@ -2,7 +2,7 @@ defaults:
  - _self_

server:
  host: 127.0.0.1
  host: 0.0.0.0
  port: 5000
  debug: false

@@ -13,7 +13,7 @@ svg:
  model_size: "small"
navigation:
  max_workers: 48
  devices: [0,1,2,3]
  devices: [0]
primitive_skill:
  max_workers: 48