From 294a9f40927b6cb4ddd77b956f785c4e53ebc083 Mon Sep 17 00:00:00 2001 From: Brad Hilton Date: Thu, 18 Sep 2025 00:23:04 +0000 Subject: [PATCH] fix: Update model configuration and server logic - Changed the base model in `yes-no-maybe.ipynb` to `Qwen/Qwen3-30B-A3B-Instruct`. - Disabled loading in 4-bit mode in `get_model_config.py` for better compatibility. - Adjusted target modules for Qwen3 MoE models to avoid unsupported LoRA weights. - Enhanced the `openai_server_task` in `server.py` to ensure missing fields in LoRA requests are handled gracefully. --- dev/yes-no-maybe.ipynb | 284 ++++++++++++++++++++++++++++---- src/art/dev/get_model_config.py | 20 ++- src/art/vllm/server.py | 26 +-- 3 files changed, 281 insertions(+), 49 deletions(-) diff --git a/dev/yes-no-maybe.ipynb b/dev/yes-no-maybe.ipynb index f9d7a6d8..4b4df24f 100644 --- a/dev/yes-no-maybe.ipynb +++ b/dev/yes-no-maybe.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ @@ -12,9 +12,30 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "\n" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], "source": [ "%%html\n", "