Skip to content

Commit

Permalink
fix(core): fix remote http api model name dispaly (#2047)
Browse files Browse the repository at this point in the history
  • Loading branch information
wsxiaoys committed May 4, 2024
1 parent e8d44bf commit 6367e2f
Show file tree
Hide file tree
Showing 4 changed files with 47 additions and 18 deletions.
10 changes: 8 additions & 2 deletions crates/tabby/src/serve.rs
Original file line number Diff line number Diff line change
Expand Up @@ -222,8 +222,11 @@ async fn api_router(

let health_state = Arc::new(health::HealthState::new(
args.model.as_deref(),
args.chat_model.as_deref(),
&args.device,
args.chat_model.as_deref(),
args.chat_model
.as_deref()
.map(|_| args.chat_device.as_ref().unwrap_or(&args.device)),
webserver,
));

Expand Down Expand Up @@ -322,8 +325,11 @@ async fn api_router(
fn start_heartbeat(args: &ServeArgs, webserver: Option<bool>) {
let state = health::HealthState::new(
args.model.as_deref(),
args.chat_model.as_deref(),
&args.device,
args.chat_model.as_deref(),
args.chat_model
.as_deref()
.map(|_| args.chat_device.as_ref().unwrap_or(&args.device)),
webserver,
);
tokio::spawn(async move {
Expand Down
23 changes: 21 additions & 2 deletions crates/tabby/src/services/health.rs
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,8 @@ pub struct HealthState {
model: Option<String>,
#[serde(skip_serializing_if = "Option::is_none")]
chat_model: Option<String>,
#[serde(skip_serializing_if = "Option::is_none")]
chat_device: Option<String>,
device: String,
arch: String,
cpu_info: String,
Expand All @@ -26,8 +28,9 @@ pub struct HealthState {
impl HealthState {
pub fn new(
model: Option<&str>,
chat_model: Option<&str>,
device: &Device,
chat_model: Option<&str>,
chat_device: Option<&Device>,
webserver: Option<bool>,
) -> Self {
let (cpu_info, cpu_count) = read_cpu_info();
Expand All @@ -37,9 +40,25 @@ impl HealthState {
Err(_) => vec![],
};

let http_model_name = Some("Remote");
let is_model_http = device == &Device::ExperimentalHttp;
let model = if is_model_http {
http_model_name
} else {
model
};

let is_chat_model_http = chat_device == Some(&Device::ExperimentalHttp);
let chat_model = if is_chat_model_http {
http_model_name
} else {
chat_model
};

Self {
model: model.map(|x| x.to_owned()),
model: model.map(|x| x.to_string()),
chat_model: chat_model.map(|x| x.to_owned()),
chat_device: chat_device.map(|x| x.to_string()),
device: device.to_string(),
arch: ARCH.to_string(),
cpu_info,
Expand Down
1 change: 1 addition & 0 deletions ee/tabby-ui/lib/hooks/use-health.tsx
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ export interface HealthInfo {
device: 'metal' | 'cpu' | 'cuda'
model?: string
chat_model?: string
chat_device?: string
cpu_info: string
cpu_count: number
cuda_devices: string[]
Expand Down
31 changes: 17 additions & 14 deletions ee/tabby-ui/lib/hooks/use-workers.ts
Original file line number Diff line number Diff line change
Expand Up @@ -7,22 +7,27 @@ import { Worker, WorkerKind } from '@/lib/gql/generates/graphql'

import { useHealth, type HealthInfo } from './use-health'

const modelNameMap: Record<WorkerKind, 'chat_model' | 'model'> = {
[WorkerKind.Chat]: 'chat_model',
[WorkerKind.Completion]: 'model'
function transformHealthInfoToCompletionWorker(healthInfo: HealthInfo): Worker {
return {
kind: WorkerKind.Completion,
device: healthInfo.device,
addr: 'localhost',
arch: '',
cpuInfo: healthInfo.cpu_info,
name: healthInfo.model!,
cpuCount: healthInfo.cpu_count,
cudaDevices: healthInfo.cuda_devices
}
}

function transformHealthInfoToWorker(
healthInfo: HealthInfo,
kind: WorkerKind
): Worker {
function transformHealthInfoToChatWorker(healthInfo: HealthInfo): Worker {
return {
kind,
device: healthInfo.device,
kind: WorkerKind.Chat,
device: healthInfo.chat_device!,
addr: 'localhost',
arch: '',
cpuInfo: healthInfo.cpu_info,
name: healthInfo?.[modelNameMap[kind]] ?? '',
name: healthInfo.chat_model!,
cpuCount: healthInfo.cpu_count,
cudaDevices: healthInfo.cuda_devices
}
Expand Down Expand Up @@ -56,12 +61,10 @@ function useWorkers() {
findIndex(_workers, { kind: WorkerKind.Chat }) > -1

if (!haveRemoteCompletionWorkers && healthInfo?.model) {
_workers.push(
transformHealthInfoToWorker(healthInfo, WorkerKind.Completion)
)
_workers.push(transformHealthInfoToCompletionWorker(healthInfo))
}
if (!haveRemoteChatWorkers && healthInfo?.chat_model) {
_workers.push(transformHealthInfoToWorker(healthInfo, WorkerKind.Chat))
_workers.push(transformHealthInfoToChatWorker(healthInfo))
}
return groupBy(_workers, 'kind')
}, [healthInfo, workers])
Expand Down

0 comments on commit 6367e2f

Please sign in to comment.