| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262 |
- import { activeProcessingState } from '$lib/stores/chat.svelte';
- import { config } from '$lib/stores/settings.svelte';
- export interface LiveProcessingStats {
- tokensProcessed: number;
- totalTokens: number;
- timeMs: number;
- tokensPerSecond: number;
- etaSecs?: number;
- }
- export interface LiveGenerationStats {
- tokensGenerated: number;
- timeMs: number;
- tokensPerSecond: number;
- }
- export interface UseProcessingStateReturn {
- readonly processingState: ApiProcessingState | null;
- getProcessingDetails(): string[];
- getProcessingMessage(): string;
- getPromptProgressText(): string | null;
- getLiveProcessingStats(): LiveProcessingStats | null;
- getLiveGenerationStats(): LiveGenerationStats | null;
- shouldShowDetails(): boolean;
- startMonitoring(): void;
- stopMonitoring(): void;
- }
- /**
- * useProcessingState - Reactive processing state hook
- *
- * This hook provides reactive access to the processing state of the server.
- * It directly reads from chatStore's reactive state and provides
- * formatted processing details for UI display.
- *
- * **Features:**
- * - Real-time processing state via direct reactive state binding
- * - Context and output token tracking
- * - Tokens per second calculation
- * - Automatic updates when streaming data arrives
- * - Supports multiple concurrent conversations
- *
- * @returns Hook interface with processing state and control methods
- */
- export function useProcessingState(): UseProcessingStateReturn {
- let isMonitoring = $state(false);
- let lastKnownState = $state<ApiProcessingState | null>(null);
- let lastKnownProcessingStats = $state<LiveProcessingStats | null>(null);
- // Derive processing state reactively from chatStore's direct state
- const processingState = $derived.by(() => {
- if (!isMonitoring) {
- return lastKnownState;
- }
- // Read directly from the reactive state export
- return activeProcessingState();
- });
- // Track last known state for keepStatsVisible functionality
- $effect(() => {
- if (processingState && isMonitoring) {
- lastKnownState = processingState;
- }
- });
- // Track last known processing stats for when promptProgress disappears
- $effect(() => {
- if (processingState?.promptProgress) {
- const { processed, total, time_ms, cache } = processingState.promptProgress;
- const actualProcessed = processed - cache;
- const actualTotal = total - cache;
- if (actualProcessed > 0 && time_ms > 0) {
- const tokensPerSecond = actualProcessed / (time_ms / 1000);
- lastKnownProcessingStats = {
- tokensProcessed: actualProcessed,
- totalTokens: actualTotal,
- timeMs: time_ms,
- tokensPerSecond
- };
- }
- }
- });
- function getETASecs(done: number, total: number, elapsedMs: number): number | undefined {
- const elapsedSecs = elapsedMs / 1000;
- const progressETASecs =
- done === 0 || elapsedSecs < 0.5
- ? undefined // can be the case for the 0% progress report
- : elapsedSecs * (total / done - 1);
- return progressETASecs;
- }
- function startMonitoring(): void {
- if (isMonitoring) return;
- isMonitoring = true;
- }
- function stopMonitoring(): void {
- if (!isMonitoring) return;
- isMonitoring = false;
- // Only clear last known state if keepStatsVisible is disabled
- const currentConfig = config();
- if (!currentConfig.keepStatsVisible) {
- lastKnownState = null;
- lastKnownProcessingStats = null;
- }
- }
- function getProcessingMessage(): string {
- if (!processingState) {
- return 'Processing...';
- }
- switch (processingState.status) {
- case 'initializing':
- return 'Initializing...';
- case 'preparing':
- if (processingState.progressPercent !== undefined) {
- return `Processing (${processingState.progressPercent}%)`;
- }
- return 'Preparing response...';
- case 'generating':
- return '';
- default:
- return 'Processing...';
- }
- }
- function getProcessingDetails(): string[] {
- // Use current processing state or fall back to last known state
- const stateToUse = processingState || lastKnownState;
- if (!stateToUse) {
- return [];
- }
- const details: string[] = [];
- // Always show context info when we have valid data
- if (stateToUse.contextUsed >= 0 && stateToUse.contextTotal > 0) {
- const contextPercent = Math.round((stateToUse.contextUsed / stateToUse.contextTotal) * 100);
- details.push(
- `Context: ${stateToUse.contextUsed}/${stateToUse.contextTotal} (${contextPercent}%)`
- );
- }
- if (stateToUse.outputTokensUsed > 0) {
- // Handle infinite max_tokens (-1) case
- if (stateToUse.outputTokensMax <= 0) {
- details.push(`Output: ${stateToUse.outputTokensUsed}/∞`);
- } else {
- const outputPercent = Math.round(
- (stateToUse.outputTokensUsed / stateToUse.outputTokensMax) * 100
- );
- details.push(
- `Output: ${stateToUse.outputTokensUsed}/${stateToUse.outputTokensMax} (${outputPercent}%)`
- );
- }
- }
- if (stateToUse.tokensPerSecond && stateToUse.tokensPerSecond > 0) {
- details.push(`${stateToUse.tokensPerSecond.toFixed(1)} tokens/sec`);
- }
- if (stateToUse.speculative) {
- details.push('Speculative decoding enabled');
- }
- return details;
- }
- function shouldShowDetails(): boolean {
- return processingState !== null && processingState.status !== 'idle';
- }
- /**
- * Returns a short progress message with percent
- */
- function getPromptProgressText(): string | null {
- if (!processingState?.promptProgress) return null;
- const { processed, total, cache } = processingState.promptProgress;
- const actualProcessed = processed - cache;
- const actualTotal = total - cache;
- const percent = Math.round((actualProcessed / actualTotal) * 100);
- const eta = getETASecs(actualProcessed, actualTotal, processingState.promptProgress.time_ms);
- if (eta !== undefined) {
- const etaSecs = Math.ceil(eta);
- return `Processing ${percent}% (ETA: ${etaSecs}s)`;
- }
- return `Processing ${percent}%`;
- }
- /**
- * Returns live processing statistics for display (prompt processing phase)
- * Returns last known stats when promptProgress becomes unavailable
- */
- function getLiveProcessingStats(): LiveProcessingStats | null {
- if (processingState?.promptProgress) {
- const { processed, total, time_ms, cache } = processingState.promptProgress;
- const actualProcessed = processed - cache;
- const actualTotal = total - cache;
- if (actualProcessed > 0 && time_ms > 0) {
- const tokensPerSecond = actualProcessed / (time_ms / 1000);
- return {
- tokensProcessed: actualProcessed,
- totalTokens: actualTotal,
- timeMs: time_ms,
- tokensPerSecond
- };
- }
- }
- // Return last known stats if promptProgress is no longer available
- return lastKnownProcessingStats;
- }
- /**
- * Returns live generation statistics for display (token generation phase)
- */
- function getLiveGenerationStats(): LiveGenerationStats | null {
- if (!processingState) return null;
- const { tokensDecoded, tokensPerSecond } = processingState;
- if (tokensDecoded <= 0) return null;
- // Calculate time from tokens and speed
- const timeMs =
- tokensPerSecond && tokensPerSecond > 0 ? (tokensDecoded / tokensPerSecond) * 1000 : 0;
- return {
- tokensGenerated: tokensDecoded,
- timeMs,
- tokensPerSecond: tokensPerSecond || 0
- };
- }
- return {
- get processingState() {
- return processingState;
- },
- getProcessingDetails,
- getProcessingMessage,
- getPromptProgressText,
- getLiveProcessingStats,
- getLiveGenerationStats,
- shouldShowDetails,
- startMonitoring,
- stopMonitoring
- };
- }
|