Spaces:

akhaliq
/

MiniCPM-V-4.6

Running on Zero

App Files Files Community

akhaliq HF Staff commited on 9 days ago

Commit

288b222

1 Parent(s): f009ec7

fix: update device mapping and GPU duration, and add thinking UI state to chat interface

Browse files

Files changed (2) hide show

app.py +2 -2
index.html +24 -2

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ model = AutoModelForImageTextToText.from_pretrained(
     model_id,
     torch_dtype=torch.bfloat16,
     trust_remote_code=True,
-    device_map="auto"
 )
 # Utility for response normalization
@@ -33,8 +33,8 @@ def normalize_response_text(text: str) -> str:
 app = Server()
-@spaces.GPU
 @app.api()
 def predict(message: str, file: FileData = None, downsample_mode: str = "16x"):
     """
     General inference endpoint for both image and video.

     model_id,
     torch_dtype=torch.bfloat16,
     trust_remote_code=True,
+    device_map="cuda"
 )
 # Utility for response normalization
 app = Server()
 @app.api()
+@spaces.GPU(duration=120)
 def predict(message: str, file: FileData = None, downsample_mode: str = "16x"):
     """
     General inference endpoint for both image and video.

index.html CHANGED Viewed

@@ -294,27 +294,49 @@
             addMessage('user', currentText, fileUrl, fileType);
-            // Show loading
             sendIcon.classList.add('hidden');
             loadingSpinner.classList.remove('hidden');
             sendBtn.disabled = true;
             try {
                 let fileData = null;
                 if (currentFile) {
                     fileData = handle_file(currentFile);
                 }
                 const result = await client.predict("/predict", {
                     message: currentText,
                     file: fileData,
                     downsample_mode: currentMode
                 });
                 addMessage('assistant', result.data);
             } catch (error) {
                 console.error("Prediction failed:", error);
-                addMessage('assistant', "Sorry, I encountered an error while processing your request.");
             } finally {
                 sendIcon.classList.remove('hidden');
                 loadingSpinner.classList.add('hidden');

             addMessage('user', currentText, fileUrl, fileType);
+            // Show loading state
             sendIcon.classList.add('hidden');
             loadingSpinner.classList.remove('hidden');
             sendBtn.disabled = true;
+            // Add thinking placeholder
+            const thinkingDiv = document.createElement('div');
+            thinkingDiv.className = 'flex gap-4 max-w-3xl mx-auto items-start message-anim';
+            thinkingDiv.id = 'thinking-placeholder';
+            thinkingDiv.innerHTML = `
+                <div class="w-8 h-8 rounded-full bg-indigo-500/20 flex items-center justify-center shrink-0 border border-indigo-500/30">
+                    <i data-lucide="bot" class="w-4 h-4 text-indigo-400"></i>
+                </div>
+                <div class="glass p-5 rounded-2xl rounded-tl-none border border-white/5">
+                    <div class="flex items-center gap-2 text-gray-400 italic">
+                        <i data-lucide="loader-2" class="w-3 h-3 animate-spin"></i> MiniCPM is thinking...
+                    </div>
+                </div>
+            `;
+            chatMessages.appendChild(thinkingDiv);
+            lucide.createIcons();
+            chatMessages.scrollTop = chatMessages.scrollHeight;
             try {
                 let fileData = null;
                 if (currentFile) {
                     fileData = handle_file(currentFile);
                 }
+                console.log("Sending request to MiniCPM-V 4.6 backend...");
                 const result = await client.predict("/predict", {
                     message: currentText,
                     file: fileData,
                     downsample_mode: currentMode
                 });
+                // Remove placeholder and add actual message
+                document.getElementById('thinking-placeholder')?.remove();
                 addMessage('assistant', result.data);
             } catch (error) {
                 console.error("Prediction failed:", error);
+                document.getElementById('thinking-placeholder')?.remove();
+                addMessage('assistant', "Sorry, I encountered an error while processing your request. Please check the Space logs.");
             } finally {
                 sendIcon.classList.remove('hidden');
                 loadingSpinner.classList.add('hidden');