Spaces:

Smilyai-labs
/

Sam-X-series-chat

Sleeping

App Files Files Community

Keeby-smilyai commited on Oct 21

Commit

d79a8f4

verified ·

1 Parent(s): 254043f

Update app.py

Browse files

Files changed (1) hide show

app.py +395 -0

app.py CHANGED Viewed

@@ -778,3 +778,398 @@ def generate_response_stream(prompt, temperature=0.7, backend=None, max_tokens=2
     final_tokens_per_sec = tokens_generated / elapsed if elapsed > 0 else 0
     yield "", False, final_tokens_per_sec, final_tokens_per_sec, False

     final_tokens_per_sec = tokens_generated / elapsed if elapsed > 0 else 0
     yield "", False, final_tokens_per_sec, final_tokens_per_sec, False
+# PART 3 - Continue from Part 2
+if __name__ == "__main__":
+    import gradio as gr
+    custom_css = """
+    .chat-container { height: 500px; overflow-y: auto; padding: 20px; background: #ffffff; border: 1px solid #e5e7eb; border-radius: 8px; }
+    .user-message { background: #f7f7f8; padding: 16px; margin: 12px 0; border-radius: 8px; }
+    .assistant-message { background: #ffffff; padding: 16px; margin: 12px 0; border-radius: 8px; border-left: 3px solid #10a37f; }
+    .message-content { color: #353740; line-height: 1.6; font-size: 15px; }
+    .message-header { font-weight: 600; margin-bottom: 8px; color: #353740; font-size: 14px; }
+    .thinking-content { color: #6b7280; font-style: italic; border-left: 3px solid #d1d5db; padding-left: 12px; margin: 8px 0; background: #f9fafb; padding: 8px 12px; border-radius: 4px; }
+    .plan-badge { display: inline-block; padding: 4px 12px; border-radius: 12px; font-size: 12px; font-weight: 600; margin-left: 8px; }
+    .plan-free { background: #e0e7ff; color: #3730a3; }
+    .plan-plus { background: #dbeafe; color: #1e40af; }
+    .plan-pro { background: #fef3c7; color: #92400e; }
+    .limits-panel { background: #f9fafb; border: 1px solid #e5e7eb; border-radius: 8px; padding: 16px; margin: 12px 0; }
+    .limit-item { display: flex; justify-content: space-between; padding: 8px 0; border-bottom: 1px solid #e5e7eb; }
+    .limit-item:last-child { border-bottom: none; }
+    .limit-exceeded { color: #dc2626; font-weight: 600; }
+    .limit-ok { color: #059669; }
+    .circular-btn { width: 48px !important; height: 48px !important; min-width: 48px !important; border-radius: 50% !important; padding: 0 !important; display: flex !important; align-items: center !important; justify-content: center !important; font-size: 20px !important; box-shadow: 0 2px 8px rgba(0,0,0,0.15) !important; transition: all 0.2s ease !important; }
+    .circular-btn:hover:not(:disabled) { transform: scale(1.05) !important; box-shadow: 0 4px 12px rgba(0,0,0,0.2) !important; }
+    .send-btn { background: linear-gradient(135deg, #10a37f 0%, #0d8c6c 100%) !important; border: none !important; }
+    .stop-btn { background: linear-gradient(135deg, #ef4444 0%, #dc2626 100%) !important; border: none !important; }
+    .announcement-banner { background: linear-gradient(135deg, #667eea 0%, #764ba2 100%); color: white; padding: 20px 28px; border-radius: 12px; margin-bottom: 20px; box-shadow: 0 4px 6px rgba(0,0,0,0.1); text-align: center; font-size: 16px; font-weight: 500; line-height: 1.6; }
+    """
+    def format_message_html(role, content, show_thinking=True):
+        role_class = "user-message" if role == "user" else "assistant-message"
+        role_name = "You" if role == "user" else "SAM-X-1"
+        thinking = ""
+        answer = ""
+        if "<think>" in content:
+            parts = content.split("<think>", 1)
+            before_think = parts[0].strip()
+            if len(parts) > 1:
+                after_think = parts[1]
+                if "</think>" in after_think:
+                    think_parts = after_think.split("</think>", 1)
+                    thinking = think_parts[0].strip()
+                    answer = (before_think + " " + think_parts[1]).strip()
+                elif "<think/>" in after_think:
+                    think_parts = after_think.split("<think/>", 1)
+                    thinking = think_parts[0].strip()
+                    answer = (before_think + " " + think_parts[1]).strip()
+                else:
+                    thinking = after_think.strip()
+                    answer = before_think
+            else:
+                answer = before_think
+        else:
+            answer = content
+        html = f'<div class="{role_class}"><div class="message-header">{role_name}</div><div class="message-content">'
+        if thinking and show_thinking:
+            html += f'<div class="thinking-content">💭 {thinking}</div>'
+        if answer:
+            html += f'<div>{answer}</div>'
+        html += '</div></div>'
+        return html
+    def render_history(history, show_thinking):
+        html = ""
+        for msg in history:
+            html += format_message_html(msg["role"], msg["content"], show_thinking)
+        return html
+    def render_limits_panel(user_session):
+        if not user_session or 'user_id' not in user_session:
+            return ""
+        info = get_user_limits_info(user_session['user_id'])
+        if not info:
+            return ""
+        plan_badge_class = f"plan-{info['plan']}"
+        html = f'<div class="limits-panel"><div style="font-weight: 600; margin-bottom: 12px; font-size: 16px;">Your Plan: <span class="plan-badge {plan_badge_class}">{info["plan"].upper()}</span></div><div style="font-size: 13px; color: #6b7280; margin-bottom: 12px;">⏰ Limits reset in: <strong>{info["reset_in"]}</strong></div>'
+        models_info = [('NANO ⚡⚡', info['nano_used'], info['nano_limit']), ('MINI 🚀', info['mini_used'], info['mini_limit']), ('FAST ⚡', info['fast_used'], info['fast_limit']), ('LARGE 💎', info['large_used'], info['large_limit'])]
+        for model_name, used, limit in models_info:
+            if limit == -1:
+                status = f'<span class="limit-ok">{used} messages (Unlimited)</span>'
+            else:
+                remaining = limit - used
+                if remaining <= 0:
+                    status = f'<span class="limit-exceeded">{used}/{limit} (LIMIT REACHED)</span>'
+                elif remaining <= 2:
+                    status = f'<span style="color: #f59e0b; font-weight: 600;">{used}/{limit} ({remaining} left)</span>'
+                else:
+                    status = f'<span class="limit-ok">{used}/{limit} ({remaining} left)</span>'
+            html += f'<div class="limit-item"><span style="font-weight: 500;">{model_name}</span><span>{status}</span></div>'
+        html += '</div>'
+        return html
+    user_session = gr.State({})
+    with gr.Blocks(css=custom_css, theme=gr.themes.Soft(primary_hue="slate")) as demo:
+        gr.HTML('<div class="announcement-banner">🔐 <strong>SAM-X-1 V3.0 - SECURE ACCESS</strong> 🔐<br>✨ Sign in to unlock AI-powered conversations!<br>🆓 FREE: Nano & Mini unlimited, Fast 10/3h, Large 8/3h<br>⭐ PLUS: Nano/Mini/Fast unlimited, Large 20/3h<br>💎 PRO: Everything unlimited!</div>')
+        with gr.Tabs() as main_tabs:
+            with gr.Tab("🔐 Sign In"):
+                with gr.Column():
+                    login_username = gr.Textbox(label="Username", placeholder="Enter username")
+                    login_password = gr.Textbox(label="Password", type="password", placeholder="Enter password")
+                    login_btn = gr.Button("Sign In", variant="primary")
+                    login_msg = gr.Markdown("")
+            with gr.Tab("📝 Sign Up"):
+                with gr.Column():
+                    signup_username = gr.Textbox(label="Username", placeholder="Choose a username")
+                    signup_email = gr.Textbox(label="Email (optional)", placeholder="your@email.com")
+                    signup_password = gr.Textbox(label="Password", type="password", placeholder="Choose a password")
+                    signup_btn = gr.Button("Create Account", variant="primary")
+                    signup_msg = gr.Markdown("")
+            with gr.Tab("💬 Chat") as chat_tab:
+                with gr.Row():
+                    with gr.Column(scale=4):
+                        user_info = gr.Markdown("Please sign in first")
+                    with gr.Column(scale=1):
+                        logout_btn = gr.Button("🚪 Logout", size="sm")
+                limits_display = gr.HTML("")
+                with gr.Accordion("⚙️ Settings", open=False):
+                    with gr.Row():
+                        model_selector = gr.Dropdown(choices=["🤖 Auto (Recommended)"], value="🤖 Auto (Recommended)", label="Model Selection", info="FREE users: Auto only. PLUS/PRO: Choose manually")
+                        max_tokens_slider = gr.Slider(minimum=64, maximum=512, value=256, step=64, label="Max Tokens")
+                    with gr.Row():
+                        temperature_slider = gr.Slider(minimum=0.0, maximum=2.0, value=0.7, step=0.1, label="Temperature")
+                        show_thinking_checkbox = gr.Checkbox(label="Show Thinking", value=True)
+                speed_display = gr.Textbox(label="Generation Speed", value="⚡ Ready", interactive=False)
+                chat_html = gr.HTML(value="", elem_classes=["chat-container"])
+                with gr.Row():
+                    msg_input = gr.Textbox(placeholder="Ask me anything...", show_label=False, scale=8)
+                    with gr.Column(scale=1, min_width=120):
+                        with gr.Row():
+                            send_btn = gr.Button("▶", variant="primary", elem_classes=["circular-btn", "send-btn"])
+                            stop_btn = gr.Button("⏹", variant="stop", elem_classes=["circular-btn", "stop-btn"], interactive=False)
+                with gr.Row():
+                    clear_btn = gr.Button("🗑️ Clear", size="sm")
+                    upgrade_btn = gr.Button("⭐ Request Upgrade", size="sm", variant="primary")
+                with gr.Accordion("🔐 Admin Panel", visible=False, open=False) as admin_panel:
+                    gr.Markdown("### User Management")
+                    with gr.Tabs():
+                        with gr.Tab("All Users"):
+                            users_table = gr.Dataframe(headers=["ID", "Username", "Email", "Plan", "Created", "Admin"])
+                            refresh_users_btn = gr.Button("🔄 Refresh")
+                            with gr.Row():
+                                admin_username = gr.Textbox(label="Username")
+                                admin_new_plan = gr.Dropdown(choices=["free", "plus", "pro"], label="New Plan")
+                                update_plan_btn = gr.Button("Update Plan")
+                            admin_msg = gr.Markdown("")
+                        with gr.Tab("Upgrade Requests"):
+                            requests_table = gr.Dataframe(headers=["ID", "Username", "Requested Plan", "Reason", "Date"])
+                            refresh_requests_btn = gr.Button("🔄 Refresh")
+                            with gr.Row():
+                                request_id_input = gr.Number(label="Request ID", precision=0)
+                                approve_req_btn = gr.Button("✅ Approve", variant="primary")
+                                deny_req_btn = gr.Button("❌ Deny", variant="stop")
+                            request_msg = gr.Markdown("")
+                with gr.Accordion("⭐ Request Plan Upgrade", visible=False, open=False) as upgrade_panel:
+                    upgrade_plan_choice = gr.Radio(choices=["plus", "pro"], label="Select Plan", value="plus")
+                    upgrade_reason = gr.Textbox(label="Reason for Upgrade", placeholder="Why do you need this upgrade?", lines=3)
+                    submit_upgrade_btn = gr.Button("Submit Request", variant="primary")
+                    upgrade_msg = gr.Markdown("")
+        def handle_login(username, password):
+            success, user_data = authenticate_user(username, password)
+            if success:
+                return user_data, f"✅ Welcome back, {username}!", "", gr.update(selected=2)
+            return {}, "❌ Invalid credentials!", "", gr.update()
+        def handle_signup(username, email, password):
+            if len(username) < 3:
+                return "❌ Username must be at least 3 characters!"
+            if len(password) < 6:
+                return "❌ Password must be at least 6 characters!"
+            success, message = create_user(username, password, email)
+            return f"{'✅' if success else '❌'} {message}"
+        def load_user_interface(session):
+            if not session or 'user_id' not in session:
+                return "❌ Not logged in", "", gr.update(visible=False), gr.update(choices=["🤖 Auto (Recommended)"], value="🤖 Auto (Recommended)"), gr.update()
+            info = get_user_limits_info(session['user_id'])
+            plan_badge = f'<span class="plan-badge plan-{info["plan"]}">{info["plan"].upper()}</span>'
+            user_info_text = f"👤 **{session['username']}** {plan_badge}"
+            limits_html = render_limits_panel(session)
+            if info['can_choose_model']:
+                available_model_names = list(available_models.keys())
+                choices = ["🤖 Auto (Recommended)"] + available_model_names
+            else:
+                choices = ["🤖 Auto (Recommended)"]
+            return user_info_text, limits_html, gr.update(visible=session.get('is_admin', False)), gr.update(choices=choices, value="🤖 Auto (Recommended)"), gr.update(maximum=info['max_tokens'], value=min(256, info['max_tokens']))
+        def send_message_handler(message, show_thinking, temperature, model_choice, max_tokens, session):
+            global stop_generation
+            stop_generation.clear()
+            if not session or 'user_id' not in session:
+                return "", "", "❌ Not logged in", gr.update(), gr.update()
+            if not message.strip():
+                return "", "", "⚡ Ready", gr.update(interactive=True), gr.update(interactive=False)
+            info = get_user_limits_info(session['user_id'])
+            if model_choice == "🤖 Auto (Recommended)" or not info['can_choose_model']:
+                user_available = get_available_models_for_user(session['user_id'])
+                if not user_available:
+                    return "", "", "❌ No models available (limits reached)", gr.update(interactive=True), gr.update(interactive=False)
+                backend = select_model_auto(message, available_models, user_available)
+                if not backend:
+                    return "", "", "❌ Could not select model", gr.update(interactive=True), gr.update(interactive=False)
+                model_name = backend.get_name()
+            else:
+                model_name = model_choice
+                can_use, msg = can_use_model(session['user_id'], model_name)
+                if not can_use:
+                    return "", "", f"❌ {msg}", gr.update(interactive=True), gr.update(interactive=False)
+                backend = available_models[model_name]
+            can_use, msg = can_use_model(session['user_id'], model_name)
+            if not can_use:
+                return "", "", f"❌ {msg}", gr.update(interactive=True), gr.update(interactive=False)
+            increment_model_usage(session['user_id'], model_name)
+            yield "", "", f"⚡ Using {model_name}...", gr.update(interactive=False), gr.update(interactive=True)
+            history = [{"role": "user", "content": message}]
+            yield "", render_history(history, show_thinking), f"⚡ Generating...", gr.update(interactive=False), gr.update(interactive=True)
+            prompt = f"User: {message}\nSam: <think>"
+            history.append({"role": "assistant", "content": "<think>"})
+            actual_max_tokens = min(max_tokens, info['max_tokens'])
+            last_speed = 0
+            was_stopped = False
+            for chunk_data in generate_response_stream(prompt, temperature, backend, actual_max_tokens):
+                if len(chunk_data) == 5:
+                    new_chunk, in_thinking, tokens_per_sec, avg_speed, stopped = chunk_data
+                    if stopped:
+                        was_stopped = True
+                        break
+                    if new_chunk:
+                        history[-1]["content"] += new_chunk
+                    last_speed = avg_speed
+                    yield "", render_history(history, show_thinking), f"⚡ {tokens_per_sec:.1f} tok/s", gr.update(interactive=False), gr.update(interactive=True)
+            final = f"{'🛑 Stopped' if was_stopped else '✅ Done'} - {last_speed:.1f} tok/s"
+            yield "", render_history(history, show_thinking), final, gr.update(interactive=True), gr.update(interactive=False)
+        def stop_generation_handler():
+            global stop_generation
+            stop_generation.set()
+            return "🛑 Stopping...", gr.update(interactive=False), gr.update(interactive=False)
+        def clear_chat():
+            return "", "⚡ Ready", gr.update(interactive=True), gr.update(interactive=False)
+        def show_upgrade_panel():
+            return gr.update(visible=True, open=True)
+        def submit_upgrade_request(plan, reason, session):
+            if not session or 'user_id' not in session:
+                return "❌ Not logged in"
+            if not reason.strip():
+                return "❌ Please provide a reason"
+            success, msg = request_upgrade(session['user_id'], plan, reason)
+            return f"{'✅' if success else '❌'} {msg}"
+        def load_all_users():
+            users = get_all_users()
+            formatted = []
+            for user in users:
+                formatted.append([user[0], user[1], user[2] or "N/A", user[3], user[4][:10] if user[4] else "N/A", "Yes" if user[5] else "No"])
+            return formatted
+        def load_pending_requests():
+            requests = get_pending_requests()
+            formatted = []
+            for req in requests:
+                formatted.append([req[0], req[1], req[2], req[3], req[4][:10] if req[4] else "N/A"])
+            return formatted
+        def admin_update_plan(username, new_plan):
+            if not username or not new_plan:
+                return "❌ Please fill all fields"
+            success, msg = update_user_plan(username, new_plan)
+            return f"{'✅' if success else '❌'} {msg}"
+        def admin_approve_request(request_id):
+            if not request_id:
+                return "❌ Please enter request ID"
+            success, msg = approve_request(int(request_id))
+            return f"{'✅' if success else '❌'} {msg}"
+        def admin_deny_request(request_id):
+            if not request_id:
+                return "❌ Please enter request ID"
+            success, msg = deny_request(int(request_id))
+            return f"{'✅' if success else '❌'} {msg}"
+        def handle_logout():
+            return {}, "Please sign in", "", gr.update(selected=0)
+        login_btn.click(handle_login, [login_username, login_password], [user_session, login_msg, chat_html, main_tabs])
+        signup_btn.click(handle_signup, [signup_username, signup_email, signup_password], [signup_msg])
+        chat_tab.select(load_user_interface, [user_session], [user_info, limits_display, admin_panel, model_selector, max_tokens_slider])
+        send_outputs = [msg_input, chat_html, speed_display, send_btn, stop_btn]
+        send_btn.click(send_message_handler, [msg_input, show_thinking_checkbox, temperature_slider, model_selector, max_tokens_slider, user_session], send_outputs)
+        msg_input.submit(send_message_handler, [msg_input, show_thinking_checkbox, temperature_slider, model_selector, max_tokens_slider, user_session], send_outputs)
+        stop_btn.click(stop_generation_handler, outputs=[speed_display, send_btn, stop_btn])
+        clear_btn.click(clear_chat, outputs=[chat_html, speed_display, send_btn, stop_btn])
+        upgrade_btn.click(show_upgrade_panel, outputs=[upgrade_panel])
+        submit_upgrade_btn.click(submit_upgrade_request, [upgrade_plan_choice, upgrade_reason, user_session], [upgrade_msg])
+        logout_btn.click(handle_logout, outputs=[user_session, user_info, chat_html, main_tabs])
+        refresh_users_btn.click(load_all_users, outputs=[users_table])
+        refresh_requests_btn.click(load_pending_requests, outputs=[requests_table])
+        update_plan_btn.click(admin_update_plan, [admin_username, admin_new_plan], [admin_msg])
+        approve_req_btn.click(admin_approve_request, [request_id_input], [request_msg])
+        deny_req_btn.click(admin_deny_request, [request_id_input], [request_msg])
+        gr.Markdown("""
+        ---
+        ### 📊 Plan Comparison
+        | Feature | FREE | PLUS ⭐ | PRO 💎 |
+        |---------|------|---------|--------|
+        | **Nano Model** | ✅ Unlimited | ✅ Unlimited | ✅ Unlimited |
+        | **Mini Model** | ✅ Unlimited | ✅ Unlimited | ✅ Unlimited |
+        | **Fast Model** | 10 msgs/3h | ✅ Unlimited | ✅ Unlimited |
+        | **Large Model** | 8 msgs/3h | 20 msgs/3h | ✅ Unlimited |
+        | **Model Selection** | 🤖 Auto only | ✅ Manual choice | ✅ Manual choice |
+        | **Max Tokens** | 256 | 384 | 512 |
+        | **Reset Period** | 3 hours | 3 hours | 3 hours |
+        ### 🎯 How It Works
+        1. **Rolling 3-Hour Window**: Your limits reset 3 hours after you start using the service
+        2. **Australia Timezone**: All times are in Australian Eastern Time (Sydney)
+        3. **Smart Auto-Selection**: FREE users get optimal model selection based on query complexity
+        4. **Flexible Limits**: Nano & Mini are always available for quick questions
+        5. **Upgrade Requests**: Request PLUS or PRO access through the chat interface
+        ### 💡 Tips for FREE Users
+        - **Use Nano & Mini freely** - Perfect for most questions and coding tasks (30-40 tok/s!)
+        - **Save Fast/Large for complex tasks** - You get 10 Fast and 8 Large messages per 3h window
+        - **Let Auto mode decide** - It intelligently picks the right model for your question
+        - **Watch your reset timer** - Plan your usage around the 3-hour window
+        ### 🔐 Admin Access
+        - **Username**: `admin`
+        - **Password**: `admin123`
+        - Admin can manage users, approve upgrades, and reset limits
+        ### 🚀 V3.0 Features
+        - ✅ **User Authentication** - Secure sign in/sign up system
+        - ✅ **Three-Tier Plans** - FREE, PLUS, PRO with different limits
+        - ✅ **Rolling 3-Hour Limits** - Fair usage based on activity
+        - ✅ **Admin Panel** - Full user management and upgrade approval
+        - ✅ **Smart Model Selection** - Auto mode for FREE, manual for PLUS/PRO
+        - ✅ **Usage Tracking** - Monitor your message limits in real-time
+        - ✅ **Australia Timezone** - All times displayed in AEST/AEDT
+        - ✅ **Upgrade Requests** - In-app upgrade request system
+        - ✅ **Per-Model Limits** - Separate counters for Nano, Mini, Fast, Large
+        - ✅ **Dynamic Batching** - Faster UI updates (2-8 token batching)
+        ### 📝 How to Use
+        **Step 1**: Create an account (Sign Up tab)
+        **Step 2**: Sign in with your credentials
+        **Step 3**: Go to Chat tab and start chatting!
+        **Step 4**: Monitor your limits in the limits panel
+        **Step 5**: Request upgrade if you need more access
+        ### 🎓 Example Queries by Plan
+        **FREE Plan (Auto Mode):**
+        - "What is Python?" → Nano (instant, unlimited)
+        - "Write a hello world function" → Mini (fast, unlimited)
+        - "Explain object-oriented programming" → Fast (uses 1 of 10)
+        - "Prove the Pythagorean theorem" → Large (uses 1 of 8)
+        **PLUS/PRO (Manual Selection):**
+        - Choose any model based on your needs
+        - PLUS gets 20 Large messages per 3h
+        - PRO gets unlimited everything!
+        ### 📧 Support
+        For questions or issues, contact the admin through the upgrade request system!
+        ---
+        **Made with ❤️ using SAM-X-1 Models**
+        """)
+    demo.launch(debug=True, share=True)