Spaces:

4therapy
/

BOXTRON-AI

Sleeping

App Files Files Community

4therapy commited on 6 days ago

Commit

fcf4fcb

verified ·

1 Parent(s): 9e353f5

Update app.py

Browse files

Files changed (1) hide show

app.py +92 -95

app.py CHANGED Viewed

@@ -1,102 +1,99 @@
 import gradio as gr
-from transformers import pipeline, AutoTokenizer, AutoModelForCausalLM
-import torch
-# --- 1. Model Configuration ---
-# Mistral-7B-Instruct-v0.2 is an excellent model for analytical, instruction-following tasks.
-# Using 'Auto' classes is robust, and 'device_map="auto"' ensures maximum GPU utilization.
-MODEL_ID = "mistralai/Mistral-7B-Instruct-v0.2"
-try:
-    # Load Model and Tokenizer
-    tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
-    model = AutoModelForCausalLM.from_pretrained(
-        MODEL_ID,
-        # Load in 8-bit or 4-bit to save VRAM, crucial for a free/small GPU Space
-        load_in_8bit=True,
-        # If 8-bit fails, try using torch.bfloat16 or torch.float16 if your GPU supports it
-        torch_dtype=torch.float16,
-        device_map="auto"
-    )
-    # Create the text generation pipeline for ease of use
-    generator = pipeline(
-        "text-generation",
-        model=model,
-        tokenizer=tokenizer,
-        device_map="auto"
-    )
-except Exception as e:
-    # Fallback for local testing or very limited CPU-only environments
-    print(f"Error loading large model: {e}. Falling back to 'gpt2' for basic functionality.")
-    generator = pipeline("text-generation", model="gpt2")
-    # For a boxing analyst, a small model is highly inaccurate, so deployment in a GPU Space is critical.
-# --- 2. System Prompt for Persona and Accuracy (CRITICAL) ---
-# A highly specific and authoritative system prompt forces the model into the desired persona.
-SYSTEM_PROMPT = (
-    "You are BOXTRON-AI, a world-class professional boxing analyst with decades of experience. "
-    "Your analysis must be objective, highly detailed, and use correct boxing terminology (e.g., in-fighter, outside fighter, high guard, check hook, weight division, KO ratio). "
-    "Analyze fighter styles, physical attributes, recent performance, and matchup dynamics. "
-    "Be concise, insightful, and offer a clear, reasoned prediction for the outcome."
-)
-# --- 3. Optimized Prediction Function ---
-def analyze_fight(user_message, history):
-    # Construct the full conversation history including the system prompt
-    messages = [{"role": "system", "content": SYSTEM_PROMPT}]
-    # Add previous conversation history
-    for human, bot in history:
-        messages.append({"role": "user", "content": human})
-        messages.append({"role": "assistant", "content": bot})
-    # Add the current user message
-    messages.append({"role": "user", "content": user_message})
-    # Apply the model's specific chat template (crucial for instruct models like Mistral)
-    prompt = generator.tokenizer.apply_chat_template(
-        messages,
-        tokenize=False,
-        add_generation_prompt=True
-    )
-    # Generate the response with optimized parameters for factual, analytical output
-    # temperature=0.1: Low temperature reduces randomness (hallucination) and increases factual consistency.
-    # top_p=0.9: Limits sampling to the most probable tokens for coherent, focused analysis.
-    response = generator(
-        prompt,
-        max_new_tokens=512,
-        do_sample=True,
-        temperature=0.1,
-        top_p=0.9,
-        return_full_text=False # Ensures only the model's response is returned
-    )
-    # Extract the generated text.
-    # The output format for the pipeline with return_full_text=False is a list of dicts.
-    bot_response = response[0]['generated_text'].strip()
-    return bot_response
-# --- 4. Gradio Interface ---
-# The gr.ChatInterface is the standard and simplest way to build a chat UI.
-demo = gr.ChatInterface(
-    fn=analyze_fight,
-    title="🥊 BOXTRON-AI: Elite Boxing Analyst Chatbot",
-    description="Ask me to break down an upcoming fight, analyze a fighter's legacy, or detail specific boxing techniques.",
-    # Set the history to be visible, and optionally customize the appearance
-    chatbot=gr.Chatbot(height=500),
-    theme="soft", # A modern theme
-    examples=[
-        ["Analyze the potential fight between Terence Crawford and Errol Spence Jr."],
-        ["What are the strengths and weaknesses of Canelo Alvarez's fighting style?"],
-        ["Predict the outcome of the next Heavyweight title fight."],
-    ]
 )
-# Launch the app
 if __name__ == "__main__":
     demo.launch()

 import gradio as gr
+from huggingface_hub import InferenceClient
+def respond(
+    message,
+    history: list[dict[str, str]],
+    system_message,
+    max_tokens,
+    temperature,
+    top_p,
+    hf_token: gr.OAuthToken,
+):
+    """
+    For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
+    """
+    client = InferenceClient(token=hf_token.token, model="moonshotai/Kimi-K2-Thinking")
+    # --- TRANSFORM HISTORY ---
+    fixed_history = []
+    print(fixed_history)
+    for h in history:
+        # Detect the keys safely
+        user_msg = h.get("user") or h.get("content") or ""
+        bot_msg = h.get("message") or h.get("content") or ""
+        if user_msg:
+            fixed_history.append({"role": "user", "content": user_msg})
+        if bot_msg:
+            fixed_history.append({"role": "assistant", "content": bot_msg})
+    # --- BUILD MESSAGES LIST ---
+    messages = [{"role": "system", "content": system_message}]
+    messages.extend(fixed_history)
+    messages.append({"role": "user", "content": message})
+    response = ""
+    for chunk in client.chat_completion(
+        messages,
+        max_tokens=max_tokens,
+        stream=True,
+        temperature=temperature,
+        top_p=top_p,
+    ):
+        choices = chunk.choices
+        token = ""
+        if len(choices) and choices[0].delta.content:
+            token = choices[0].delta.content
+        response += token
+        yield response
+"""
+For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
+"""
+system_prompt="""
+You are BOXTRON-AI, a highly skilled boxing analyst and professional-level fight judge. Your purpose is to provide objective, deeply informed evaluations of fighters, styles, strategies, and matchups. You score rounds using the official 10-point must system, always basing your judgments on clean and effective punching, effective aggression, ring generalship, and defense. When a round is close, you explain why; when a round is one-sided, you justify the margin. Knockdowns are reflected in the score unless extraordinary circumstances warrant otherwise, and you clearly explain those cases.
+Your analysis of fighters must be technical, comprehensive, and grounded in real boxing principles. This includes breaking down fighting styles, strengths, weaknesses, physical attributes, tendencies, and historical performances. You discuss strategy, game plans, match-up dynamics, pace, footwork, punch selection, defense, adaptability, stamina, and the overall ebb and flow of a bout. Whenever you give predictions, you do so logically and without bias, making your reasoning transparent and acknowledging uncertainties.
+You maintain strict objectivity at all times. You do not favor particular fighters, trainers, or promotions. You avoid hype and keep your focus on evidence and technical detail. If uncertainty exists, you state that clearly and use probabilities instead of definitive claims.
+When asked to predict a fight, you describe multiple plausible scenarios and identify the factors that make each possible. You consider momentum, recent performances, stylistic interactions, weight changes, injury history when reliably documented, defensive responsibility, punch resistance, pace, and likely adjustments. All conclusions are based on established boxing knowledge rather than speculation.
+If you are asked to simulate a fight, you proceed round by round, offering realistic and technically grounded descriptions of the action as it unfolds. At the end of each simulated round, you provide an official score and a concise explanation of why the round was scored that way.
+You avoid unfounded medical claims, do not present rumors as facts, and label speculation clearly when you use it. Your tone is clear, professional, and analytical, resembling a hybrid of an experienced boxing judge and a seasoned ringside analyst. You use accurate boxing terminology and can provide slow-motion-style breakdowns of exchanges when useful.
+You can also find weaknesses in opponents and tell the user how to capitalize on them and defeat their opponent
+"""
+chatbot = gr.ChatInterface(
+    respond,
+    type="messages",
+    additional_inputs=[
+        gr.Textbox(value=system_prompt, label="System message"),
+        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
+        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
+        gr.Slider(
+            minimum=0.1,
+            maximum=1.0,
+            value=0.95,
+            step=0.05,
+            label="Top-p (nucleus sampling)",
+        ),
+    ],
 )
+with gr.Blocks() as demo:
+    with gr.Sidebar():
+        gr.LoginButton()
+    chatbot.render()
 if __name__ == "__main__":
     demo.launch()