Spaces:

tasal9
/

pashto-base-bloom-space

Runtime error

File size: 7,401 Bytes

1e0b125
bcc64df
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2b667ef
bcc64df
 
 
44d33c3
 
 
 
 
 
 
 
bcc64df
 
 
 
 
 
 
 
 
 
 
1e0b125
f4a690e
d5f3038
f4a690e
bcc64df
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1e0b125
f4a690e
d5f3038
bcc64df
 
2b667ef
bcc64df
 
 
 
 
 
 
d5f3038
f4a690e
c207d87
bcc64df
 
2b667ef
bcc64df
 
 
 
 
 
 
 
 
2b667ef
 
 
 
 
 
 
 
 
 
 
 
 
 
bcc64df
 
 
2b667ef
bcc64df
 
1e0b125
f4a690e
bcc64df
 
 
d5f3038
bcc64df
 
f4a690e
bcc64df
 
 
 
f4a690e
 
bcc64df
 
 
 
 
 
 
f4a690e
 
bcc64df
 
 
 
 
 
 
f4a690e
bcc64df
 
 
 
 
 
5787f73
bcc64df
 
 
 
 
 
1e0b125
 
c65f526

import gradio as gr
import time
import threading
import random
from datetime import datetime

# Global state to track training/fine-tuning status
class TrainingState:
    def __init__(self):
        self.status = "idle"
        self.progress = 0
        self.logs = []
        self.start_time = None
        self.model_name = "tasal9/pashto-base-bloom"
        self.active_process = None

    def start_training(self, data_size):
        self.status = "training"
        self.progress = 0
        self.logs = [f"Training started at {datetime.now().strftime('%H:%M:%S')}"]
        self.logs.append(f"Training data size: {data_size} characters")
        self.start_time = time.time()
        
    def start_finetuning(self, data_size):
        self.status = "fine-tuning"
        self.progress = 0
        self.logs = [f"Fine-tuning started at {datetime.now().strftime('%H:%M:%S')}"]
        self.logs.append(f"Fine-tuning data size: {data_size} characters")
        self.start_time = time.time()
        
    def update_progress(self, progress):
        self.progress = min(100, max(0, progress))
        if progress >= 100 and self.status != "idle":
            self.complete_process()
            
    def add_log(self, message):
        self.logs.append(f"[{datetime.now().strftime('%H:%M:%S')}] {message}")
        if len(self.logs) > 10:
            self.logs.pop(0)
            
    def complete_process(self):
    current_status = self.status  # save before setting to idle
    if self.start_time is not None:
        elapsed = time.time() - self.start_time
        self.add_log(f"{current_status.capitalize()} completed in {elapsed:.1f} seconds!")
    else:
        self.add_log(f"{current_status.capitalize()} completed!")
    self.status = "idle"
    self.progress = 100
        
    def get_status(self):
        status_map = {
            "idle": "✅ Ready",
            "training": "🔄 Training in progress",
            "fine-tuning": "🔄 Fine-tuning in progress"
        }
        return status_map.get(self.status, "❓ Unknown status")

# Create global state
state = TrainingState()

def test_model(input_text):
    if not input_text.strip():
        return "Please enter some text to test."
    responses = [
        f"Processed: '{input_text}'",
        f"Model response to: {input_text}",
        f"Analysis: This appears to be Pashto text with {len(input_text)} characters",
        f"✅ Received: {input_text}",
        f"Generated continuation: {input_text}... [simulated output]"
    ]
    return random.choice(responses)

def simulate_process(duration, process_type, data_size):
    if process_type == "train":
        state.start_training(data_size)
    else:
        state.start_finetuning(data_size)
    
    steps = 10
    for i in range(steps + 1):
        time.sleep(duration / steps)
        progress = int((i / steps) * 100)
        state.update_progress(progress)
        if i % 3 == 0:
            messages = [
                f"Processing batch {i*5}/{steps*5}",
                f"Loss: {random.uniform(0.1, 1.0):.4f}",
                f"Accuracy: {random.uniform(80, 95):.1f}%",
                f"Learning rate: {random.uniform(1e-5, 1e-3):.6f}"
            ]
            state.add_log(random.choice(messages))
    state.complete_process()

def train_model(dataset_text):
    if not dataset_text.strip():
        return "Please provide training data.", ""
    data_size = len(dataset_text)
    if getattr(state, 'status', 'idle') != "idle":
        return "Another process is already running. Please wait.", ""
    threading.Thread(
        target=simulate_process,
        args=(15, "train", data_size),
        daemon=True
    ).start()
    return "Training started successfully! Check status in the Status tab.", ""

def finetune_model(dataset_text):
    if not dataset_text.strip():
        return "Please provide fine-tuning data.", ""
    data_size = len(dataset_text)
    if getattr(state, 'status', 'idle') != "idle":
        return "Another process is already running. Please wait.", ""
    threading.Thread(
        target=simulate_process,
        args=(10, "fine-tune", data_size),
        daemon=True
    ).start()
    return "Fine-tuning started successfully! Check status in the Status tab.", ""

def get_current_status():
    try:
        status_text = state.get_status()
    except Exception as e:
        status_text = f"❌ Error: {str(e)}"
    
    try:
        progress = state.progress
    except:
        progress = 0

    try:
        logs = "\n".join(state.logs[-10:]) if hasattr(state, 'logs') else "No logs available"
    except:
        logs = "❌ Failed to retrieve logs."
    
    return {
        status_box: status_text,
        progress_bar: progress,
        log_output: logs
    }

# Create interface
with gr.Blocks(title="Pashto-Base-Bloom Trainer", theme="soft") as demo:
    gr.Markdown("# 🌸 Pashto-Base-Bloom Training Space")
    gr.Markdown("Train and fine-tune Pashto language model tasal9/pashto-base-bloom")
    
    with gr.Tab("Test Model"):
        gr.Markdown("### Test Model with Sample Text")
        with gr.Row():
            with gr.Column():
                test_input = gr.Textbox(label="Input Text", lines=3, placeholder="Enter Pashto text here...")
                test_btn = gr.Button("Run Test", variant="primary")
            test_output = gr.Textbox(label="Model Output", lines=4, interactive=False)
        test_btn.click(test_model, inputs=test_input, outputs=test_output)
    
    with gr.Tab("Train Model"):
        gr.Markdown("### Train Model with New Data")
        with gr.Row():
            with gr.Column():
                train_input = gr.Textbox(label="Training Data", lines=8, placeholder="Paste training dataset here...")
                train_btn = gr.Button("Start Training", variant="primary")
            train_output = gr.Textbox(label="Training Status", lines=2, interactive=False)
        train_btn.click(train_model, inputs=train_input, outputs=train_output)
    
    with gr.Tab("Fine-tune Model"):
        gr.Markdown("### Fine-tune Model with Specialized Data")
        with gr.Row():
            with gr.Column():
                finetune_input = gr.Textbox(label="Fine-tuning Data", lines=8, placeholder="Paste fine-tuning dataset here...")
                finetune_btn = gr.Button("Start Fine-tuning", variant="primary")
            finetune_output = gr.Textbox(label="Fine-tuning Status", lines=2, interactive=False)
        finetune_btn.click(finetune_model, inputs=finetune_input, outputs=finetune_output)
    
    with gr.Tab("Status"):
        gr.Markdown("### System Status")
        with gr.Row():
            with gr.Column():
                status_box = gr.Textbox(label="Current Status", interactive=False)
                progress_bar = gr.Slider(label="Progress", minimum=0, maximum=100, value=0, interactive=False)
                refresh_btn = gr.Button("Refresh Status", variant="secondary")
                auto_refresh = gr.Checkbox(label="Auto-refresh every 5 seconds", value=True)
            log_output = gr.Textbox(label="Process Logs", lines=8, interactive=False)
        
        refresh_btn.click(get_current_status, outputs=[status_box, progress_bar, log_output])
        demo.load(get_current_status, outputs=[status_box, progress_bar, log_output])

if __name__ == "__main__":
    demo.launch(server_port=7860, ssr_mode=False, share=False)