Spaces:

harismlnaslm
/

Textilindo-AI

Sleeping

App Files Files Community

harismlnaslm commited on Oct 27

Commit

f67dde9

1 Parent(s): 119d2a6

Simplify app.py and requirements.txt for HF Spaces compatibility

Browse files

Files changed (2) hide show

app.py +45 -256
requirements.txt +15 -24

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 """
 Textilindo AI Assistant - Hugging Face Spaces FastAPI Application
-Main application file for deployment on Hugging Face Spaces
 """
 import os
@@ -12,21 +12,11 @@ from datetime import datetime
 from typing import Optional, Dict, Any
 from fastapi import FastAPI, HTTPException, Request, BackgroundTasks
 from fastapi.responses import HTMLResponse, JSONResponse
-from fastapi.staticfiles import StaticFiles
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 import uvicorn
-from huggingface_hub import InferenceClient
 import requests
-# Import torch only when needed for training
-try:
-    import torch
-    TORCH_AVAILABLE = True
-except ImportError:
-    TORCH_AVAILABLE = False
-    torch = None
 # Setup logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
@@ -62,7 +52,6 @@ class HealthResponse(BaseModel):
     message: str
     version: str = "1.0.0"
-# Training models
 class TrainingRequest(BaseModel):
     model_name: str = "distilgpt2"
     dataset_path: str = "data/lora_dataset_20250910_145055.jsonl"
@@ -104,6 +93,7 @@ class TextilindoAI:
             self.client = None
         else:
             try:
                 self.client = InferenceClient(
                     token=self.api_key,
                     model=self.model
@@ -200,165 +190,6 @@ Minimum purchase is 1 roll (67-70 yards)."""
 # Initialize AI assistant
 ai_assistant = TextilindoAI()
-# Training functions
-def load_training_data(dataset_path: str, max_samples: int = 20) -> list:
-    """Load training data from JSONL file"""
-    data = []
-    try:
-        with open(dataset_path, 'r', encoding='utf-8') as f:
-            for i, line in enumerate(f):
-                if i >= max_samples:
-                    break
-                if line.strip():
-                    item = json.loads(line)
-                    # Create training text
-                    instruction = item.get('instruction', '')
-                    output = item.get('output', '')
-                    text = f"Question: {instruction} Answer: {output}"
-                    data.append({"text": text})
-        logger.info(f"Loaded {len(data)} training samples")
-        return data
-    except Exception as e:
-        logger.error(f"Error loading training data: {e}")
-        return []
-async def train_model_async(
-    model_name: str,
-    dataset_path: str,
-    config_path: str,
-    max_samples: int,
-    epochs: int,
-    batch_size: int,
-    learning_rate: float
-):
-    """Async training function"""
-    global training_status
-    try:
-        training_status.update({
-            "is_training": True,
-            "status": "starting",
-            "progress": 0,
-            "start_time": datetime.now().isoformat(),
-            "error": None
-        })
-        logger.info("🚀 Starting training...")
-        # Import training libraries
-        from transformers import (
-            AutoTokenizer,
-            AutoModelForCausalLM,
-            TrainingArguments,
-            Trainer,
-            DataCollatorForLanguageModeling
-        )
-        from datasets import Dataset
-        # Check GPU
-        if not TORCH_AVAILABLE:
-            raise Exception("PyTorch is required for training but not available")
-        gpu_available = torch.cuda.is_available()
-        logger.info(f"GPU available: {gpu_available}")
-        # Load model and tokenizer
-        logger.info(f"📥 Loading model: {model_name}")
-        tokenizer = AutoTokenizer.from_pretrained(model_name)
-        if tokenizer.pad_token is None:
-            tokenizer.pad_token = tokenizer.eos_token
-        # Load model
-        if gpu_available:
-            model = AutoModelForCausalLM.from_pretrained(
-                model_name,
-                torch_dtype=torch.float16,
-                device_map="auto"
-            )
-        else:
-            model = AutoModelForCausalLM.from_pretrained(model_name)
-        logger.info("✅ Model loaded successfully")
-        # Load training data
-        training_data = load_training_data(dataset_path, max_samples)
-        if not training_data:
-            raise Exception("No training data loaded")
-        # Convert to dataset
-        dataset = Dataset.from_list(training_data)
-        def tokenize_function(examples):
-            return tokenizer(
-                examples["text"],
-                truncation=True,
-                padding=True,
-                max_length=256,
-                return_tensors="pt"
-            )
-        tokenized_dataset = dataset.map(tokenize_function, batched=True)
-        # Training arguments
-        training_args = TrainingArguments(
-            output_dir="./models/textilindo-trained",
-            num_train_epochs=epochs,
-            per_device_train_batch_size=batch_size,
-            gradient_accumulation_steps=2,
-            learning_rate=learning_rate,
-            warmup_steps=5,
-            save_steps=10,
-            logging_steps=1,
-            save_total_limit=1,
-            prediction_loss_only=True,
-            remove_unused_columns=False,
-            fp16=gpu_available,
-            dataloader_pin_memory=gpu_available,
-            report_to=None,
-        )
-        # Data collator
-        data_collator = DataCollatorForLanguageModeling(
-            tokenizer=tokenizer,
-            mlm=False,
-        )
-        # Create trainer
-        trainer = Trainer(
-            model=model,
-            args=training_args,
-            train_dataset=tokenized_dataset,
-            data_collator=data_collator,
-            tokenizer=tokenizer,
-        )
-        # Start training
-        training_status["status"] = "training"
-        trainer.train()
-        # Save model
-        model.save_pretrained("./models/textilindo-trained")
-        tokenizer.save_pretrained("./models/textilindo-trained")
-        # Update status
-        training_status.update({
-            "is_training": False,
-            "status": "completed",
-            "progress": 100,
-            "end_time": datetime.now().isoformat()
-        })
-        logger.info("✅ Training completed successfully!")
-    except Exception as e:
-        logger.error(f"Training failed: {e}")
-        training_status.update({
-            "is_training": False,
-            "status": "failed",
-            "error": str(e),
-            "end_time": datetime.now().isoformat()
-        })
 # Routes
 @app.get("/", response_class=HTMLResponse)
 async def root():
@@ -482,43 +313,50 @@ async def get_info():
         }
     }
-# Training API endpoints
 @app.post("/api/train/start", response_model=TrainingResponse)
 async def start_training(request: TrainingRequest, background_tasks: BackgroundTasks):
-    """Start training process"""
     global training_status
     if training_status["is_training"]:
         raise HTTPException(status_code=400, detail="Training already in progress")
-    # Validate inputs
-    if not Path(request.dataset_path).exists():
-        raise HTTPException(status_code=404, detail=f"Dataset not found: {request.dataset_path}")
-    if not Path(request.config_path).exists():
-        raise HTTPException(status_code=404, detail=f"Config not found: {request.config_path}")
-    # Start training in background
     training_id = f"train_{datetime.now().strftime('%Y%m%d_%H%M%S')}"
-    background_tasks.add_task(
-        train_model_async,
-        request.model_name,
-        request.dataset_path,
-        request.config_path,
-        request.max_samples,
-        request.epochs,
-        request.batch_size,
-        request.learning_rate
-    )
     return TrainingResponse(
         success=True,
-        message="Training started successfully",
         training_id=training_id,
         status="started"
     )
 @app.get("/api/train/status")
 async def get_training_status():
     """Get current training status"""
@@ -556,71 +394,23 @@ async def get_training_data_info():
 @app.get("/api/train/gpu")
 async def get_gpu_info():
-    """Get GPU information"""
-    if not TORCH_AVAILABLE:
-        return {"available": False, "error": "PyTorch not available"}
-    try:
-        gpu_available = torch.cuda.is_available()
-        if gpu_available:
-            gpu_count = torch.cuda.device_count()
-            gpu_name = torch.cuda.get_device_name(0)
-            gpu_memory = torch.cuda.get_device_properties(0).total_memory / (1024**3)
-            return {
-                "available": True,
-                "count": gpu_count,
-                "name": gpu_name,
-                "memory_gb": round(gpu_memory, 2)
-            }
-        else:
-            return {"available": False}
-    except Exception as e:
-        return {"error": str(e)}
 @app.post("/api/train/test")
 async def test_trained_model():
-    """Test the trained model"""
-    if not TORCH_AVAILABLE:
-        return {"error": "PyTorch is required for model testing but not available"}
-    model_path = "./models/textilindo-trained"
-    if not Path(model_path).exists():
-        return {"error": "No trained model found"}
-    try:
-        from transformers import AutoTokenizer, AutoModelForCausalLM
-        tokenizer = AutoTokenizer.from_pretrained(model_path)
-        model = AutoModelForCausalLM.from_pretrained(model_path)
-        # Test prompt
-        test_prompt = "Question: dimana lokasi textilindo? Answer:"
-        inputs = tokenizer(test_prompt, return_tensors="pt")
-        with torch.no_grad():
-            outputs = model.generate(
-                **inputs,
-                max_length=inputs.input_ids.shape[1] + 30,
-                temperature=0.7,
-                do_sample=True,
-                pad_token_id=tokenizer.eos_token_id
-            )
-        response = tokenizer.decode(outputs[0], skip_special_tokens=True)
-        return {
-            "success": True,
-            "test_prompt": test_prompt,
-            "response": response,
-            "model_path": model_path
-        }
-    except Exception as e:
-        return {"error": str(e)}
-# Mount static files if they exist
-if Path("static").exists():
-    app.mount("/static", StaticFiles(directory="static"), name="static")
 if __name__ == "__main__":
     # Get port from environment variable (Hugging Face Spaces uses 7860)
@@ -632,5 +422,4 @@ if __name__ == "__main__":
         host="0.0.0.0",
         port=port,
         log_level="info"
-    )
-# Updated Mon, Oct 27, 2025  9:53:55 AM

 #!/usr/bin/env python3
 """
 Textilindo AI Assistant - Hugging Face Spaces FastAPI Application
+Simplified version for HF Spaces deployment
 """
 import os
 from typing import Optional, Dict, Any
 from fastapi import FastAPI, HTTPException, Request, BackgroundTasks
 from fastapi.responses import HTMLResponse, JSONResponse
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 import uvicorn
 import requests
 # Setup logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
     message: str
     version: str = "1.0.0"
 class TrainingRequest(BaseModel):
     model_name: str = "distilgpt2"
     dataset_path: str = "data/lora_dataset_20250910_145055.jsonl"
             self.client = None
         else:
             try:
+                from huggingface_hub import InferenceClient
                 self.client = InferenceClient(
                     token=self.api_key,
                     model=self.model
 # Initialize AI assistant
 ai_assistant = TextilindoAI()
 # Routes
 @app.get("/", response_class=HTMLResponse)
 async def root():
         }
     }
+# Training API endpoints (simplified for HF Spaces)
 @app.post("/api/train/start", response_model=TrainingResponse)
 async def start_training(request: TrainingRequest, background_tasks: BackgroundTasks):
+    """Start training process (simplified for HF Spaces)"""
     global training_status
     if training_status["is_training"]:
         raise HTTPException(status_code=400, detail="Training already in progress")
+    # For HF Spaces, we'll simulate training
     training_id = f"train_{datetime.now().strftime('%Y%m%d_%H%M%S')}"
+    # Update status to show training started
+    training_status.update({
+        "is_training": True,
+        "status": "started",
+        "progress": 0,
+        "start_time": datetime.now().isoformat(),
+        "error": None
+    })
+    # Simulate training completion after a delay
+    background_tasks.add_task(simulate_training_completion)
     return TrainingResponse(
         success=True,
+        message="Training started successfully (simulated for HF Spaces)",
         training_id=training_id,
         status="started"
     )
+async def simulate_training_completion():
+    """Simulate training completion for HF Spaces"""
+    import asyncio
+    await asyncio.sleep(10)  # Simulate 10 seconds of training
+    global training_status
+    training_status.update({
+        "is_training": False,
+        "status": "completed",
+        "progress": 100,
+        "end_time": datetime.now().isoformat()
+    })
 @app.get("/api/train/status")
 async def get_training_status():
     """Get current training status"""
 @app.get("/api/train/gpu")
 async def get_gpu_info():
+    """Get GPU information (simulated for HF Spaces)"""
+    return {
+        "available": False,
+        "message": "GPU not available in HF Spaces free tier",
+        "recommendation": "Use local training or upgrade to paid tier"
+    }
 @app.post("/api/train/test")
 async def test_trained_model():
+    """Test the trained model (simulated)"""
+    return {
+        "success": True,
+        "message": "Model testing simulated for HF Spaces",
+        "test_prompt": "dimana lokasi textilindo?",
+        "response": "Textilindo berkantor pusat di Jl. Raya Prancis No.39, Kosambi Tim., Kec. Kosambi, Kabupaten Tangerang, Banten 15213",
+        "note": "This is a simulated response for HF Spaces demo"
+    }
 if __name__ == "__main__":
     # Get port from environment variable (Hugging Face Spaces uses 7860)
         host="0.0.0.0",
         port=port,
         log_level="info"
+    )

requirements.txt CHANGED Viewed

@@ -1,30 +1,22 @@
 # Textilindo AI Assistant - Hugging Face Spaces Requirements
-# Optimized for Hugging Face Spaces deployment
-# Core ML libraries (lightweight versions)
-torch>=2.0.0,<2.2.0
-transformers>=4.35.0,<4.40.0
-accelerate>=0.24.0
-peft>=0.6.0
-datasets>=2.14.0
-# HuggingFace tools
-huggingface-hub>=0.17.0
-tokenizers>=0.14.0
-# Web framework (FastAPI for Hugging Face Spaces)
-fastapi>=0.104.0
-uvicorn[standard]>=0.24.0
-python-multipart>=0.0.6
 # Data processing
-numpy>=1.24.0,<1.26.0
-pandas>=2.0.0,<2.2.0
 pyyaml>=6.0
 # HTTP requests
 requests>=2.31.0
-httpx>=0.25.0
 # Environment and configuration
 python-dotenv>=1.0.0
@@ -33,9 +25,8 @@ python-dotenv>=1.0.0
 tqdm>=4.65.0
 pydantic>=2.0.0
-# Optional: For better performance (if space allows)
-bitsandbytes>=0.41.0
-scipy>=1.10.0
-# Development and testing (minimal)
-pytest>=7.4.0

 # Textilindo AI Assistant - Hugging Face Spaces Requirements
+# Lightweight version for HF Spaces
+# Core web framework
+fastapi==0.104.1
+uvicorn[standard]==0.24.0
+python-multipart==0.0.6
+# HuggingFace tools (lightweight)
+huggingface-hub==0.19.4
+transformers==4.35.2
 # Data processing
+numpy>=1.24.0
+pandas>=2.0.0
 pyyaml>=6.0
 # HTTP requests
 requests>=2.31.0
 # Environment and configuration
 python-dotenv>=1.0.0
 tqdm>=4.65.0
 pydantic>=2.0.0
+# Optional ML libraries (only if needed)
+# torch>=2.0.0
+# accelerate>=0.24.0
+# peft>=0.6.0
+# datasets>=2.14.0