Spaces:

Vishwas1
/

LLMTrainingPro

Sleeping

App Files Files Community

Vishwas1 commited on Sep 17, 2024

Commit

2de0e9b

verified ·

1 Parent(s): a61270e

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -11

app.py CHANGED Viewed

@@ -38,7 +38,8 @@ class TrainingRequest(BaseModel):
     task: str  # 'generation' or 'classification'
     model_params: dict
     model_name: str
-    dataset_content: str  # The actual content of the dataset
 # Root Endpoint
 @app.get("/")
@@ -59,28 +60,27 @@ def train_model(request: TrainingRequest):
         session_dir = f"./training_sessions/{session_id}"
         os.makedirs(session_dir, exist_ok=True)
-        # Save the dataset content to a file
-        dataset_path = os.path.join(session_dir, "dataset.txt")
-        with open(dataset_path, "w", encoding="utf-8") as f:
-            f.write(request.dataset_content)
-        # Define the path to train_model.py (assuming it's in the root directory)
         TRAIN_MODEL_PATH = os.path.join(os.path.dirname(__file__), "train_model.py")
         cmd = [
             "python", TRAIN_MODEL_PATH,
             "--task", request.task,
             "--model_name", request.model_name,
-            "--dataset", os.path.abspath(dataset_path),
             "--num_layers", str(request.model_params.get('num_layers', 12)),
             "--attention_heads", str(request.model_params.get('attention_heads', 1)),
             "--hidden_size", str(request.model_params.get('hidden_size', 64)),
             "--vocab_size", str(request.model_params.get('vocab_size', 30000)),
             "--sequence_length", str(request.model_params.get('sequence_length', 512))
         ]
-        # Start the training process as a background task
-        subprocess.Popen(cmd, cwd=session_dir)
         logging.info(f"Training started for model: {request.model_name}, Session ID: {session_id}")
@@ -90,6 +90,11 @@ def train_model(request: TrainingRequest):
         logging.error(f"Error during training request: {str(e)}")
         raise HTTPException(status_code=500, detail=str(e))
 # Optional: Status Endpoint
 @app.get("/status/{session_id}")
 def get_status(session_id: str):

     task: str  # 'generation' or 'classification'
     model_params: dict
     model_name: str
+    dataset_name: str  # The name of the existing Hugging Face dataset
 # Root Endpoint
 @app.get("/")
         session_dir = f"./training_sessions/{session_id}"
         os.makedirs(session_dir, exist_ok=True)
+        # No need to save dataset content; use dataset_name directly
+        dataset_name = request.dataset_name
+        # Define the absolute path to train_model.py
         TRAIN_MODEL_PATH = os.path.join(os.path.dirname(__file__), "train_model.py")
+        # Prepare the command to run the training script with dataset_name
         cmd = [
             "python", TRAIN_MODEL_PATH,
             "--task", request.task,
             "--model_name", request.model_name,
+            "--dataset_name", dataset_name,  # Pass dataset_name instead of dataset file path
             "--num_layers", str(request.model_params.get('num_layers', 12)),
             "--attention_heads", str(request.model_params.get('attention_heads', 1)),
             "--hidden_size", str(request.model_params.get('hidden_size', 64)),
             "--vocab_size", str(request.model_params.get('vocab_size', 30000)),
             "--sequence_length", str(request.model_params.get('sequence_length', 512))
         ]
+        # Start the training process as a background task in the root directory
+        subprocess.Popen(cmd, cwd=os.path.dirname(__file__))
         logging.info(f"Training started for model: {request.model_name}, Session ID: {session_id}")
         logging.error(f"Error during training request: {str(e)}")
         raise HTTPException(status_code=500, detail=str(e))
+    except Exception as e:
+        logging.error(f"Error during training request: {str(e)}")
+        raise HTTPException(status_code=500, detail=str(e))
 # Optional: Status Endpoint
 @app.get("/status/{session_id}")
 def get_status(session_id: str):