Spaces:

wuhp
/

test-detr

Sleeping

App Files Files Community

wuhp commited on Sep 18

Commit

c54a7a8

verified ·

1 Parent(s): a68cd78

Update app.py

Browse files

Files changed (1) hide show

app.py +440 -208

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import shutil
 import stat
 import yaml
 import gradio as gr
-from ultralytics import YOLO # Note: This is the training engine for RT-DETR in this library.
 from roboflow import Roboflow
 import re
 from urllib.parse import urlparse
@@ -40,22 +40,87 @@ RTDETR_MODELS = {
 }
 DEFAULT_MODEL = "rtdetr-l.pt"
-# --- Helper & Core Logic Functions ---
 def handle_remove_readonly(func, path, exc_info):
     """Error handler for shutil.rmtree."""
-    os.chmod(path, stat.S_IWRITE)
     func(path)
-def parse_roboflow_url(url):
-    """Parses Roboflow URL to get workspace, project, and version."""
-    parsed = urlparse(url.strip())
-    path_parts = parsed.path.strip('/').split('/')
-    if len(path_parts) >= 3 and 'roboflow.com' in parsed.netloc:
-        # Format: /workspace/project-id/version
-        return path_parts[1], path_parts[2], path_parts[3] if len(path_parts) > 3 else None
     return None, None, None
 def get_latest_version(api_key, workspace, project):
     """Gets the latest version number of a Roboflow project."""
     try:
@@ -67,246 +132,348 @@ def get_latest_version(api_key, workspace, project):
         logging.error(f"Could not get latest version for {workspace}/{project}: {e}")
         return None
 def download_dataset(api_key, workspace, project, version):
-    """Downloads a single dataset from Roboflow."""
     try:
         rf = Roboflow(api_key=api_key)
         proj = rf.workspace(workspace).project(project)
-        # RT-DETR trains perfectly with the yolov8 format.
-        dataset = proj.version(int(version)).download("yolov8")
-        with open(os.path.join(dataset.location, 'data.yaml'), 'r') as f:
             data_yaml = yaml.safe_load(f)
         class_names = data_yaml.get('names', [])
-        splits = [s for s in ['train', 'valid', 'test'] if os.path.exists(os.path.join(dataset.location, s))]
         return dataset.location, class_names, splits, f"{project}-v{version}"
     except Exception as e:
         logging.error(f"Failed to download {workspace}/{project}/v{version}: {e}")
         return None, [], [], None
 def gather_class_counts(dataset_info, class_mapping):
-    """Calculates image counts for each final class based on the mapping."""
-    unified_names = set(class_mapping.values())
-    counts = {name: 0 for name in unified_names}
-    if not dataset_info: return counts
     for loc, names, splits, _ in dataset_info:
         for split in splits:
             labels_dir = os.path.join(loc, split, 'labels')
-            if not os.path.exists(labels_dir): continue
             for label_file in os.listdir(labels_dir):
-                found_in_file = set()
                 with open(os.path.join(labels_dir, label_file), 'r') as f:
                     for line in f:
                         try:
-                            class_id = int(line.split()[0])
-                            original_name = names[class_id]
-                            mapped_name = class_mapping.get(original_name, original_name)
-                            if mapped_name in unified_names:
-                                found_in_file.add(mapped_name)
-                        except (ValueError, IndexError):
                             continue
-                for cls in found_in_file:
-                    counts[cls] += 1
     return counts
 def finalize_merged_dataset(dataset_info, class_mapping, class_limits, progress=gr.Progress()):
-    """The core function to merge datasets based on user rules."""
     merged_dir = 'rolo_merged_dataset'
     if os.path.exists(merged_dir):
         shutil.rmtree(merged_dir, onerror=handle_remove_readonly)
     progress(0, desc="Creating directories...")
     for split in ['train', 'valid', 'test']:
         os.makedirs(os.path.join(merged_dir, split, 'images'), exist_ok=True)
         os.makedirs(os.path.join(merged_dir, split, 'labels'), exist_ok=True)
-    active_classes = sorted([cls for cls, limit in class_limits.items() if limit > 0])
     final_class_map = {name: i for i, name in enumerate(active_classes)}
     all_images = []
     for loc, _, splits, _ in dataset_info:
         for split in splits:
             img_dir = os.path.join(loc, split, 'images')
-            if not os.path.exists(img_dir): continue
             for img_file in os.listdir(img_dir):
                 if img_file.lower().endswith(('.jpg', '.jpeg', '.png')):
                     all_images.append((os.path.join(img_dir, img_file), split, loc))
     random.shuffle(all_images)
     progress(0.2, desc="Selecting images based on limits...")
-    selected_images = set()
     current_counts = {cls: 0 for cls in active_classes}
-    for img_path, original_split, source_loc in progress.tqdm(all_images, desc="Analyzing images"):
-        lbl_path = img_path.replace('/images/', '/labels/').rsplit('.', 1)[0] + '.txt'
-        if not os.path.exists(lbl_path): continue
         image_classes = set()
         with open(lbl_path, 'r') as f:
             for line in f:
                 try:
-                    source_names = next(info[1] for info in dataset_info if info[0] == source_loc)
-                    original_name = source_names[int(line.split()[0])]
-                    mapped_name = class_mapping.get(original_name, original_name)
-                    if mapped_name in active_classes:
-                        image_classes.add(mapped_name)
-                except (ValueError, IndexError, StopIteration): continue
-        can_add = True
-        for cls in image_classes:
-            if current_counts[cls] >= class_limits[cls]:
-                can_add = False
-                break
-        if can_add and image_classes:
-            selected_images.add((img_path, original_split))
-            for cls in image_classes:
-                current_counts[cls] += 1
     progress(0.6, desc=f"Copying {len(selected_images)} files...")
     for img_path, split in progress.tqdm(selected_images, desc="Finalizing files"):
-        lbl_path = img_path.replace('/images/', '/labels/').rsplit('.', 1)[0] + '.txt'
-        shutil.copy(img_path, os.path.join(merged_dir, split, 'images'))
-        with open(lbl_path, 'r') as f_in, open(os.path.join(merged_dir, split, 'labels', os.path.basename(lbl_path)), 'w') as f_out:
             for line in f_in:
-                parts = line.split()
                 try:
-                    source_loc = next(info[0] for info in dataset_info if img_path.startswith(info[0]))
-                    source_names = next(info[1] for info in dataset_info if info[0] == source_loc)
-                    original_name = source_names[int(parts[0])]
                     mapped_name = class_mapping.get(original_name, original_name)
                     if mapped_name in final_class_map:
                         new_id = final_class_map[mapped_name]
                         f_out.write(f"{new_id} {' '.join(parts[1:])}\n")
-                except (ValueError, IndexError, StopIteration): continue
     progress(0.95, desc="Creating data.yaml...")
     with open(os.path.join(merged_dir, 'data.yaml'), 'w') as f:
         yaml.dump({
-            'path': os.path.abspath(merged_dir), 'train': 'train/images', 'val': 'valid/images', 'test': 'test/images',
-            'nc': len(active_classes), 'names': active_classes
         }, f)
     return f"Dataset finalized with {len(selected_images)} images.", os.path.abspath(merged_dir)
-# --- Gradio UI Event Handlers ---
 def load_datasets_handler(api_key, url_file, progress=gr.Progress()):
     """Handles the 'Load Datasets' button click."""
-    if not api_key: raise gr.Error("Roboflow API Key is required.")
-    if not url_file: raise gr.Error("Please upload a .txt file with Roboflow URLs.")
-    with open(url_file.name, 'r') as f:
         urls = [line.strip() for line in f if line.strip()]
     dataset_info = []
-    for i, url in enumerate(urls):
-        progress((i+1)/len(urls), desc=f"Processing URL {i+1}/{len(urls)}")
-        workspace, project, version = parse_roboflow_url(url)
-        if not all([workspace, project]):
-            logging.warning(f"Invalid URL skipped: {url}")
             continue
-        if not version:
-            version = get_latest_version(api_key, workspace, project)
-            if not version:
-                logging.warning(f"Could not find version for {project}. Skipping.")
                 continue
-        loc, names, splits, name_str = download_dataset(api_key, workspace, project, str(version))
         if loc:
             dataset_info.append((loc, names, splits, name_str))
-    if not dataset_info: raise gr.Error("No datasets were loaded successfully.")
     all_names = sorted(list(set(n for _, names, _, _ in dataset_info for n in names)))
     class_map = {name: name for name in all_names}
     initial_counts = gather_class_counts(dataset_info, class_map)
     df_data = [[name, name, initial_counts.get(name, 0), False] for name in all_names]
-    return "Datasets loaded successfully. Proceed to the next tab to manage classes.", dataset_info, gr.DataFrame.update(value=pd.DataFrame(df_data, columns=["Original Name", "Rename To", "Max Images", "Remove"]))
 def update_class_counts_handler(class_df, dataset_info):
-    """Provides live feedback on class counts as the user edits the DataFrame."""
-    if class_df is None or not dataset_info: return None
-    class_mapping = dict(zip(class_df["Original Name"], class_df["Rename To"]))
-    updated_counts = gather_class_counts(dataset_info, class_mapping)
-    merged_summary = {}
     for _, row in class_df.iterrows():
-        if not row["Remove"]:
-            rename_to = row["Rename To"]
-            # This logic needs to be careful: sum counts of all original classes that map to the same `rename_to`
-            # Let's recalculate based on mapping
-            merged_summary[rename_to] = 0 # reset
-    for original_name, rename_to in class_mapping.items():
-         if rename_to in merged_summary:
-            # find count for original name in its original mapped state
-            original_count = gather_class_counts(dataset_info, {k:k for k in class_mapping.keys()}).get(original_name,0)
-            is_removed = class_df.loc[class_df['Original Name'] == original_name, 'Remove'].iloc[0]
-            if not is_removed:
-                merged_summary[rename_to] += original_count
-    final_summary = {}
-    # Recalculate from scratch for simplicity and accuracy
-    class_map_for_summary = dict(zip(class_df["Original Name"], class_df["Rename To"]))
-    all_final_names = set(class_df[~class_df['Remove']]['Rename To'])
-    final_counts = {name: 0 for name in all_final_names}
     for loc, names, splits, _ in dataset_info:
         for split in splits:
             labels_dir = os.path.join(loc, split, 'labels')
-            if not os.path.exists(labels_dir): continue
             for label_file in os.listdir(labels_dir):
-                found_in_file = set()
                 with open(os.path.join(labels_dir, label_file), 'r') as f:
                     for line in f:
                         try:
-                            class_id = int(line.split()[0])
-                            original_name = names[class_id]
-                            is_removed = class_df.loc[class_df['Original Name'] == original_name, 'Remove'].iloc[0]
-                            if not is_removed:
-                                mapped_name = class_map_for_summary.get(original_name)
-                                if mapped_name:
-                                    found_in_file.add(mapped_name)
-                        except (ValueError, IndexError, KeyError): continue
-                for cls in found_in_file:
-                    final_counts[cls] += 1
-    summary_df = pd.DataFrame(list(final_counts.items()), columns=["Final Class Name", "Est. Total Images"])
     return summary_df
 def finalize_handler(dataset_info, class_df, progress=gr.Progress()):
     """Handles the 'Finalize' button click."""
-    if not dataset_info: raise gr.Error("Load datasets first in Tab 1.")
-    if class_df is None: raise gr.Error("Class data is missing.")
-    class_mapping = dict(zip(class_df["Original Name"], class_df["Rename To"]))
     class_limits = {}
     for _, row in class_df.iterrows():
-        if not row["Remove"]:
-            rename_to = row["Rename To"]
-            class_limits[rename_to] = class_limits.get(rename_to, 0) + int(row["Max Images"])
     status, path = finalize_merged_dataset(dataset_info, class_mapping, class_limits, progress)
     return status, path
 def training_handler(dataset_path, model_filename, run_name, epochs, batch, imgsz, lr, opt, progress=gr.Progress()):
-    """Handles the training process with real-time feedback."""
-    if not dataset_path: raise gr.Error("Finalize a dataset in Tab 2 before training.")
     metrics_queue = Queue()
     def on_epoch_end(trainer):
         metrics_queue.put({
-            'epoch': trainer.epoch + 1, 'train_loss': trainer.metrics.get('train/loss'),
-            'val_loss': trainer.metrics.get('val/loss'), 'mAP50': trainer.metrics.get('metrics/mAP50(B)'),
-            'mAP50_95': trainer.metrics.get('metrics/mAP50-95(B)')
         })
     def train_thread_func():
@@ -315,22 +482,30 @@ def training_handler(dataset_path, model_filename, run_name, epochs, batch, imgs
             weights_path = os.path.join('pretrained_models', model_filename)
             if not os.path.exists(weights_path):
                 os.makedirs('pretrained_models', exist_ok=True)
-                r = requests.get(model_url, stream=True)
                 r.raise_for_status()
                 with open(weights_path, 'wb') as f:
                     for chunk in r.iter_content(chunk_size=8192):
                         f.write(chunk)
             model = YOLO(weights_path)
             model.add_callback("on_train_epoch_end", on_epoch_end)
             model.train(
-                data=os.path.join(dataset_path, 'data.yaml'), epochs=epochs, batch=batch, imgsz=imgsz,
-                lr0=lr, optimizer=opt, project='runs/train', name=run_name, exist_ok=True,
-                device=0 if torch.cuda.is_available() else 'cpu'
             )
             metrics_queue.put("done")
         except Exception as e:
-            logging.error(f"Training thread error: {e}")
             metrics_queue.put(f"error: {e}")
     Thread(target=train_thread_func, daemon=True).start()
@@ -339,38 +514,52 @@ def training_handler(dataset_path, model_filename, run_name, epochs, batch, imgs
     while True:
         item = metrics_queue.get()
         if isinstance(item, str):
-            if item == "done": break
-            if item.startswith("error"): raise gr.Error(f"Training failed: {item}")
-        for key, val in item.items():
-            if val is not None: history[key].append(val)
-        current_epoch = history['epoch'][-1]
-        progress(current_epoch / epochs, desc=f"Epoch {current_epoch}/{epochs}")
-        # Gradio Plotting does not require clearing figures
-        fig_loss = plt.figure(); ax_loss = fig_loss.add_subplot(111)
         ax_loss.plot(history['epoch'], history['train_loss'], "o-", label='Train Loss')
         ax_loss.plot(history['epoch'], history['val_loss'], "o-", label='Val Loss')
-        ax_loss.legend(); ax_loss.set_title("Loss")
-        fig_map = plt.figure(); ax_map = fig_map.add_subplot(111)
         ax_map.plot(history['epoch'], history['mAP50'], "o-", label='mAP@0.5')
         ax_map.plot(history['epoch'], history['mAP50_95'], "o-", label='mAP@0.5:0.95')
-        ax_map.legend(); ax_map.set_title("mAP")
-        yield f"Epoch {current_epoch}/{epochs} complete.", fig_loss, fig_map, None
-    final_path = os.path.join('runs/train', run_name, 'weights/best.pt')
     if not os.path.exists(final_path):
         raise gr.Error("Training finished, but 'best.pt' was not found.")
     yield "Training complete!", None, None, gr.File.update(value=final_path, visible=True)
 def upload_handler(model_file, hf_token, hf_repo, gh_token, gh_repo, progress=gr.Progress()):
-    """Handles the model upload to Hugging Face and GitHub."""
-    if not model_file: raise gr.Error("No trained model file available to upload. Train a model first.")
     hf_status = "Skipped Hugging Face (credentials not provided)."
     if hf_token and hf_repo:
         progress(0, desc="Uploading to Hugging Face...")
@@ -379,54 +568,71 @@ def upload_handler(model_file, hf_token, hf_repo, gh_token, gh_repo, progress=gr
             HfFolder.save_token(hf_token)
             repo_url = api.create_repo(repo_id=hf_repo, exist_ok=True, token=hf_token)
             api.upload_file(
-                path_or_fileobj=model_file.name, path_in_repo=os.path.basename(model_file.name),
-                repo_id=hf_repo, token=hf_token
             )
             hf_status = f"Success! Model at: {repo_url}"
-        except Exception as e: hf_status = f"Hugging Face Error: {e}"
     gh_status = "Skipped GitHub (credentials not provided)."
     if gh_token and gh_repo:
         progress(0.5, desc="Uploading to GitHub...")
         try:
             username, repo_name = gh_repo.split('/')
             api_url = f"https://api.github.com/repos/{username}/{repo_name}/contents/{os.path.basename(model_file.name)}"
             headers = {"Authorization": f"token {gh_token}"}
-            with open(model_file.name, "rb") as f: content = base64.b64encode(f.read()).decode()
-            get_resp = requests.get(api_url, headers=headers)
             sha = get_resp.json().get('sha') if get_resp.ok else None
-            data = {"message": "Upload trained model from Rolo app", "content": content, "sha": sha}
-            put_resp = requests.put(api_url, headers=headers, json={k: v for k, v in data.items() if v is not None})
-            if put_resp.ok: gh_status = f"Success! Model at: {put_resp.json()['content']['html_url']}"
-            else: gh_status = f"GitHub Error: {put_resp.json().get('message', 'Unknown')}"
-        except Exception as e: gh_status = f"GitHub Error: {e}"
     progress(1)
     return hf_status, gh_status
-# --- Gradio UI Layout ---
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="sky")) as app:
     gr.Markdown("# Rolo: A Dedicated RT-DETR Training Dashboard")
     # State variables
     dataset_info_state = gr.State([])
     final_dataset_path_state = gr.State(None)
     with gr.Tabs():
         with gr.TabItem("1. Prepare Datasets"):
-            gr.Markdown("### Load Roboflow Datasets\nProvide your Roboflow API key and upload a `.txt` file containing one Roboflow dataset URL per line.")
             with gr.Row():
-                rf_api_key = gr.Textbox(label="Roboflow API Key", type="password", scale=2)
                 rf_url_file = gr.File(label="Upload Roboflow URLs (.txt)", file_types=[".txt"], scale=1)
             load_btn = gr.Button("Load Datasets", variant="primary")
             dataset_status = gr.Textbox(label="Status", interactive=False)
         with gr.TabItem("2. Manage & Merge"):
-            gr.Markdown("### Configure Classes and Finalize Dataset\nRename classes to merge them, set image limits, or remove them. Click **Update Counts** to see a preview of your changes, then click **Finalize** to create the dataset.")
             with gr.Row():
                 class_df = gr.DataFrame(
                     headers=["Original Name", "Rename To", "Max Images", "Remove"],
@@ -434,9 +640,13 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="sky")) as app:
                     label="Class Configuration", interactive=True, scale=3
                 )
                 with gr.Column(scale=1):
-                    class_count_summary_df = gr.DataFrame(label="Merged Class Counts Preview", headers=["Final Class Name", "Est. Total Images"], interactive=False)
                     update_counts_btn = gr.Button("Update Counts")
             finalize_btn = gr.Button("Finalize Merged Dataset", variant="primary")
             finalize_status = gr.Textbox(label="Status", interactive=False)
@@ -444,13 +654,15 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="sky")) as app:
             gr.Markdown("### Set Hyperparameters and Train the RT-DETR Model")
             with gr.Row():
                 with gr.Column(scale=1):
-                    model_file_dd = gr.Dropdown(label="Select Pre-Trained RT-DETR Model",
-                                                choices=[m["filename"] for m in RTDETR_MODELS["detection"]], value=DEFAULT_MODEL)
                     run_name_tb = gr.Textbox(label="Run Name", value="rtdetr_run_1")
                     epochs_sl = gr.Slider(1, 500, 100, step=1, label="Epochs")
                     batch_sl = gr.Slider(1, 32, 8, step=1, label="Batch Size")
                     imgsz_num = gr.Number(label="Image Size", value=640)
-                    # <<< FIXED: Removed the 'format' argument which is not supported.
                     lr_num = gr.Number(label="Learning Rate", value=0.001)
                     opt_dd = gr.Dropdown(["Adam", "AdamW", "SGD"], value="Adam", label="Optimizer")
                     train_btn = gr.Button("Start Training", variant="primary")
@@ -476,14 +688,34 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="sky")) as app:
                 hf_status = gr.Textbox(label="Hugging Face Status", interactive=False)
                 gh_status = gr.Textbox(label="GitHub Status", interactive=False)
-    # --- Wire UI handlers ---
-    load_btn.click(fn=load_datasets_handler, inputs=[rf_api_key, rf_url_file], outputs=[dataset_status, dataset_info_state, class_df])
-    update_counts_btn.click(fn=update_class_counts_handler, inputs=[class_df, dataset_info_state], outputs=[class_count_summary_df])
-    finalize_btn.click(fn=finalize_handler, inputs=[dataset_info_state, class_df], outputs=[finalize_status, final_dataset_path_state])
-    train_btn.click(fn=training_handler,
-                    inputs=[final_dataset_path_state, model_file_dd, run_name_tb, epochs_sl, batch_sl, imgsz_num, lr_num, opt_dd],
-                    outputs=[train_status, loss_plot, map_plot, final_model_file])
-    upload_btn.click(fn=upload_handler, inputs=[final_model_file, hf_token, hf_repo, gh_token, gh_repo], outputs=[hf_status, gh_status])
 if __name__ == "__main__":
-    app.launch(debug=True)

 import stat
 import yaml
 import gradio as gr
+from ultralytics import YOLO  # Ultralytics RT-DETR runner
 from roboflow import Roboflow
 import re
 from urllib.parse import urlparse
 }
 DEFAULT_MODEL = "rtdetr-l.pt"
+# ------------------------------
+# Utilities
+# ------------------------------
 def handle_remove_readonly(func, path, exc_info):
     """Error handler for shutil.rmtree."""
+    try:
+        os.chmod(path, stat.S_IWRITE)
+    except Exception:
+        pass
     func(path)
+_ROBO_URL_RX = re.compile(
+    r"""
+    ^(?:
+        (?:https?://)?(?:universe|app|www)?\.?roboflow\.com/    # Any roboflow host
+        (?P<ws>[A-Za-z0-9\-_]+)/                                # workspace
+        (?P<proj>[A-Za-z0-9\-_]+)/?                              # project
+        (?:
+            (?:dataset/[^/]+/)?                                  # optional 'dataset/<fmt>/'
+            (?:v?(?P<ver>\d+))?                                  # optional version 'vN' or 'N'
+        )?
+      |
+        (?P<ws2>[A-Za-z0-9\-_]+)/(?P<proj2>[A-Za-z0-9\-_]+)(?:/(?:v)?(?P<ver2>\d+))?  # raw ws/proj[/vN]
+    )$
+    """,
+    re.VERBOSE | re.IGNORECASE
+)
+def parse_roboflow_url(s: str):
+    """
+    Accepts:
+      - https://universe.roboflow.com/<workspace>/<project>[/vN | /N]
+      - https://app.roboflow.com/<workspace>/<project>[/vN | /N]
+      - https://roboflow.com/<workspace>/<project>[/vN | /N]
+      - raw: <workspace>/<project>[/vN | /N]
+    Returns: (workspace, project, version_or_None)
+    """
+    s = s.strip()
+    # Fast path: try regex
+    m = _ROBO_URL_RX.match(s)
+    if m:
+        ws = m.group('ws') or m.group('ws2')
+        proj = m.group('proj') or m.group('proj2')
+        ver = m.group('ver') or m.group('ver2')
+        return ws, proj, (int(ver) if ver else None)
+    # Fallback: parse like URL and split path
+    parsed = urlparse(s)
+    parts = [p for p in parsed.path.strip('/').split('/') if p]
+    if len(parts) >= 2:
+        # Try to pull raw version from the 3rd part if it exists
+        version = None
+        if len(parts) >= 3:
+            # Accept 'vN' or 'N'
+            vpart = parts[2]
+            if vpart.lower().startswith('v') and vpart[1:].isdigit():
+                version = int(vpart[1:])
+            elif vpart.isdigit():
+                version = int(vpart)
+        return parts[0], parts[1], version
+    # Fallback raw "ws/proj" without slashes in URL
+    if '/' in s and 'roboflow' not in s:
+        p = s.split('/')
+        if len(p) >= 2:
+            # Accept trailing version if present
+            version = None
+            if len(p) >= 3:
+                v = p[2]
+                if v.lower().startswith('v') and v[1:].isdigit():
+                    version = int(v[1:])
+                elif v.isdigit():
+                    version = int(v)
+            return p[0], p[1], version
     return None, None, None
 def get_latest_version(api_key, workspace, project):
     """Gets the latest version number of a Roboflow project."""
     try:
         logging.error(f"Could not get latest version for {workspace}/{project}: {e}")
         return None
 def download_dataset(api_key, workspace, project, version):
+    """Downloads a single dataset from Roboflow (yolov8 format works fine for RT-DETR)."""
     try:
         rf = Roboflow(api_key=api_key)
         proj = rf.workspace(workspace).project(project)
+        ver = proj.version(int(version))
+        dataset = ver.download("yolov8")
+        data_yaml_path = os.path.join(dataset.location, 'data.yaml')
+        with open(data_yaml_path, 'r') as f:
             data_yaml = yaml.safe_load(f)
         class_names = data_yaml.get('names', [])
+        splits = [s for s in ['train', 'valid', 'test']
+                  if os.path.exists(os.path.join(dataset.location, s))]
         return dataset.location, class_names, splits, f"{project}-v{version}"
     except Exception as e:
         logging.error(f"Failed to download {workspace}/{project}/v{version}: {e}")
         return None, [], [], None
+def label_path_for(img_path: str) -> str:
+    """Convert .../split/images/file.jpg -> .../split/labels/file.txt in a safe way."""
+    split_dir = os.path.dirname(os.path.dirname(img_path))  # .../split
+    base = os.path.splitext(os.path.basename(img_path))[0] + '.txt'
+    return os.path.join(split_dir, 'labels', base)
 def gather_class_counts(dataset_info, class_mapping):
+    """
+    Count, per final class, how many images contain at least one instance of that class
+    (counted once per image). class_mapping maps original_name -> final_name.
+    """
+    if not dataset_info:
+        return {}
+    final_names = set(class_mapping.values())
+    counts = {name: 0 for name in final_names}
     for loc, names, splits, _ in dataset_info:
+        # Map from original idx -> mapped name (or None if removed later)
+        id_to_name = {}
+        for idx, n in enumerate(names):
+            id_to_name[idx] = class_mapping.get(n, None)
         for split in splits:
             labels_dir = os.path.join(loc, split, 'labels')
+            if not os.path.exists(labels_dir):
+                continue
             for label_file in os.listdir(labels_dir):
+                if not label_file.endswith('.txt'):
+                    continue
+                found = set()
                 with open(os.path.join(labels_dir, label_file), 'r') as f:
                     for line in f:
+                        parts = line.strip().split()
+                        if not parts:
+                            continue
                         try:
+                            cls_id = int(parts[0])
+                            mapped = id_to_name.get(cls_id, None)
+                            if mapped in final_names:
+                                found.add(mapped)
+                        except Exception:
                             continue
+                for m in found:
+                    counts[m] += 1
     return counts
 def finalize_merged_dataset(dataset_info, class_mapping, class_limits, progress=gr.Progress()):
+    """Core function to merge datasets based on user rules."""
     merged_dir = 'rolo_merged_dataset'
     if os.path.exists(merged_dir):
         shutil.rmtree(merged_dir, onerror=handle_remove_readonly)
     progress(0, desc="Creating directories...")
     for split in ['train', 'valid', 'test']:
         os.makedirs(os.path.join(merged_dir, split, 'images'), exist_ok=True)
         os.makedirs(os.path.join(merged_dir, split, 'labels'), exist_ok=True)
+    # Only classes with positive limits are active
+    active_classes = [cls for cls, limit in class_limits.items() if limit > 0]
+    active_classes = sorted(set(active_classes))
     final_class_map = {name: i for i, name in enumerate(active_classes)}
+    # Collect all candidate images
     all_images = []
     for loc, _, splits, _ in dataset_info:
         for split in splits:
             img_dir = os.path.join(loc, split, 'images')
+            if not os.path.exists(img_dir):
+                continue
             for img_file in os.listdir(img_dir):
                 if img_file.lower().endswith(('.jpg', '.jpeg', '.png')):
                     all_images.append((os.path.join(img_dir, img_file), split, loc))
     random.shuffle(all_images)
     progress(0.2, desc="Selecting images based on limits...")
+    selected_images = []
     current_counts = {cls: 0 for cls in active_classes}
+    # Build a quick lookup: source_loc -> names list
+    loc_to_names = {info[0]: info[1] for info in dataset_info}
+    for img_path, split, source_loc in progress.tqdm(all_images, desc="Analyzing images"):
+        lbl_path = label_path_for(img_path)
+        if not os.path.exists(lbl_path):
+            continue
+        source_names = loc_to_names.get(source_loc, [])
         image_classes = set()
         with open(lbl_path, 'r') as f:
             for line in f:
+                parts = line.strip().split()
+                if not parts:
+                    continue
                 try:
+                    cls_id = int(parts[0])
+                    orig = source_names[cls_id]
+                    mapped = class_mapping.get(orig, orig)
+                    if mapped in active_classes:
+                        image_classes.add(mapped)
+                except Exception:
+                    continue
+        if not image_classes:
+            continue
+        # Check limits
+        if any(current_counts[c] >= class_limits[c] for c in image_classes):
+            continue
+        selected_images.append((img_path, split))
+        for c in image_classes:
+            current_counts[c] += 1
     progress(0.6, desc=f"Copying {len(selected_images)} files...")
     for img_path, split in progress.tqdm(selected_images, desc="Finalizing files"):
+        lbl_path = label_path_for(img_path)
+        out_img = os.path.join(merged_dir, split, 'images', os.path.basename(img_path))
+        out_lbl = os.path.join(merged_dir, split, 'labels', os.path.basename(lbl_path))
+        shutil.copy(img_path, out_img)
+        # Determine source names by matching the parent dataset root
+        source_loc = None
+        for info in dataset_info:
+            if img_path.startswith(info[0]):
+                source_loc = info[0]
+                break
+        source_names = loc_to_names.get(source_loc, [])
+        with open(lbl_path, 'r') as f_in, open(out_lbl, 'w') as f_out:
             for line in f_in:
+                parts = line.strip().split()
+                if not parts:
+                    continue
                 try:
+                    old_id = int(parts[0])
+                    original_name = source_names[old_id]
                     mapped_name = class_mapping.get(original_name, original_name)
                     if mapped_name in final_class_map:
                         new_id = final_class_map[mapped_name]
                         f_out.write(f"{new_id} {' '.join(parts[1:])}\n")
+                except Exception:
+                    continue
     progress(0.95, desc="Creating data.yaml...")
     with open(os.path.join(merged_dir, 'data.yaml'), 'w') as f:
         yaml.dump({
+            'path': os.path.abspath(merged_dir),
+            'train': 'train/images',
+            'val': 'valid/images',
+            'test': 'test/images',
+            'nc': len(active_classes),
+            'names': active_classes
         }, f)
     return f"Dataset finalized with {len(selected_images)} images.", os.path.abspath(merged_dir)
+# ------------------------------
+# Gradio UI Event Handlers
+# ------------------------------
 def load_datasets_handler(api_key, url_file, progress=gr.Progress()):
     """Handles the 'Load Datasets' button click."""
+    api_key = api_key or os.getenv("ROBOFLOW_API_KEY", "")
+    if not api_key:
+        raise gr.Error("Roboflow API Key is required (or set ROBOFLOW_API_KEY).")
+    if not url_file:
+        raise gr.Error("Please upload a .txt file with Roboflow URLs or lines like 'workspace/project[/vN]'.")
+    with open(url_file.name, 'r', encoding='utf-8', errors='ignore') as f:
         urls = [line.strip() for line in f if line.strip()]
     dataset_info = []
+    failures = []
+    for i, raw in enumerate(urls):
+        progress((i + 1) / max(1, len(urls)), desc=f"Parsing {i+1}/{len(urls)}")
+        ws, proj, ver = parse_roboflow_url(raw)
+        if not (ws and proj):
+            failures.append((raw, "ParseError: could not resolve workspace/project"))
             continue
+        if ver is None:
+            ver = get_latest_version(api_key, ws, proj)
+            if ver is None:
+                failures.append((raw, f"Could not resolve latest version for {ws}/{proj}"))
                 continue
+        loc, names, splits, name_str = download_dataset(api_key, ws, proj, int(ver))
         if loc:
             dataset_info.append((loc, names, splits, name_str))
+        else:
+            failures.append((raw, f"DownloadError: {ws}/{proj}/v{ver}"))
+    if not dataset_info:
+        # Show a compact failure report to the UI
+        msg = "No datasets were loaded successfully.\n" + "\n".join([f"- {u}: {why}" for u, why in failures[:10]])
+        raise gr.Error(msg)
     all_names = sorted(list(set(n for _, names, _, _ in dataset_info for n in names)))
     class_map = {name: name for name in all_names}
+    # Initial preview uses "keep all" mapping
     initial_counts = gather_class_counts(dataset_info, class_map)
     df_data = [[name, name, initial_counts.get(name, 0), False] for name in all_names]
+    status_text = "Datasets loaded successfully."
+    if failures:
+        status_text += f" ({len(dataset_info)} OK, {len(failures)} failed; see console logs)."
+    return status_text, dataset_info, gr.DataFrame.update(
+        value=pd.DataFrame(df_data, columns=["Original Name", "Rename To", "Max Images", "Remove"])
+    )
 def update_class_counts_handler(class_df, dataset_info):
+    """
+    Provides live feedback on class counts as the user edits the DataFrame.
+    We compute a mapping of original -> final (or None if removed), then count images
+    for each final name.
+    """
+    if class_df is None or not dataset_info:
+        return None
+    # Build mapping original_name -> final_name or None if removed
+    class_df = pd.DataFrame(class_df)
+    mapping = {}
     for _, row in class_df.iterrows():
+        orig = row["Original Name"]
+        if bool(row["Remove"]):
+            mapping[orig] = None
+        else:
+            mapping[orig] = row["Rename To"]
+    # Build final set
+    final_names = sorted(set(v for v in mapping.values() if v))
+    counts = {k: 0 for k in final_names}
     for loc, names, splits, _ in dataset_info:
+        id_to_final = {}
+        for idx, n in enumerate(names):
+            id_to_final[idx] = mapping.get(n, None)
         for split in splits:
             labels_dir = os.path.join(loc, split, 'labels')
+            if not os.path.exists(labels_dir):
+                continue
             for label_file in os.listdir(labels_dir):
+                if not label_file.endswith('.txt'):
+                    continue
+                found = set()
                 with open(os.path.join(labels_dir, label_file), 'r') as f:
                     for line in f:
+                        parts = line.strip().split()
+                        if not parts:
+                            continue
                         try:
+                            cls_id = int(parts[0])
+                            mapped = id_to_final.get(cls_id, None)
+                            if mapped:
+                                found.add(mapped)
+                        except Exception:
+                            continue
+                for m in found:
+                    counts[m] += 1
+    summary_df = pd.DataFrame(list(counts.items()), columns=["Final Class Name", "Est. Total Images"])
     return summary_df
 def finalize_handler(dataset_info, class_df, progress=gr.Progress()):
     """Handles the 'Finalize' button click."""
+    if not dataset_info:
+        raise gr.Error("Load datasets first in Tab 1.")
+    if class_df is None:
+        raise gr.Error("Class data is missing.")
+    # Mapping and limits
+    class_df = pd.DataFrame(class_df)
+    class_mapping = {}
     class_limits = {}
     for _, row in class_df.iterrows():
+        orig = row["Original Name"]
+        if bool(row["Remove"]):
+            continue
+        final_name = row["Rename To"]
+        class_mapping[orig] = final_name
+        # Sum limits for final_name over any merged originals
+        class_limits[final_name] = class_limits.get(final_name, 0) + int(row["Max Images"])
+    # Any original not present in mapping will map to itself (keep behavior)
+    # BUT we do not want to include classes with 0 limit in the final dataset
+    # finalize_merged_dataset uses the limits dict to decide active classes.
     status, path = finalize_merged_dataset(dataset_info, class_mapping, class_limits, progress)
     return status, path
 def training_handler(dataset_path, model_filename, run_name, epochs, batch, imgsz, lr, opt, progress=gr.Progress()):
+    """Handles the training process with live feedback."""
+    if not dataset_path:
+        raise gr.Error("Finalize a dataset in Tab 2 before training.")
+    # Ultralytics expects device string, e.g. '0' or 'cpu'
+    device_str = "0" if torch.cuda.is_available() else "cpu"
     metrics_queue = Queue()
     def on_epoch_end(trainer):
+        # Be defensive about metric keys
+        m = trainer.metrics or {}
         metrics_queue.put({
+            'epoch': (trainer.epoch or 0) + 1,
+            'train_loss': m.get('train/loss') or m.get('loss'),
+            'val_loss': m.get('val/loss'),
+            'mAP50': m.get('metrics/mAP50(B)') or m.get('metrics/mAP50'),
+            'mAP50_95': m.get('metrics/mAP50-95(B)') or m.get('metrics/mAP50-95')
         })
     def train_thread_func():
             weights_path = os.path.join('pretrained_models', model_filename)
             if not os.path.exists(weights_path):
                 os.makedirs('pretrained_models', exist_ok=True)
+                r = requests.get(model_url, stream=True, timeout=60)
                 r.raise_for_status()
                 with open(weights_path, 'wb') as f:
                     for chunk in r.iter_content(chunk_size=8192):
                         f.write(chunk)
             model = YOLO(weights_path)
             model.add_callback("on_train_epoch_end", on_epoch_end)
             model.train(
+                data=os.path.join(dataset_path, 'data.yaml'),
+                epochs=int(epochs),
+                batch=int(batch),
+                imgsz=int(imgsz),
+                lr0=float(lr),
+                optimizer=str(opt),
+                project='runs/train',
+                name=str(run_name),
+                exist_ok=True,
+                device=device_str
             )
             metrics_queue.put("done")
         except Exception as e:
+            logging.exception("Training thread error")
             metrics_queue.put(f"error: {e}")
     Thread(target=train_thread_func, daemon=True).start()
     while True:
         item = metrics_queue.get()
         if isinstance(item, str):
+            if item == "done":
+                break
+            if item.startswith("error"):
+                raise gr.Error(f"Training failed: {item}")
+        # Append metrics
+        for key in ['epoch', 'train_loss', 'val_loss', 'mAP50', 'mAP50_95']:
+            val = item.get(key, None)
+            if val is not None:
+                history[key].append(val)
+        current_epoch = history['epoch'][-1] if history['epoch'] else 0
+        total_epochs = int(epochs)
+        frac = min(max(current_epoch / max(1, total_epochs), 0.0), 1.0)
+        progress(frac, desc=f"Epoch {current_epoch}/{total_epochs}")
+        # Plot Loss
+        fig_loss = plt.figure()
+        ax_loss = fig_loss.add_subplot(111)
         ax_loss.plot(history['epoch'], history['train_loss'], "o-", label='Train Loss')
         ax_loss.plot(history['epoch'], history['val_loss'], "o-", label='Val Loss')
+        ax_loss.legend()
+        ax_loss.set_title("Loss")
+        # Plot mAP
+        fig_map = plt.figure()
+        ax_map = fig_map.add_subplot(111)
         ax_map.plot(history['epoch'], history['mAP50'], "o-", label='mAP@0.5')
         ax_map.plot(history['epoch'], history['mAP50_95'], "o-", label='mAP@0.5:0.95')
+        ax_map.legend()
+        ax_map.set_title("mAP")
+        yield f"Epoch {current_epoch}/{total_epochs} complete.", fig_loss, fig_map, None
+    final_path = os.path.join('runs', 'train', str(run_name), 'weights', 'best.pt')
     if not os.path.exists(final_path):
         raise gr.Error("Training finished, but 'best.pt' was not found.")
     yield "Training complete!", None, None, gr.File.update(value=final_path, visible=True)
 def upload_handler(model_file, hf_token, hf_repo, gh_token, gh_repo, progress=gr.Progress()):
+    """Handles model upload to Hugging Face and GitHub."""
+    if not model_file:
+        raise gr.Error("No trained model file available to upload. Train a model first.")
     hf_status = "Skipped Hugging Face (credentials not provided)."
     if hf_token and hf_repo:
         progress(0, desc="Uploading to Hugging Face...")
             HfFolder.save_token(hf_token)
             repo_url = api.create_repo(repo_id=hf_repo, exist_ok=True, token=hf_token)
             api.upload_file(
+                path_or_fileobj=model_file.name,
+                path_in_repo=os.path.basename(model_file.name),
+                repo_id=hf_repo,
+                token=hf_token
             )
             hf_status = f"Success! Model at: {repo_url}"
+        except Exception as e:
+            hf_status = f"Hugging Face Error: {e}"
     gh_status = "Skipped GitHub (credentials not provided)."
     if gh_token and gh_repo:
         progress(0.5, desc="Uploading to GitHub...")
         try:
+            if '/' not in gh_repo:
+                raise ValueError("GitHub repo must be in the form 'username/repo'.")
             username, repo_name = gh_repo.split('/')
             api_url = f"https://api.github.com/repos/{username}/{repo_name}/contents/{os.path.basename(model_file.name)}"
             headers = {"Authorization": f"token {gh_token}"}
+            with open(model_file.name, "rb") as f:
+                content = base64.b64encode(f.read()).decode()
+            get_resp = requests.get(api_url, headers=headers, timeout=30)
             sha = get_resp.json().get('sha') if get_resp.ok else None
+            data = {"message": "Upload trained model from Rolo app", "content": content}
+            if sha:
+                data["sha"] = sha
+            put_resp = requests.put(api_url, headers=headers, json=data, timeout=60)
+            if put_resp.ok:
+                gh_status = f"Success! Model at: {put_resp.json()['content']['html_url']}"
+            else:
+                msg = put_resp.json().get('message', 'Unknown')
+                gh_status = f"GitHub Error: {msg}"
+        except Exception as e:
+            gh_status = f"GitHub Error: {e}"
     progress(1)
     return hf_status, gh_status
+# ------------------------------
+# Gradio UI
+# ------------------------------
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="sky")) as app:
     gr.Markdown("# Rolo: A Dedicated RT-DETR Training Dashboard")
     # State variables
     dataset_info_state = gr.State([])
     final_dataset_path_state = gr.State(None)
     with gr.Tabs():
         with gr.TabItem("1. Prepare Datasets"):
+            gr.Markdown("### Load Roboflow Datasets\nProvide your Roboflow API key and upload a `.txt` file containing one Roboflow dataset URL or `workspace/project[/vN]` per line.")
             with gr.Row():
+                rf_api_key = gr.Textbox(label="Roboflow API Key (or set ROBOFLOW_API_KEY env)", type="password", scale=2)
                 rf_url_file = gr.File(label="Upload Roboflow URLs (.txt)", file_types=[".txt"], scale=1)
             load_btn = gr.Button("Load Datasets", variant="primary")
             dataset_status = gr.Textbox(label="Status", interactive=False)
         with gr.TabItem("2. Manage & Merge"):
+            gr.Markdown("### Configure Classes and Finalize Dataset\nRename classes to merge them, set image limits, or remove them. Click **Update Counts** to preview, then **Finalize** to create the dataset.")
             with gr.Row():
                 class_df = gr.DataFrame(
                     headers=["Original Name", "Rename To", "Max Images", "Remove"],
                     label="Class Configuration", interactive=True, scale=3
                 )
                 with gr.Column(scale=1):
+                    class_count_summary_df = gr.DataFrame(
+                        label="Merged Class Counts Preview",
+                        headers=["Final Class Name", "Est. Total Images"],
+                        interactive=False
+                    )
                     update_counts_btn = gr.Button("Update Counts")
             finalize_btn = gr.Button("Finalize Merged Dataset", variant="primary")
             finalize_status = gr.Textbox(label="Status", interactive=False)
             gr.Markdown("### Set Hyperparameters and Train the RT-DETR Model")
             with gr.Row():
                 with gr.Column(scale=1):
+                    model_file_dd = gr.Dropdown(
+                        label="Select Pre-Trained RT-DETR Model",
+                        choices=[m["filename"] for m in RTDETR_MODELS["detection"]],
+                        value=DEFAULT_MODEL
+                    )
                     run_name_tb = gr.Textbox(label="Run Name", value="rtdetr_run_1")
                     epochs_sl = gr.Slider(1, 500, 100, step=1, label="Epochs")
                     batch_sl = gr.Slider(1, 32, 8, step=1, label="Batch Size")
                     imgsz_num = gr.Number(label="Image Size", value=640)
                     lr_num = gr.Number(label="Learning Rate", value=0.001)
                     opt_dd = gr.Dropdown(["Adam", "AdamW", "SGD"], value="Adam", label="Optimizer")
                     train_btn = gr.Button("Start Training", variant="primary")
                 hf_status = gr.Textbox(label="Hugging Face Status", interactive=False)
                 gh_status = gr.Textbox(label="GitHub Status", interactive=False)
+    # Wire UI handlers
+    load_btn.click(
+        fn=load_datasets_handler,
+        inputs=[rf_api_key, rf_url_file],
+        outputs=[dataset_status, dataset_info_state, class_df]
+    )
+    update_counts_btn.click(
+        fn=update_class_counts_handler,
+        inputs=[class_df, dataset_info_state],
+        outputs=[class_count_summary_df]
+    )
+    finalize_btn.click(
+        fn=finalize_handler,
+        inputs=[dataset_info_state, class_df],
+        outputs=[finalize_status, final_dataset_path_state]
+    )
+    train_btn.click(
+        fn=training_handler,
+        inputs=[final_dataset_path_state, model_file_dd, run_name_tb, epochs_sl, batch_sl, imgsz_num, lr_num, opt_dd],
+        outputs=[train_status, loss_plot, map_plot, final_model_file]
+    )
+    upload_btn.click(
+        fn=upload_handler,
+        inputs=[final_model_file, hf_token, hf_repo, gh_token, gh_repo],
+        outputs=[hf_status, gh_status]
+    )
 if __name__ == "__main__":
+    # Tip: silence Ultralytics settings warning by setting env var:
+    #   export YOLO_CONFIG_DIR=/tmp/Ultralytics
+    app.launch(debug=True)