Spaces:

cricverse
/

CricAnnotate

Sleeping

App Files Files Community

ashu1069 commited on Mar 29

Commit

6f4b473

1 Parent(s): 624e18c

updates

Browse files

Files changed (1) hide show

app.py +13 -15

app.py CHANGED Viewed

@@ -54,39 +54,39 @@ class VideoAnnotator:
             # --- Start Edit: Filter out already annotated videos ---
             logger.info(f"Checking for existing annotations in {self.annotation_repo_id}")
             try:
                 annotated_files = self.api.list_repo_files(
                     repo_id=self.annotation_repo_id,
                     repo_type=self.annotation_repo_type,
-                    path_in_repo="annotations"
                 )
-                # Extract base video names from annotation filenames (e.g., "annotations/video1.mp4.jsonl" -> "video1.mp4")
                 annotated_video_basenames = set(
-                    os.path.basename(f).replace('.jsonl', '') for f in annotated_files if f.startswith("annotations/") and f.endswith(".jsonl")
                 )
                 logger.info(f"Found {len(annotated_video_basenames)} existing annotation files.")
-                # Filter the video list
                 self.video_files = [
-                    vf for vf in all_video_files
                     if os.path.basename(vf) not in annotated_video_basenames
                 ]
                 logger.info(f"Filtered list: {len(self.video_files)} videos remaining to be annotated.")
             except Exception as e:
                 logger.error(f"Could not list or process annotation files: {e}. Proceeding with all videos, but conflicts may occur.")
                 self.video_files = all_video_files # Fallback: load all if check fails
             # --- End Edit ---
-            # print(self.video_files) # Optional: keep if needed for debugging
-            # logger.info(f"Found {len(self.video_files)} video files") # Updated log message above
-            # print(f"Video files found: {self.video_files}") # Optional: keep if needed for debugging
             if not self.video_files:
                 logger.warning("No videos left to annotate!")
                 # Optionally, display a message in the UI here if possible
             return len(self.video_files) > 0
         except Exception as e:
             logger.error(f"Error accessing HuggingFace dataset: {e}")
@@ -261,7 +261,7 @@ def create_interface():
             with gr.Column(scale=2): # Column for Annotations and Save Button
                 annotation_components = []
-                gr.Markdown("### Annotations") # Header for the annotation section
                 # Display annotation radio buttons vertically in this column
                 for category, options in ANNOTATION_CATEGORIES.items():
@@ -271,7 +271,6 @@ def create_interface():
                     )
                     annotation_components.append(radio)
-                # --- Start Edit: Add Progress Display and attach change listeners ---
                 progress_display = gr.Markdown(value=update_progress(*[None]*total_categories)) # Initial progress
                 # Attach change listener to each radio button
@@ -281,7 +280,6 @@ def create_interface():
                         inputs=annotation_components,
                         outputs=progress_display
                     )
-                # --- End Edit ---
                 save_btn = gr.Button("Save Annotations", variant="primary")

             # --- Start Edit: Filter out already annotated videos ---
             logger.info(f"Checking for existing annotations in {self.annotation_repo_id}")
             try:
+                # List files in the 'annotations' directory of the annotation repo
                 annotated_files = self.api.list_repo_files(
                     repo_id=self.annotation_repo_id,
                     repo_type=self.annotation_repo_type,
+                    path_in_repo="annotations" # Specify the directory
                 )
+                # Extract base video names from annotation filenames
+                # e.g., "annotations/video1.mp4.jsonl" -> "video1.mp4"
                 annotated_video_basenames = set(
+                    os.path.basename(f).replace('.jsonl', '')
+                    for f in annotated_files
+                    if f.startswith("annotations/") and f.endswith(".jsonl") # Ensure it's in the correct folder and has the right extension
                 )
                 logger.info(f"Found {len(annotated_video_basenames)} existing annotation files.")
+                # Filter the video list: keep only videos whose basename is NOT in the annotated set
                 self.video_files = [
+                    vf for vf in all_video_files
                     if os.path.basename(vf) not in annotated_video_basenames
                 ]
                 logger.info(f"Filtered list: {len(self.video_files)} videos remaining to be annotated.")
             except Exception as e:
+                # Log error and fallback to using all videos if the check fails
                 logger.error(f"Could not list or process annotation files: {e}. Proceeding with all videos, but conflicts may occur.")
                 self.video_files = all_video_files # Fallback: load all if check fails
             # --- End Edit ---
             if not self.video_files:
                 logger.warning("No videos left to annotate!")
                 # Optionally, display a message in the UI here if possible
             return len(self.video_files) > 0
         except Exception as e:
             logger.error(f"Error accessing HuggingFace dataset: {e}")
             with gr.Column(scale=2): # Column for Annotations and Save Button
                 annotation_components = []
+                gr.Markdown("## Annotations") # Header for the annotation section
                 # Display annotation radio buttons vertically in this column
                 for category, options in ANNOTATION_CATEGORIES.items():
                     )
                     annotation_components.append(radio)
                 progress_display = gr.Markdown(value=update_progress(*[None]*total_categories)) # Initial progress
                 # Attach change listener to each radio button
                         inputs=annotation_components,
                         outputs=progress_display
                     )
                 save_btn = gr.Button("Save Annotations", variant="primary")