quietlight/skraak_mcp - Change DMMB63IW75MSRMKX63LTIVRVA74FOERMGGCNYGC7BZRV76VIJURQC

first iteration of niw calls summarise tool

Created by quietlight on March 12, 2026

DMMB63IW75MSRMKX63LTIVRVA74FOERMGGCNYGC7BZRV76VIJURQC

Dependencies

In channels

main

Change contents

File addition: calls_summarise.go (----------)

[3.22715]

package tools
import (
	"sort"
	"strings"
	"skraak/utils"
)
// CallsSummariseInput defines the input for the calls-summarise tool
type CallsSummariseInput struct {
	Folder string `json:"folder" jsonschema:"required,Path to folder containing .data files"`
}
// CallsSummariseOutput defines the output for the calls-summarise tool
type CallsSummariseOutput struct {
	Segments         []SegmentSummary            `json:"segments"`
	DataFilesRead    int                         `json:"data_files_read"`
	DataFilesSkipped []string                    `json:"data_files_skipped"`
	TotalSegments    int                         `json:"total_segments"`
	Filters          map[string]FilterStats      `json:"filters"`
	ReviewStatus     ReviewStatus                `json:"review_status"`
	Operators        []string                    `json:"operators"`
	Reviewers        []string                    `json:"reviewers"`
	Error            *string                     `json:"error,omitempty"`
}
// SegmentSummary represents a single segment in the output
type SegmentSummary struct {
	File      string        `json:"file"`
	StartTime float64       `json:"start_time"`
	EndTime   float64       `json:"end_time"`
	Labels    []LabelSummary `json:"labels"`
}
// LabelSummary represents a label in the output (omits empty fields)
type LabelSummary struct {
	Filter    string `json:"filter"`
	Certainty int    `json:"certainty"`
	Species   string `json:"species"`
	CallType  string `json:"calltype,omitempty"`
	Comment   string `json:"comment,omitempty"`
	Bookmark  bool   `json:"bookmark,omitempty"`
}
// FilterStats contains per-filter statistics
type FilterStats struct {
	Segments int            `json:"segments"`
	Species  map[string]int `json:"species"`
}
// ReviewStatus contains review progress statistics
type ReviewStatus struct {
	Unreviewed   int `json:"unreviewed"`   // certainty < 100
	Confirmed    int `json:"confirmed"`    // certainty = 100
	DontKnow     int `json:"dont_know"`    // certainty = 0
	WithCallType int `json:"with_calltype"`
	WithComments int `json:"with_comments"`
	Bookmarked   int `json:"bookmarked"`
}
// CallsSummarise reads all .data files in a folder and produces a summary
func CallsSummarise(input CallsSummariseInput) (CallsSummariseOutput, error) {
	var output CallsSummariseOutput
	// Find all .data files
	filePaths, err := utils.FindDataFiles(input.Folder)
	if err != nil {
		errMsg := err.Error()
		output.Error = &errMsg
		return output, err
	}
	// Initialize empty slices/maps (avoid null in JSON)
	output.Segments = make([]SegmentSummary, 0)
	output.Filters = make(map[string]FilterStats)
	output.Operators = make([]string, 0)
	output.Reviewers = make([]string, 0)
	output.DataFilesSkipped = make([]string, 0)
	if len(filePaths) == 0 {
		return output, nil
	}
	// Track unique operators and reviewers
	operatorSet := make(map[string]bool)
	reviewerSet := make(map[string]bool)
	// Process each file
	for _, path := range filePaths {
		df, err := utils.ParseDataFile(path)
		if err != nil {
			// Extract just the filename for skipped list
			output.DataFilesSkipped = append(output.DataFilesSkipped, path)
			continue
		}
		output.DataFilesRead++
		// Track operator and reviewer
		if df.Meta != nil {
			if df.Meta.Operator != "" {
				operatorSet[df.Meta.Operator] = true
			}
			if df.Meta.Reviewer != "" {
				reviewerSet[df.Meta.Reviewer] = true
			}
		}
		// Process segments
		for _, seg := range df.Segments {
			// Extract relative filename
			relPath := extractRelativePath(input.Folder, path)
			// Build label summaries
			var labels []LabelSummary
			for _, l := range seg.Labels {
				labelSummary := LabelSummary{
					Filter:    l.Filter,
					Certainty: l.Certainty,
					Species:   l.Species,
				}
				if l.CallType != "" {
					labelSummary.CallType = l.CallType
				}
				if l.Comment != "" {
					labelSummary.Comment = l.Comment
				}
				if l.Bookmark {
					labelSummary.Bookmark = true
				}
				labels = append(labels, labelSummary)
				// Update filter stats
				fs, exists := output.Filters[l.Filter]
				if !exists {
					fs = FilterStats{
						Segments: 0,
						Species:  make(map[string]int),
					}
				}
				fs.Segments++
				fs.Species[l.Species]++
				output.Filters[l.Filter] = fs
				// Update review status
				if l.Certainty == 100 {
					output.ReviewStatus.Confirmed++
				} else if l.Certainty == 0 {
					output.ReviewStatus.DontKnow++
				} else {
					output.ReviewStatus.Unreviewed++
				}
				if l.CallType != "" {
					output.ReviewStatus.WithCallType++
				}
				if l.Comment != "" {
					output.ReviewStatus.WithComments++
				}
				if l.Bookmark {
					output.ReviewStatus.Bookmarked++
				}
			}
			// Create segment summary
			segSummary := SegmentSummary{
				File:      relPath,
				StartTime: seg.StartTime,
				EndTime:   seg.EndTime,
				Labels:    labels,
			}
			output.Segments = append(output.Segments, segSummary)
		}
	}
	output.TotalSegments = len(output.Segments)
	// Convert sets to sorted slices
	for op := range operatorSet {
		output.Operators = append(output.Operators, op)
	}
	for r := range reviewerSet {
		output.Reviewers = append(output.Reviewers, r)
	}
	sort.Strings(output.Operators)
	sort.Strings(output.Reviewers)
	// Sort segments by file, then start time
	sort.Slice(output.Segments, func(i, j int) bool {
		if output.Segments[i].File != output.Segments[j].File {
			return output.Segments[i].File < output.Segments[j].File
		}
		return output.Segments[i].StartTime < output.Segments[j].StartTime
	})
	return output, nil
}
// extractRelativePath extracts the .wav filename from a .data file path
// e.g., "/folder/tx51_LISTENING_20260221_203004.WAV.data" -> "tx51_LISTENING_20260221_203004.wav"
func extractRelativePath(folder, dataPath string) string {
	// Get the filename
	filename := dataPath
	if idx := strings.LastIndex(dataPath, "/"); idx >= 0 {
		filename = dataPath[idx+1:]
	}
	// Remove .data extension
	filename = strings.TrimSuffix(filename, ".data")
	// Normalize extension to lowercase .wav
	lower := strings.ToLower(filename)
	if strings.HasSuffix(lower, ".wav") {
		// Already has .wav/.WAV extension, just normalize to lowercase
		return filename[:len(filename)-4] + ".wav"
	}
	// No extension, add .wav
	return filename + ".wav"
}

Insertion in cmd/calls.go at line 30 [5.1]
[4.36733]
[5.278]
```
	case "summarise":
		runCallsSummarise(args[1:])
```

Insertion in cmd/calls.go at line 47 [5.1]

[4.36822]

[5.629]

	fmt.Fprintf(os.Stderr, "  summarise    Summarise all .data files in a folder\n")

Insertion in cmd/calls.go at line 54 [5.1]

[6.6865]

[5.879]

	fmt.Fprintf(os.Stderr, "  skraak calls summarise --folder ./recordings > summary.json\n")

Insertion in cmd/calls.go at line 366 [5.1]

[7.35946]

	}
	// Output JSON to stdout
	enc := json.NewEncoder(os.Stdout)
	enc.SetIndent("", "  ")
	enc.Encode(output)
}
// runCallsSummarise handles the "calls summarise" subcommand
func runCallsSummarise(args []string) {
	fs := flag.NewFlagSet("calls summarise", flag.ExitOnError)
	folder := fs.String("folder", "", "Folder containing .data files (required)")
	fs.Usage = func() {
		fmt.Fprintf(os.Stderr, "Usage: skraak calls summarise [options]\n\n")
		fmt.Fprintf(os.Stderr, "Summarise all .data files in a folder.\n")
		fmt.Fprintf(os.Stderr, "Outputs JSON with segments array and summary statistics.\n\n")
		fmt.Fprintf(os.Stderr, "Options:\n")
		fs.PrintDefaults()
		fmt.Fprintf(os.Stderr, "\nOutput includes:\n")
		fmt.Fprintf(os.Stderr, "  - segments: array of all segments with labels\n")
		fmt.Fprintf(os.Stderr, "  - data_files_read: count of successfully parsed .data files\n")
		fmt.Fprintf(os.Stderr, "  - data_files_skipped: list of files that failed to parse\n")
		fmt.Fprintf(os.Stderr, "  - total_segments: total number of segments\n")
		fmt.Fprintf(os.Stderr, "  - filters: per-filter statistics (segments, species counts)\n")
		fmt.Fprintf(os.Stderr, "  - review_status: unreviewed/confirmed/dont_know counts\n")
		fmt.Fprintf(os.Stderr, "  - operators/reviewers: unique values found\n")
		fmt.Fprintf(os.Stderr, "\nExamples:\n")
		fmt.Fprintf(os.Stderr, "  skraak calls summarise --folder ./recordings > summary.json\n")
		fmt.Fprintf(os.Stderr, "  skraak calls summarise --folder ./recordings | jq 'del(.segments)'  # summary only\n")
	}
	if err := fs.Parse(args); err != nil {
		os.Exit(1)
	}
	// Validate required flags
	if *folder == "" {
		fmt.Fprintf(os.Stderr, "Error: --folder is required\n\n")
		fs.Usage()
		os.Exit(1)
	}
	input := tools.CallsSummariseInput{
		Folder: *folder,
	}
	fmt.Fprintf(os.Stderr, "Summarising .data files in: %s\n", *folder)
	output, err := tools.CallsSummarise(input)
	if err != nil {
		fmt.Fprintf(os.Stderr, "Error: %v\n", err)
		os.Exit(1)

Insertion in cmd/calls.go at line 420 [5.1]

[7.35949]


	fmt.Fprintf(os.Stderr, "Read %d .data files, skipped %d\n",
		output.DataFilesRead, len(output.DataFilesSkipped))
	fmt.Fprintf(os.Stderr, "Total segments: %d\n", output.TotalSegments)
	fmt.Fprintf(os.Stderr, "Filters: %d\n", len(output.Filters))
	fmt.Fprintf(os.Stderr, "Review status: %d unreviewed, %d confirmed, %d don't know\n",
		output.ReviewStatus.Unreviewed, output.ReviewStatus.Confirmed, output.ReviewStatus.DontKnow)

Insertion in CHANGELOG.md at line 4 [8.1]

[8.81]

[2.4218]


## [2026-03-13] Calls Summarise Command
**Feature:** New `skraak calls summarise` command to analyse .data files after classification.
**Changes:**
- `tools/calls_summarise.go` — New tool with `CallsSummarise()` function
- `cmd/calls.go` — Added `summarise` subcommand

Insertion in CHANGELOG.md at line 13 [8.1]

[2.4219]

**Usage:**
```bash
skraak calls summarise --folder ./recordings > summary.json
skraak calls summarise --folder ./recordings | jq 'del(.segments)'  # summary only
```
**Output structure:**
```json
{
  "segments": [...],
  "data_files_read": 27,
  "data_files_skipped": [],
  "total_segments": 47,
  "filters": {
    "opensoundscape-kiwi-1.2": {"segments": 20, "species": {"Kiwi": 15, "Don't Know": 5}}
  },
  "review_status": {
    "unreviewed": 30,
    "confirmed": 10,
    "dont_know": 5,
    "with_calltype": 8,
    "with_comments": 3,
    "bookmarked": 2
  },
  "operators": ["Auto"],
  "reviewers": ["David", "None"]
}
```
**Review status definitions:**
- `unreviewed`: certainty < 100 (default from detection)
- `confirmed`: certainty = 100 (user pressed bind key)
- `dont_know`: certainty = 0
**Rationale:**
After running `skraak classify` on .data files, it's difficult to understand the state of classifications. This command provides a comprehensive summary with both detailed segments array and aggregated statistics.

first iteration of niw calls summarise tool

Dependencies

In channels

Change contents

File addition: calls_summarise.go (----------)

Insertion in cmd/calls.go at line 30 [5.1]

Insertion in cmd/calls.go at line 47 [5.1]

Insertion in cmd/calls.go at line 54 [5.1]

Insertion in cmd/calls.go at line 366 [5.1]

Insertion in cmd/calls.go at line 420 [5.1]

Insertion in CHANGELOG.md at line 4 [8.1]

Insertion in CHANGELOG.md at line 13 [8.1]