Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

CLN/MAINT: Vendor code, fix #262 #263

Merged
merged 14 commits into from
Feb 2, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 3 additions & 5 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -12,12 +12,10 @@ requires-python = ">=3.9"
dependencies = [
"appdirs >=1.4.4",
"attrs >=19.3.0",
"evfuncs >=0.3.5",
"birdsong-recognition-dataset >=0.3.2",
"numpy >=1.21.0",
"pandas >= 1.3.5",
"numpy >=1.22.0",
"pandas >= 1.4.0",
"pandera >= 0.9.0",
"scipy >=1.7.0",
"scipy >=1.8.0",
"SoundFile >=0.12.1",
]
version = "5.0.1"
Expand Down
10 changes: 4 additions & 6 deletions src/crowsetta/annotation.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
"""A class to represent annotations for a single file."""
from __future__ import annotations

from pathlib import Path
import reprlib
from pathlib import Path
from typing import Optional

import crowsetta
Expand Down Expand Up @@ -89,12 +89,10 @@ def __init__(

if seq:
if not (
isinstance(seq, crowsetta.Sequence) or
(isinstance(seq, list) and all([isinstance(seq_, crowsetta.Sequence) for seq_ in seq]))
isinstance(seq, crowsetta.Sequence)
or (isinstance(seq, list) and all([isinstance(seq_, crowsetta.Sequence) for seq_ in seq]))
):
raise TypeError(
f"``seq`` should be a crowsetta.Sequence or list of Sequences but was: {type(seq)}"
)
raise TypeError(f"``seq`` should be a crowsetta.Sequence or list of Sequences but was: {type(seq)}")
self.seq = seq

if bboxes:
Expand Down
194 changes: 188 additions & 6 deletions src/crowsetta/formats/seq/birdsongrec.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,19 +8,201 @@
Boundaries in the Birdsong with Variable Sequences. PLoS ONE 11(7): e0159188.
doi:10.1371/journal.pone.0159188
"""
from __future__ import annotations

import os
import pathlib
import warnings
import xml.etree.ElementTree as ET
from typing import ClassVar, List, Optional

import attr
import birdsongrec
import numpy as np
import soundfile

import crowsetta
from crowsetta.typing import PathLike


class BirdsongRecSyllable:
"""Object that represents a syllable.

Attributes
----------
position : int
starting sample number ("frame") within .wav file
*** relative to start of sequence! ***
length : int
duration given as number of samples
label : str
text representation of syllable as classified by a human
or a machine learning algorithm
"""

def __init__(self, position: int, length: int, label: str) -> None:
if not isinstance(position, int):
raise TypeError(f"position must be an int, not type {type(position)}")
if not isinstance(length, int):
raise TypeError(f"length must be an int, not type {type(length)}")
if not isinstance(label, str):
raise TypeError(f"label must be a string, not type {type(label)}")
self.position = position
self.length = length
self.label = label

def __repr__(self):
return f"BirdsongRecSyllable(position={self.position}, length={self.length}, label={self.label})"


class BirdsongRecSequence:
"""Class from birdsong-recognition
that represents a sequence of syllables.

Attributes
----------
wav_file : string
file name of .wav file in which sequence occurs
position : int
starting sample number within .wav file
length : int
duration given as number of samples
syls : list
list of syllable objects that make up sequence
seq_spect : spectrogram object
"""

def __init__(self, wav_file: PathLike, position: int, length: int, syl_list: list[BirdsongRecSyllable]):
if not isinstance(wav_file, (str, pathlib.Path)):
raise TypeError(f"wav_file must be a string or pathlib.Path, not type {type(wav_file)}")
wav_file = str(wav_file)
if not isinstance(position, int):
raise TypeError(f"position must be an int, not type {type(position)}")
if not isinstance(length, int):
raise TypeError(f"length must be an int, not type {type(length)}")
if not isinstance(syl_list, list):
raise TypeError(f"syl_list must be a list, not type {type(syl_list)}")
if not all([isinstance(syl, BirdsongRecSyllable) for syl in syl_list]):
raise TypeError("not all elements in syl list are of type BirdsongRecSyllable: " f"{syl_list}")
self.wav_file = wav_file
self.position = position
self.length = length
self.num_syls = len(syl_list)
self.syls = syl_list

def __repr__(self):
return f"Sequence(wav_file={self.wav_file}, position={self.position}, length={self.length}, syls={self.syls})"


def parse_xml(
xml_file: PathLike,
concat_seqs_into_songs: bool = False,
return_wav_abspath: bool = False,
wav_abspath: PathLike = None,
) -> list[BirdsongRecSequence]:
"""parses Annotation.xml files from the BirdsongRecognition dataset:
Koumura, T. (2016). BirdsongRecognition (Version 1). figshare.
https://doi.org/10.6084/m9.figshare.3470165.v1
https://figshare.com/articles/BirdsongRecognition/3470165

Parameters
----------
xml_file : str
filename of .xml file, e.g. 'Annotation.xml'
concat_seqs_into_songs : bool
if True, concatenate sequences into songs, where each .wav file is a
song. Default is False.
return_wav_abspath : bool
if True, change value for the wav_file field of sequences to absolute path,
instead of just the .wav file name (without a path). This option is
useful if you need to specify the path to data on your system.
Default is False, in which the .wav file name is returned as written in the
Annotation.xml file.
wav_abspath : str
Path to directory in which .wav files are found. Specify this if you have changed
the structure of the repository so that the .wav files are no longer in a
directory named Wave that's in the same parent directory as the Annotation.xml
file. Default is None, in which case the structure just described is assumed.

Returns
-------
seq_list : list of BirdsongrecSequence objects
if concat_seqs_into_songs is True, then each sequence will correspond to one song,
i.e., the annotation for one .wav file

Examples
--------
>>> seq_list = parse_xml(xml_file='./Bird0/Annotation.xml', concat_seqs_into_songs=False)
>>> seq_list[0]
Sequence from 0.wav with position 32000 and length 43168

Notes
-----
Parses files that adhere to this XML Schema document:
https://github.com/NickleDave/birdsong-recognition-dataset/blob/main/doc/xsd/AnnotationSchema.xsd
"""
if return_wav_abspath:
if wav_abspath:
if not os.path.isdir(wav_abspath):
raise NotADirectoryError(f"return_wav_abspath is True but {wav_abspath} " "is not a valid directory.")
tree = ET.ElementTree(file=xml_file)
seq_list = []
for seq in tree.iter(tag="Sequence"):
wav_file = seq.find("WaveFileName").text
if return_wav_abspath:
if wav_abspath:
wav_file = os.path.join(wav_abspath, wav_file)
else:
# assume .wav file is in Wave directory that's a child to wherever
# Annotation.xml file is kept (since this is how the repository is
# structured)
xml_dirname = os.path.dirname(xml_file)
wav_file = os.path.join(xml_dirname, "Wave", wav_file)
if not os.path.isfile(wav_file):
raise FileNotFoundError("File {wav_file} is not found")

position = int(seq.find("Position").text)
length = int(seq.find("Length").text)
syl_list = []
for syl in seq.iter(tag="Note"):
syl_position = int(syl.find("Position").text)
syl_length = int(syl.find("Length").text)
label = syl.find("Label").text

syl_obj = BirdsongRecSyllable(position=syl_position, length=syl_length, label=label)
syl_list.append(syl_obj)
seq_obj = BirdsongRecSequence(wav_file=wav_file, position=position, length=length, syl_list=syl_list)
seq_list.append(seq_obj)

if concat_seqs_into_songs:
song_list = []
curr_wav_file = seq_list[0].wav_file
new_seq_obj = seq_list[0]
for syl in new_seq_obj.syls:
syl.position += new_seq_obj.position

for seq in seq_list[1:]:
if seq.wav_file == curr_wav_file:
new_seq_obj.length += seq.length
new_seq_obj.num_syls += seq.num_syls
for syl in seq.syls:
syl.position += seq.position
new_seq_obj.syls += seq.syls

else:
song_list.append(new_seq_obj)
curr_wav_file = seq.wav_file
new_seq_obj = seq
for syl in new_seq_obj.syls:
syl.position += new_seq_obj.position

song_list.append(new_seq_obj) # to append last song

return song_list

else:
return seq_list


@crowsetta.interface.SeqLike.register
@attr.define
class BirdsongRec:
Expand All @@ -35,7 +217,7 @@ class BirdsongRec:
ext: str
Extension of files in annotation format: ``'.xml'``.
sequences: list
List of :class:`birdsongrec.Sequence` instances.
List of :class:`BirdsongRecSequence` instances.
annot_path: pathlib.Path
Path to file from which annotations were loaded.
Typically with filename 'Annotation.xml'.
Expand Down Expand Up @@ -85,7 +267,7 @@ class BirdsongRec:
name: ClassVar[str] = "birdsong-recognition-dataset"
ext: ClassVar[str] = ".xml"

sequences: List[birdsongrec.Sequence]
sequences: List[BirdsongRecSequence]
annot_path: pathlib.Path = attr.field(converter=pathlib.Path)
wav_path: Optional[pathlib.Path] = attr.field(default=None, converter=attr.converters.optional(pathlib.Path))

Expand Down Expand Up @@ -140,7 +322,7 @@ def from_file(

# `birdsong-recongition-dataset` has a 'Sequence' class
# but it is different from a `crowsetta.Sequence`
birdsongrec_seqs = birdsongrec.parse_xml(annot_path, concat_seqs_into_songs=concat_seqs_into_songs)
birdsongrec_seqs = parse_xml(annot_path, concat_seqs_into_songs=concat_seqs_into_songs)
return cls(sequences=birdsongrec_seqs, annot_path=annot_path, wav_path=wav_path)

def to_seq(
Expand All @@ -161,7 +343,7 @@ def to_seq(
samplerate : int
Sampling rate for wave files. Used to convert
``position`` and ``length`` attributes of
``birdsongrec.Syllable`` from sample number
``BirdsongrecSyllable`` from sample number
to seconds. Default is None, in which ths function
tries to open each .wav file and determine
the actual sampling rate. If this does not work,
Expand Down Expand Up @@ -262,7 +444,7 @@ def to_annot(
samplerate
Sampling rate for wave files. Used to convert
``position`` and ``length`` attributes of
``birdsongrec.Syllable`` from sample number
``BirdsongRecSyllable`` from sample number
to seconds. Default is None, in which ths function
tries to open each .wav file and determine
the actual sampling rate. If this does not work,
Expand Down
55 changes: 53 additions & 2 deletions src/crowsetta/formats/seq/notmat.py
Original file line number Diff line number Diff line change
@@ -1,18 +1,69 @@
"""Module with functions that handle .not.mat annotation files
produced by evsonganaly GUI.
"""
from __future__ import annotations

import pathlib
from typing import ClassVar, Dict, Optional

import attr
import evfuncs
import numpy as np
import scipy.io

import crowsetta
from crowsetta.typing import PathLike


def load_notmat(filename: PathLike) -> dict:
"""loads .not.mat files created by evsonganaly (Matlab GUI for labeling song)

Parameters
----------
filename : str
name of .not.mat file, can include path

Returns
-------
notmat_dict : dict
variables from .not.mat files

Examples
--------
>>> a_notmat = 'gy6or6_baseline_230312_0808.138.cbin.not.mat'
>>> notmat_dict = load_notmat(a_notmat)
>>> notmat_dict.keys()
dict_keys(['__header__', '__version__', '__globals__', 'Fs', 'fname', 'labels',
'onsets', 'offsets', 'min_int', 'min_dur', 'threshold', 'sm_win'])

Notes
-----
Basically a wrapper around `scipy.io.loadmat`. Calls `loadmat` with `squeeze_me=True`
to remove extra dimensions from arrays that `loadmat` parser sometimes adds.

Also note that **onsets and offsets from .not.mat files are in milliseconds**.
The GUI `evsonganaly` saves onsets and offsets in these units,
and we avoid converting them here for consistency and interoperability
with Matlab code.
"""
filename = pathlib.Path(filename)

# have to cast to str and call endswith because 'ext' from Path will just be .mat
if str(filename).endswith(".not.mat"):
pass
elif str(filename).endswith("cbin"):
filename = filename.parent.joinpath(filename.name + ".not.mat")
else:
ext = filename.suffix
raise ValueError(f"Filename should have extension .cbin.not.mat or .cbin but extension was: {ext}")
notmat_dict = scipy.io.loadmat(filename, squeeze_me=True)
# ensure that onsets and offsets are always arrays, not scalar
for key in ("onsets", "offsets"):
if np.isscalar(notmat_dict[key]): # `squeeze_me` makes them a ``float``, this will be True in that case
value = np.array(notmat_dict[key])[np.newaxis] # ``np.newaxis`` ensures 1-d array with shape (1,)
notmat_dict[key] = value
return notmat_dict


@crowsetta.interface.SeqLike.register
@attr.define
class NotMat:
Expand Down Expand Up @@ -70,7 +121,7 @@ def from_file(cls, annot_path: PathLike) -> "Self": # noqa: F821
"""
annot_path = pathlib.Path(annot_path)
crowsetta.validation.validate_ext(annot_path, extension=cls.ext)
notmat_dict = evfuncs.load_notmat(annot_path)
notmat_dict = load_notmat(annot_path)
# in .not.mat files saved by evsonganaly,
# onsets and offsets are in units of ms, have to convert to s
onsets = notmat_dict["onsets"] / 1000
Expand Down
6 changes: 3 additions & 3 deletions src/crowsetta/formats/seq/textgrid/parse.py
Original file line number Diff line number Diff line change
Expand Up @@ -173,7 +173,7 @@ def parse_fp(fp: TextIO, keep_empty: bool = False) -> dict:
}

tiers = []
for i in range(n_tier):
for _ in range(n_tier):
if not is_short:
fp.readline() # skip item[\d]: (where \d is some number)
tier_type = get_str_from_next_line(fp)
Expand All @@ -182,7 +182,7 @@ def parse_fp(fp: TextIO, keep_empty: bool = False) -> dict:
xmax_tier = get_float_from_next_line(fp)

entries = [] # intervals or points depending on tier type
for i in range(get_int_from_next_line(fp)):
for _ in range(get_int_from_next_line(fp)):
if not is_short:
fp.readline() # skip intervals [\d]
if tier_type == INTERVAL_TIER:
Expand Down Expand Up @@ -246,7 +246,7 @@ def parse(textgrid_path: str | pathlib.Path, keep_empty: bool = False) -> dict:
try:
with textgrid_path.open("r", encoding="utf-16") as fp:
textgrid_raw = parse_fp(fp, keep_empty)
except (UnicodeError, UnicodeDecodeError):
except UnicodeError:
with textgrid_path.open("r", encoding="utf-8") as fp:
textgrid_raw = parse_fp(fp, keep_empty)
return textgrid_raw
Loading
Loading