diff --git a/WavCaps/retrieval/download_bert.py.py b/WavCaps/retrieval/download_bert.py.py new file mode 100644 index 0000000..76a8ac0 --- /dev/null +++ b/WavCaps/retrieval/download_bert.py.py @@ -0,0 +1,11 @@ +from transformers import AutoTokenizer, AutoModel + +tokenizer = AutoTokenizer.from_pretrained('bert-base-uncased') +model = AutoModel.from_pretrained('bert-base-uncased') + +# 简单测试一下 +test_text = "Hello world" +encoded = tokenizer(test_text, return_tensors="pt") +output = model(**encoded) +print(f"Model output shape: {output.last_hidden_state.shape}") +print("模型加载成功!") \ No newline at end of file diff --git a/WavCaps/retrieval/models/audio_encoder.py b/WavCaps/retrieval/models/audio_encoder.py index 40e96a1..2cfbd01 100644 --- a/WavCaps/retrieval/models/audio_encoder.py +++ b/WavCaps/retrieval/models/audio_encoder.py @@ -47,7 +47,8 @@ def __init__(self, config): config=config, ) if config["audio_encoder_args"]["pretrained"]: - audio_ckpt = torch.load("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT.ckpt", map_location="cpu")["state_dict"] + # audio_ckpt = torch.load("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT.ckpt", map_location="cpu")["state_dict"] + audio_ckpt = torch.load("/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/pretrained_models/HTSAT.ckpt", map_location="cpu")["state_dict"] for key in list(audio_ckpt.keys()): if key.startswith('sed_model') and ('spectrogram_extractor' not in key and 'logmel_extractor' not in key): diff --git a/audioset_vggish_tensorflow_to_pytorch/README.md b/audioset_vggish_tensorflow_to_pytorch/README.md new file mode 100644 index 0000000..e49d533 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/README.md @@ -0,0 +1,32 @@ +# AudioSet VGGish in PyTorch + + +## Introduction +This repository includes: +- A script which converts the pretrained VGGish model provided in the AudioSet repository from TensorFlow to PyTorch +(along with a basic smoke test). +**Sourced from:** https://github.com/tensorflow/models/tree/master/research/audioset +- The VGGish architecture defined in PyTorch. +**Adapted from:** https://github.com/harritaylor/torchvggish +- The converted weights found in the [Releases](https://github.com/tcvrick/audioset-vggish-tensorflow-to-pytorch/releases) section. + +Please note that converted model does not produce exactly the same results as the original model, but should be +close in most cases. + +## Usage +1. Download the pretrained weights and PCA parameters from the [AudioSet](https://github.com/tensorflow/models/tree/master/research/audioset) repository and place them in the working directory. +2. Install any dependencies required by [AudioSet](https://github.com/tensorflow/models/tree/master/research/audioset) (e.g., resampy, numpy, TensorFlow, etc.). +3. Run **"convert_to_pytorch.py"** to generate the PyTorch formatted weights for the VGGish model or download +the weights from the [Releases](https://github.com/tcvrick/audioset-vggish-tensorflow-to-pytorch/releases) section. + +## Example Usage +Please refer to the **"example_usage.py"** script. The output of the script should be as follows. + +``` +Input Shape: (3, 1, 96, 64) +Output Shape: (3, 128) +Computed Embedding Mean and Standard Deviation: 0.13079901 0.23851949 +Expected Embedding Mean and Standard Deviation: 0.131 0.238 +Computed Post-processed Embedding Mean and Standard Deviation: 123.01041666666667 75.51479501722199 +Expected Post-processed Embedding Mean and Standard Deviation: 123.0 75.0 +``` \ No newline at end of file diff --git a/audioset_vggish_tensorflow_to_pytorch/audioset/mel_features.py b/audioset_vggish_tensorflow_to_pytorch/audioset/mel_features.py new file mode 100644 index 0000000..ac58fb5 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/audioset/mel_features.py @@ -0,0 +1,223 @@ +# Copyright 2017 The TensorFlow Authors All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== + +"""Defines routines to compute mel spectrogram features from audio waveform.""" + +import numpy as np + + +def frame(data, window_length, hop_length): + """Convert array into a sequence of successive possibly overlapping frames. + + An n-dimensional array of shape (num_samples, ...) is converted into an + (n+1)-D array of shape (num_frames, window_length, ...), where each frame + starts hop_length points after the preceding one. + + This is accomplished using stride_tricks, so the original data is not + copied. However, there is no zero-padding, so any incomplete frames at the + end are not included. + + Args: + data: np.array of dimension N >= 1. + window_length: Number of samples in each frame. + hop_length: Advance (in samples) between each window. + + Returns: + (N+1)-D np.array with as many rows as there are complete frames that can be + extracted. + """ + num_samples = data.shape[0] + num_frames = 1 + int(np.floor((num_samples - window_length) / hop_length)) + shape = (num_frames, window_length) + data.shape[1:] + strides = (data.strides[0] * hop_length,) + data.strides + return np.lib.stride_tricks.as_strided(data, shape=shape, strides=strides) + + +def periodic_hann(window_length): + """Calculate a "periodic" Hann window. + + The classic Hann window is defined as a raised cosine that starts and + ends on zero, and where every value appears twice, except the middle + point for an odd-length window. Matlab calls this a "symmetric" window + and np.hanning() returns it. However, for Fourier analysis, this + actually represents just over one cycle of a period N-1 cosine, and + thus is not compactly expressed on a length-N Fourier basis. Instead, + it's better to use a raised cosine that ends just before the final + zero value - i.e. a complete cycle of a period-N cosine. Matlab + calls this a "periodic" window. This routine calculates it. + + Args: + window_length: The number of points in the returned window. + + Returns: + A 1D np.array containing the periodic hann window. + """ + return 0.5 - (0.5 * np.cos(2 * np.pi / window_length * + np.arange(window_length))) + + +def stft_magnitude(signal, fft_length, + hop_length=None, + window_length=None): + """Calculate the short-time Fourier transform magnitude. + + Args: + signal: 1D np.array of the input time-domain signal. + fft_length: Size of the FFT to apply. + hop_length: Advance (in samples) between each frame passed to FFT. + window_length: Length of each block of samples to pass to FFT. + + Returns: + 2D np.array where each row contains the magnitudes of the fft_length/2+1 + unique values of the FFT for the corresponding frame of input samples. + """ + frames = frame(signal, window_length, hop_length) + # Apply frame window to each frame. We use a periodic Hann (cosine of period + # window_length) instead of the symmetric Hann of np.hanning (period + # window_length-1). + window = periodic_hann(window_length) + windowed_frames = frames * window + return np.abs(np.fft.rfft(windowed_frames, int(fft_length))) + + +# Mel spectrum constants and functions. +_MEL_BREAK_FREQUENCY_HERTZ = 700.0 +_MEL_HIGH_FREQUENCY_Q = 1127.0 + + +def hertz_to_mel(frequencies_hertz): + """Convert frequencies to mel scale using HTK formula. + + Args: + frequencies_hertz: Scalar or np.array of frequencies in hertz. + + Returns: + Object of same size as frequencies_hertz containing corresponding values + on the mel scale. + """ + return _MEL_HIGH_FREQUENCY_Q * np.log( + 1.0 + (frequencies_hertz / _MEL_BREAK_FREQUENCY_HERTZ)) + + +def spectrogram_to_mel_matrix(num_mel_bins=20, + num_spectrogram_bins=129, + audio_sample_rate=8000, + lower_edge_hertz=125.0, + upper_edge_hertz=3800.0): + """Return a matrix that can post-multiply spectrogram rows to make mel. + + Returns a np.array matrix A that can be used to post-multiply a matrix S of + spectrogram values (STFT magnitudes) arranged as frames x bins to generate a + "mel spectrogram" M of frames x num_mel_bins. M = S A. + + The classic HTK algorithm exploits the complementarity of adjacent mel bands + to multiply each FFT bin by only one mel weight, then add it, with positive + and negative signs, to the two adjacent mel bands to which that bin + contributes. Here, by expressing this operation as a matrix multiply, we go + from num_fft multiplies per frame (plus around 2*num_fft adds) to around + num_fft^2 multiplies and adds. However, because these are all presumably + accomplished in a single call to np.dot(), it's not clear which approach is + faster in Python. The matrix multiplication has the attraction of being more + general and flexible, and much easier to read. + + Args: + num_mel_bins: How many bands in the resulting mel spectrum. This is + the number of columns in the output matrix. + num_spectrogram_bins: How many bins there are in the source spectrogram + data, which is understood to be fft_size/2 + 1, i.e. the spectrogram + only contains the nonredundant FFT bins. + audio_sample_rate: Samples per second of the audio at the input to the + spectrogram. We need this to figure out the actual frequencies for + each spectrogram bin, which dictates how they are mapped into mel. + lower_edge_hertz: Lower bound on the frequencies to be included in the mel + spectrum. This corresponds to the lower edge of the lowest triangular + band. + upper_edge_hertz: The desired top edge of the highest frequency band. + + Returns: + An np.array with shape (num_spectrogram_bins, num_mel_bins). + + Raises: + ValueError: if frequency edges are incorrectly ordered or out of range. + """ + nyquist_hertz = audio_sample_rate / 2. + if lower_edge_hertz < 0.0: + raise ValueError("lower_edge_hertz %.1f must be >= 0" % lower_edge_hertz) + if lower_edge_hertz >= upper_edge_hertz: + raise ValueError("lower_edge_hertz %.1f >= upper_edge_hertz %.1f" % + (lower_edge_hertz, upper_edge_hertz)) + if upper_edge_hertz > nyquist_hertz: + raise ValueError("upper_edge_hertz %.1f is greater than Nyquist %.1f" % + (upper_edge_hertz, nyquist_hertz)) + spectrogram_bins_hertz = np.linspace(0.0, nyquist_hertz, num_spectrogram_bins) + spectrogram_bins_mel = hertz_to_mel(spectrogram_bins_hertz) + # The i'th mel band (starting from i=1) has center frequency + # band_edges_mel[i], lower edge band_edges_mel[i-1], and higher edge + # band_edges_mel[i+1]. Thus, we need num_mel_bins + 2 values in + # the band_edges_mel arrays. + band_edges_mel = np.linspace(hertz_to_mel(lower_edge_hertz), + hertz_to_mel(upper_edge_hertz), num_mel_bins + 2) + # Matrix to post-multiply feature arrays whose rows are num_spectrogram_bins + # of spectrogram values. + mel_weights_matrix = np.empty((num_spectrogram_bins, num_mel_bins)) + for i in range(num_mel_bins): + lower_edge_mel, center_mel, upper_edge_mel = band_edges_mel[i:i + 3] + # Calculate lower and upper slopes for every spectrogram bin. + # Line segments are linear in the *mel* domain, not hertz. + lower_slope = ((spectrogram_bins_mel - lower_edge_mel) / + (center_mel - lower_edge_mel)) + upper_slope = ((upper_edge_mel - spectrogram_bins_mel) / + (upper_edge_mel - center_mel)) + # .. then intersect them with each other and zero. + mel_weights_matrix[:, i] = np.maximum(0.0, np.minimum(lower_slope, + upper_slope)) + # HTK excludes the spectrogram DC bin; make sure it always gets a zero + # coefficient. + mel_weights_matrix[0, :] = 0.0 + return mel_weights_matrix + + +def log_mel_spectrogram(data, + audio_sample_rate=8000, + log_offset=0.0, + window_length_secs=0.025, + hop_length_secs=0.010, + **kwargs): + """Convert waveform to a log magnitude mel-frequency spectrogram. + + Args: + data: 1D np.array of waveform data. + audio_sample_rate: The sampling rate of data. + log_offset: Add this to values when taking log to avoid -Infs. + window_length_secs: Duration of each window to analyze. + hop_length_secs: Advance between successive analysis windows. + **kwargs: Additional arguments to pass to spectrogram_to_mel_matrix. + + Returns: + 2D np.array of (num_frames, num_mel_bins) consisting of log mel filterbank + magnitudes for successive frames. + """ + window_length_samples = int(round(audio_sample_rate * window_length_secs)) + hop_length_samples = int(round(audio_sample_rate * hop_length_secs)) + fft_length = 2 ** int(np.ceil(np.log(window_length_samples) / np.log(2.0))) + spectrogram = stft_magnitude( + data, + fft_length=fft_length, + hop_length=hop_length_samples, + window_length=window_length_samples) + mel_spectrogram = np.dot(spectrogram, spectrogram_to_mel_matrix( + num_spectrogram_bins=spectrogram.shape[1], + audio_sample_rate=audio_sample_rate, **kwargs)) + return np.log(mel_spectrogram + log_offset) diff --git a/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_input.py b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_input.py new file mode 100644 index 0000000..f97f08f --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_input.py @@ -0,0 +1,87 @@ +# Copyright 2017 The TensorFlow Authors All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== + +"""Compute input examples for VGGish from audio waveform.""" + +import numpy as np +import resampy + +from audioset_vggish_tensorflow_to_pytorch.audioset import mel_features +from audioset_vggish_tensorflow_to_pytorch.audioset import vggish_params + +import soundfile as sf + + +def waveform_to_examples(data, sample_rate): + """Converts audio waveform into an array of examples for VGGish. + + Args: + data: np.array of either one dimension (mono) or two dimensions + (multi-channel, with the outer dimension representing channels). + Each sample is generally expected to lie in the range [-1.0, +1.0], + although this is not required. + sample_rate: Sample rate of data. + + Returns: + 3-D np.array of shape [num_examples, num_frames, num_bands] which represents + a sequence of examples, each of which contains a patch of log mel + spectrogram, covering num_frames frames of audio and num_bands mel frequency + bands, where the frame length is vggish_params.STFT_HOP_LENGTH_SECONDS. + """ + # Convert to mono. + if len(data.shape) > 1: + data = np.mean(data, axis=1) + # Resample to the rate assumed by VGGish. + if sample_rate != vggish_params.SAMPLE_RATE: + data = resampy.resample(data, sample_rate, vggish_params.SAMPLE_RATE) + + # Compute log mel spectrogram features. + log_mel = mel_features.log_mel_spectrogram( + data, + audio_sample_rate=vggish_params.SAMPLE_RATE, + log_offset=vggish_params.LOG_OFFSET, + window_length_secs=vggish_params.STFT_WINDOW_LENGTH_SECONDS, + hop_length_secs=vggish_params.STFT_HOP_LENGTH_SECONDS, + num_mel_bins=vggish_params.NUM_MEL_BINS, + lower_edge_hertz=vggish_params.MEL_MIN_HZ, + upper_edge_hertz=vggish_params.MEL_MAX_HZ) + + # Frame features into examples. + features_sample_rate = 1.0 / vggish_params.STFT_HOP_LENGTH_SECONDS + example_window_length = int(round( + vggish_params.EXAMPLE_WINDOW_SECONDS * features_sample_rate)) + example_hop_length = int(round( + vggish_params.EXAMPLE_HOP_SECONDS * features_sample_rate)) + log_mel_examples = mel_features.frame( + log_mel, + window_length=example_window_length, + hop_length=example_hop_length) + return log_mel_examples + + +def wavfile_to_examples(wav_file): + """Convenience wrapper around waveform_to_examples() for a common WAV format. + + Args: + wav_file: String path to a file, or a file-like object. The file + is assumed to contain WAV audio data with signed 16-bit PCM samples. + + Returns: + See waveform_to_examples. + """ + wav_data, sr = sf.read(wav_file, dtype='int16') + assert wav_data.dtype == np.int16, 'Bad sample type: %r' % wav_data.dtype + samples = wav_data / 32768.0 # Convert to [-1.0, +1.0] + return waveform_to_examples(samples, sr) diff --git a/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_params.py b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_params.py new file mode 100644 index 0000000..a38ce26 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_params.py @@ -0,0 +1,53 @@ +# Copyright 2017 The TensorFlow Authors All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== + +"""Global parameters for the VGGish model. + +See vggish_slim.py for more information. +""" + +# Architectural constants. +NUM_FRAMES = 96 # Frames in input mel-spectrogram patch. +NUM_BANDS = 64 # Frequency bands in input mel-spectrogram patch. +EMBEDDING_SIZE = 128 # Size of embedding layer. + +# Hyperparameters used in feature and example generation. +SAMPLE_RATE = 16000 +STFT_WINDOW_LENGTH_SECONDS = 0.025 +STFT_HOP_LENGTH_SECONDS = 0.010 +NUM_MEL_BINS = NUM_BANDS +MEL_MIN_HZ = 125 +MEL_MAX_HZ = 7500 +LOG_OFFSET = 0.01 # Offset used for stabilized log of input mel-spectrogram. +EXAMPLE_WINDOW_SECONDS = 0.96 # Each example contains 96 10ms frames +EXAMPLE_HOP_SECONDS = 0.96 # with zero overlap. + +# Parameters used for embedding postprocessing. +PCA_EIGEN_VECTORS_NAME = 'pca_eigen_vectors' +PCA_MEANS_NAME = 'pca_means' +QUANTIZE_MIN_VAL = -2.0 +QUANTIZE_MAX_VAL = +2.0 + +# Hyperparameters used in training. +INIT_STDDEV = 0.01 # Standard deviation used to initialize weights. +LEARNING_RATE = 1e-4 # Learning rate for the Adam optimizer. +ADAM_EPSILON = 1e-8 # Epsilon for the Adam optimizer. + +# Names of ops, tensors, and features. +INPUT_OP_NAME = 'vggish/input_features' +INPUT_TENSOR_NAME = INPUT_OP_NAME + ':0' +OUTPUT_OP_NAME = 'vggish/embedding' +OUTPUT_TENSOR_NAME = OUTPUT_OP_NAME + ':0' +AUDIO_EMBEDDING_FEATURE_NAME = 'audio_embedding' diff --git a/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_postprocess.py b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_postprocess.py new file mode 100644 index 0000000..040a701 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_postprocess.py @@ -0,0 +1,91 @@ +# Copyright 2017 The TensorFlow Authors All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== + +"""Post-process embeddings from VGGish.""" + +import numpy as np + +from audioset_vggish_tensorflow_to_pytorch.audioset import vggish_params + + +class Postprocessor(object): + """Post-processes VGGish embeddings. + + The initial release of AudioSet included 128-D VGGish embeddings for each + segment of AudioSet. These released embeddings were produced by applying + a PCA transformation (technically, a whitening transform is included as well) + and 8-bit quantization to the raw embedding output from VGGish, in order to + stay compatible with the YouTube-8M project which provides visual embeddings + in the same format for a large set of YouTube videos. This class implements + the same PCA (with whitening) and quantization transformations. + """ + + def __init__(self, pca_params_npz_path): + """Constructs a postprocessor. + + Args: + pca_params_npz_path: Path to a NumPy-format .npz file that + contains the PCA parameters used in postprocessing. + """ + params = np.load(pca_params_npz_path) + self._pca_matrix = params[vggish_params.PCA_EIGEN_VECTORS_NAME] + # Load means into a column vector for easier broadcasting later. + self._pca_means = params[vggish_params.PCA_MEANS_NAME].reshape(-1, 1) + assert self._pca_matrix.shape == ( + vggish_params.EMBEDDING_SIZE, vggish_params.EMBEDDING_SIZE), ( + 'Bad PCA matrix shape: %r' % (self._pca_matrix.shape,)) + assert self._pca_means.shape == (vggish_params.EMBEDDING_SIZE, 1), ( + 'Bad PCA means shape: %r' % (self._pca_means.shape,)) + + def postprocess(self, embeddings_batch): + """Applies postprocessing to a batch of embeddings. + + Args: + embeddings_batch: An nparray of shape [batch_size, embedding_size] + containing output from the embedding layer of VGGish. + + Returns: + An nparray of the same shape as the input but of type uint8, + containing the PCA-transformed and quantized version of the input. + """ + assert len(embeddings_batch.shape) == 2, ( + 'Expected 2-d batch, got %r' % (embeddings_batch.shape,)) + assert embeddings_batch.shape[1] == vggish_params.EMBEDDING_SIZE, ( + 'Bad batch shape: %r' % (embeddings_batch.shape,)) + + # Apply PCA. + # - Embeddings come in as [batch_size, embedding_size]. + # - Transpose to [embedding_size, batch_size]. + # - Subtract pca_means column vector from each column. + # - Premultiply by PCA matrix of shape [output_dims, input_dims] + # where both are are equal to embedding_size in our case. + # - Transpose result back to [batch_size, embedding_size]. + pca_applied = np.dot(self._pca_matrix, + (embeddings_batch.T - self._pca_means)).T + + # Quantize by: + # - clipping to [min, max] range + clipped_embeddings = np.clip( + pca_applied, vggish_params.QUANTIZE_MIN_VAL, + vggish_params.QUANTIZE_MAX_VAL) + # - convert to 8-bit in range [0.0, 255.0] + quantized_embeddings = ( + (clipped_embeddings - vggish_params.QUANTIZE_MIN_VAL) * + (255.0 / + (vggish_params.QUANTIZE_MAX_VAL - vggish_params.QUANTIZE_MIN_VAL))) + # - cast 8-bit float to uint8 + quantized_embeddings = quantized_embeddings.astype(np.uint8) + + return quantized_embeddings diff --git a/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_slim.py b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_slim.py new file mode 100644 index 0000000..0bb6ea7 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/audioset/vggish_slim.py @@ -0,0 +1,129 @@ +# Copyright 2017 The TensorFlow Authors All Rights Reserved. +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================== + +"""Defines the 'VGGish' model used to generate AudioSet embedding features. + +The public AudioSet release (https://research.google.com/audioset/download.html) +includes 128-D features extracted from the embedding layer of a VGG-like model +that was trained on a large Google-internal YouTube dataset. Here we provide +a TF-Slim definition of the same model, without any dependences on libraries +internal to Google. We call it 'VGGish'. + +Note that we only define the model up to the embedding layer, which is the +penultimate layer before the final classifier layer. We also provide various +hyperparameter values (in vggish_params.py) that were used to train this model +internally. + +For comparison, here is TF-Slim's VGG definition: +https://github.com/tensorflow/models/blob/master/research/slim/nets/vgg.py +""" + +import tensorflow as tf +from audioset import vggish_params as params + +slim = tf.contrib.slim + + +def define_vggish_slim(training=False): + """Defines the VGGish TensorFlow model. + + All ops are created in the current default graph, under the scope 'vggish/'. + + The input is a placeholder named 'vggish/input_features' of type float32 and + shape [batch_size, num_frames, num_bands] where batch_size is variable and + num_frames and num_bands are constants, and [num_frames, num_bands] represents + a log-mel-scale spectrogram patch covering num_bands frequency bands and + num_frames time frames (where each frame step is usually 10ms). This is + produced by computing the stabilized log(mel-spectrogram + params.LOG_OFFSET). + The output is an op named 'vggish/embedding' which produces the activations of + a 128-D embedding layer, which is usually the penultimate layer when used as + part of a full model with a final classifier layer. + + Args: + training: If true, all parameters are marked trainable. + + Returns: + The op 'vggish/embeddings'. + """ + # Defaults: + # - All weights are initialized to N(0, INIT_STDDEV). + # - All biases are initialized to 0. + # - All activations are ReLU. + # - All convolutions are 3x3 with stride 1 and SAME padding. + # - All max-pools are 2x2 with stride 2 and SAME padding. + with slim.arg_scope([slim.conv2d, slim.fully_connected], + weights_initializer=tf.truncated_normal_initializer( + stddev=params.INIT_STDDEV), + biases_initializer=tf.zeros_initializer(), + activation_fn=tf.nn.relu, + trainable=training), \ + slim.arg_scope([slim.conv2d], + kernel_size=[3, 3], stride=1, padding='SAME'), \ + slim.arg_scope([slim.max_pool2d], + kernel_size=[2, 2], stride=2, padding='SAME'), \ + tf.variable_scope('vggish'): + # Input: a batch of 2-D log-mel-spectrogram patches. + features = tf.placeholder( + tf.float32, shape=(None, params.NUM_FRAMES, params.NUM_BANDS), + name='input_features') + # Reshape to 4-D so that we can convolve a batch with conv2d(). + net = tf.reshape(features, [-1, params.NUM_FRAMES, params.NUM_BANDS, 1]) + + # The VGG stack of alternating convolutions and max-pools. + net = slim.conv2d(net, 64, scope='conv1') + net = slim.max_pool2d(net, scope='pool1') + net = slim.conv2d(net, 128, scope='conv2') + net = slim.max_pool2d(net, scope='pool2') + net = slim.repeat(net, 2, slim.conv2d, 256, scope='conv3') + net = slim.max_pool2d(net, scope='pool3') + net = slim.repeat(net, 2, slim.conv2d, 512, scope='conv4') + net = slim.max_pool2d(net, scope='pool4') + + # Flatten before entering fully-connected layers + net = slim.flatten(net) + net = slim.repeat(net, 2, slim.fully_connected, 4096, scope='fc1') + # The embedding layer. + net = slim.fully_connected(net, params.EMBEDDING_SIZE, scope='fc2') + return tf.identity(net, name='embedding') + + +def load_vggish_slim_checkpoint(session, checkpoint_path): + """Loads a pre-trained VGGish-compatible checkpoint. + + This function can be used as an initialization function (referred to as + init_fn in TensorFlow documentation) which is called in a Session after + initializating all variables. When used as an init_fn, this will load + a pre-trained checkpoint that is compatible with the VGGish model + definition. Only variables defined by VGGish will be loaded. + + Args: + session: an active TensorFlow session. + checkpoint_path: path to a file containing a checkpoint that is + compatible with the VGGish model definition. + """ + # Get the list of names of all VGGish variables that exist in + # the checkpoint (i.e., all inference-mode VGGish variables). + with tf.Graph().as_default(): + define_vggish_slim(training=False) + vggish_var_names = [v.name for v in tf.global_variables()] + + # Get the list of all currently existing variables that match + # the list of variable names we just computed. + vggish_vars = [v for v in tf.global_variables() if v.name in vggish_var_names] + + # Use a Saver to restore just the variables selected above. + saver = tf.train.Saver(vggish_vars, name='vggish_load_pretrained', + write_version=1) + saver.restore(session, checkpoint_path) diff --git a/audioset_vggish_tensorflow_to_pytorch/convert_to_pytorch.py b/audioset_vggish_tensorflow_to_pytorch/convert_to_pytorch.py new file mode 100644 index 0000000..30bb8c0 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/convert_to_pytorch.py @@ -0,0 +1,128 @@ +import torch +import numpy as np +import tensorflow as tf + +from vggish import VGGish +from audioset import vggish_params, vggish_slim, vggish_input + + +""" +Script which converts the pretrained TensorFlow implementation of VGGish to a PyTorch equivalent, along with +a basic smoke test to verify accuracy. +""" + + +def main(): + with tf.Graph().as_default(), tf.Session() as sess: + # ------------------- + # Step 1 + # ------------------- + # Load the model. + vggish_slim.define_vggish_slim(training=False) + vggish_slim.load_vggish_slim_checkpoint(sess, 'vggish_model.ckpt') + + # Get all of the variables, and use this to construct a dictionary which maps + # the name of the variables to their values. + variables = tf.all_variables() + variables = [x.name for x in variables] + variable_values = sess.run(variables) + variable_dict = dict(zip(variables, variable_values)) + + # Create a new state dictionary which maps the TensorFlow version of the weights + # to those in in the new PyTorch model. + pytorch_model = VGGish() + pytorch_feature_dict = pytorch_model.features.state_dict() + pytorch_fc_dict = pytorch_model.fc.state_dict() + + # ------------------- + # Step 2 + # ------------------- + # There is a bias and weight vector for each convolution layer. The weights are not necessarily stored + # in the same format and order between the two frameworks; for the TensorFlow model, the 12 vectors for the + # convolution layers are first, followed by the 6 FC layers. + tf_feature_names = list(variable_dict.keys())[:-6] + tf_fc_names = list(variable_dict.keys())[-6:] + + def to_pytorch_tensor(weights): + if len(weights.shape) == 4: + tensor = torch.from_numpy(weights.transpose(3, 2, 0, 1)).float() + else: + tensor = torch.from_numpy(weights.T).float() + return tensor + + # Convert the weights for the convolution layers. + for tf_name, pytorch_name in zip(tf_feature_names, pytorch_feature_dict.keys()): + print(f'Converting [{tf_name}] ----------> [feature.{pytorch_name}]') + pytorch_feature_dict[pytorch_name] = to_pytorch_tensor(variable_dict[tf_name]) + + # Convert the weights for the FC layers. + for tf_name, pytorch_name in zip(tf_fc_names, pytorch_fc_dict.keys()): + print(f'Converting [{tf_name}] ----------> [fc.{pytorch_name}]') + pytorch_fc_dict[pytorch_name] = to_pytorch_tensor(variable_dict[tf_name]) + + # ------------------- + # Step 3 + # ------------------- + # Load the new state dictionaries into the PyTorch model. + pytorch_model.features.load_state_dict(pytorch_feature_dict) + pytorch_model.fc.load_state_dict(pytorch_fc_dict) + + # ------------------- + # Step 4 + # ------------------- + # Generate a sample input (as in the AudioSet repo smoke test). + num_secs = 3 + freq = 1000 + sr = 44100 + t = np.linspace(0, num_secs, int(num_secs * sr)) + x = np.sin(2 * np.pi * freq * t) + + # Produce a batch of log mel spectrogram examples. + input_batch = vggish_input.waveform_to_examples(x, sr) + + # Run inference on the TensorFlow model. + features_tensor = sess.graph.get_tensor_by_name( + vggish_params.INPUT_TENSOR_NAME) + embedding_tensor = sess.graph.get_tensor_by_name( + vggish_params.OUTPUT_TENSOR_NAME) + [tf_output] = sess.run([embedding_tensor], + feed_dict={features_tensor: input_batch}) + + # Run on the PyTorch model. + pytorch_model = pytorch_model.to('cpu') + pytorch_output = pytorch_model(torch.from_numpy(input_batch).unsqueeze(dim=1).float()) + pytorch_output = pytorch_output.detach().numpy() + + # ------------------- + # Step 5 + # ------------------- + # Compare the difference between the outputs. + diff = np.linalg.norm(pytorch_output - tf_output) ** 2 + print(f'Distance between TensorFlow and PyTorch outputs: [{diff}]') + assert diff < 1e-6 + + # Run a smoke test. + expected_embedding_mean = 0.131 + expected_embedding_std = 0.238 + + # Verify the TF output. + np.testing.assert_allclose( + [np.mean(tf_output), np.std(tf_output)], + [expected_embedding_mean, expected_embedding_std], + rtol=0.001) + + # Verify the PyTorch output. + np.testing.assert_allclose( + [np.mean(pytorch_output), np.std(pytorch_output)], + [expected_embedding_mean, expected_embedding_std], + rtol=0.001) + + # ------------------- + # Step 6 + # ------------------- + print('Smoke test passed! Saving PyTorch weights to "pytorch_vggish.pth".') + torch.save(pytorch_model.state_dict(), 'pytorch_vggish.pth') + + +if __name__ == '__main__': + main() diff --git a/audioset_vggish_tensorflow_to_pytorch/example_usage.py b/audioset_vggish_tensorflow_to_pytorch/example_usage.py new file mode 100644 index 0000000..aa23d39 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/example_usage.py @@ -0,0 +1,90 @@ +import torch +import numpy as np +from pathlib import Path +from tqdm import tqdm +from vggish import VGGish +from audioset import vggish_input, vggish_postprocess +import os +import json +import torch.nn as nn + +def main(): + # Initialize the PyTorch model. + + exception_dict=[] + device = 'cuda:0' + + pytorch_model = VGGish() + pytorch_model.load_state_dict(torch.load('pytorch_vggish.pth')) + pytorch_model = pytorch_model.to(device) + pytorch_model.eval() + path = Path("/home/omercea19/akata-shared/omercea19/full_ebird_download") + + root_saved=Path("/home/omercea19/akata-shared/omercea19/full_ebird_download_embeddings_new_model") + + dict = {} + for file in tqdm(path.glob('**/*.wav')): + try: + dict[file] = 0 + loaded_wav=torch.from_numpy(vggish_input.wavfile_to_examples(str(file))) + input_batch = loaded_wav.float().to(device) + input_batch = input_batch.unsqueeze(dim=1) + pytorch_output = pytorch_model(input_batch) + pytorch_output = pytorch_output.detach().cpu().numpy() + post_processor = vggish_postprocess.Postprocessor('vggish_pca_params.npz') + postprocessed_output = post_processor.postprocess(pytorch_output) + #postprocessed_output=postprocessed_output.mean(axis=0) + new_path=str(file.relative_to(path)) + new_directory=Path.joinpath(root_saved,file.relative_to(path).parent) + try: + os.makedirs(new_directory) + except: + pass + new_path=Path.joinpath(root_saved,file.relative_to(path)) + name = str(new_path.name).split('.')[0] + name = name + ".npy" + new_path = Path.joinpath(new_path.parent, Path(name)) + np.save(new_path,postprocessed_output) + #zz=np.load(new_path) + #print(zz) + except: + print(str(file)) + exception_dict.append(str(file)) + + with open("./exception.json","w") as g: + json.dump(exception_dict,g) + + + + ''' + + THIS IS THE VARIANT WITH THE BATCHES, WHICH WILL MOST LIKELY WE USED DURING THE TRAINING/INFERENCE + + # Generate a sample input (as in the AudioSet repo smoke test). + x=['../altele/5bS607UKT2U.wav','../altele/5bS607UKT2U.wav'] + input_batch=[] + for i in x: + input_batch.append(torch.from_numpy(vggish_input.wavfile_to_examples(i))) + + input_batch=torch.stack(input_batch) + + # Produce a batch of log mel spectrogram examples. + input_batch = input_batch.float().to(device) + input_batch=input_batch.unsqueeze(dim=2) + input_batch=input_batch.view(-1,input_batch.shape[2],input_batch.shape[3],input_batch.shape[4]) + + # Run the PyTorch model. + pytorch_output = pytorch_model(input_batch) + pytorch_output = pytorch_output.detach().cpu().numpy() + print('Input Shape:', tuple(input_batch.shape)) + print('Output Shape:', tuple(pytorch_output.shape)) + + # Post-processing. + post_processor = vggish_postprocess.Postprocessor('vggish_pca_params.npz') + postprocessed_output = post_processor.postprocess(pytorch_output) + postprocessed_output=np.reshape(postprocessed_output,(len(x),-1,postprocessed_output.shape[1])) + print("final") + ''' + +if __name__ == '__main__': + main() diff --git a/audioset_vggish_tensorflow_to_pytorch/exception.json b/audioset_vggish_tensorflow_to_pytorch/exception.json new file mode 100644 index 0000000..0637a08 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/exception.json @@ -0,0 +1 @@ +[] \ No newline at end of file diff --git a/audioset_vggish_tensorflow_to_pytorch/vggish.py b/audioset_vggish_tensorflow_to_pytorch/vggish.py new file mode 100644 index 0000000..3f81796 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/vggish.py @@ -0,0 +1,58 @@ +import torch.nn as nn + + +class VGGish(nn.Module): + """ + PyTorch implementation of the VGGish model. + + Adapted from: https://github.com/harritaylor/torch-vggish + The following modifications were made: (i) correction for the missing ReLU layers, (ii) correction for the + improperly formatted data when transitioning from NHWC --> NCHW in the fully-connected layers, and (iii) + correction for flattening in the fully-connected layers. + """ + + def __init__(self): + super(VGGish, self).__init__() + self.features = nn.Sequential( + nn.Conv2d(1, 64, 3, stride=1, padding=1), + nn.ReLU(inplace=True), + nn.MaxPool2d(2, stride=2), + + nn.Conv2d(64, 128, 3, stride=1, padding=1), + nn.ReLU(inplace=True), + nn.MaxPool2d(2, stride=2), + + nn.Conv2d(128, 256, 3, stride=1, padding=1), + nn.ReLU(inplace=True), + nn.Conv2d(256, 256, 3, stride=1, padding=1), + nn.ReLU(inplace=True), + nn.MaxPool2d(2, stride=2), + + nn.Conv2d(256, 512, 3, stride=1, padding=1), + nn.ReLU(inplace=True), + nn.Conv2d(512, 512, 3, stride=1, padding=1), + nn.ReLU(inplace=True), + nn.MaxPool2d(2, stride=2) + ) + self.fc = nn.Sequential( + nn.Linear(512 * 24, 4096), + nn.ReLU(inplace=True), + nn.Linear(4096, 4096), + nn.ReLU(inplace=True), + nn.Linear(4096, 128), + nn.ReLU(inplace=True), + ) + + def forward(self, x): + x = self.features(x).permute(0, 2, 3, 1).contiguous() + x = x.view(x.size(0), -1) + x = self.fc(x) + return x + + +def main(): + pass + + +if __name__ == '__main__': + main() diff --git a/audioset_vggish_tensorflow_to_pytorch/xeno_canto_to_seconds.py b/audioset_vggish_tensorflow_to_pytorch/xeno_canto_to_seconds.py new file mode 100644 index 0000000..6be3df6 --- /dev/null +++ b/audioset_vggish_tensorflow_to_pytorch/xeno_canto_to_seconds.py @@ -0,0 +1,93 @@ +import torch +import numpy as np +from pathlib import Path +from tqdm import tqdm +from vggish import VGGish +from audioset import vggish_input, vggish_postprocess +import os +import json +import soundfile as sf + +def main(): + # Initialize the PyTorch model. + + exception_dict = [] + device = 'cuda:0' + pytorch_model = VGGish() + pytorch_model.load_state_dict(torch.load('pytorch_vggish.pth')) + pytorch_model = pytorch_model.to(device) + pytorch_model.eval() + path = Path("/home/omercea19/akata-shared/omercea19/full_ebird_download") + + root_saved = Path("/home/omercea19/akata-shared/omercea19/seconds_waveform_full_ebird_5seconds") + + dict = {} + for file in tqdm(path.glob('**/*.wav')): + try: + + data, sr = sf.read(str(file),dtype='int16') + assert data.dtype == np.int16, 'Bad sample type: %r' % data.dtype + # split + split = [] + noSections = int(np.ceil(len(data) / sr) - 1) + + for i in range(noSections): + # get 1 second + temp = data[i * sr:i * sr + sr] # this is for mono audio + # temp = data[i*sr:i*sr + sr, :] # this is for stereo audio; uncomment and comment line above + # add to list + temp=temp/32768.0 + temp = vggish_input.waveform_to_examples(temp, sr) + new_path = str(file.relative_to(path)) + new_directory = Path.joinpath(root_saved, file.relative_to(path).parent) + try: + os.makedirs(new_directory) + except: + pass + new_path = Path.joinpath(root_saved, file.relative_to(path)) + name = str(new_path.name).split('.')[0] + name = name +"sec"+ str(i)+".npy" + new_path = Path.joinpath(new_path.parent, Path(name)) + np.save(new_path, temp) + # zz=np.load(new_path) + # print(zz) + except: + print("Exception",str(file)) + exception_dict.append(str(file)) + + with open("./exception.json", "w") as g: + json.dump(exception_dict, g) + + ''' + + THIS IS THE VARIANT WITH THE BATCHES, WHICH WILL MOST LIKELY WE USED DURING THE TRAINING/INFERENCE + + # Generate a sample input (as in the AudioSet repo smoke test). + x=['../altele/5bS607UKT2U.wav','../altele/5bS607UKT2U.wav'] + input_batch=[] + for i in x: + input_batch.append(torch.from_numpy(vggish_input.wavfile_to_examples(i))) + + input_batch=torch.stack(input_batch) + + # Produce a batch of log mel spectrogram examples. + input_batch = input_batch.float().to(device) + input_batch=input_batch.unsqueeze(dim=2) + input_batch=input_batch.view(-1,input_batch.shape[2],input_batch.shape[3],input_batch.shape[4]) + + # Run the PyTorch model. + pytorch_output = pytorch_model(input_batch) + pytorch_output = pytorch_output.detach().cpu().numpy() + print('Input Shape:', tuple(input_batch.shape)) + print('Output Shape:', tuple(pytorch_output.shape)) + + # Post-processing. + post_processor = vggish_postprocess.Postprocessor('vggish_pca_params.npz') + postprocessed_output = post_processor.postprocess(pytorch_output) + postprocessed_output=np.reshape(postprocessed_output,(len(x),-1,postprocessed_output.shape[1])) + print("final") + ''' + + +if __name__ == '__main__': + main() diff --git a/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/ActivityNet.csv b/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/ActivityNet.csv new file mode 100644 index 0000000..01db345 --- /dev/null +++ b/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/ActivityNet.csv @@ -0,0 +1,203 @@ +name,description_1,description_2,description_3,,,,,,, +Applying sunscreen,"Applying sunscreen is a protective measure against the sun's harmful UV rays. It involves spreading a protective lotion on skin exposed to sunlight to prevent sunburns and reduce the risk of skin cancer, and it should be reapplied regularly, especially after swimming or sweating.","A person squeezes creamy lotion from a bottle onto their skin, often on exposed areas like arms or face, and rubs it in circular motions until it's absorbed, sometimes leaving a temporary white sheen.","Squirting or squeezing sound of lotion from a bottle, rubbing hands together, slathering sound as it spreads on skin, occasional clicking of spray sunscreen, soft patting as it is applied on the body, and the snapping sound of a cap closing.",,,,,,, +Archery,"Archery is a sport that involves shooting arrows with a bow at a target. It requires precision, control, and focus, as archers aim to hit the bullseye from various distances. Originally used for hunting and combat, today it's practiced for recreation and competition globally.","Archery involves an individual wielding a bow to shoot arrows at a target marked with concentric circles, aiming for the center or ""bullseye"". Bows are drawn back using hand and arm strength, and archers often wear finger tabs or gloves for protection. The stance is focused and precise.","The release of a bowstring creates a sharp ""twang"", the arrow's fletching makes a soft whisper as it cuts through the air, and the impact thud as the arrow hits the target, potentially followed by a metallic ring if arrows collide or strike a metal stand.",,,,,,, +Arm wrestling,"Arm wrestling is a competitive sport where two participants face each other with one arm bent and hands clasped, aiming to pin the opponent's arm onto a surface by using strength and technique. This test of upper body power is often regarded as both a sport and a display of brute strength.","Two individuals face each other, elbows planted on a flat surface, hands clasped. They apply opposing force to overpower the other's arm, aiming to pin the opponent's hand to the surface. Muscles are tensed, and expressions show determination or strain. Spectators may watch, cheering for the competitors.","During arm wrestling, one might hear grunts and groans of exertion, the thud of an arm hitting the table, onlookers cheering or shouting encouragement, and the slap of participants' hands gripping and adjusting. Occasional dialogue between competitors or with the audience adds to the aural landscape.",,,,,,, +Assembling bicycle,"Assembling a bicycle involves joining various components__rame, wheels, handlebars, gears, and brakes__ollowing specific instructions to ensure a safe, rideable bike. It requires tools, patience, and mechanical skill to align, adjust, and secure all parts properly.","A person combines various parts__rame, wheels, handlebars, gears, brakes__sing tools. They attach components, adjust fittings, and secure bolts, often consulting a manual, resulting in a complete bicycle ready for use.","Clicking of tools, metallic clinks, turning of wrenches, snapping of parts fitting together, spinning of wheels, adjusting of gears, rubber grips on handles, tightening of bolts, occasional grunts of effort, and the soft swish of tires being inflated.",,,,,,, +BMX,"BMX, short for Bicycle Motocross, is an action sport involving racing or performing freestyle tricks on BMX bikes. It gained popularity in the 1970s, inspired by motocross, and features compact, durable bikes designed for jumping and stunts. BMX became an Olympic sport in 2008.","BMX features riders on small, robust bikes performing tricks, jumps, and racing on dirt tracks, ramps, and skatepark-like courses, often with bold graphics on their bikes and protective gear like helmets and pads.","BMX riding often involves rhythmic sounds of wheels on ramps, clicks of gear shifting, the clacking of bike chains, screeching brakes, the thud when landing jumps, and the occasional cheers of onlookers. Environmental noises vary by location, from urban din to tranquil parks.",,,,,,, +Baking cookies,"Baking cookies involves combining ingredients like flour, sugar, butter, and eggs according to a recipe, shaping the dough into small portions, and then heating them in an oven until they're golden and delicious. It's a popular home cooking activity that fills the air with sweet, inviting aromas.","In the kitchen, a dusting of flour coats surfaces. Rolled dough awaits cutting into shapes, with scattered cookie cutters nearby. Sheets of raw cookies sit on a tray. The oven glows warmly. Finished cookies, golden-brown and varying in forms, cool on a rack, emanating a comforting, sweet aroma.","Crackling of sugar, rustling of packaging, tapping of utensils, whirring of a mixer, timer's ding, oven door creak, cookies' sizzle within the heat, and a faint crack when cooling.",,,,,,, +Ballet,"Ballet is a highly technical performance dance that originated during the Italian Renaissance. Characterized by grace, precision, and formalized steps and gestures, it tells a story or expresses a mood through fluid movement, often set to classical music, and typically includes pointe work in female dancers.","Ballet exhibits graceful, fluid movements by dancers in fitted costumes and slippers, typically on a stage with theatrical lighting. Elegant, controlled, and precise gestures, often accompanied by classical music, define this art form, which emphasizes poise, strength, and flexibility.","Classical music, pointe shoe sounds on wooden stage, swishing of tutus, dancers' soft footsteps, instructor's voice, piano accompaniment, audience applause, the occasional thud of a landing jump.",,,,,,, +Bathing dog,"Bathing a dog involves cleaning it with water and pet-safe shampoo to remove dirt, maintain hygiene, and prevent skin issues. Regular baths, appropriate to the dog's breed and lifestyle, contribute to overall health and wellbeing. It's a bonding experience but can be messy and requires patience.","A person uses soap and water to scrub a wet, possibly resistant dog in a tub or outdoor setting. Bubbles form on the dog's fur; towels, a hose, or a showerhead are often involved. The scene may be messy, with splashes and water spraying around. ","Splashing water, dog's panting or barking, scrubbing noises, wet fur being ruffled, occasional whining or shaking, faucet running, shampoo bottle clicks, toweling friction, and possibly calm or encouraging human voices directing the dog.",,,,,,, +Baton twirling,"Baton twirling is a rhythmic performance sport combining dance, gymnastics, and skillful manipulation of a metal rod (baton), often involving elaborate routines with spinning, tossing, and catching, performed solo or in groups to synchronized music and often incorporated into marching bands and parades.","Baton twirling is a dynamic performance involving a dancer gracefully manipulating a metal rod (baton) through coordinated flips, spins, rolls, tosses, and catches, often synchronized with dance moves and music, displaying agility, dexterity, rhythm, and sometimes performed in groups for elaborate choreographed routines.","Baton twirling may produce rhythmic sounds from the baton striking hands or catching, the swish of the stick cutting through the air, and possible clicks when two batons collide. Background music often accompanies routines, and audiences might provide applause or cheers, enhancing the auditory experience.",,,,,,, +Beach soccer,"Beach soccer, a fast-paced sport played on sand, is a variant of association football. Teams of five players compete to score goals in temporary arenas with smaller pitches and goals, emphasizing skill, agility, and scoring. Originating in Brazil, beach soccer has grown internationally with its own FIFA-endorsed competitions.","Beach soccer features players barefoot on sand, with a colorful ball, goals, and nets. Teams sport casual summer kits amidst a lively, sun-drenched coastal setting. Spectators enjoy the dynamic, high-energy matches under umbrellas or the open sky.","Auditory features of beach soccer include the sound of waves crashing, players calling to each other, the thud of the ball on sand, referee whistles, and the cheers of spectators.",,,,,,, +Beer pong,"Beer pong is a popular party game where players throw ping pong balls across a table aiming to land them in cups of beer. Teams take turns, and when a ball lands in a cup, the opposing team must drink its contents. The goal is to eliminate the opposing team's cups first.","Beer pong is a party game where players throw ping pong balls across a table, aiming to land them in cups of beer arranged in a triangular formation at either end. Cups are removed when hit, and the team that eliminates all opponents' cups wins. The setting is often lively and competitive.","Beer pong typically involves the sound of bouncing ping pong balls, laughter and chatter from players and spectators, clinking of balls against plastic cups, splashing of beer, and occasional cheers or groans depending on the success of the throws.",,,,,,, +Belly dance,"Belly dance is a traditional expressive dance with Middle Eastern origins, characterized by intricate movements of the torso, hips, and abdomen. It emphasizes fluidity, grace, and control, often accompanied by rhythmic music, and is celebrated for its cultural significance and as a form of artistic and physical expression.","Belly dance features fluid hip and abdomen movements. Dancers wear colorful costumes with flowing skirts or harem pants, often using accessories like veils or cymbals. Exposed midriffs highlight the torso’s motion.","Belly dance may involve rhythmic shimmies, clinks of coin belts, tapping of finger cymbals (zills), swishes of flowing costumes, and traditional Middle Eastern music with complex drum patterns, melodic strings, and enchanting flutes.",,,,,,, +Blow-drying hair,"Blow-drying hair involves using a handheld dryer to expel warm air, styling and drying the hair after washing. It shapes the hair, increases volume, and can create various hairstyles while reducing moisture. It's a common part of personal grooming routines and professional hairstyling.","A person wields a handheld blow dryer directing hot air towards their damp hair, often using a brush to style it. Warm air flows through the hair causing it to flutter and dry while being shaped. It's a common grooming activity that involves a lot of hand movement.","Blow-drying hair typically produces a consistent, loud roar of heated air, with varying pitch as settings adjust. Intermittent clicks from switches and occasional crackle of wet strands drying can also be heard.",,,,,,, +Blowing leaves,"Blowing leaves is an outdoor maintenance activity that involves using a leaf blower to gather and remove fallen leaves from lawns, gardens, and pathways, ensuring clean and tidy outdoor spaces.","Person wielding a leaf blower, directing forceful air stream at colorful foliage. Swirls of red, yellow, and brown leaves dance and scatter across a lawn or pavement in chaotic yet rhythmic patterns, creating a dynamic, ever-shifting carpet of autumnal hues.","The activity of blowing leaves typically produces a sustained, high-pitched whirring or whining sound from the leaf blower motor, punctuated by the rustling and fluttering of leaves as they are disturbed and moved across the ground. Occasionally, there might be softer crunching noises if dry leaves are present.",,,,,,, +Braiding hair,Braiding hair involves interweaving three or more strands of hair in a systematic pattern to create a cohesive plait. This versatile styling technique can range from simple three-strand braids to complex patterns and is used for both aesthetic and practical purposes across various cultures and ages.,"""Braiding hair"" involves systematically crossing strands of hair over one another to create a cohesive, interwoven pattern that lies flat against the head or extends outwards, forming a plait or braid of varying sizes and styles, often secured at the end with a hair tie or accessory.","Soft rustling of hair strands, occasional snaps of hair ties or click of hair accessory clasps, whispered exchanges between stylist and client or self-talk concentrating, and sporadic creaks of the chair as either person adjusts their position.",,,,,,, +Breakdancing,"Breakdancing, also called breaking or b-boying/b-girling, emerged in 1970s Bronx, NYC. This energetic street dance features athletic moves like spins, freezes, and power moves. Performed to hip-hop or breakbeats, it emphasizes creativity, style, and physical prowess.","Breakdancing involves dynamic, acrobatic moves: spinning on the floor or head, handstands, and power moves. Dancers showcase swift footwork, freezes in poses, and battle each other with stylistic flair, often forming circles to highlight individual performances amidst pulsating hip-hop beats.","Breakdancing features rhythmic beats, dynamic music with strong bass, percussive body movements generating thuds, tapping sounds of sneakers on floor, occasional whoops or cheers from onlookers, and the swish of clothing as dancers execute fast spins and aerial maneuvers.",,,,,,, +Brushing hair,"Brushing hair is a grooming activity involving running a brush through the hair to detangle, smooth, and style it, while also distributing natural scalp oils to promote hair health and shine. It is a daily routine for many and can help prevent knots and breakages.","A person runs a brush or comb through their hair, typically using one hand to hold the tool, while the other might separate strands. The hair may sway and fall with each stroke, detangling and smoothing as the bristles glide from roots to ends, often in front of a mirror.","Brushing hair may produce soft, rhythmic scraping sounds as bristles slide through strands, interspersed with gentle rustling and the occasional sharper snap when encountering tangles. The frequency varies with brush type and hair texture.",,,,,,, +Brushing teeth,"Brushing teeth is a daily hygiene practice to clean teeth and gums, remove plaque, and prevent oral issues like cavities, gingivitis, and bad breath. It involves using a toothbrush and toothpaste to scrub all tooth surfaces in a systematic manner, typically twice a day.","Person stands at sink, toothbrush in hand, applying toothpaste. Bristles scrub teeth in circular motions, creating white frothy foam. Mirror reflection shows mouth movement, rinsing under faucet follows. Toothbrush is rinsed and put away; sparkling clean teeth are revealed with a final rinse and spit, leaving a fresh sensation.","Brushing teeth is typically accompanied by sounds of bristle scrubbing against enamel, rhythmic brush strokes, occasional gargling, spitting into the sink, and running water during rinsing. The electric toothbrushes add a buzzing or whirring motor noise to the auditory mix.",,,,,,, +Building sandcastles,"Building sandcastles is a creative outdoor activity often enjoyed on sandy beaches, where participants shape and sculpt sand into structures, using hands, tools, and water to stabilize the creations. It's a popular pastime for all ages that can range from simple forms to elaborate, artistic designs.","People shape wet sand with hands or tools, creating towers and walls, often using buckets for formwork, focused on constructing miniature sandy fortresses, decorated with shells or flags, on a beach with scattered sand mounds and dug-up moats, against a backdrop of ocean waves and beachgoers.","Building sandcastles may involve the gentle scraping and patting of wet sand, the occasional splash of water to moisten the sand, playful children's chatter, the distant sound of waves, and the soothing ocean breeze creating a rhythmic background.",,,,,,, +Bullfighting,"Bullfighting is a traditional spectacle of Spain, Portugal, southern France, and some Latin American countries, where matadors perform a series of formalized actions concluding with an attempt to kill a bull for audience entertainment. It is a controversial practice due to animal welfare concerns.","Bullfighting involves a matador in a traditional costume wielding a cape, facing off in a sandy arena against a charging bull, aiming to perform an artistic and controlled display of dodges and moves before the climactic moment of the fight, which usually intends to kill or subdue the bull.","Bullfighting is associated with the dramatic blare of trumpets, the crowd's passionate cheers and gasps, the matador's vocal cues, the swishing of capes, the dull thud of hooves on the sand, and the tense silence before the bull charges.",,,,,,, +Bungee jumping,"Bungee jumping is an exhilarating activity where individuals leap from a high platform, such as a bridge or crane, secured by a long elastic cord attached to their ankles, experiencing free-fall before the cord recoils, leaving them to oscillate until brought to a rest.","A person, strapped into a harness attached to an elastic cord, leaps from a high platform, freefalling until the cord stretches and rebounds, repeatedly bouncing up and down until the motion gradually subsides.","Bungee jumping may involve the rush of wind, screams of thrill or fear, the creaking or stretching of the bungee cord, a short silence during free fall, safety harness clicks, and potentially instructions or encouragement shouted by operators or spectators.",,,,,,, +Calf roping,"Calf roping, also known as tie-down roping, is a competitive rodeo event where a rider on horseback chases, lassos, and then quickly ties three of the calf's legs together, aiming to complete the task in the shortest possible time while adhering to specific rules ensuring animal safety.","Calf roping involves a mounted cowboy quickly lassoing a calf's neck, dismounting, and restraining the calf by tying three of its legs together, all against the clock. The activity features a dynamic scene with a galloping horse, flying rope, and a calf being pursued and ultimately immobilized.","Calf roping involves sounds of horses galloping, ropes whizzing and tightening, calves bleating, crowd reactions, and occasional announcer commentary, alongside the clatter of gates and thuds of tackles.",,,,,,, +Camel ride,"A camel ride is a guided experience on the back of a camel, often in desert areas, where participants enjoy a leisurely pace while observing the landscape. It's a popular tourist activity that offers a unique way to explore natural scenery and experience traditional modes of transportation.","Individuals mount camels, sitting atop their humped backs, often with traditional saddles. Camels are led by guides across scenic landscapes, such as deserts with sand dunes, facilitating a slow and swaying gait as they walk in single file or small groups under the open sky.","Camel rides are often accompanied by the gentle, rhythmic sounds of the camel's padded feet on sand, the creature's distinctive grunts and chews, the creak of the saddle, soothing desert winds, and the occasional chatter or commands from the guide.",,,,,,, +Canoeing,"Canoeing is an outdoor activity where participants paddle a canoe using a single-bladed paddle. It involves navigating rivers or lakes for recreation or competition, offering a full-body workout and a chance to explore nature. Canoeing enhances teamwork and endurance, ranging from peaceful outings to thrilling white water adventures.","Canoeing features one or more individuals paddling a narrow, lightweight boat with pointed ends in water, using single-bladed paddles. Participants sit or kneel, facing forward in the canoe, which glides atop rivers, lakes, or seas, often amidst natural scenic beauty.","Canoeing typically entails sounds of gentle water lapping against the canoe's hull, rhythmic splashes of paddles dipping into the river, distant calls of birds or wildlife, occasional creaking of wood or shifting gear, and soft murmurs of conversation or silence amidst nature's tranquility.",,,,,,, +Capoeira,"Capoeira is a Brazilian martial art that fuses dance, acrobatics, and music. It is characterized by quick, intricate movements using power and speed for diverse kicks and spins. Developed by enslaved Africans in 16th-century Brazil, Capoeira is celebrated for its dynamic and fluid techniques.","Capoeira is a dynamic Afro-Brazilian martial art that blends dance, acrobatics, and music. Practitioners move fluidly; often executing spins, kicks, and flips to the rhythm of percussion instruments, embodying a flowing, dance-like fight with strong cultural aesthetics.","Capoeira, a Brazilian martial art, typically features rhythmic music with instruments like the berimbau, pandeiro, and atabaque. Chants and clapping accompany movements, enhancing the flow and interaction between practitioners. This sonic environment is integral, guiding the pace and style of this cultural dance-fight-game.",,,,,,, +Carving jack-o-lanterns,"Carving jack-o'-lanterns is a popular Halloween tradition where pumpkins are hollowed out, and faces or designs are cut into the surface. Candles or lights are placed inside to create a glowing effect. The practice is rooted in Irish folklore to ward off evil spirits.","Carving jack-o'-lanterns involves hollowing out pumpkins and cutting out faces or designs to create glowing lanterns when lit with candles inside, often featuring triangular eyes, a jagged smile, and an ambient orange glow.","Scratching and slicing sounds as knives cut through pumpkin flesh, the scoop scraping seeds and strands, occasional thuds when pieces are removed, and the squishy noise of hands removing the innards. Sometimes, there's light laughter or conversation if the activity is shared.",,,,,,, +Changing car wheel,"Changing a car wheel involves lifting the vehicle with a jack, removing the lug nuts, swapping the flat tire for a spare, securing the lug nuts back in place, and lowering the car. It's essential for roadside emergencies and requires a jack, lug wrench, spare tire, and basic safety knowledge.","A person crouches beside a car, removing lug nuts with a wrench. The car is lifted slightly by a jack. A spare wheel is ready nearby. The removed flat tire sits to the side, awaiting replacement. The person shows effort, focused on securely attaching the spare wheel to the car.","When changing a wheel, you can hear the clinking sound of a wrench against metal, the clicking of a jack, the thud of a tire hitting the ground, and other subtle sounds of disassembly and assembly.",,,,,,, +Cheerleading,"Cheerleading is an energetic activity combining gymnastics, dance, and stunts to lead audience cheers and support sports teams, while also competing in organized routines showcasing athletic skills, coordination, and teamwork. It's a performance-based sport that promotes spirit, enthusiasm, and athleticism among participants.","Cheerleading involves synchronized team routines with vibrant outfits, pompoms, and acrobatic stunts, including jumps, pyramids, and tumbling, often accompanied by spirited chants and cheers, designed to energize crowds at sports events.","Cheerleading auditory features include vocal chants, clapping, energetic music, sneaker squeaks on gym floors, pom-poms rustling, crowd reactions, coach shouts, and stunts resulting in thuds or team synchronization sounds.",,,,,,, +Chopping wood,"Chopping wood is a physical activity where a person uses a sharp tool, such as an axe, to split logs into smaller pieces, typically for firewood. It requires strength, precision, and safety precautions, serving both as a form of exercise and a practical way to prepare fuel.","A person swings an axe overhead, striking a log on a chopping block. Wood splinters with each chop, and stacked logs await nearby. The rhythmic motion continues as pieces are split and tossed aside to grow the pile of firewood.","Chopping wood may produce rhythmic thuds of the axe striking wood, cracking sounds as the wood splits, rustling leaves if done outdoors, and occasional grunts or exhales from the person exerting effort.",,,,,,, +Clean and jerk,"The clean and jerk is a dynamic Olympic weightlifting movement comprising two distinct phases: the ""clean,"" where the lifter hoists the barbell from the ground to the shoulders, and the ""jerk,"" in which the athlete explosively thrusts the barbell overhead, completing the lift with arms fully extended.","The clean and jerk involves lifting a barbell from the floor to the shoulders (clean), then thrusting it overhead with locked arms (jerk), typically in a split stance or squat position for stability. It's a dynamic, two-phase Olympic weightlifting movement showcasing power, coordination, and strength.","The ""clean and jerk"" is accompanied by sounds of heavy breathing, grunts from exertion, clanking of metal weights, the thud of the barbell hitting the platform, and possibly verbal cues from a spotter or coach.",,,,,,, +Cleaning shoes,"Cleaning shoes is the process of removing dirt, stains, and odors from footwear to maintain their appearance and hygiene. It involves using appropriate tools and cleaning agents suitable for the shoe material, and can extend their lifespan and enhance comfort.","A person brushes off dirt and wipes down shoes, sometimes applying polish or cleaner, then buffs them to a shine. Various tools like brushes, cloths, and sprays are typically used, alongside a mat or newspaper to protect surfaces.","Scraping and brushing sounds, water splashing, soap suds squelching, gentle tapping of shoes being banged together, bristles on surfaces during scrubbing, and the soft thud of shoes being set down to dry.",,,,,,, +Cleaning sink,"Cleaning a sink involves removing dirt, grime, and bacteria to maintain hygiene and aesthetics. It typically involves scrubbing the basin with a cleaner, rinsing, and possibly polishing fixtures to restore shine. Regular cleaning prevents build-up and keeps the sink sanitary and visually appealing.","Person scrubbing a sink basin with a sponge or brush, using cleaning spray or soap, water running, bubbles forming, and debris being washed down the drain. Surfaces transition from dirty to shiny and spotless as the person rinses and wipes down the sink's faucet and handles.","Splashing water, scrubbing bristles, clinking of dishes, running faucet, swooshing soap suds, metallic scraping (if sink is stainless steel), and the occasional clatter of utensils or cleaning tools.",,,,,,, +Cleaning windows,"Cleaning windows involves removing dirt, grime, and streaks from glass surfaces to improve transparency and aesthetics. It can involve washing with soap and water, using squeegees, cloths, or specialized cleaning solutions, and can be done both indoors and outdoors for better light and view.","A person wipes glass panes with a squeegee or cloth, often using soapy water or cleaner. Streaks vanish as they systematically move across the surface. Ladders or long poles may be used for high windows, with a clear, streak-free shine left behind as evidence of their task.","Squeaks from glass as squeegee glides, spritzing liquid sounds from spray bottles, dripping water, rustling of wiping cloths, clicking of extending handles, and occasional clanking of equipment against window frames.",,,,,,, +Clipping cat claws,"Clipping cat claws is a routine grooming process to prevent scratches and reduce damage to furniture. It involves carefully trimming the sharp tips of a cat's nails, using special clippers, while avoiding the quick to ensure the cat's safety and comfort. Regular clipping promotes healthy paws and behavior.","A person carefully holds a cat's paw, gently pressing to extend the claws. Using specialized pet clippers, they snip the sharp tips off each claw, avoiding the pinkish quick to prevent discomfort or bleeding, while the cat remains still or is gently restrained.","Clipping cat claws may involve the sound of the clipper's cutting mechanism, occasional feline vocalizations ranging from purring to hissing or meowing, and a possible soft click when the claw is trimmed. Background noises might include the cat's movements or rustling if restrained for the procedure.",,,,,,, +Cricket,"Cricket is a team sport involving batting and bowling where two teams of eleven players aim to score runs and dismiss opponents on an oval field, with a 22-yard pitch at its center. It's popular mainly in Commonwealth countries and has various formats like Test, One-Day, and Twenty20 matches.","Cricket features players in white uniforms on a grassy field, a flat pitch with stumps at each end, a bowler hurling a red ball, batsmen wielding flat bats, and fielders dispersed around to catch or chase the ball. The scene may include cheering spectators in a stadium or park.","Cricket activity is associated with a rhythmic, high-pitched chirping sound produced by male crickets rubbing their wings together, called stridulation. This sound serves as a mating call and varies in frequency depending on the species and temperature.",,,,,,, +Croquet,"Croquet is an outdoor game where players use mallets to hit wooden balls through a series of hoops, or ""wickets"", embedded in a grass playing field, aiming to complete the course in a set sequence and finish by striking a central peg, combining strategy, skill, and precision.","Croquet involves players hitting wooden balls with mallets through hoops or ""wickets"" embedded in a grassy lawn, often dressed in traditional white attire for competitive play. The game features brightly colored balls, manicured lawns, and tactic discussions among participants, exuding a genteel, strategic, and leisurely aesthetic.","The click of mallet striking ball, the thud of balls colliding, players' calls and laughter, the rustle of mallets sweeping grass__hese are auditory features one might hear during a game of croquet.",,,,,,, +Cumbia,"Cumbia is a lively Colombian dance and musical genre with African, Indigenous, and Spanish influences, characterized by its rhythmic percussion, melodic wind instruments, and swaying hip movements, often enjoyed at social gatherings and reflecting a rich cultural heritage.","Cumbia is a lively dance with couples swirling in colorful, rhythmic movements, often featuring traditional, vibrant outfits with flowing skirts and handkerchiefs, accompanied by the upbeat tunes of accordions, drums, and claves in a festive atmosphere.","Cumbia is characterized by rhythmic drum patterns, claves, shakers, and accordion melodies. Depending on the regional style, you might hear call-and-response vocals, brass, string instruments, and electronic sounds filling the festive, dance-evoking sonic landscape of this traditional Latin American music genre.",,,,,,, +Curling,"Curling is a team sport played on ice, where players slide stones towards a target area. Two teams take turns sliding heavy, polished granite stones down the ice curling sheet towards the house, a circular target marked on the ice. The objective is to have the stones closest to the center.","Curling involves teams sliding polished granite stones across ice towards a target area, with players sweeping the ice to influence the stone's path. The sport features circular scoring zones and competitors wearing special shoes for traction and gliding.","Curling involves the sound of sliding stones across the ice, the scraping of brooms briskly sweeping, shouted strategic commands from teammates, and the gentle clink as stones collide. The ambiance often includes the murmurs of the audience and the echo of activity within an ice rink.",,,,,,, +Cutting the grass,"Cutting the grass involves trimming the turf to a uniform height using mowers, keeping lawns neat and healthy and aiding in the control of weeds, pests, and diseases. Regular mowing also encourages lush, dense grass growth and enhances the aesthetic appeal of outdoor spaces.","A person pushes a lawn mower across a lawn, trimming the green grass to a uniform, shorter height, leaving behind freshly cut clippings and the distinct scent of mown grass. The mower's blades whirl, and straight or patterned lines appear where the mower has passed.","The activity ""cutting the grass"" typically includes the steady roar of a lawnmower engine, periodic whirring of the blades, occasional rattling over uneven terrain, and the softer rustle of trimmed grass falling. Higher-pitched squeaks or knocks may suggest mechanical issues with the mower.",,,,,,, +Decorating the Christmas tree,"Decorating the Christmas tree is a festive holiday tradition where families and friends adorn a tree with ornaments, lights, tinsel, and a star or angel topper, creating a centerpiece for Christmas celebrations, reflective of cultural customs and individual styles__ombining nostalgia, creativity, and the spirit of joy.","Individuals adorn an evergreen with twinkling lights, colorful ornaments, tinsel, and a star or angel atop while surrounded by boxes of decorations, strands of lights, and scattered tinsel, imbuing the space with festive cheer.","Crinkling tinsel, rustling branches, soft clinks of ornaments, snippets of holiday tunes, laughter, the snap of string lights, and the occasional sound of something delicate being carefully placed or, sometimes, accidentally dropping.",,,,,,, +Disc dog,"Disc dog is a competitive and recreational activity where a handler and a dog work together to perform aerial stunts and catches with a flying disc. It showcases the dog's agility, speed, and coordination, as well as the handler's throwing skills, often set to music and judged on difficulty, accuracy, and showmanship.","Disc dog involves a dog leaping through the air to catch flying discs thrown by its handler. It's a dynamic display of agility and coordination, with dogs showcasing intense focus and athleticism against a backdrop of enthusiastic spectators. The vibrant discs add colorful flashes to the high-energy sport.","Disc dog events typically involve barks from excited canines, the whoosh of flying discs, cheers and commands from handlers, applause from spectators, and light-footed movements of dogs on grass as they leap and dash to catch frisbees. Soundscapes may vary with indoor or outdoor settings.",,,,,,, +Discus throw,"Discus throw is an ancient track and field athletics event where competitors hurl a heavy disc called a discus as far as possible. Athletes spin within a designated circle and release the discus with speed and precise technique, aiming to achieve maximum distance within marked sector boundaries.","An athlete spins rapidly within a circle and hurls a heavy, lenticular disc, aiming for maximum distance. The discus thrower combines strength and finely tuned technique, the discus arcing gracefully through the air before landing in a designated sector of the field.","Grunt or exhale from the athlete's effort, whir of the spinning discus, slap of feet against the ground, crowd reactions, and the thud of discus landing on the field.",,,,,,, +Dodgeball,Dodgeball is a team sport in which players on two teams try to throw balls at each other while avoiding being hit themselves. The objective is to eliminate opponents by hitting them with a ball or catching one they throw.,"Dodgeball involves players in two teams on opposite sides of a court, dodging and throwing rubber or foam balls at each other, with the aim to hit opponents. The sport is marked by rapid movement, dodges, throws, and occasional group strategies within the defined play area.","Dodgeball auditory features include the thud of rubber balls striking the floor or players, whistles blown by referees, players shouting for coordination or dodges, the buzzing of a timer, and often the squeak of gym shoes on the court surface.",,,,,,, +Doing a powerbomb,A powerbomb is a professional wrestling move where one wrestler lifts another onto their shoulders and then slams them down to the mat back-first. It is a show of strength and often used as a signature or finishing move in matches.,"A powerbomb is a wrestling move where an individual lifts the opponent on their shoulders and then slams them down onto the mat, back-first, often with the attacker squatting before the throw to maximize force.","The auditory features of a powerbomb, a wrestling move, may include the grunts or shouts of exertion, a loud slam as the recipient hits the mat, the reaction of a watching crowd (gasps, cheers, or winces), and possibly the referee's count or announcement following the move.",,,,,,, +Doing crunches,"Crunches are a core-strengthening exercise where one curls their upper body from a lying position, engaging the abdominal muscles to lift the shoulders off the ground. It is commonly used for toning the midsection and improving core stability.","An individual lies on their back with knees bent, feet flat on the floor, hands supporting the head. Engaging the core, they lift their shoulders towards the pelvis, crunching their abdomen, then lower back down. The movement is repetitive and focused, involving primarily the upper body.","While doing crunches, one might hear the rhythmic sound of breath exhaling forcefully on the contraction phase, a soft rustling of clothing or exercise mat, occasional grunts of exertion, and possibly the floor or equipment creaking slightly under the movement's strain.",,,,,,, +Doing fencing,"Fencing is a modern combat sport where two competitors duel with foil, épée, or sabre, scoring points by hitting their opponent. It demands precision, strategy, and athleticism, while following rules of movement, attack, and defense. Fencing is steeped in centuries-old swordsmanship traditions.","Two fencers in white protective gear, helmets, and gloves face off with épées, foils, or sabres. They execute agile lunges, thrusts, and parries on a narrow strip, aiming to score points with swift and precise movements.","Doing fencing features sounds of metal blades clashing, footsteps shuffling on the piste, fencers' breaths, electronic scoring beeps, referee commands, and occasional audience reactions.",,,,,,, +Doing karate,"Karate is a martial art originating from Okinawa, Japan, emphasizing self-defense, discipline, and striking techniques including punches, kicks, knee strikes, and elbow blows. Practitioners, known as karatekas, train in katas (forms), sparring, and conditioning for mental and physical development.","Someone doing karate typically wears a white gi (uniform) with a colored belt and performs sharp, precise movements such as punches, kicks, blocks, and stances, often accompanied by loud kiai (shouts) for focus and power.","Karate may involve sounds of sharp exhalations, kiai (shouts), snapping of gis (uniforms), thuds of bare feet on mats, impacts from strikes and blocks, and occasional dialogue between instructor and students, or among practitioners. Background may have rhythmic count or traditional Japanese music if practiced during training routines.",,,,,,, +Doing kickboxing,"Kickboxing is a high-energy martial arts discipline combining punches, kicks, and footwork, offering a vigorous full-body workout that improves strength, agility, and cardiovascular health, while also providing practical self-defense techniques.","Individuals wear gloves, performing punches and kicks in the air or on pads. They exhibit focused, swift, and controlled movements, with a mix of offensive and defensive stances, showcasing strength, stamina, and technique. Fitness and combat elements are combined in a high-energy, dynamic environment.","Rhythmic punches and kicks striking pads or heavy bags, the thud of gloves on targets, quick steps and shuffles on the mat, instructor commands, heavy breathing, and the occasional grunt of exertion or encouragement from fellow participants.",,,,,,, +Doing motocross,"Motocross is a high-adrenaline outdoor sport involving racing and stunt riding on off-road motorcycles over rough terrain, featuring jumps, sharp turns, and varied obstacles. Competitors aim for the fastest times or best performance on dirt tracks designed to challenge their speed, skill, and endurance.","Riders clad in colorful protective gear race on dirt bikes, leaping off ramps and navigating sharp turns amidst clouds of dust, on a rough track with hills and obstacles.","Motocross is characterized by the revving of high-powered engines, the roar of motorcycles speeding through rough terrain, punctuated by the sounds of jumps and landings, the occasional crunch of bikes colliding, and the buzzing crowd of spectators cheering on the riders.",,,,,,, +Doing nails,"Doing nails involves shaping, cleaning, polishing, and decorating fingernails and toenails to enhance their appearance. This beauty activity can include trimming, filing, applying nail polish or gel, and adding nail art or artificial enhancements like acrylics. It's a popular way to express personal style and maintain grooming.","A person carefully applies colorful polish on fingernails, perhaps with an array of brushes and bottles nearby. Shiny coats or intricate designs adorn the nails, and tools like files and cuticle pushers might be in use for shaping and preparing the nails for decoration.","Clipping, filing, and buffing create rhythmic scraping and clicking sounds. Brushes sweeping over nails make soft swishes, while shaking polish bottles yields a liquid sloshing noise. An electric nail drill hums during use. Occasional conversation with muted background music or a hairdryer can be part of the ambient sounds.",,,,,,, +Doing step aerobics,"Step aerobics is a cardio exercise combining rhythmic steps and music using an elevated platform, enhancing coordination, cardiovascular health, and lower body strength. It can be adjusted to various fitness levels by altering step height and choreography intensity, providing a dynamic and enjoyable workout that burns calories and improves stamina.","Individuals perform choreographed movements on and off a raised platform, often to the rhythm of music. Stepping up, down, and around the bench, they combine cardio and coordination exercises, sometimes using hand weights for added intensity.","""Doing step aerobics"" typically involves rhythmic sounds of feet tapping on a step platform, synchronized with up-tempo music. There's also the instructor's voice guiding movements, participants' synchronized steps, occasional clapping, and the sound of deep, controlled breathing from exerted participants.",,,,,,, +Drinking beer,"Drinking beer is a social and cultural activity where individuals consume beer, a fermented alcoholic beverage made from grains, often for leisure, to unwind, enjoy flavors, and foster social connections. It is widely enjoyed globally and is often accompanied by food, games, and conversation.","A person tilts a glass or bottle, sipping the amber-to-golden liquid with a frothy head, possibly relaxing or socializing, with beads of condensation marking the container's surface.","The pop of a bottle or can, the fizz of carbonation, and the pour into a glass create a soft cascade. Glasses clink for a toast, followed by sipping and swallowing amidst relaxed conversation and laughter. Ambient bar or party noise accompanies the thud of setting down a glass.",,,,,,, +Drinking coffee,"Drinking coffee is a popular daily ritual where one consumes a brewed beverage made from roasted coffee beans, known for its stimulating effect due to caffeine, rich aroma, and varied flavors, often enjoyed for its ability to enhance alertness and sociability.","A person holds a mug, steam rises from the dark liquid. They sip, often with a relaxed demeanor, enjoying the warmth and aroma. The coffee might sit on a saucer, and occasionally there's a spoon, sugar, or cream on the table.","Drinking coffee could involve the sounds of a cup clinking against a saucer, gentle slurping, the ceramic clank when setting down the cup, stirring clinks from a spoon, the sizzle of poured hot coffee, and quiet sighs of contentment after sipping.",,,,,,, +Drum corps,"Drum corps is a competitive form of marching ensemble, known for its precision, musicality, and high-energy performances. It combines brass instruments, percussion, and color guard elements to create intricate field shows. Participants often train rigorously and perform in nationwide competitions during the summer season.","Drum corps involves uniformed musicians marching in precise formations with brass instruments, percussion, and color guard. They perform choreographed routines with dynamic, rhythmic music, often incorporating elaborate flag work, rifle tossing, and vivid costumes. The spectacle is colorful, energetic, and visually synchronized to the musical performance.","Drum corps performances feature precise, rhythmic percussion patterns with varying dynamics, melodic brass accompaniment, and color guard effects creating a rich, multi-layered soundscape of intense musical arrangements designed for competitive and exhibition events, often characterized by a high level of musical and marching coordination.",,,,,,, +Elliptical trainer,"The elliptical trainer is a low-impact exercise machine that simulates walking, running, or stair climbing without causing excessive pressure on the joints, thus decreasing the risk of impact injuries. It provides a cardiovascular workout, engaging multiple muscle groups simultaneously through smooth, elliptical motion.","An individual stands on pedals, grasps handles, and glides feet back-and-forth in an elliptical motion while arms push and pull in sync, simulating walking or running with less impact.","Whirring of machine, rhythmic thumping of feet, soft hum of rotating components, occasional squeaks of joints or bearings, steady breathing patterns, metallic clinking from pulse sensors or bottle holder, background music or audio from headphones, and the faint beep of control panel as settings are adjusted.",,,,,,, +Fixing bicycle,"Fixing a bicycle involves diagnosing issues, repairing or replacing parts like tires, chains, or brakes, and ensuring the bike is safe and functional for riding. It requires tools and mechanical knowledge and can range from simple tune-ups to complex overhauls.","A person is bent over a bicycle, tools in hand, adjusting gears, aligning wheels, or repairing a tire. Parts, screws, and a bike pump might be visible nearby, with focus and concentration evident in the individual's demeanor.","Clicking of gears, whirring of chain, hiss of tires inflating, clanging of tools, scraping of brushes cleaning, clinking of metal parts, snapping of cables, occasional grunts of effort.",,,,,,, +Fixing the roof,"Fixing the roof involves assessing damage, removing old materials, and installing new shingles or tiles to restore the integrity of the roof, protecting a building from weather-related damage. It requires safety measures and skilled labor to ensure the longevity and durability of the roofing structure.","Person on a ladder or rooftop, using tools like hammers or nail guns, replacing shingles or tiles, wearing safety gear like gloves, harness, and helmet, with materials around them such as new shingles, flashing, and debris from old roofing.","Hammering nails, sawing wood, footsteps on shingles, scraping, peeling, application of sealant, conversations between workers, creaking boards, power tools whirring, materials being moved, occasional debris falling.",,,,,,, +Fun sliding down,"""Fun sliding down"" is an exhilarating activity where participants enjoy the thrill of descending down slides or slopes, often found at water parks, playgrounds, or snowy hills, creating joyful memories fueled by speed and laughter, suitable for all ages.","Individuals gleefully descend a smooth, inclined surface, like a slide, their faces alight with joy and excitement as they swoop downwards, some with arms raised, against a backdrop of vibrant colors or natural scenery, showcasing motion and the thrill of the swift, smooth glide to the bottom.","The activity of sliding down typically produces sounds of whooshing due to rapid movement through air, joyful screams or laughter from participants, and potentially a thud or softer impact when landing at the end of the slide. The material of the slide may create additional friction noises.",,,,,,, +Futsal,"Futsal is a fast-paced, small-sided soccer game, played indoors on a hard court with five players per team. Originating in South America, it emphasizes ball control, creativity, and technical skill, utilizing a smaller, low-bounce ball in a confined space to enhance close-quarter gameplay and quick decision-making.","Futsal features two teams of five players, including goalkeepers, on a hard court smaller than a football pitch, bounded by lines. Players use a smaller, low-bounce ball, displaying close ball control, rapid passes, and frequent goal attempts with swift, agile movements, in a fast-paced, indoor soccer-like environment.","Futsal's auditory features include the echoing bounce of a heavier ball on a hard surface, quick short passes, referees' whistles, players' vocal communication and shouts, the thud of the ball hitting the walls or goals, and the cheers and reactions of an enclosed, often intimate spectator crowd.",,,,,,, +Gargling mouthwash,"Gargling mouthwash is a hygiene activity involving swishing liquid around the mouth and throat to clean, freshen breath, and potentially reduce oral bacteria, followed by spitting it out.","A person tilts their head back, takes a swig of mouthwash, and vigorously swishes it, puffing their cheeks. Bubbles form as they gargle, occasionally grimacing at the strong flavor, before spitting it out.","Gargling mouthwash produces a bubbling liquid sound as air passes through the mouthwash, a periodic gargle or swishing noise, often followed by a spitting sound when the mouthwash is expelled, and possibly a brief sigh of freshness or relief from the person after completion.",,,,,,, +Getting a haircut,"Getting a haircut involves trimming and styling hair on the head and, sometimes, the face. A professional hairstylist or barber uses tools like scissors, clippers, and combs to achieve the desired look, ranging from simple cuts to complex styles, refreshing one's appearance and maintaining hair health.","A person sits in a chair while a hairstylist, armed with scissors and comb, snips and styles their hair; locks of hair fall to the ground as the customer's hairstyle transforms. Mirrors reflect the progress, and there may be hair care products and tools like clippers and blow dryers in use.","The snip of scissors cutting hair, the buzz of electric clippers, the spray from a water bottle, hair rustling, conversations with the barber or stylist, background music or magazine pages turning, occasional laughter or phone ringing, the swish of a cape being removed, and the whoosh of a hairdryer.",,,,,,, +Getting a piercing,"Getting a piercing involves puncturing a part of the body to insert jewelry, often for fashion or self-expression. Performed by professionals in sterile environments, it ranges from ears to noses, navels, and more, and requires proper aftercare to heal and prevent infections.","An individual sits or lies down as a piercing professional cleans the designated area, marks the spot for precision, and uses a sterilized needle or piercing gun to insert jewelry through the skin, often accompanied by brief discomfort and subsequent aftercare instructions.","During a piercing, one might hear the buzz of sterilization equipment, the clinician's gloves snapping, calming background music, the sharp click of the piercing instrument, and possibly a sharp intake of breath or a quiet vocal reaction from the person being pierced.",,,,,,, +Getting a tattoo,"Getting a tattoo involves inscribing a design onto the skin using needles to insert ink permanently, usually as a form of body art or personal expression. It's performed by skilled artists and requires consideration of design, placement, pain tolerance, and care during the healing process.","An individual sits or lies down while a tattoo artist, wearing gloves, uses a buzzing tattoo machine to carefully ink a design into their skin, which may show redness. Various colored ink bottles and sterilized equipment are visible. The area being tattooed is often wiped clean regularly.","Buzzing needle, soft hum of the tattoo machine, occasional paper rustling, the artist's gloves snapping, client's sharp intakes of breath, faint background music, and intermittent conversation between artist and client.",,,,,,, +Grooming dog,"Grooming a dog involves cleaning and hygienic care, which can include brushing, bathing, hair trimming, nail clipping, and ear cleaning. Regular grooming maintains a dog's health and appearance, and also provides an opportunity to check for signs of skin issues or parasites.","A person brushes or combs a dog's fur, trims it with scissors or clippers, often while the dog sits or stands calmly, sometimes on a grooming table with various grooming tools visible (brushes, shampoos, nail clippers). The environment is organized, with a focus on the dog's cleanliness and neat appearance.","Grooming a dog involves clipping nails with a sharp snip, splashing water and shampooing, and brushing with soft strokes. Scissors trim fur with cutting sounds, and hair dryers hum constantly. Dogs may purr contentedly or whine anxiously.",,,,,,, +Grooming horse,"Grooming a horse is the process of cleaning and caring for a horse's coat, mane, tail, hooves, and overall body. It promotes health, fosters bonding between horse and handler, and prepares the animal for riding or showing by removing dirt, mud, parasites, and shedding hair.","A person uses brushes and combs to clean a horse's coat, mane, and tail, often while the horse is tethered. Dirt and debris are removed, leaving the horse's hair smooth and shiny. Hooves are also picked clean. The process involves close physical interaction, reflecting care and attentiveness.","Soft snorts, steady hoof scrapes, swishes of a brush or curry comb through coarse hair, rhythmic strokes, the jingle of buckles as tack is adjusted, occasional whinnies, leather creaks, and the rustle of hay or straw underfoot.",,,,,,, +Hammer throw,"Hammer throw is a track and field event where athletes compete to throw a heavy metal ball attached to a grip by a steel wire as far as possible. Technique, strength, and coordination are crucial in this Olympic sport requiring athletes to whirl the hammer in a circular motion before release.","An athlete spins inside a circle, gripping a wire-attached heavy ball (hammer), releasing it to soar through the air, landing within a marked field sector. The thrower wears gloves and boots while maintaining balance and coordination to achieve maximum distance within typically four to six allocated attempts.","The hammer throw produces rhythmic whooshing sounds from the rotating hammer, punctuated by the grunt of the athlete's exertion, culminating in a sharp thud as the hammer hits the ground at a distance.",,,,,,, +Hand car wash,"Hand car wash is a manual cleaning service for vehicles where trained workers meticulously wash, wax, and dry cars by hand, often providing personalized attention to detail and using specialized tools and products to ensure a thorough clean without the risk of damage that can occur with automated systems.","Individuals manually scrub and rinse vehicles using spones, cloths, hoses, and buckets of soapy water, often in an outdoor or open-air facility, with signs advertising the service. Cars are wiped down and dried with towels, leaving a gleaming finish.","Splashing water, bristles scrubbing against metal, the hiss of a pressure washer, sudsy swishes, intermittent spraying, dripping, occasional clanking of tools, footsteps on wet ground, ambient traffic noise, and casual conversation between workers or with customers.",,,,,,, +Hand washing clothes,"Hand washing clothes is a traditional method of laundering that involves cleaning garments by manually scrubbing and rinsing them in water, typically using soap or detergent. This process is often used for delicate items or when a washing machine is not available.","Submerging and scrubbing garments in water with soap, hands vigorously agitate fabric, creating soapy suds; clothes are twisted and squeezed to remove dirt; garments are then rinsed and wrung out to eliminate suds and excess water, often laid out or hung to dry.","Splashing water, scrubbing sounds, fabric rubbing against itself, rhythmic movements in water, occasional drips, and the squeezing or wringing of wet clothing.",,,,,,, +Hanging wallpaper,"Hanging wallpaper involves applying decorative paper to walls using adhesive. It's done by preparing surfaces, cutting paper to size, and carefully aligning patterns before smoothing out bubbles and edges for a finished look.","An individual measures and cuts strips of decorative paper, applies adhesive to the back, and carefully aligns them on a wall, smoothing out any bubbles or wrinkles with a brush or tool, transforming the wall's appearance with a new pattern or texture.","Rustling of paper, tearing sounds, sloshing and splashing of adhesive, the scrape of tools smoothing surfaces, occasional tapping or thumping aligning panels, and the click of cutters trimming edges.",,,,,,, +Having an ice cream,"Having an ice cream involves selecting and consuming this frozen dessert, which is typically made from dairy and sugar, enjoyed worldwide in various flavors, often served in cones or cups.","A person holds a cone with a swirl of creamy ice cream on top, possibly dotted with colorful sprinkles. They take a joyful lick or bite as the ice cream drips slightly under the warmth of the sun.","Enjoyment of an ice cream may involve sounds of a wrapper or container opening, the tapping of a spoon, the distinctive sound of scooping, soft slurping or licking, occasional contented sighs or exclamations, and ambient noises of the environment where the ice cream is being enjoyed.",,,,,,, +High jump,"High jump is an athletic track and field event where competitors leap over a horizontal bar set at measured heights without dislodging it. Athletes run up to the bar and jump using techniques like the Fosbury Flop, striving for maximum height. It requires strength, agility, and precise timing.","An athlete sprints towards a bar set high above the ground, takes a leap, arches their back mid-air to clear the bar without knocking it, and lands on a cushioned mat.","The rhythmic approach run's footsteps, the rustle of sportswear, a brief grunt during take-off, the swoosh of clearing the bar, the landing pad's cushioned thump, and occasional cheers or claps from onlookers.",,,,,,, +Hitting a pinata,"Hitting a piñata involves blindfolded participants taking turns to swing a stick or bat at a colorful, paper-covered clay or cardboard container, often shaped like an animal or character, to break it open and release the candy or small toys within during celebrations such as birthdays or festivals.","Blindfolded individual, swinging a stick at a suspended, colorful paper-mache figure, surrounded by expectant onlookers anticipating candy and treats to burst forth.","Hitting a piñata involves cheerful chants and cheers from onlookers, intermittent whacks from sticks, rustling paper or fringes, and the burst of candy and toys showering down, accompanied by excited squeals and laughter when the piñata breaks.",,,,,,, +Hopscotch,"Hopscotch is a playground game where players toss a small object into numbered spaces drawn on the ground and hop through the spaces to retrieve it, balancing on one foot. It's a classic children's game that combines skill, physical coordination, and strategy.","Hopscotch involves a series of numbered squares drawn on the ground. Players hop on one leg into each square, skipping the square with a marker in it, and must complete the course. The design is typically linear or with a few lateral squares, made with chalk or paint.","Hopscotch typically involves the rhythmic tapping of shoes against pavement, the occasional thud of a stone or beanbag, children's voices counting, laughter, and the occasional exclamation of excitement or disappointment during play. These sounds vary in intensity and frequency, depending on the number of participants and the playing surface.",,,,,,, +Horseback riding,"Horseback riding is a sporting and recreational activity where riders mount horses and guide them at various paces. It can include disciplines like dressage, show jumping, and trail riding. Beyond sport, it fosters a bond between horse and rider and requires skill, balance, and communication for proper equestrianism.","An individual sits astride a horse, holding reins for direction and balance. They wear a helmet and appropriate attire. The horse moves through open landscapes or trails, trotting, cantering, or galloping, muscles rippling, mane flowing with each stride, as rider and animal move in synchronized motion.","Clopping hooves, snorting, neighing horses, jingling tack, leather creaks, soft thuds on earthen trails, rustling foliage, riders' voices, and occasional whinnies echoing in the environment are common auditory features of horseback riding.",,,,,,, +Hula hoop,"Hula hooping is a fun physical activity involving the rotation of a large hoop around one's waist, limbs, or neck. Typically performed for exercise, dance, or play, it improves coordination, strengthens core muscles, and can be both a solo and group activity promoting rhythm and creativity.","A performer gyrates their hips to spin a large, colorful circular ring around their waist, maintaining a rhythmic, circular motion to keep the hoop from falling to the ground.","While hula hooping, one might hear the rhythmic swishing or whooshing of the hoop circling around, occasional soft thuds as it taps the body, and the light clattering sound if the hoop drops to the ground. There may also be laughter or music if the activity is recreational.",,,,,,, +Hurling,"Hurling is a fast-paced, traditional Irish field sport, where players use a wooden stick called a hurley to hit a small ball, the sliotar, between the opposing team's goalposts. It's known for its high speed, physicality, and skill, often referred to as the ""fastest game on grass.""","Hurling is a fast-paced field sport with players wielding curved wooden sticks called hurleys, using them to hit a small ball (sliotar). They wear helmets, jerseys, shorts, and cleats. The action features swift, sweeping motions, aerial duels, and dynamic runs across a grassy pitch marked with goalposts.","Hurling, an Irish team sport, features the clack of wooden hurleys striking sliotars (balls), players' shouts, referee whistles, and the roar of cheering crowds. Each contact and vocalization contributes to the dynamic soundscape characteristic of this fast-paced, ancient Gaelic game.",,,,,,, +Ice fishing,"Ice fishing is a winter angling practice where individuals catch fish through holes drilled in the frozen surfaces of lakes and ponds, using lines with hooks and often sheltered by temporary structures called ice shanties to protect from the cold.","Ice fishing involves anglers sitting or standing by holes cut into a frozen lake's surface, often with portable shelters or stools, surrounded by snow and ice, using rods or tip-ups to catch fish in the frigid water below. Gear, buckets, and augers are common sights.","Auditory features of ice fishing may include the crisp cracking of ice, the whir of a manual or powered auger drilling, plopping of bait into water, gentle splashes, occasional fish flopping, the wind's howl, muffled chatter, and the subtle creaking of a fishing stool on the ice.",,,,,,, +Installing carpet,"Installing carpet involves measuring the room, cutting the carpet to fit, attaching tack strips and underpad, stretching the carpet with a knee-kicker or power stretcher, and securing it around the perimeter for a smooth, finished floor covering. It requires tools and attention to detail for a professional look.","Individuals unroll and smooth large swathes of fabric over a floor's surface, using tools like knee kickers and carpet tuckers to stretch the material and secure it along edges and corners, often trimming excess with a utility knife to ensure a snug, even fit.","Sounds of footsteps and movement, cutting and tearing of carpet and padding, banging of a knee-kicker, thumping of a carpet stretcher, snapping of tack strips, rustling of tools, and occasional communication between installers.",,,,,,, +Ironing clothes,"Ironing clothes is a domestic chore involving the removal of wrinkles and creases from fabric using a heated iron. The process smooths fabrics, giving garments a crisp and polished appearance, often after washing and drying. Different materials require specific heat settings to avoid damage.","A person stands at an ironing board, running a hot, flat iron over wrinkled fabric to smooth it. Steam rises as the iron presses against the clothes, creases vanish, and the scent of warm, clean linen fills the air. The garment gradually becomes crisp and neat.","The sound of steam hissing from the iron, the faint creak of the ironing board, the rhythmic glide of the iron moving over fabric, occasional bursts of water spray, and the quiet background noise of clothes shuffling as they're straightened and adjusted on the board.",,,,,,, +Javelin throw,"Javelin throw is an Olympic event where athletes run to gain momentum and hurl a spear-like javelin for maximum distance, staying within sector lines. Success depends on technique, strength, and aerodynamics.","An athlete sprints briefly before hurling a long, slender spear (javelin) as far as possible into a marked sector on a grass field, seeking both distance and accuracy. They exhibit a blend of strength, technique, and coordination, punctuated by the dynamic, extended pose of the release.","In javelin throw, you may hear the whoosh of the javelin cutting through the air, the grunt or exhale of the athlete during the throw, the thud as it strikes the ground, and possibly the cheers and applause of spectators if the throw is particularly impressive or achieves a significant distance.",,,,,,, +Kayaking,"Kayaking is a versatile watersport where individuals paddle across water in a small, narrow watercraft called a kayak. It can range from serene lake paddling to navigating challenging whitewater rapids, suiting both peaceful explorations and adrenaline-fueled adventures.","Kayaking features individuals seated in small, narrow watercraft, paddling with double-bladed oars, navigating rivers, lakes, or oceans. Their vessels, called kayaks, are sleek and often colorful, hugging the water's surface as they glide through varied aquatic environments, often amidst natural scenery or in urban waterways.","Kayaking can include sounds of paddles swooshing through water, splashes when entering or exiting the kayak, gentle waves lapping against the hull, wildlife calls nearby, and the rhythmic creak of the vessel moving with the rower's efforts.",,,,,,, +Kite flying,"Kite flying is a leisure activity where a kite__ lightweight frame covered with fabric or paper__s flown in the air by controlling a string attached to it from the ground, often requiring skill to maneuver and taking advantage of wind currents for lift and aerial acrobatics.","Kite flying involves a colorful kite soaring and dipping in the sky, tethered by a string to a person below, who guides it with hand movements against a backdrop of clouds, with the kite's tail fluttering gracefully.","The whoosh of wind rustling through the kite's material, the steady hum of the string as it cuts through the air, the distant laughter and chatter of those around, and perhaps the faint flapping of the kite's tail if it has one.",,,,,,, +Kneeling,"Kneeling is a common posture where one or both knees touch the ground. It can be a form of exercise, a position for prayer or meditation, a respectful gesture, a restful pose, or a functional stance for tasks close to the ground.","In the kneeling position, a person is upright on their knees, with the tops of their feet flat against the ground, buttocks resting on or hovering above the heels, and torso vertical, often used for prayer, submission, or rest.","Kneeling may produce soft sounds of clothing fabric stretching or brushing against a surface, creaks or groans from joints, and possibly a gentle thud if performed on a non-cushioned floor. The person may exhale audibly while moving into the position.",,,,,,, +Knitting,"Knitting is a craft in which yarn is manipulated to create fabric or textiles, typically using long needles to form loops and stitches. It can be a relaxing hobby and is used to make clothing, accessories, and home decor.","Knitting involves looping yarn with needles to create a textile. Fingers manipulate the needles, yarn intertwines, and a fabric pattern emerges. Stitch rows build upon each other, forming a coherent structure, often accompanied by a rhythmic motion of hands.","Knitting's auditory features include a soft, rhythmic clicking of needles, gentle rustling of yarn, and occasional snipping sounds from scissors cutting threads. These create a calm, repetitive soundscape indicative of the craft's steady, methodical nature.",,,,,,, +Laying tile,"Laying tile is the process of installing tiles on floors or walls, involving preparing the surface, cutting tiles to fit, spreading adhesive, setting tiles, and applying grout to seal the spaces between them, which creates durable and aesthetic coverings.","The activity ""laying tile"" involves placing square or rectangular pieces of ceramic, porcelain, or stone onto a prepared adhesive-covered surface in a precise, tightly-spaced pattern, followed by grouting between the tiles to ensure a smooth, even finish.","Laying tile often involves sounds of scraping as adhesive is applied, the tapping of a rubber mallet to set tiles in place, occasional cutting or snapping noises from trimming tiles, and the clinking of spacers being inserted between tiles to ensure even spacing.",,,,,,, +Layup drill in basketball,"A layup drill in basketball is a foundational practice routine where players repetitively practice layups, driving towards the hoop to shoot close-range, high-percentage shots often using the backboard, to improve footwork, timing, and finishing abilities under the rim.","Players line up, take turns driving towards the basketball hoop, performing a layup shot, retrieving their ball, and rejoining the line. Continuous motion with players dribbling, shooting off the backboard, and scoring close-range baskets, typically alternating between left and right-handed layups.","Bouncing balls, squeaking sneakers on the court, player communication (calls, shouts), swish of the net, occasional claps, coach instruction, and possibly the reverberation of the gym.",,,,,,, +Long jump,The long jump is a track and field event where athletes sprint down a runway and leap as far as possible from a takeoff board into a sandpit. Success is measured by the distance covered from the board to the nearest mark made in the sand.,"An athlete sprints down a runway and leaps horizontally into a sandpit from a wooden take-off board, aiming to cover the greatest distance possible. The jump is measured from the board to the nearest mark in the sand made by any part of the jumper's body.","A long jump activity typically features the rhythmic run-up of the athlete's feet on the track, the sound of heavy breathing, the whoosh of air as they leap, the thud upon landing in the sand pit, and occasional cheers or instructions from coaches and spectators.",,,,,,, +Longboarding,"Longboarding, a skateboarding variant, involves riding a longer board with larger, softer wheels, enabling smooth movement and higher stability. It's popular for cruising, downhill racing, and performing tricks. Longboarding combines balance, coordination, and thrill, appealing to those seeking a relaxed ride or an adrenaline-pumping experience.","Longboarding features a rider gracefully maneuvering on a longer, wider skateboard, usually cruising, carving or downhill racing on urban or mountainous roads with sweeping turns and occasional stunts, displaying balance and control.","Longboarding generates rhythmic rolling sounds of wheels on pavement, punctuated by scrapes during turns or tricks. Wind noise increases with speed and foot friction creates intermittent scraping when pushing off or braking. Board flex may produce subtle creaks on rough surfaces or during rider weight shifts.",,,,,,, +Making a cake,"Making a cake involves mixing ingredients like flour, sugar, eggs, and butter, then baking the batter in an oven until it rises and sets. It's a creative cooking activity that often culminates in decorating the finished product with frosting, fondant, or fruits to make it both visually appealing and delicious.","Mixing batter in a bowl; pouring it into cake pans; a rising cake in an oven; spreading frosting on cooled layers; decorating with icing, fruit, or sprinkles; vibrant colors of ingredients and finished product; an overall messy yet creative and delightful culinary process.","Whirring mixer blades, tapping of utensils, crackling eggshells, rustling of ingredient packages, pouring liquids, clinking of glass or metal bowls, beep of a timer, preheating oven's hum, and the final ding of an oven indicating that the cake is baked.",,,,,,, +Making a lemonade,"Making lemonade involves juicing lemons, combining the juice with sugar and water, then stirring until the sugar dissolves. This refreshingly simple beverage can be customized to taste and served cold for a classic, thirst-quenching summer drink.","A person squeezes lemons, pours juice, water, and sugar into a pitcher. They stir the mixture, taste-testing and adjusting for sweetness. Ice clinks as it's added. The liquid is a pale yellow, and condensation forms on the glass pitcher under a sunny backdrop, suggesting a refreshing, cool beverage.","Slice lemons and juice them. Pour water, add ice cubes, and stir, enjoying the clinking sounds. If desired, add carbonated water for fizz. Finish with a refreshing sip, possibly followed by a satisfied “Ahh.”",,,,,,, +Making a sandwich,"Making a sandwich involves layering ingredients such as meats, cheeses, vegetables, and spreads between slices of bread to create a portable, customizable meal that can range from simple to gourmet depending on one's taste preferences and the components used.","Two hands layer ingredients like meat, cheese, vegetables, and condiments between slices of bread. Varied textures and colors stack neatly until the sandwich is complete, then it's often sliced diagonally, revealing the cross-section of the layered fillings.","Slicing bread, rustling of packaging, clinking of utensils on plates, spreading condiments, crunchy chopping of vegetables, meats, or cheeses, and the wrapping or unwrapping of ingredients.",,,,,,, +Making an omelette,"Making an omelette involves beating eggs, pouring them into a hot pan, and cooking until set. Ingredients like cheese, vegetables, or meats are often added before folding the omelette over and serving. It's a quick, versatile meal that can be enjoyed for breakfast, lunch, or dinner.","Cracking eggs into a bowl, whisking vigorously. The mix sets at the edges, stirred gently. Fluffy semi-solid mass forms, perhaps filled with diced tomatoes, onions, greens. Edges fold over, encasing fillings; a yellow, crescent-shaped delicacy emerges, steaming and appetizing.","Cracking of eggs, sizzle and bubble as eggs hit the hot pan, clinking of a spatula or whisk, light scraping sounds stirring and flipping, occasional sputtering of oil or butter, timer ding or chef's triumphant ""Done!"" upon completion.",,,,,,, +Mixing drinks,"Mixing drinks involves combining different liquids, typically alcoholic beverages with mixers, to make cocktails. It requires knowledge of ingredients, proportions, and techniques, such as shaking or stirring, to achieve balanced and flavorful concoctions. Barware like shakers, jiggers, and strainers are also essential tools for this activity.","Pouring various liquids from bottles into a shaker or glass, often with ice; stirring or shaking; straining into a serving glass; garnishing with fruit or herbs; vibrant colors layering or blending together.","The activity ""Mixing drinks"" may involve the clinking of ice cubes, the sound of liquid pouring, shaker rattles, stirring sounds, the tap of metal on glass, and the sealing or opening whoosh of bottle caps and corks.",,,,,,, +Mooping floor,"""Mooping"" is likely a typo or colloquial mash-up of ""mopping,"" an activity involving cleaning a floor by using a mop to wet-wash it, usually with a combination of water and detergent, to remove dust, dirt, and stains, ensuring the area is neat and hygienic.","A person sweeps and scrubs the floor with a mop, using rhythmic back-and-forth strokes, often wringing out excess water, leaving a trail of glistening floor behind as it gradually dries to a clean shine.","Sloshing water, squelching mop, rhythmic swishing across the floor; occasional splashing; bucket handle creaks; footsteps; and the distinct squeaky-clean sound on the final pass.",,,,,,, +Mowing the lawn,"Mowing the lawn involves cutting the grass in a garden or yard to a uniform, tidy length using a lawn mower. This regular maintenance keeps outdoor spaces neat, promotes healthy grass growth, and deters pests.","A person pushes a lawn mower across a grassy area, leaving behind neat, even strips of freshly cut grass, while trimmed clippings are either collected in a bag or dispersed across the lawn.","The auditory features of mowing the lawn include the steady roar of the mower engine, periodic chugging sounds, the slicing noise of blades cutting grass, and occasional rustling when moving over uneven terrain or through thicker patches of vegetation.",,,,,,, +Paintball,"Paintball is a competitive team shooting sport where players eliminate opponents by hitting them with dye-filled, breakable, oil and gelatin paintballs shot from a special paintball gun called a marker. It emphasizes teamwork, strategy, and quick thinking, often played on a course with natural or artificial terrain for tactical cover.","Paintball is characterized by players in protective gear wielding air-powered guns, shooting capsules of colorful, washable gelatin filled with paint, amidst natural or artificial terrain with obstacles used for cover. It's a vibrant, fast-paced activity often resulting in splatters of bright paint against gear and the surrounding objects.","Paintball games feature rapid bursts of gunfire from markers, high-pitched 'splat' sounds upon impact, muffled commands among teammates, rustling from movement in underbrush or obstacles, occasional whistles for game starts/ends, and the release of pressurized air or CO2 during firing.",,,,,,, +Painting,"Painting is the art of applying pigment to a surface, like canvas or paper, using tools such as brushes to create images and express ideas. It's a form of visual expression with historical and cultural significance, ranging from realism to abstraction across various mediums and techniques.","An individual holds a brush, applying colorful strokes to a canvas or wall, surrounded by paint containers, palettes, and possibly drop cloths to protect surroundings. The developing image reveals a blend of hues, shapes, and textures that evolve with each brush movement.","Scraping sounds of brushes or palette knives on canvas, swishing sounds of brush strokes, dipping into water or solvents, clinking of glass jars or metal paint tubes, rustling of paper towels or cloths, occasional sighs or sounds of concentration from the painter, subtle background music or environmental noises.",,,,,,, +Painting fence,"Painting a fence involves applying a protective and decorative coating to the surface of wooden, metal, or other material fences using brushes, rollers, or sprayers, often as a DIY home improvement or maintenance task to enhance curb appeal and preserve the material from weathering and rust.","A person brushes or rolls paint onto a vertical wooden fence, coating the planks in fresh paint. Drips may run down the wood's surface while the paint's color revives the fence's appearance, transforming it from weathered to vibrant.","Brush strokes against wood, dipping brush in paint, occasional scraping for prep work, rustling of tarp or drop cloth, stirring paint in a can, sounds of nature if outdoors, and possibly the faint sound of footsteps pacing along the fence line.",,,,,,, +Painting furniture,"Painting furniture involves applying paint or varnish to revitalize or change the appearance of old or plain furniture, often using techniques to create a specific style or finish, such as distressing or stenciling, to enhance a piece's aesthetic and protect its surface.","A person sands down wooden furniture and applies paint methodically with brushes or rollers, covering the surface in smooth, fresh color. Tarp or newspaper is often laid out to protect the floor while paint cans, sandpaper, and other tools lie nearby. The updated piece transforms as it dries.","While painting furniture, one may hear the soft bristles of a brush swooshing against wood, the occasional dip and swirl in the paint can, the clinking of tools, the sticky sound of tape being applied for clean edges, and the faint rustle of drop cloths adjusting underfoot.",,,,,,, +Peeling potatoes,"Peeling potatoes is a common kitchen task involving the removal of the outer skin from potatoes using a knife or a vegetable peeler before they are used in cooking various dishes like mashed potatoes, fries, or stews to enhance texture and appearance.","A person holds a potato in one hand and a peeler or small knife in the other, scraping or cutting away the outer skin to reveal the white flesh underneath, often with a growing pile of peelings beside them on a table or cutting board.","The activity of peeling potatoes typically includes the sound of the peeler scraping and slicing through the potato skin, the occasional snapping sound of a potato being cut into, and the thud of peeled potatoes dropping into a bowl or water. There may also be intermittent rustling as potatoes are handled.",,,,,,, +Ping-pong,"Ping-pong, also known as table tennis, is a fast-paced sport where two or four players hit a lightweight ball back and forth using small paddles on a hard table divided by a net. It emphasizes agility, reflexes, and strategy, providing a fun and competitive aerobic activity for all ages.","Two players face off across a small table, hitting a lightweight ball back and forth with small paddles. A net divides the table, and the game is played with fast, sharp movements. The ball moves quickly, and players remain alert, ready to respond to rapid volleys.","Ping-pong auditory features include the rhythmic bouncing of the lightweight ball, the sharp click of ball contact with paddles, the sound of play on the table, and potential verbal exchanges between players. Environmental echoes may vary with venue acoustics.",,,,,,, +Plastering,"Plastering involves applying layers of plaster onto an interior wall or ceiling to achieve a smooth or textured surface. It prepares walls for painting or wallpapering, providing durability and a finished aesthetic. This construction technique requires skill to mix and apply the plaster uniformly.","Plastering is the application of a smooth, creamy mixture over walls or ceilings using a flat tool called a trowel, resulting in a uniform, flat surface upon drying, often in preparation for painting or decorating.","Plastering activity may feature the sound of a trowel scraping and smoothing wet plaster, the mix of dry powder with water, occasional tapping to level surfaces, and the crinkling of protective plastic sheeting or paper masking tape used to cover nearby surfaces.",,,,,,, +Plataform diving,"Platform diving is an aquatic sport where athletes perform acrobatic jumps and flips from a fixed platform, typically 10 meters high, culminating in a precise, splash-minimized entry into the water, judged for technical and artistic prowess.","Platform diving involves athletes performing acrobatic jumps and turns from a high, fixed ledge, often 10 meters above the water, before gracefully entering the pool with minimal splash. Competitors wear sleek swimsuits and may be observed arching, spinning, or flipping against a backdrop of open sky and pool.","The splash of the diver entering the water, the sound of the wind during descent, the distinct smack of a well-executed dive, distant crowd applause, muffled underwater noises, and the echo inside an indoor pool facility.",,,,,,, +Playing accordion,"Playing accordion involves operating a handheld musical instrument with bellows, keyboard/piano for melody, and buttons for bass and chords. It requires coordinating both hands to compress the bellows and press keys/buttons simultaneously, producing a rich, reedy sound, characteristic of folk, tango, and various musical genres.","A person operates an accordion by expanding and compressing its bellows while pressing keys or buttons, producing music. The musician's fingers dance across the keyboard or buttons, and the instrument's pleated central section moves rhythmically in and out, often accompanied by swaying or foot-tapping.","The playing accordion activity produces distinctive, reedy, bellows-driven musical tones. The sounds include variable pitches, chords, and melodies, with possible rhythmic squeezing and air-release hissing from the bellows during play.",,,,,,, +Playing badminton,"Playing badminton is a fast-paced racket sport where players hit a shuttlecock over a net, aiming to land it within the opponent's court. It can be played singles or doubles, requiring agility, precision, and stamina. It's a popular recreational activity and competitive sport enjoyed worldwide.","Two or four players energetically swing rackets, hitting a feathered shuttlecock back and forth over a high net, on a rectangular court. Athletic movements and precise strokes combine with light equipment for a fast-paced, engaging sport, often played indoors with focus and agility on display.","Playing badminton involves sounds of shuttlecock striking, swooshing during fast swings, light footwork on the court, occasional player communication, and the subtle clicking of racket frames.",,,,,,, +Playing bagpipes,"Playing bagpipes involves inflating a bag through a mouthpiece or bellows, then pressing the bag to push air through reeds in attached pipes. The player creates a harmonious array of sounds, often with a distinctive drone, by fingering the melody on the chanter while maintaining constant bag pressure.","A person stands, inflating a large bag under their arm, fingers dancing on chanter pipes while squeezing the bag to emit a resonant, droning sound. Tartan kilt and sporran often complement their attire as they manipulate the iconic Scottish instrument with its projecting pipes and distinctive skirl.","Playing bagpipes typically produces a sustained, loud, and resonant sound. The drone of the pipes is constant, and the chanter creates the melody, often with a sharp, reedy timbre. The skirl of the bagpipes is distinctive and can be heard from a considerable distance.",,,,,,, +Playing beach volleyball,"Playing beach volleyball involves two teams, typically with two players each, competing to send a ball over a net without it touching the sand on their own side, aiming to land it in the opposing team's court or force an error for points, all while barefoot on a sandy surface.","Two teams leap and lunge on sandy courts, hitting a ball over a high net. Participants often wear swimsuits or athletic gear, under the sun, with spectators lounging or cheering around the perimeter. The scene is vibrant with movement, characterized by athletic figures against a backdrop of blue sky and beach.","Sounds include the rhythmic bouncing of the ball, players' calls and shouts, sandy footsteps, hand slaps, energetic dives, crowd cheers, waves crashing nearby, wind, and whistles signaling points or fouls.",,,,,,, +Playing blackjack,"Playing blackjack is a card game where players aim for a hand total closer to 21 than the dealer's without exceeding it. It combines luck, strategy, and skill, with players deciding when to hit, stand, double down, or split based on their cards and the dealer's visible card.","Individuals sit around a semicircular table facing a dealer, cards and chips in hand or on the felt surface. The dealer deals from a card shoe. Players focus on their cards, calculating their moves, with moments of excitement or disappointment as cards are revealed and bets won or lost.","Shuffling and dealing cards, chips clinking, players murmuring decisions (""hit,"" ""stand""), dealer announcing outcomes, soft background casino sounds (slot machines, faint music), occasional exclamations from wins or losses.",,,,,,, +Playing congas,"Playing congas involves rhythmically hitting the drumheads of tall Cuban percussion instruments with hands or sticks, producing diverse tones. Congueros use techniques for slaps, open, and muffled tones, often improvising within Afro-Cuban rhythms or other styles.","A person seated or standing taps rhythmically on a pair of tall, narrow drums with tapered sides using the palms, fingers, and heels of the hands for varied tones. The congas are played with fluid, often intricate hand movements and can be accompanied by swaying or body movement to the beat.","Playing congas involves rhythmic tapping and slapping, producing deep resonant bass tones when struck in the center and sharper slapping sounds towards the edges. Skilled players can create complex rhythms and varying sound textures, incorporating palm and fingertip strikes for a broad range of percussive effects.",,,,,,, +Playing drums,"Playing drums involves creating rhythm by striking various drums and cymbals arranged in a drum set using sticks or hands. It requires coordination, timing, and a sense of beat, serving as the backbone for many musical genres and providing both tempo and dynamic to ensemble playing.","An individual sits at a drum kit, striking various drums and cymbals with sticks in a rhythmic fashion, often using foot pedals to play bass drums, with focused concentration and coordinated movement between arms and legs.","Playing drums typically involves rhythmic beats, variable intensities, and diverse tones produced by striking different drum surfaces and cymbals, leading to a mix of sharp, resonant strikes, deep bass thumps, and metallic crashes, with potential intricate patterns and tempo changes based on musician skill and style.",,,,,,, +Playing field hockey,"Field hockey is a fast-paced, team sport played by two teams using sticks to hit a ball into the opposing team's goal. It emphasizes speed, strategy, and teamwork, and is played on grass, turf, or indoor surfaces, requiring athletic prowess and skillful handling of the stick and ball.","Individuals equipped with sticks curve to strike a small, hard ball on a large grass or turf field. They wear protective gear like shin guards and often colorful uniforms as they maneuver in formation, aiming to score goals in a netted area guarded by a goalkeeper.","The sound of hard sticks clashing, the thwack of a ball being hit, quick footsteps on turf or grass, players calling for passes, the whistle from referees, and cheering or instructions from coaches and spectators. +",,,,,,, +Playing flauta,"Playing the flauta, or flute, involves producing music by directing air across the mouthpiece of the instrument and fingering different notes on the keys to create melodies and harmonies with its distinctive, ethereal sound.","A person holds a flauta, a type of Mexican filled tortilla snack, often crispy from frying, with one or both hands, taking bites from its elongated, golden-brown exterior, typically garnished with toppings like sour cream, cheese, and salsa, the enjoyment evident from their facial expressions.","While playing the flute, one would hear melodious tones varied by pitch and dynamics, characterized by breathy, silver-toned timbres, and articulated through techniques such as tonguing and vibrato, with occasional clicking of keys and breath sounds between phrases.",,,,,,, +Playing guitarra,"Playing guitar involves skillfully manipulating strings with fingers and a pick to produce music. It combines melody, harmony, and rhythm, offering a versatile range of styles from classical to rock, appealing to diverse musical tastes and fostering creativity, coordination, and emotional expression.","A person cradles a guitar across their body, their fingers press strings along the fretboard with one hand, while the other hand strums or plucks the strings near the sound hole, creating music. The guitar's body is usually wooden, with a curvaceous shape and a long neck extending from it.",Strumming or picking strings produces melodic tones, chord changes emit harmonic sequences, fingers sliding on fretboard may create subtle squeaks, percussive sounds when tapping body, rhythmic string rattle with vigorous play, occasional buzz from string contact with frets, tuning peg clicks, soft thuds when switching hand positions or palm-muting. +Playing harmonica,"Playing harmonica involves breathing into or drawing air out of a handheld, reed-based instrument, producing musical notes that can be varied in pitch and tone through mouth shape and technique, often used in blues, folk, and rock music for its soulful, expressive sound.","A person holds a small rectangular instrument, the harmonica, to their lips, and their fingers grip its sides. They intermittently breathe in and out, producing musical notes, while their hands might move the harmonica to create different sounds, their facial expressions changing with the tune's rhythm and emotion.","Playing harmonica produces harmonious notes with bending and vibrato effects. The sound can be airy or crisp, ranging from soothing melodies to energetic blues, amplifying emotions through expressive breath manipulation and rhythm.",,,,,,, +Playing ice hockey,"Ice hockey is a high-energy team sport played on an ice rink where players skate at high speeds, maneuvering a puck with sticks, aiming to score goals against an opposing team while defending their own goal, characterized by strategy, agility, and physicality.","Players wearing helmets and padding glide across an ice rink, maneuvering a puck with sticks. Teams in contrasting jerseys compete, aiming for goals at opposite ends. Spectators surround the rink, watching the fast-paced, physical sport characterized by skating prowess, swift shots, and occasional collisions.","Playing ice hockey features the sounds of skates carving across the ice, sticks clashing, pucks striking the boards or goalposts, players communicating, the goal horn blaring, and sometimes the audience cheering.",,,,,,, +Playing kickball,"Playing kickball is a team sport resembling baseball, where players kick a rubber ball instead of hitting it with a bat, and run bases to score points. It's fun, inclusive, requires minimal equipment, and is enjoyed by people of all ages.","Individuals in casual attire are on a field, with some kicking a large rubber ball while others run bases or play defense, under open skies.","The sounds of a rubber ball being kicked and bouncing on the ground, players calling out for passes and positions, laughter, cheers from spectators, the referee's whistle, footsteps on playing field, and occasional claps or high-fives.",,,,,,, +Playing lacrosse,"Playing lacrosse is a fast-paced, high-intensity team sport combining elements of basketball, soccer, and hockey. Players use a stick with a netted pocket to catch, carry, and pass a ball, aiming to score goals by shooting it into the opposing team's net.","Participants wield long-handled sticks, called lacrosse sticks, with netted pouches to catch, carry, and pass a small rubber ball. Players wear helmets and protective gear. They run vigorously across a grassy field, aiming to score goals by shooting the ball into the opponent's netted goal.","Playing lacrosse involves the sounds of quick footsteps on grass or turf, the thwack of sticks clashing, the whistle of a ball slicing through air, shouts and calls between players, the thud of a ball caught in a netted stick, and occasional referee whistles signaling game events.",,,,,,, +Playing piano,"Playing piano involves creating music by pressing keys on a piano, a stringed instrument with a keyboard. It requires coordination, rhythm, and interpretation to perform pieces ranging from classical to modern genres. This activity can be both a form of artistic expression and a way to improve cognitive skills.","Individual seated at a piano, fingers moving across black and white keys, body swaying subtly with the music, foot operating pedals, sheet music on the stand, and concentration visible on the face.","Playing piano involves the sound of keys being struck, producing a range of musical notes and harmonies, the clicking of keys, the occasional pedal shift, and the resonance of strings within the instrument's body. The tempo and volume can vary, creating a diverse auditory experience depending on the piece performed.",,,,,,, +Playing polo,"Polo is a dynamic team sport played on horseback where players use long-handled mallets to hit a small ball into the opposing team's goal, combining elements of horsemanship, strategy, and speed, traditionally considered the sport of kings due to its aristocratic history and global prestige.","Playing polo involves riders on horseback, wielding long mallets, galloping across a grass field, striving to hit a small ball into the opposing team's goal for points, clad in helmets, boots, and team-colored attire, surrounded by a dynamic, competitive atmosphere.","Playing polo may involve the thundering of horses' hooves, the knock of mallets striking the ball, the shouting of players communicating, the blowing of a whistle for fouls or goals, and the cheer of spectators.",,,,,,, +Playing pool,"Playing pool, or billiards, is a precision sport where players use a cue stick to pocket balls on a felt-covered table with cushions. It improves focus, hand-eye coordination, and strategy, featuring game types like eight-ball, nine-ball, and snooker.","Individuals wield cues, aiming at colored balls on a green felt-covered table surrounded by rails, trying to pocket them into six holes with precision and strategy. The environment is often dimly lit, evoking a casual, social atmosphere.","Cues striking balls, balls clacking together, sinking into pockets, sound of chalk on cue tip, players conversing, background music or bar noise, the subtle slide of felt as balls roll across the table, triumphant cheers or groans of defeat, clicking of ball return mechanisms.",,,,,,, +Playing racquetball,"Playing racquetball involves two players using racquets to hit a hollow rubber ball against the walls of an enclosed court, aiming to outmaneuver the opponent and win points by making the ball unreturnable or by capitalizing on the opponent's mistakes, combining strategy with intense physical exertion.","Two players engage in fast-paced rallies, hitting a small rubber ball against a wall with handheld racquets inside a four-walled court. Movements are swift and agile, with players often backing, lunging, and pivoting to strike and volley the ball in continuous, high-energy exchanges.","Playing racquetball involves sounds of rubber balls striking walls, floors, and racquets; squeaking sneakers on the court; players' heavy breathing and vocalizations; and possibly echoing thuds or bangs in an indoor court environment.",,,,,,, +Playing rubik cube,"Playing with a Rubik’s Cube involves twisting its six 3x3 faces to align colors on each side, solving the puzzle. It challenges spatial reasoning, problem-solving skills, and patience as you work through combinations to achieve a uniform color scheme.","A person manipulates a colorful, 3D, six-sided puzzle comprised of smaller, rotating cubes, aligning colors to achieve uniform faces.","Playing with a Rubik's Cube generally produces soft, plastic-on-plastic clicking sounds as the cube sections are twisted and turned. The frequency and rhythm of these clicks vary with the solver's speed and technique. There's no background noise unless the solver is in a non-silent environment.",,,,,,, +Playing saxophone,"Playing the saxophone involves blowing into a reed mouthpiece to create sound, manipulating keys to control pitch, and mastering breathing techniques for tone control. It's a versatile woodwind instrument prominent in jazz, classical, and contemporary music, offering a rich, vibrant sound palette for expressive musical performances.","An individual holds a brass instrument with a curved bell and numerous keys, and presses their fingers on the keys while blowing into a mouthpiece with a reed, often moving their fingers rapidly and swaying slightly with the rhythm, creating soulful or jazzy tones.","Playing the saxophone involves rich, resonant tones varying from mellow to bright, reedy timbres, and a dynamic range from whisper-quiet to piercingly loud. Breath control produces vibrato and honking blasts, while keys clacking and occasional overblown squeaks add to the sonic character.",,,,,,, +Playing squash,"Playing squash is a fast-paced racquet sport for two or four players, played indoors in a four-walled court where players alternate hitting a small, rubber ball against the front wall, with the goal of outmaneuvering their opponent in a test of agility, strategy, and stamina.","Two players energetically rally a small rubber ball against the four walls of an enclosed court using racquets, quickly maneuvering and taking turns to strike the ball before it bounces twice.","Playing squash involves the sound of a small rubber ball being repeatedly struck against the walls, the squeak of athletic shoes on the wooden court floor, players' quick movements, heavy breathing, and occasional calls or communication between the competitors.",,,,,,, +Playing ten pins,"Playing ten pins, commonly known as bowling, is a sport where players roll a heavy ball down a lane to knock down ten pin-shaped targets arranged in a triangular formation at the other end. The objective is to topple all pins with as few throws as possible.","Individuals roll a bowling ball down a lane towards ten pins arranged in a triangle, aiming to knock them down. The alley is bordered by gutters, and an automated system resets the pins and returns the ball. Players wear special shoes and often celebrate strikes and spares with animated gestures.","While playing ten pins (bowling), one hears rolling balls thudding on wooden lanes, crashing pins, mechanical pinsetters resetting pins, player cheers/jeers, and background noise from arcade games or music. Sounds of skidding balls and strikes punctuate the rhythmic hum of activity in a bowling alley.",,,,,,, +Playing violin,"Playing violin involves skillfully drawing a bow across strings, expertly pressing fingerboard notes, and producing a rich assortment of sounds, combining technique with expression for musical performance.","An individual holds a violin under their chin with their left shoulder, using their left fingers to press the strings on the fingerboard while their right hand moves a bow horizontally across the strings, eliciting music. Their posture is straight, focused, with subtle movements for string changes and dynamics.","Playing the violin involves the production of rich, resonant tones and harmonics, varying in pitch and dynamics, alongside the occasional friction-induced squeaks and the rhythmic sounds of the bow drawing across the strings, complemented by the soft clatter of finger placement on the fingerboard.",,,,,,, +Playing water polo,"Water polo is a competitive team water sport where players pass a ball with the aim of scoring goals in the opposing team's net. It requires swimming skills, teamwork, strategy, and physical endurance as players navigate the pool and defend against opponents without touching the bottom.","Teams in colored caps tread water in a pool, passing a yellow ball, aiming to throw it into the opponent's net; splashing, dynamic movements, and coordinated plays punctuate the action against the blue backdrop of the water.","Playing water polo involves sounds of splashing water, referee whistles, player shouts and communication, the thud of the ball hitting the water or being caught, and periodic crowd noise during competitive matches.",,,,,,, +Pole vault,"Pole vault is an athletic event in which competitors vault over a high bar using a flexible pole. Skill, speed, and strength are needed to propel over the height. Originating from ancient Greece, it's a mainstay in modern track and field competitions, including the Olympics.","An athlete sprints with a long flexible pole, plants it into a box on the ground, and uses its bend to catapult themselves over a high horizontal bar, before landing on a cushioned mat.","Pole vaulting produces distinctive sounds including the fast whoosh of the pole cutting through the air, the rhythmic pounding of the athlete's footsteps on the runway, the creak or flex of the pole during bending, and the click or clack as the pole hits the box, followed by a possible cheer of the crowd.",,,,,,, +Polishing forniture,"Polishing furniture is the process of applying a substance, often a wax or polish, to wooden furniture surfaces to protect them, enhance their appearance, and give them a glossy finish. It helps remove scratches and dirt, restoring and maintaining the furniture's beauty and prolonging its life.","A person rubs a soft cloth or brush with polish over wooden furniture, creating a shiny and smooth surface, often accompanied by a gleaming effect as light reflects off the treated areas.","Auditory features include the soft, rhythmic swish of a cloth rubbing surfaces, occasional creaks from wooden items, light clinks of polish bottles or cans, and perhaps the subtle spray sound of liquid polish being applied.",,,,,,, +Polishing shoes,"Polishing shoes is a maintenance task involving cleaning, conditioning, and applying polish to enhance and protect the footwear's appearance and longevity. It rejuvenates leather, adds shine, and can conceal scuffs, ensuring shoes look presentable and are better protected against the elements.","Using a cloth or brush, someone rubs polish onto leather shoes in circular motions, buffing them to achieve a glossy finish. The shoes gradually transform from dull to shiny.","Scraping strokes of the brush, rhythmic buffing, soft swishes of cloth on leather, periodic clinks of the polish tin lid, occasional squelching of cream, and the gentle rustle of newspaper or mat underneath the shoes.",,,,,,, +Powerbocking,"Powerbocking involves jumping and running with spring-loaded stilts, giving the wearer the ability to perform incredible leaps and sprints, mimicking the power and agility of kangaroos, while providing a unique, exhilarating workout.","Powerbocking involves individuals wearing spring-loaded stilts, called powerbocks, that allow them to perform acrobatic jumps and running with enhanced speed and agility, often resembling a blend of running and leaping gazelles with human athleticism.","Powerbocking produces rhythmic thuds due to spring-loaded stilts' impact with the ground, accompanied by whooshing of air and metallic creaks during jumps. Laughter and chatter from participants often augment these sounds, as powerbocking is typically a social, outdoor activity.",,,,,,, +Preparing pasta,"Preparing pasta involves boiling water, adding salt for flavor, cooking the pasta until al dente, and then draining it. Optionally, one can toss it with sauce, herbs, or additional ingredients to create a complete dish.","Someone boils water in a pot, adds salt, stirs in uncooked pasta, and occasionally checks the noodles for doneness. Steam rises from the bubbling water as the pasta softens and swells. Tools like a spoon or strainer are nearby for handling the hot pasta.","Boiling water bubbling, pasta hitting water, stirring sounds, the clink of a spoon against a pot, package rustling, salt shaking, straining water whoosh, and a sizzling sound if sautéing with toppings.",,,,,,, +Preparing salad,"""Preparing salad"" is the process of cleaning, cutting, and mixing various fresh ingredients, typically vegetables and fruits, to create a healthy, nutritious dish. It often includes adding dressings or toppings for flavor.","Chopping colorful vegetables, tearing leafy greens, drizzling dressing; hands toss ingredients in a bowl, intermingling textures of crunchy, fresh, and juicy elements.","Preparing salad involves chopping vegetables, tearing spinach, and rustling lettuce. You wash ingredients under running water, spin them dry, and add nuts or croutons. Whisk the dressing and lightly toss everything in a bowl with kitchen utensils clinking.",,,,,,, +Putting in contact lenses,"Putting in contact lenses is a hygiene-sensitive task that involves placing soft or rigid lenses directly onto the surface of the eyes to correct vision, following a process that ensures proper alignment, comfort, and cleanliness to avoid irritation or infection.","Holding a tiny, convex clear disc on a fingertip, a person tilts their head back, pulls the eyelid open with the other hand, and gently places the lens onto the exposed eye, blinking several times to secure it in place.","Soft clicks of contact lens case, faint squish of lens suction on fingertip, subtle splash of saline solution, and occasional blink-related sounds (e.g., light fluttering or eyelid movement). Additional sounds may include the gentle rustle of cleansing solution packets or the quiet snap of the case closing.",,,,,,, +Putting on makeup,"Putting on makeup is the application of cosmetic products to enhance facial features, conceal imperfections, and express personal style. It involves steps such as applying foundation, eye shadow, mascara, and lipstick, often using brushes and spones to achieve a desired look.","A person applies various cosmetic products like foundation, powder, eyeshadow, mascara, and lipstick to enhance or alter their facial features, often using brushes, sponges, and other tools, creating a tailored, polished look.","Putting on makeup includes opening containers with clicks, sweeping brushes with soft swishes, and applying pencils with scratchy lines. Liquid products shake with fluid sounds, mascara wands twist with clicks, and sometimes a hair dryer or mechanical applicator hums or buzzes.",,,,,,, +Putting on shoes,"Putting on shoes is a daily task where one selects footwear, typically after dressing, and places their feet inside, making sure they fit snugly and comfortably. The process often involves adjusting laces, straps, or buckles to secure the shoes for walking and various activities.","A person bends down, opens the shoe up wide, slides their foot inside, pulls the heel back, and either ties the laces, secures the Velcro, or adjusts the slip-on for a snug fit.","Rustling of fabric or leather, snapping of elastic, thudding as shoes hit the ground, tightening of laces or Velcro, tapping of heels, and a final shuffle or foot-tapping to ensure a snug fit.",,,,,,, +Rafting,Rafting is an exhilarating outdoor sport where participants navigate a river's rapids and currents using an inflatable raft. It's a team activity requiring coordination and can range from serene floats to adrenaline-fueled rides through challenging whitewater. Safety gear and guidance from experienced instructors are essential.,"Rafting involves a group of individuals wearing helmets and life vests, navigating turbulent river waters aboard an inflatable boat, paddling in coordination, often sprayed with white froth as they steer through the rapids against a backdrop of scenic natural landscapes.","Rafting produces a symphony of sounds: rushing and splashing water as the raft cuts through waves, paddles dipping and swooshing rhythmically, the raft's inflatable body creaking, nature__ ambient noise on riverbanks, and exhilarated shouts and communication between rafters coordinating maneuvers against the river__ roar.",,,,,,, +Raking leaves,"Raking leaves involves using a rake to gather fallen leaves into piles for collection or composting, typically done in autumn to maintain yard tidiness and prevent lawn damage.","A person sweeps a long-handled rake across the ground, gathering scattered, colorful autumn leaves into a pile. The movements are rhythmic and repetitive. The gathered leaves often create a mound which can be bagged or left as compost.","The rhythmic scraping sound of the rake's tines against the ground, rustling of dry leaves being gathered, and occasional softer thuds as piles are collected. There might be intermittent bird calls or ambient wind rustle through trees in the background.",,,,,,, +Removing curlers,"Removing curlers is the process of carefully taking out rollers from hair after they've set, usually to create curls or add volume. It involves gently unraveling or unsnapping the curlers to reveal the styled hair without causing frizz or ruining the formed curls.","A person unwinds or slides out cylindrical rollers from their hair, which may be clipped or pinned, revealing hair that has been set to have curls or waves, and sometimes fluffing or styling the newly curled locks with their fingers or a brush.","Clicks from unlocking curlers, rustling as they unwind from hair, soft thuds as they're set down, and the swishing sound of newly curled hair settling.",,,,,,, +Removing ice from car,"Removing ice from a car involves clearing frost from the windshield, windows, and exterior for visibility and safety. Common techniques include using scrapers, de-icing sprays, and defrosting systems. This winter task prevents impaired sight and protects the vehicle’s surface in cold climates.","A person scrapes a layer of frost or ice off their car's windshield and windows, often using a handheld ice scraper or de-icing spray, revealing clear glass beneath the white, crystalline covering while their breath is visible in the cold air.",Scraping and crunching sounds as ice is chiseled away, shattering or cracking of thick ice layers, soft brushing noises from sweeping off powdery snow, and possibly the gentle hum of a car engine idling as the defroster works to loosen the ice's grip on glass surfaces.,,,, +Riding bumper cars,"Bumper cars is a funfair activity where participants drive small electric vehicles enclosed in a space, deliberately colliding with each other. It's a thrilling amusement ride, emphasizing merry chaos and gentle crashes within a safe, controlled environment.","People steering small electric cars in an enclosed arena, colliding with each other amidst laughter. Cars are brightly colored, surrounded by rubber bumpers, flashing lights, and sparkly poles for power contact.","Auditory features associated with riding bumper cars include the buzz of electric motors, collisions' thuds and clangs, children's laughter and shrieks, the whirring of wheels on the metal floor, repetitive upbeat carnival music, and occasionally a loudspeaker voice giving instructions or warnings.",,,,,,, +River tubing,"River tubing is a relaxing water activity where participants float downstream on large inflatable tubes, enjoying the scenery and serenity of the river at a leisurely pace. It's a popular summer pastime in many regions, suitable for all ages and generally requiring no special skills.","Individuals float downstream on a river, reclining in large, inflated inner tubes. They often wear swimwear and life jackets, surrounded by tranquil waters, lush greenery, and occasionally joined by fellow tubers enjoying the leisurely ride and the serene natural setting.","River tubing may include sounds of gentle water flow, splashing, birdsong, rustling leaves, and breezy ambiance, alongside human laughter and conversation. Occasional louder rushes of water or wildlife calls could punctuate the tranquil soundscape.",,,,,,, +Rock climbing,"Rock climbing is a physically and mentally demanding sport where participants ascend natural or artificial rock formations. Requiring strength, endurance, and problem-solving, climbers use ropes and safety gear to tackle various routes, known as problems, either indoors or in outdoor settings, aiming to reach new heights and overcome personal challenges.","Rock climbing involves individuals ascending vertical rock formations or artificial walls, using hands and feet to grip holds. Climbers use ropes, harnesses and protective gear, focusing on technique and strength as they maneuver upwards, often adorned with specialized shoes and chalk bags against a backdrop of natural or simulated rock textures.","Rock climbing generates sounds of scraping shoes on rock, heavy breathing, the clink of metal gear, commands between climber and belayer, birds or nature if outdoors, and the occasional sound of falling pebbles or debris dislodged by movement.",,,,,,, +Rock-paper-scissors,"Rock-paper-scissors is a two-player hand game where each player forms one of three shapes: rock (fist), paper (open hand), or scissors (V with fingers). Rock crushes scissors, scissors cuts paper, and paper covers rock.","Two players simultaneously form one of three shapes with an outstretched hand: a rock (fist), paper (flat hand), or scissors (two fingers extended and separated). They compare shapes to determine a winner: rock crushes scissors, scissors cut paper, and paper covers rock.","The auditory features of rock-paper-scissors include the sound of participants counting aloud, often using the phrase ""Rock, paper, scissors, shoot!"", accompanied by the slapping of one hand against the other to synchronize their reveals. There may be sounds of victory cheers or disappointment from the players.",,,,,,, +Rollerblading,"Rollerblading is an exhilarating sport and recreational activity where participants glide along surfaces on rollerblades, a type of inline skate with two to five wheels arranged in a single line. It requires balance and coordination, providing a full-body workout and a fun way to improve cardiovascular health.","Rollerblading involves individuals wearing inline skates__oots with wheels arranged in a single line__liding on surfaces, often performing smooth, fluid movements or tricks like jumps and spins, with a sense of agility and speed, often dressed in casual or athletic wear with protective gear like helmets and pads.","The sound of wheels rolling on pavement, occasional clicks of hard plastic on concrete during tricks, the whoosh of wind passing by, and possibly the low hum of bearings as they spin. Scuffing noises during stops and starts, and muffled chatter or laughter from participants may also be present.",,,,,,, +Roof shingle removal,"Roof shingle removal is the process of taking off old or damaged shingles from a roof in preparation for repairs or replacement. Safety precautions are essential, and special tools like roofing shovels or pry bars are typically used to lift and remove the shingles efficiently.","Workers atop a roof pry up and strip away old, worn shingles. Debris falls into a dumpster as they progress, revealing bare roof decking. They wear protective gear, and the roof gradually transitions from covered with old shingles to exposed, prepped for new roofing materials.","Auditory features of roof shingle removal may include scraping, prying, and tearing sounds, the clatter of shingles sliding off the roof, thuds as they hit the ground, and occasional hammer or nail gun noises from securing tarps or temporary covers. (29 words)",,,,,,, +Rope skipping,"Rope skipping, also known as jump rope, is a physical activity involving jumping over a swinging rope repeatedly, which is turned by either the jumper or two others. It improves coordination, burns calories, and can be performed individually or in groups for fitness, competition, or fun.","A person repeatedly jumps over a swinging rope, which passes under their feet and over their head. The rope is held and rotated by the individual or by two others if it's long enough for double Dutch skipping. Coordination and rhythm are visible in the jumper's movements.","Rope skipping produces rhythmic thumps as the rope hits the ground, the swishing sound of the rope cutting through the air, intermittent squeaks of sneakers on the floor, and possibly the jumper's steady breaths or vocal counts.",,,,,,, +Running a marathon,"Running a marathon is a challenging endurance event covering 26.2 miles (42.195 kilometers). It demands rigorous training, proper nutrition, and strategic pacing. Athletes aim to reach the finish line, showcasing their physical and mental strength.","A diverse crowd of determined runners pacing through streets or nature, sporting athletic gear with bib numbers, often with cheering spectators along the course, and a finish line banner ahead, showcasing exhaustion and triumph.","Heavy breathing, rhythmic footstrikes, cheering crowds, volunteers offering water, race announcements, heart pounding, music from personal devices or live bands along the course, wind whooshing, fabric rustling, occasional conversations between runners, and the beep of timing mats or personal running watches tracking pace and distance.",,,,,,, +Sailing,"Sailing involves harnessing the wind's power to propel a boat or ship across water using large fabric sails attached to masts. Participants navigate using rudders and trim sails, requiring skill, strategic thinking, and an understanding of weather and sea conditions. It can be for recreation, sport, or transportation.","Sailing features a boat with large fabric sails harnessing wind power. The vessel glides across water, often leaning to one side due to wind force. Skippers navigate, adjust sail positions, and steer, while clear skies and open seas or picturesque coasts often surround them.","Lapping waves, flapping sails, creaking rigging, ropes snapping in the wind, the hull cutting through water, calls of seabirds, and the distant sound of a foghorn or a ship's horn.",,,,,,, +Scuba diving,"Scuba diving is an underwater adventure sport where divers use self-contained underwater breathing apparatus (SCUBA) to explore aquatic ecosystems, observe marine life, and experience weightlessness. It requires training in safety and equipment use.","Scuba diving features individuals in wetsuits, masks, and fins, submerged in water, with air tanks on their backs. They explore underwater environments, such as coral reefs or shipwrecks, surrounded by marine life like fish and plants, often with bubbles rising toward the surface as they breathe through regulators.","Scuba diving offers a unique auditory experience, including underwater breathing sounds, bubbling air, regulator noises, and marine life sounds. Divers hear wetsuit and equipment movements, water currents, boat engines, coral crackling, and muffled voices or gear echoes, creating a distinctive underwater soundscape.",,,,,,, +Sharpening knives,"Sharpening knives involves honing the blade’s edge to restore cutting ability. This can be done with tools like whetstones, honing rods, or electric sharpeners. Techniques vary by tool and blade type. Regular sharpening ensures optimal knife performance and safety.","A person runs a knife blade at an angle along a rough surface, such as a sharpening stone or rod, honing the edge to a fine point. Sparks may fly, and the rhythmic motion produces a distinct scraping sound.","Sharpening knives typically produces a metallic scraping sound as the blade edge is drawn across a honing rod or sharpening stone, varying in pitch and intensity with the angle, pressure, and speed of the action. +",,,,,,, +Shaving,"Shaving is the practice of removing hair from the body, often facial hair, using a razor or other tool. It's part of personal grooming routines, enhancing appearance, cleanliness, or preparing the skin for other activities, like applying makeup. Today, both men and women shave various body areas.","Shaving involves gliding a razor across lathered skin to remove hair, resulting in smooth skin. It often includes a mirror reflection, foamy cream or gel, and occasionally water droplets.","The sounds of shaving include the swish of the razor gliding across skin, the gentle tap of the blade being rinsed, the click of a cartridge being replaced, the fizz of shaving cream dispensed, and the subtle splash of water as it's splashed on the face or rinsed off.",,,,,,, +Shaving legs,"Shaving legs involves using a razor to remove body hair from the legs for cosmetic reasons or personal grooming preferences. It's commonly practiced for skin smoothness, aesthetics, or as preparation for sports. Regular shaving requires maintenance to prevent irritation and achieve consistent smoothness.","A person runs a razor along their wet, usually foamy or gelled legs, methodically removing hair and revealing smooth skin. Sometimes there's a bathtub or shower setting with water rinsing away the shavings.","Sound of running water, hiss of aerosol shaving cream, scraping of razor against skin, occasional tapping of razor on sink edge to dislodge hairs, splashing as rinsing the shaved area.",,,,,,, +Shot put,"Shot put is a track and field event where competitors throw a heavy spherical object (shot) as far as possible from a circular area (the circle), using a pushing motion rather than a throwing technique, aiming to combine strength, form, and technique to achieve maximum distance.","A shot putter stands inside a circular area, leans back gripping a heavy metal ball, and initiates a pushing motion by explosively twisting their body and extending their arm to launch the ball into the air. The ball arcs through the air, landing in a marked sector of a field.","During shot put, one may hear the grunts or exhales from athletes exerting force, the thud of the shot hitting the ground, and the rustle of feet in the circle during the wind-up. Additionally, there may be background sounds of spectators and announcements over the loudspeaker.",,,,,,, +Shoveling snow,"Shoveling snow involves using a shovel to clear snow from pathways, driveways, and other surfaces. It's necessary for safety and accessibility during winter and requires physical effort, appropriate clothing for cold temperatures, and caution to avoid overexertion or injury.","A person bundled in warm winter clothing uses a shovel to lift and move white snow from a surface, such as a driveway or sidewalk, often creating piles alongside the cleared path. Visible breath in the cold air and a potentially overcast, snowy sky are common.","Shoveling snow is often accompanied by the crisp crunch of footsteps on fresh snow, the scraping of a shovel's blade against the ground, and the soft thud of snow being lifted and tossed aside. Muffled sounds prevail due to the snow's insulating properties.",,,,,,, +Shuffleboard,"Shuffleboard is a game where players slide weighted pucks down a long, narrow court with the aim of having them come to rest within marked scoring zones, while also possibly knocking opponents' pucks away. It can be played on indoor courts or on deck aboard ships.","Shuffleboard involves players sliding weighted pucks down a narrow, elongated court with numerical scoring zones at the end, aiming to land in high-scoring areas while possibly knocking opponents' pucks away. The court often has a polished, smooth surface with marked scoring sections. Players use cues to push the pucks.","Shuffleboard typically includes sounds of sliding pucks (also called weights or discs), the gentle collision of pucks, the specific auditory cue of a puck gliding across the marked court or table, and possibly players communicating scores or turns. The ambient environment may contribute additional background noise.",,,,,,, +Skateboarding,"Skateboarding is an action sport where riders perform tricks using a skateboard. It involves gliding on flat surfaces and performing aerial stunts on ramps and urban landscapes, appealing to those seeking athleticism, creativity, and countercultural expression. Skateboarding is also an Olympic sport as of the 2020 Tokyo Games.","Skateboarding involves a person balancing on a small board with wheels, performing tricks and maneuvers such as jumps, flips, and grinds on various surfaces, often in skate parks or urban landscapes, showcasing agility, speed, and creative expression in athletic movements.","Skateboarding auditory features include the clatter of wheels on pavement, the snapping sound of tricks like ollies, grinding noises as the board slides along edges, clicks from kickflips, the occasional thud from falls, and the rolling hum on smooth concrete.",,,,,,, +Skiing,"Skiing is a winter sport where participants slide over snow on skis__ong, flat devices attached to boots. It combines recreation, competition, and travel across snowy landscapes, offering variations like alpine, cross-country, and freestyle. Essential for the sport are skillful balance, control, and mastery of varied terrains and snow conditions.","Skiing features individuals gliding over snow-capped slopes with long, narrow skis attached to their boots, often using poles for balance, dressed in insulated winter gear against scenic mountain backdrops, with movements ranging from graceful linear descents to sharp, agile turns and jumps.","Skiing features include the swish of skis gliding on snow, the crunch of crisp snow underfoot, the whoosh of passing wind while in motion, periodic chatter of ski poles, distant murmurs of other skiers, occasional snowboarders' sharper scrapes, and the distinct silence enveloping remote snowy landscapes.",,,,,,, +Slacklining,"Slacklining involves balancing and walking on a narrow, flexible piece of webbing, usually made of nylon or polyester, which is suspended between two anchor points. It is similar to tightrope walking but features a dynamic line that swings and stretches, requiring core strength and focus.","Slacklining involves balancing on a narrow, flexible band of webbing tensioned between two anchor points, usually trees. Participants walk, balance, and perform tricks on the line, which sways and bounces with movement. It resembles tightrope walking, but with a more dynamic and elastic line.","Slacklining may involve the sound of footsteps shuffling on the line, the creak or stretch of the webbing under tension, occasional words of encouragement from onlookers, and perhaps the hum of nature or chatter if performed outdoors.",,,,,,, +Smoking a cigarette,"Smoking a cigarette involves lighting the end of a tobacco-filled stick and inhaling the resulting smoke. This practice, which delivers nicotine and other chemicals to the smoker, is known for its addictive properties and significant health risks, including lung cancer and heart disease.","An individual typically holds a thin, lit cigarette between fingers, inhales, and exhales smoke, often accompanied by the glow of the burning tip and a trail of smoke drifting upwards, which dissipates into the air.","Crackling of burning tobacco, a faint hiss as the smoke is inhaled, the exhalation of breath through the filter, occasional coughing, and the flick of a lighter or match.",,,,,,, +Smoking hookah,"Smoking hookah, also known as shisha or water pipe, involves inhaling flavored tobacco smoke after it passes through water, typically in a social setting. Originating in ancient Persia and India, it's a centuries-old tradition now enjoyed worldwide for its aromatic blends and communal experience.","A person inhales from a mouthpiece connected to a tube leading to a glass-based hookah, from which smoke billows after bubbling through water. Aromatic vapor swirls around as the coals atop the bowl heat flavored tobacco, adding to the relaxed, social ambiance often accompanied by dim lighting and plush seating.","Auditory features of smoking hookah may include bubbling water, inhalation sounds, the clink of charcoals being adjusted, gentle exhales, soft conversations, and occasional laughter, contributing to a relaxing and social ambiance.",,,,,,, +Snatch,"Snatch is a fast-paced, explosive Olympic weightlifting movement where a lifter raises a barbell from the ground to overhead in one continuous motion, requiring strength, flexibility, and coordination, typically executed with a wide grip and often used to develop power for athletes across various sports.","""Snatch"" is a dynamic Olympic weightlifting move where an athlete rapidly lifts a barbell from the ground to overhead in one continuous motion, exhibiting power, speed, and flexibility, often squatting before standing tall, arms extended, barbell steadied above.","Snatch, an explosive weightlifting movement, may involve sounds of heavy breathing, grunting, weights clanging, the barbell sliding on its bearings, feet shuffling and stomping on the platform, and sometimes verbal cues from coaches or the lifter's self-encouragement.",,,,,,, +Snow tubing,"Snow tubing is a winter recreation activity where participants slide down snow-covered slopes in large inflatable tubes, relying on gravity for propulsion. It's a family-friendly alternative to skiing or snowboarding, requiring no specialized equipment or skills. Venues often include designated hills with lifts for convenient uphill transport.","Snow tubing involves individuals sitting in large inflatable tubes, sliding down snow-covered slopes. It's a winter activity characterized by hills blanketed in white, punctuated by colorful tubes and joyous riders zipping down, with laughter and snow sprays accompanying their descent.","Snow tubing often involves the sounds of laughter and excitement, the swish of the tube sliding over snow, occasional shouts for steering directions, the muffled crunch of fresh snow compacting, and possibly the whistling of the wind as riders pick up speed down the slope.",,,,,,, +Snowboarding,"Snowboarding is a winter sport where participants descend snow-covered slopes on a single board attached to their feet, using a combination of balance and body movements to navigate and perform tricks. It combines elements of surfing, skateboarding, and skiing, offering both recreational and competitive avenues.","Snowboarding involves a rider descending snow-covered slopes standing sideways on a board, executing turns and tricks, often wearing colorful winter sportswear, against a backdrop of white snow and mountainous terrain.","Whoosh of slicing through snow, crunch of carving turns, muffled sounds through beanie or helmet, chatter of bindings, occasional yells or chatter from fellow riders, the occasional thud from falls, and the subtle flapping of clothing in the wind.",,,,,,, +Spinning,"Spinning is a high-intensity, indoor cycling workout. Participants ride stationary bikes to the rhythm of music, guided by an instructor through a series of speed and resistance levels, simulating outdoor biking experiences. It's a cardio exercise designed to build endurance, strength, and promote weight loss.","Spinning involves rapid circular motion, often seen with dizzying, blurring effects, creating whirls of color and shapes. The repetitive rotation can convey energy and momentum, with the central axis as a focal point of the activity.","The auditory features associated with spinning may include a whirring or whooshing sound from rotational movement, rhythmic humming from machinery like a spinning wheel or bike, soft thudding from foot pedaling, and background music or instructor cues if in a spin class environment.",,,,,,, +Spread mulch,"Spread mulch involves applying a layer of material, such as bark, compost, or leaves, over soil to conserve moisture, suppress weeds, regulate temperature, and enhance garden aesthetics. It's a key activity in sustainable gardening and landscaping for protecting and nurturing plant life.","A person scatters a layer of organic material, such as bark or straw, over soil using a rake or hands, creating a dark, textured blanket around plants or across garden beds, often emitting an earthy aroma.","Spreading mulch involves shoveling and rustling sounds as the material is distributed, the soft thud of mulch dropping onto soil, and periodic scraping as tools smooth the layers over garden beds. Periodic footsteps and ambient outdoor noises complement the work's rhythmic auditory backdrop.",,,,,,, +Springboard diving,"Springboard diving is an aquatic sport where athletes perform acrobatic jumps and flips from a flexible diving board, typically 1 or 3 meters above the water. Divers strive for precise, graceful aerial maneuvers and entry into the water with minimal splash, judged for technique and execution.","An athlete springs off a flexible diving board, performing acrobatic flips and twists before entering the water with minimal splash.","Springboard diving is characterized by sounds that include the steady rhythm of footsteps on the board, the creak and recoil of the springboard flexing, the sharp cut of the diver slicing through the air, and the splash of entry into the water, often followed by the echo of waves in the pool.",,,,,,, +Starting a campfire,"Starting a campfire involves gathering kindling, arranging dry wood, using a spark or flame to ignite, and gradually adding larger logs to maintain the fire, while following safety protocols to prevent wildfires and ensuring adequate ventilation for a steady burn.","Gathering sticks and logs, a person arranges them in a pit. Striking a match, they light small twigs that crackle and catch fire, producing wisps of smoke. Flames grow, licking the larger wood, and soon a warm, flickering campfire glows under the evening sky, casting a comforting light.","Crackling wood, roaring flames, faint snaps of twigs breaking, rustling leaves, a whoosh as the fire ignites, and the occasional pop from moisture escaping the wood, with the background hum of nature or quiet conversation.",,,,,,, +Sumo,"Sumo is a traditional Japanese sport where wrestlers, or rikishi, face off in a circular ring, aiming to either push their opponent out or make them touch the ground with anything other than their feet. Matches combine elements of strength, technique, and ritual.","Sumo features large, heavy wrestlers wearing mawashi (traditional loincloths) grappling in a circular ring (dohy_), aiming to push each other out of bounds or make their opponent touch the ground with anything other than the soles of their feet.","Sumo wrestling features deep, guttural calls by rikishi (wrestlers), the resounding impact of heavy bodies colliding, audience cheers, the referee's (gyoji) chanting, and ceremonial stomping that rumbles through the dohyo (ring).",,,,,,, +Surfing,"Surfing is a water sport where individuals ride ocean waves standing on surfboards. It requires balance, agility, and knowledge of wave patterns. Popular in coastal regions, it's both a recreational activity and competitive sport with deep cultural connections, particularly in Hawaii and Australia.","Surfing involves individuals standing on surfboards, riding ocean waves. They balance skillfully, often performing turns and maneuvers against a backdrop of blue water and curling surf, with occasional sprays of white foam. The surfers appear to glide seamlessly across the wave's surface, harmonizing with the sea's rhythm.","Surfing auditory features include the rhythmic crashing of waves, the whoosh of water gliding past the board, the occasional calls of seabirds, the sound of wind whipping past ears, and the murmur of distant chatter from other surfers or beachgoers.",,,,,,, +Swimming,"Swimming is a versatile physical activity that involves propelling oneself through water using the limbs. It is a popular sport, a vital life skill, and an effective workout, offering full-body exercise, cardiovascular benefits, and low-impact movement suitable for various fitness levels and ages while promoting endurance and coordination.","Swimming involves individuals propelling themselves through water using their arms and legs, often in pools or open water. Swimmers wear swimsuits, goggles, and sometimes swim caps, with their bodies submerged or partly above the water surface, creating ripples and splashes as they move.","Splashing water, rhythmic breaths, muffled underwater noises, distant chatter, lifeguard whistles, the echo in indoor pools, the occasional sound of swim strokes, starting signals or buzzers during races, and perhaps the gentle lap of waves against the poolside or shoreline in open water environments.",,,,,,, +Swinging at the playground,"Swinging at the playground is a joyful outdoor activity where individuals, often children, use a suspended seat to swing back and forth, propelled by pushing with their legs or being pushed by someone else, enjoying the sensation of movement and temporary weightlessness.","Children sway to and fro on swings, laughter filling the air as they soar upwards. Chains clink rhythmically, feet kick skyward, and the playground's backdrop blends with the joyful motion of swinging.","Laughter, creaking of swing chains, rhythmic squeaking of swing hinges, children shouting, whoosh of swings moving, soft thuds of feet on ground, rustling leaves if trees are nearby, distant chatter, occasional clunk of swing seats hitting poles, and the background hum of a park environment.",,,,,,, +Table soccer,"Table soccer, or foosball, is a competitive game where players manipulate miniature figures mounted on rotating rods to shoot a ball into the opponent's goal, simulating soccer in a tabletop format. It requires hand-eye coordination and strategy, enjoyed casually or in tournaments.","Table soccer, or foosball, features miniature players attached to rotating rods, a small soccer ball, score trackers, and goalposts on a table resembling a soccer field with raised edges to contain the ball. Players twist and push the rods to simulate a soccer match, aiming to score goals.","Table soccer features the clicking of rotating rods, the thud of the ball hitting plastic figures, the sliding sound as it moves across the field, and the satisfying clunk when a goal is scored, accompanied by players' cheers and groans.",,,,,,, +Tai chi,"Tai chi is a traditional Chinese martial art practiced for both its defense training and health benefits. It involves slow, flowing movements and deep breathing, promoting physical coordination, relaxation, and mental focus. Its gentle nature makes it accessible to people of all ages and fitness levels.","Tai chi involves slow, flowing movements often performed outdoors. Practitioners adopt gentle, graceful postures, transitioning smoothly from one stance to the next with focused breathing, maintaining an erect spine and relaxed state, creating a meditative, dance-like practice.","Tai chi often involves soft, rhythmic background music to complement the meditative movements, whispered instructions or verbal cues from instructors, and the natural sounds of the environment, such as birds, water, or leaves rustling, which enhance the tranquil and mindful experience.",,,,,,, +Tango,"Tango is a passionate and sensual dance that originated in the late 19th century in Argentina. It involves a fluid, improvisational partnership, marked by close embrace and intricate footwork, set to distinctive rhythmic music. Tango has transcended its cultural roots, becoming a global phenomenon with various styles.","Tango is a passionate and elegant dance characterized by close embraces, dramatic poses, swift footwork, and intricate leg movements, often to the sound of classic Argentine music. Dancers typically wear sophisticated attire, with men in suits and women in flowy, embellished dresses and high heels.","Tango music typically features a steady, rhythmic beat accentuated by bandoneóns, violins, and pianos, intertwined with passionate, nostalgic melodies. The dancers' swift footsteps and the occasional whisper of fabric contribute to the auditory experience as they move in sync with the music's dramatic ebb and flow.",,,,,,, +Tennis serve with ball bouncing,"""Tennis serve with ball bouncing"" is an essential skill in tennis where a player launches the ball into the opponent's court by striking it with a racquet, following a bounce, to initiate a point. It requires precise timing, technique, and body coordination to effectively challenge the receiving player.","A player tosses a ball skyward and swings a racket overhead to strike it; the ball arcs over the net, landing and bouncing on the opposite court's service box.","A sharp racquet swoosh, a resonant thwack upon ball impact, a fainter bounce sound as the ball hits the court, and possibly the player's grunt or breath exhale. Subtle background sounds might include opponents_ or spectators_ movements and ambient court noises.",,,,,,, +Throwing darts,"Throwing darts is a competitive sport and pub game involving precision hand-eye coordination where players hurl small, pointed missiles (darts) at a circular target (dartboard) fixed to a wall, aiming to hit specific marked areas for varying scores. It combines skill, strategy, and concentration.","A person stands at a line, dart in hand, aiming at a circular, numbered dartboard. They execute a focused, precise throw to hit a specific section, usually aiming for high-scoring areas or a bullseye. Dart flights streamline the path, and the dart sticks into the board upon impact.",The sound of darts hitting the dartboard is characterized by a distinct thunk. A soft flutter of flights might be heard during a throw. Muffled chatter and applause from onlookers can also form part of the ambient noise in a venue where darts are being thrown.,,,,,,, +Trimming branches or hedges,"Trimming branches or hedges is a gardening task that involves cutting away overgrown or unwanted parts of plants to encourage healthy growth, maintain shape, and enhance the appearance of the landscape. It's essential for plant health, preventing damage, and promoting lush, dense foliage.","An individual is selectively cutting away overgrown or unwanted branches and twigs from trees or shrubs, using tools like shears, loppers, or a hedge trimmer, to shape, control growth, and remove dead material, enhancing the plants' overall health and aesthetic appeal.","Trimming branches or hedges typically produces intermittent snipping or chopping sounds from manual shears or the constant hum and whir from electric or gas-powered hedge trimmers, accompanied by the rustling of leaves and the occasional thud of cut branches falling to the ground.",,,,,,, +Triple jump,"The triple jump is an athletic event where competitors sprint along a runway and perform a hop, a step, and a jump into a sandpit. The aim is to cover the greatest possible distance, combining speed, strength, and agility. It is part of track and field competitions such as the Olympics.","An athlete sprints down the track, hops on one foot, steps forward continuing on the same foot, then jumps with both feet into a sandpit, displaying a sequence of fluid, coordinated motions marked by explosive power and graceful athleticism over an extended horizontal distance.","The triple jump involves distinct sounds: the short run-up's accelerating footsteps, rhythmic breathing, three consecutive ""thuds"" as the athlete hits the hop, step, and jump phases, the landing's sandy impact, and occasional crowd reactions__heers or gasps__epending on the jump's success or form.",,,,,,, +Tug of war,"Tug of war is a competitive team activity where two groups pull on opposite ends of a rope, attempting to drag the opposing team across a central line. Strength, team coordination, and strategy are key in this test of collective force.","Two teams pull opposite ends of a rope, straining and leaning back, attempting to drag the other team across a central line. Observers watch as participants dig their feet into the ground, muscles tensed, faces showing determination and effort, in a classic test of collective strength and teamwork.","Grunt and strain sounds from participants, cheering and encouragement from spectators, the creak and stretch of the rope, occasional thuds of participants' falls, rhythmic chanting or counting, heavy breathing, and the referee's whistle or vocal commands.",,,,,,, +Tumbling,"Tumbling is a gymnastics discipline involving acrobatic moves like flips, rolls, jumps, and twists. It's performed on a springy floor without props, showcasing agility, coordination, and aerial skills in routines executed with fluidity and precision, often part of cheerleading or as a standalone competitive sport.","Tumbling involves gymnasts executing acrobatic moves like flips, rolls, and jumps in a rapid, fluid sequence, often on a springy mat, showcasing agility and coordination. It emphasizes grace, strength, and precision, with movements akin to somersaults and aerial spins.","Tumbling involves rhythmic thuds or thumps on a mat, rapid swooshing noises from body movements, occasional heavy breathing from exertion, and possibly soft footsteps or running before a sequence. The sound of hands and feet making contact with the surface can also be a characteristic auditory feature.",,,,,,, +Using parallel bars,"Using parallel bars involves exercises on two horizontal bars set at the same height, where individuals perform a range of gymnastic and calisthenic movements to improve upper body strength, coordination, and balance, such as dips, swings, and leg raises.","An individual grips two horizontal bars at shoulder width, placed at a consistent height, typically performing exercises like dips or leg raises, moving their body weight up and down or in a controlled swinging motion, with the arms or legs supporting the movement depending on the exercise variation.","The sound of hands gripping metal, rhythmic tapping of feet on floor mats, occasional grunts of exertion, the swoosh of body movement through the air, clinking of the bars with slight sway, and soft thuds as gymnasts dismount onto padded surfaces.",,,,,,, +Using the balance beam,"The balance beam, an apparatus in gymnastics, challenges athletes to perform routines consisting of jumps, flips, and dance movements on a narrow, elevated beam. It tests balance, coordination, and grace, requiring rigorous practice to master complex skills and build confidence for competition.","An individual performs gymnastic maneuvers on a narrow, elevated beam, maintaining careful balance while executing turns, jumps, and sometimes flips, often with arms outstretched for stability.","Auditory features may include the sound of footsteps tapping on the wood, occasional thuds when dismounting or adjusting balance, creaks from the beam's flex, and the whir of air during jumps or flips. Background gym noise like coaches' instructions and other athletes' activities might also be audible.",,,,,,, +Using the monkey bar,Using monkey bars involves swinging from one bar to the next using hand strength and coordination. It's a popular playground activity that helps develop upper body strength and control in children and can also be part of a fun adult workout routine.,"A child grips overhead horizontal bars, swinging hand-over-hand across a metal frame, body suspended in air, legs dangling or tucked up, moving from one end to the other with focused determination and physical coordination.","Gripping and swinging motions produce rhythmic hand clasps and releases, metallic clangs of bars interacting, children's laughter and chatter, wind whooshing past ears during movement, occasional thuds of feet landing on the ground, and the creaking of equipment under stress or in motion.",,,,,,, +Using the pommel horse,"The pommel horse is a gymnastics apparatus with two handles. Athletes perform continuous movements like circles and flairs, maintaining balance and rhythm. Using their hands for support, they demonstrate strength, flexibility, and coordination while swinging their legs and bodies around the horse.","A gymnast swings and flips around a leather-covered apparatus with wooden handles (pommels), using rhythmic leg movements and precise hand placements to maintain momentum and balance while performing circles, scissors, and flairs without touching the horse with their torso.","Auditory features may include the rhythmic thumping of hands and feet striking the pommel horse, the swishing sound of the gymnast's body and clothing moving through the air, occasional grunts or breaths exerted during maneuvers, and the supportive clapping or cheering from spectators or coaches.",,,,,,, +Using the rowing machine,"Using a rowing machine provides a full-body workout, targeting legs, core, and arms with smooth, low-impact pulling motions. It simulates water rowing and is ideal for cardiovascular fitness and strength, allowing adjustable resistance to suit various fitness levels.","An individual sits on a sliding seat, grasping a bar with both hands, pulling it towards the torso while extending the legs, then slides forward bending the knees, resembling the motion of rowing a boat, often accompanied by the rhythmic sound of the machine's moving parts.","Using a rowing machine typically produces rhythmic whooshing from the seat sliding, repetitive swirling water or air from resistance mechanisms, and clicking of the catch and release mechanism. Occasional metallic clinks or thuds may occur during intense workouts. Users may also hear heavy breathing and the strap tightening against their feet.",,,,,,, +Using uneven bars,"Using uneven bars, a gymnastics apparatus, athletes perform aerial routines on two horizontal bars set at different heights, showcasing strength, agility, and coordination. It's a dynamic and artistic Olympic event predominantly contested by female gymnasts.","A gymnast gracefully swings, flips, and transitions between two horizontal bars set at different heights, demonstrating agility, strength, and aerial acrobatics in a fluid routine.","Using uneven bars generates rhythmic metallic clanks as the gymnast transitions between bars, the whir of swinging motions, the slap of hands gripping metal, and occasional thuds of feet on the mat, along with the sounds of heavy breathing and the coach's instructions or encouragement.",,,,,,, +Vacuuming floor,"Vacuuming the floor is a cleaning process that involves using a vacuum cleaner to remove dirt, dust, debris, and pet hair from flooring surfaces, such as carpets and hard floors, in order to maintain a clean and hygienic living or working space.","An individual pushes an upright vacuum cleaner across a carpet or a floor, back and forth, with the machine's nozzle sucking up dirt and debris. The vacuum's cord may trail behind, and the surface gradually looks cleaner as the person systematically covers the area.","The activity ""vacuuming the floor"" is characterized by the continuous roar and hum of the vacuum cleaner motor, varied by pitch changes when adjusting settings or encountering different surface types, accompanied by the sound of debris being sucked up and occasional high-pitched whines when airflow is restricted.",,,,,,, +Volleyball,"Volleyball is a team sport where two teams of six players use their hands to hit a ball over a net, aiming to ground it on the opponent's court. Points are scored for forcing errors or winning rallies, with strategy and teamwork being essential components for success.","Two teams, typically of six players each, face off on a court divided by a high net. They hit a spherical ball over the net, aiming to ground it on the opponent's side or force errors. Players wear athletic gear, often with knee pads, and move dynamically in sand or indoor courts.","Volleyball auditory features include the sound of the ball being served and hit, players calling out plays, the whistle of the referee, cheers from spectators, the thump of players' feet on the court, and the occasional dive or skidding sound when saving a ball.",,,,,,, +Wakeboarding,"Wakeboarding is a water sport where riders stand on a wakeboard and are towed behind a motorboat, performing aerial tricks and maneuvers on the boat's wake. It combines elements of snowboarding, surfing, and skateboarding and requires balance, strength, and agility.","Wakeboarding involves a rider standing on a short, wide board, towed on a body of water by a speedboat, performing jumps and tricks over wakes. The rider typically wears a life vest and is connected to the boat by a towrope and handle.","Wakeboarding produces sounds of splashing water, the hum of the boat engine, the rush of wind, waves chopping against the board, and occasional shouts of excitement or instruction from participants.",,,,,,, +Walking the dog,"Walking the dog is a popular physical activity that involves taking a canine companion for a stroll outdoors. It promotes exercise, mental stimulation, and bonding time for both the dog and the owner, while also providing opportunities for socialization and obedience training.","An individual strolls with a leash in hand, connected to a dog that trots alongside. They move in sync, occasionally pausing for the dog to explore or attend to nature's call. The owner carries bags for cleanup, and the dog may carry a joyful demeanor, sometimes leading the way.","The potential auditory features associated with walking the dog include the sound of the leash jangling, the dog's panting and barking, the clip-clop of its paws on the pavement, occasional interactions with passersby or other animals, and ambient neighborhood sounds such as birds, traffic, or rustling leaves.",,,,,,, +Washing dishes,"Washing dishes is a household chore that involves cleaning cookware, tableware, and kitchen utensils with water and detergent, typically by hand or using a dishwasher, to remove food residue and maintain hygiene.","Hands scrubbing plates with soapy water, utensils clinking, bubbles forming, steam rising, dishes stacked neatly, faucet running clear water, suds draining in sink.","Splashing water, clinking dishes, scraping utensils, running faucet, gurgling drain, suds fizzing, glassware clanking, porcelain clinking, silverware chiming, dishwasher humming, scrub brush scouring, and occasional utensil dropping sounds.",,,,,,, +Washing face,"Washing your face is a personal hygiene activity that involves using water and often a cleanser to remove dirt, oil, sweat, and other impurities from the skin on your face. It's typically done twice daily to maintain clear and healthy skin.","A person splashes water onto their face, applies cleanser with their hands, rubs in circular motions, and then rinses off the soap, often finishing by patting dry with a towel.","Splashing water, running tap, trickling streams from hands/fingers, gentle rubbing sounds, occasional squelching of soap, a towel patting or rubbing on skin, and possibly the unscrewing and squeezing of tubes or pumping of liquid soap dispensers.",,,,,,, +Washing hands,"Washing hands is a crucial hygiene practice where individuals use soap and water to clean their hands, removing dirt, germs, and bacteria to prevent illness and the spread of infections. It involves scrubbing all hand surfaces for at least 20 seconds and is essential before eating and after using the restroom.","Running water flows over interlocked fingers with soapy suds, scrubbing palms and back of hands, between fingers, and under nails. Bubbles form as hands are rubbed together, then rinsed, with droplets scattering and steam rising slightly, finishing with a clean, damp look.","While washing hands, one may hear running water, the lathering of soap, a squelching or scrubbing sound from rubbing hands together, splashing water, and the clicking of the tap or dispenser. There may also be the rustling of a towel or the air dryer if drying hands afterward.",,,,,,, +Waterskiing,"Waterskiing is a thrilling water sport where individuals glide across water on skis, towed by a boat. It combines balance, strength, and coordination as skiers maintain upright positions while performing maneuvers at high speeds. It__ a popular recreational and competitive activity enjoyed on lakes and calm sea waters.","A person glides over water on skis, towed by a speeding boat via a rope/handle, maintaining balance as they cut through the waves, possibly performing jumps and tricks.","The sound of splashing water, the hum of the boat's engine, the whoosh of skis gliding across the surface, the rhythmic lapping of waves, wind rushing past the ears, and the occasional shout of instructions or encouragement between the skier and the spotter or driver.",,,,,,, +Waxing skis,"Waxing skis is the process of applying a hydrocarbon wax to the bases of skis to enhance glide, improve performance, and protect them from damage. It involves melting and spreading the wax, letting it cool, then scraping and brushing for a smooth finish.","Waxing skis involves smearing or melting a layer of wax onto the ski base, often with a hand-held iron, then scraping and buffing it to a smooth finish, resulting in a glossy, slick surface to enhance glide and performance on snow.","Scraping sounds of wax removal, soft swishing noises as the wax is spread, brief rasps of brush strokes for finish texturing, and occasional clicks of tools or clamps used to secure the skis during the process.",,,,,,, +Welding,"Welding is a fabrication process that joins materials, usually metals or thermoplastics, by applying high heat to melt the parts together and allowing them to cool, causing fusion. It's used in various industries for constructing structures, vehicles, and manufacturing components, requiring skilled technicians to perform.","Welding involves bright, intense sparks and a glowing arc of light as a welder, clad in protective gear, fuses metal with a tool emitting concentrated heat. Glowing red-orange metal cools alongside blackened weld lines, amidst a backdrop of smoke and the blue-white light of the welding torch.","Welding often produces loud noise including hissing, buzzing, or popping from the arc, crackling sounds from metal cooling, and clanging of tools and materials, requiring ear protection to prevent hearing damage.",,,,,,, +Windsurfing,"Windsurfing is a water sport where athletes ride on a board equipped with a sail, using wind power for propulsion. Windsurfers maneuver by tilting and rotating the mast and sail, skillfully combining elements of surfing and sailing for recreational racing and acrobatics.","Windsurfing features a person standing on a board with an attached sail, skimming across water's surface, harnessing wind power for speed and performing maneuvers by tilting and steering the sail.","Wave crashing, sail flapping, wind howling, board cutting through water, rigging creaking, splashes as surfer maneuvers, distant cheers, zip and snap of wetsuit and harness, chatter of pulleys and clips during setup, occasional whistles and shouts for communication.",,,,,,, +Wrapping presents,"Wrapping presents is the act of enclosing gifts in decorative paper or materials, often with ribbons and bows, to conceal the contents and enhance the gift-giving experience. It's a common practice for special occasions, such as birthdays and holidays, to add a personal touch to the presented items.","Colorful paper, ribbons, and tape are spread out. Hands fold and crease paper around boxes, securing edges with tape. Bows are tied, and gift tags are attached to neatly wrapped presents, adding a festive touch.","Rustling paper, tearing of tape, scissor snips, creasing folds, soft thuds of boxes, occasional ripping sounds, muffled impacts as gifts are placed on a surface, and potentially background music or humming that one might do while engaged in the task.",,,,,,, +Zumba,"Zumba is a high-energy fitness program that blends dance moves from styles like salsa, merengue, and samba with aerobic exercises, driven by Latin and international music beats. It's designed to be fun and effective, offering a party-like experience that helps participants burn calories and improve cardiovascular health.","Zumba is an energetic, dance-based workout where participants perform choreographed movements to Latin and international music, often characterized by vibrant attire, dynamic steps, and infectious enthusiasm within a group setting.","Zumba features rhythmic Latin music that blends upbeat tempos and energetic percussion, encouraging participants to dance. It includes vocal encouragement from instructors, the sound of footsteps, and participants' synchronized movements to high-energy beats, creating an immersive and motivating workout atmosphere.",,,,,,, diff --git a/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/wavcaps_word_embeddings_activitynet_normed.npy b/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/wavcaps_word_embeddings_activitynet_normed.npy new file mode 100644 index 0000000..7a72d51 Binary files /dev/null and b/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/wavcaps_word_embeddings_activitynet_normed.npy differ diff --git a/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/word_embeddings_activitynet_normed.npy b/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/word_embeddings_activitynet_normed.npy new file mode 100644 index 0000000..a607dc4 Binary files /dev/null and b/avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/word_embeddings_activitynet_normed.npy differ diff --git a/avgzsl_benchmark_non_averaged_datasets/UCF/class-split/UCF.csv b/avgzsl_benchmark_non_averaged_datasets/UCF/class-split/UCF.csv new file mode 100644 index 0000000..f6c107c --- /dev/null +++ b/avgzsl_benchmark_non_averaged_datasets/UCF/class-split/UCF.csv @@ -0,0 +1,103 @@ +name,description_1,description_2,description_3,,,,,,, +Apply Eye Makeup,"Applying eye makeup is a cosmetic routine involving the use of products like eyeshadow, eyeliner, and mascara to enhance the eyes' appearance, add definition, and accentuate their shape, often following steps tailored to individual styles and preferences for everyday looks or special occasions.","A person carefully applies cosmetic products like eyeshadow, eyeliner, and mascara to enhance and define the eyes, often using brushes or applicators to blend colors on the eyelids and accentuate the lash lines.","Quiet environment with occasional sound of makeup containers snapping open/closed. Soft brush strokes might be audible. User may give voice commands to an AI assistant or play music/beauty tutorials in the background, leading to a mix of dialogues, music, or video sounds.",,,,,,, +Apply Lipstick,"Applying lipstick is a cosmetic procedure where one uses a colored substance in stick or liquid form to add color and texture to the lips, enhancing their appearance, defining the lip shape, and often providing hydration or other benefits. It's a common step in makeup routines for aesthetic purposes.","A person smooths colorful cosmetic substance over their lips using a tubular stick or brush for an enhanced, polished look, often looking into a mirror to ensure precise application. The lips become more defined and vibrant after the lipstick is applied.","Applying lipstick may involve subtle sounds: the click of a lipstick tube opening or closing, the slight pull when twisting the mechanism to raise the stick, and the soft swish as the product glides across the lips. There may be a faint smack or pucker afterward to even the application.",,,,,,, +Archery,"Archery is a sport that involves shooting arrows at a target from a set distance using a bow. It requires precision, control, and concentration, and can be practiced competitively or recreationally, indoors or outdoors. Archery has historical roots as a hunting and warfare tool, now enjoying Olympic status.","Archery involves an archer using a bow to shoot arrows at a distant target marked with concentric circles. The archer typically stands with a focused stance, drawing the bowstring back with one hand while the other hand steadies the bow, aiming for the bullseye to score maximum points.","The twang of the bowstring, the whoosh of the arrow soaring through the air, and the decisive thud as it strikes the target are characteristic sounds of archery. Remote outdoor locations often feature ambient nature sounds, while indoor ranges may echo with the muted sounds of other archers and equipment.",,,,,,, +Baby Crawling,"Baby crawling is a developmental stage where infants typically learn to move on their hands and knees, exploring their surroundings and strengthening their muscles, usually occurring around 6 to 10 months old. It's key for motor skills and cognitive development, preceding walking.","A baby crawling typically involves a small infant on all fours, moving with alternating hand and knee motions across the floor, often with a determined, focused expression as they explore their surroundings.","Soft coos or babbling, gentle patting sounds on the floor, occasional giggles or laughter, light grunts with effort, rustling of clothing or a diaper, and possibly the curious squeal or cry if met with frustration or surprise from new discoveries.",,,,,,, +Balance Beam,"The balance beam is a gymnastics apparatus used primarily by female gymnasts. It's a narrow platform elevated off the ground, where athletes perform routines including jumps, flips, and dance moves, requiring balance, agility, and coordination. It challenges mental focus and physical precision, and is both a competitive and training tool.","The balance beam is a narrow, rectangular gymnastics apparatus raised off the floor, on which athletes perform acrobatic flips, jumps, and dance movements, requiring exceptional balance and concentration. It typically has a padded, leather-like surface for grip and measures about 4 inches wide and 16 feet long.","Balance beam activity may include rhythmic footsteps, soft thuds of dismounts, coach’s instructions, the creak of the beam with movement, and the occasional gasp or cheer from spectators.",,,,,,, +Band Marching,"Band marching is a coordinated group performance that combines musical play with precise, choreographed movement. Participants, known as marchers, play instruments while executing intricate formations and steps during parades, sporting events, and competitions, often led by a drum major.","Uniformed individuals march in synchronized steps, often in formation, while playing musical instruments like brass, woodwinds, and percussion, creating a dynamic spectacle of orderly movement paired with melodic and rhythmic sounds, typically during sporting events or parades. Flags and batons may also be twirled by color guard members.","Loud, synchronized melodies and rhythms; brass, woodwind, and percussion instruments; drumline cadences; marching steps; shouted commands; and possible ambient crowd cheers.",,,,,,, +Baseball Pitch,"Baseball pitch involves a player, called the pitcher, throwing a ball towards home plate to be hit by the batter from the opposing team, striving to strike him out or induce a poor hit, governed by intricate rules regarding pitch styles, speed, and ball movement.","A baseball pitch involves a player winding up and then rapidly extending their arm forward to release a small white ball with red stitching towards another player crouching behind a pentagonal rubber plate, within the confines of a dirt mound enclosed by a grassy field.","The sound of a baseball being thrown includes a whoosh as it cuts through the air, a thud or pop upon hitting the catcher's mitt, the umpire's calls, the crack of a bat if contact is made, and the cheers or groans of spectators.",,,,,,, +Basketball,"Basketball is a fast-paced team sport in which two teams of five players compete to score by shooting a ball through a hoop elevated 10 feet above the ground. Points are scored by getting the ball through the opponent's hoop in various play styles that can include passing, dribbling, and shooting.","Basketball involves players dribbling a round orange ball on a court with marked lines, aiming to shoot it into an elevated hoop with a net while outmaneuvering opponents in athletic attire. Brightly lit, indoor or outdoor with bleachers for spectators, it's a dynamic display of teamwork, agility, and skill.","Bouncing balls, squeaking sneakers on the court, swish of the net, players communicating, coach shouting instructions, whistle blowing, crowd cheering, buzzer signaling game end.",,,,,,, +Basketball Dunk,"Basketball dunking involves jumping high and slamming the ball through the hoop from above, often with dramatic flair. It's a high-adrenaline move showcasing an athlete's strength, agility, and skill, and is a crowd-pleaser in games and contests.","An athlete springs upwards, basketball in hand, arm outstretched, and slams the ball down through a hoop with a net, often bending the rim, while in mid-air. Spectators might witness a powerful, gravity-defying leap and the physical prowess on display during this high-energy, dynamic move.","A ""Basketball Dunk"" typically features the sound of sneakers squeaking on the court, the player's breath, the rush of air, the slap of the hand on the ball, the ball hitting the rim, the net swish, the vibration of the backboard, and the crowd's cheers or reactions.",,,,,,, +Bench Press,"The bench press is a strength-training exercise where an individual lies on a bench and lifts a weighted barbell up and down from chest level. It primarily targets the chest, triceps, and shoulders, and is a key component of weightlifting and bodybuilding routines, as well as strength testing.","A person lies on a bench, grips a barbell above their chest with arms extended, then lowers and pushes the weight up in controlled motions, activating chest, arms, and shoulder muscles.","During a bench press, one might hear the clanking of metal weights, the sliding of the barbell across the rack, grunts or exhales of the lifter, the thud of weights being set down, and potentially coaching cues or encouragements from spotters or trainers.",,,,,,, +Biking,"Biking is a versatile activity involving riding a bicycle for transportation, recreation, or fitness. It's a low-impact, eco-friendly way to explore terrain, improve cardiovascular health, and enjoy the outdoors, suitable for all ages and skill levels. Biking ranges from leisurely rides to competitive racing.","A person pedals a bicycle, their legs moving in circular motion. Handlebars are held for steering. The wheels roll along a path or road, with the surrounding scenery passing by. The cyclist often wears a helmet and may have a focused or exhilarated expression with the wind brushing against them.","Whir of spinning wheels, rhythmic pedal strokes, clicking gear shifts, rush of wind, occasional chain clink, distant hum of traffic, sounds of nature in rural areas, brief exchanges with pedestrians or other cyclists, alert dinging of bike bells, and the rasping breaths of exertion.",,,,,,, +Billiards,"Billiards is a precision sport involving cue sticks and spherical balls on a felt-covered table, where players aim to score points through various games by striking balls into pockets or against each other, depending on the rules of specific disciplines like eight-ball, nine-ball, or snooker.","Billiards involves players using cues to strike colored balls, aiming to pocket them on a green felt-covered table with six receptacles at the corners and midpoints of the long sides.","The auditory features of billiards include the sharp cracking sound of the cue ball striking other balls, the clicking of balls colliding, the softer thud of balls dropping into pockets, and the occasional clatter of the cue stick against the table or the chalk's snap on the cue tip.",,,,,,, +Blow Dry Hair,"Blow drying hair is a styling method that involves using a handheld dryer to apply directed heat and airflow to wet hair, accelerating evaporation of moisture and enabling shaping and volume creation for a desired hairstyle. It's often paired with brushes and products to protect hair and enhance results.","A person uses a handheld dryer emitting hot air, often brushing through hair simultaneously, as strands flutter and dry, transforming from wet to styled and voluminous.","The activity ""Blow Dry Hair"" typically involves a consistent whirring sound from the hair dryer's motor, varied by the device's speed settings, occasional clicking of buttons to adjust temperature or speed, and the sound of air rushing and hair strands fluttering as they are dried.",,,,,,, +Blowing Candles,"Blowing candles is a ceremonial activity typically performed on birthdays, where an individual extinguishes a set of candles placed atop a cake with a breath in one go, often while making a silent wish, symbolizing the celebration of another year of life and the hope for future aspirations.","A person puffs cheeks and exhales forcefully towards lit candles on a cake, extinguishing the flames, often amidst a darkened room with soft lighting from the flickering candlelight, surrounded by expectant, smiling faces, and festive decorations indicative of a celebratory event like a birthday or anniversary.","The activity ""Blowing Candles"" features a whooshing sound as air is expelled, possibly a brief sputtering as candle flames flicker out, and often followed by the soft crackling of wicks and applause or cheers from onlookers.",,,,,,, +Bodyweight Squats,"Bodyweight squats are a strength exercise that targets the lower body. Without added weights, one performs a squatting motion to tone the legs, glutes, and core, while also improving balance and flexibility. They're versatile, require no equipment, and can be modified to suit different fitness levels.","A bodyweight squat starts with feet shoulder-width apart, toes facing forward. The individual bends their knees, pushing hips back as if sitting in an invisible chair, while keeping chest upright and arms extended for balance. They lower until thighs are parallel to the floor, then push up to standing.","Bodyweight squats may produce rhythmic breathing sounds, soft thuds of feet as they maintain contact with the ground, occasional creaking of knee joints, and potentially the rustle of clothing during movement. Audible exertion or a light grunt could accompany the effort, especially during faster or more intense sets.",,,,,,, +Bowling,Bowling is a recreational and competitive sport in which players roll a heavy ball down a lane to knock down a set of ten pins arranged in a triangular formation. The goal is to score the highest number of points by knocking down as many pins as possible.,"Bowling features a smooth, polished lane, ten pins arranged in a triangle, a heavy, spherical ball with finger holes, and players taking turns to roll the ball towards the pins, aiming to knock them down for points, all under the vibrant glow of overhead lights.",The sound of a heavy ball rolling on a wooden lane, crashing pins, mechanical noise of pinsetter resetting pins, background chatter, occasional cheers or groans from players, squeaking shoes on the approach, electronic scoring beeps, ambient music or announcements over a PA system. +Boxing Punching Bag,"Boxing with a punching bag is a high-intensity workout that improves strength, speed, and endurance. It involves striking a heavy bag with various punch combinations, simulating a real fight, to develop technique and cardiovascular health, while also serving as a powerful stress-reliever.","A boxing punching bag is a heavy cylindrical bag suspended from a secure mount, typically made of leather or synthetic material, swaying slightly upon being struck by gloved fists delivering powerful punches and combinations in a rhythmic, forceful training session.","Boxing with a punching bag produces rhythmic thuds from gloves striking the bag, the swish of the bag moving, occasional grunt sounds from exertion, the creaking of the bag's chains, and the soft patter of the boxer's footwork on the floor.",,,,,,, +Boxing Speed Bag,"Boxing speed bag training involves rhythmically hitting a small, air-filled bag that rebounds quickly. This workout improves hand-eye coordination, timing, and punching speed, and is a staple in a boxer’s reflex and rhythm development, often incorporated into their cardiovascular and skill routines.","A small, teardrop-shaped bag is rhythmically punched by a person, rebounding swiftly on a swivel mount. The boxer’s hands move continuously, delivering rapid, repetitive strikes while maintaining a steady stance and focused concentration. The bag oscillates back and forth with each precise hit.","The rhythmic pounding of fists striking the bag, a consistent tempo-like beating; the swishing of the bag as it swings; the occasional squeak of the rotating swivel; and the boxer's controlled, rhythmic breathing amidst occasional grunts of exertion.",,,,,,, +Breast Stroke,"The breaststroke is a swimming style characterized by frog-like kicks and circular arm movements, performed with the swimmer's head above water between strokes. It is known for its efficiency and is often taught to beginners for its simplicity and rhythmic breathing pattern.","The breaststroke involves gliding forward with both arms extended, palms together, then sweeping them outwards and rearwards in a circular motion, while performing a frog-like kick with bent knees and feet turned out, propelling the swimmer's body through the water in a horizontal position.","The breaststroke swimming style produces rhythmic, splashing sounds as arms sweep through the water, a distinct gliding silence, and regular, muffled breathing noises when the swimmer's head breaks the surface for air. Goggles and water movement may also create subtle swishing or bubbling sounds.",,,,,,, +Brushing Teeth,"Brushing teeth is a daily hygiene activity that involves cleaning the teeth and mouth using toothpaste and a toothbrush to remove plaque, prevent cavities, maintain oral health, freshen breath, and decrease the risk of gum diseases like gingivitis. It's generally recommended twice a day for two minutes each session.","Person stands before sink, toothbrush in hand, applying toothpaste. Brushing motions scrub inner, outer, and biting surfaces of teeth, creating a foamy froth. Rinse follows, with water swirling in mouth and spat out, leaving behind a clean, fresh feeling. Toothbrush is cleaned under running water and replaced.","Brushing teeth usually involves the sound of bristles scrubbing against teeth, the splashing of water when rinsing the brush or mouth, and sometimes gurgling or spitting noises as the user clears their mouth of toothpaste. There may also be the clicking of a toothpaste cap or the squeezing of the tube.",,,,,,, +Weight Lifting,"Weight lifting is a physical activity that focuses on increasing muscle strength and mass through the lifting of weighted bars, dumbbells, or other equipment. It involves various exercises targeting different muscle groups, and it can improve overall fitness, bone density, and athletic performance.","Weight lifting involves individuals lifting barbells or dumbbells of varying weights, often on a bench or rack, engaging muscles with focused exertion, with bodies tensed and sometimes using gloves or belts for support, in an environment with mirrors and padded flooring.","Weight lifting often entails rhythmic metal clanking of weights, heavy breathing, grunts of exertion, the thud of weights being dropped, and occasionally the encouragement or instructions from trainers or spotters. Background music and gym machinery noises may also be present.",,,,,,, +Cliff Diving,"Cliff diving is an extreme sport that involves jumping from high cliffs into water, performing acrobatic movements during the freefall. Participants leap from heights typically ranging from 18-27 meters, requiring precision, skill, and courage to safely execute dives and minimize the risk of injury.","Cliff diving features individuals leaping from high cliffs into water, embodying grace and fearlessness. The diver often assumes an aerodynamic form mid-air against a backdrop of rugged rocks and open sky, before plunging into the sea or lake with minimal splash.","The rush of wind while falling, the distant roar of waves against the cliff, the sharp, echoing calls of sea birds, the muffled rush approaching water, the loud, splash impact, and the sudden quiet underwater before resurfacing to hear cheers and the ocean's continuous hum.",,,,,,, +Cricket Bowling,"Cricket bowling is the act of delivering the cricket ball to the batsman. Bowlers use various techniques to achieve speed, swing, and spin, aiming to outsmart the batsman, prevent runs, and ultimately dismiss them. There are different types of bowlers, including fast, medium, and spin bowlers.","A player runs up, then delivers a ball with a straight arm overhand towards a batsman at the other end of the pitch, aiming to hit the wickets or deceive the batsman. The action is fluid, with a high-speed arm rotation following a leap or stride from the bowler's delivery stride.","Cricketers bowling can produce sounds like the rhythmic run-up thuds, swift whoosh of ball delivery, leather ball hitting the pitch, or seams skidding, occasional grunts of effort, and the loud appeals or cheers from players and spectators reacting to the play's outcome.",,,,,,, +Cricket Shot,"Cricket shot is a batting technique in cricket where a player attempts to hit the ball delivered by the bowler, aiming to score runs while preventing the ball from hitting the stumps or getting caught by fielders. Shot selection is crucial and varies from defensive to aggressive hits.","A batter stands at the wicket, poised with a raised cricket bat. On striking the ball, their arms extend in a fluid, sweeping motion, often with a follow-through that rotates the body. The shot ranges from powerful drives to deft glances, executed with precise timing and footwork.","A cricket shot may produce a sharp crack as the ball strikes the bat, the whoosh of the bat swing, the crowd’s cheer or gasp, and potentially the thud of the ball hitting the ground or boundary boards.",,,,,,, +Cut Kitchen,"""Cut Kitchen"" is a challenging culinary activity where participants are tasked with creating innovative dishes from a limited set of ingredients within a set time frame, often with unexpected twists thrown in to test their creativity and adaptability in the kitchen.","""Cut Kitchen"" likely refers to a cooking space bustling with food preparation where chefs chop ingredients with knives, surrounded by cutting boards, vegetable peelings, and a variety of sliced foods, with the sound of swift chops punctuating the air amidst the hum of active culinary work.","The activity ""Cut Kitchen"" may include sounds of chopping, slicing on cutting boards, running water, the clink of utensils, sizzling sounds from cooking on a stove, the hum of appliances like refrigerators or dishwashers, and occasional background conversations or radio music.",,,,,,, +Diving,"Diving is an underwater exploration and sport activity where individuals use special equipment, such as scuba gear or a snorkel, to breathe underwater while observing marine environments, conducting research, or for recreation and adventure in oceans, lakes, and caves. It requires training for safety and proper technique.","Diving typically involves a person clad in swimwear performing acrobatic jumps into water, often from a platform or springboard, executing precise flips and twists before entering with minimal splash. It's a graceful, athletic display combining aerial maneuvers with controlled, streamlined entry into the water.","Underwater sounds are muffled due to density; hearing bubble trails, breath exhales; regulator clicks during air compression; distant boat hums; marine life clicks, songs, or calls; pressure changes impacting ear sensation; and potentially the creak of dive equipment or scraping against coral or rocks.",,,,,,, +Drumming,"Drumming involves rhythmically striking drums and percussion instruments to create music or accompany melodies. It can be a solo act or part of a band, ranging from cultural rituals to modern performances. It requires coordination, timing, and can express emotions or tell stories through varied beats and intensities.","A person rhythmically strikes drums with sticks, hands, or brushes, causing vibrations. Movement is coordinated; hands rise and fall in a dynamic flow. Drums of various sizes are arranged around the drummer, who may sit or stand, focused intently on producing sounds with controlled gestures and varying intensity.","Drumming produces rhythmic beats and varying tones depending on drum types and player technique. It creates a range of dynamics from soft taps to resounding thumps, encapsulating tempo changes, patterns like syncopation, and can incorporate additional sounds from cymbals or percussion accessories. Volume can escalate in high-energy passages.",,,,,,, +Fencing,"Fencing is a competitive sport where two opponents duel with slender swords. Aiming to touch each other with the weapon's tip, fencers score points for successful hits. The sport emphasizes agility, strategy, and precision and includes three disciplines: foil, épée, and sabre, each with its specific rules and target areas.","Fencing features two competitors clad in white protective gear with masks, wielding slender swords—foils, épées, or sabres—on a narrow strip, executing rapid, precise lunges, thrusts, and parries in pursuit of scoring touches on their opponent under bright lights with electronic scoring systems indicating hits.","Fencing may involve the clashing of metal epees, foils, or sabres, the en garde stance shuffle, athletes' quick footwork on the piste, the buzz of electronic scoring systems when a touch is scored, referees' vocal commands, and the swish of protective clothing during rapid movements.",,,,,,, +Field Hockey Penalty,"Field hockey penalties occur due to infractions, with consequences like penalty corners or penalty strokes. Penalty corners involve an attack from the edge of the field, while penalty strokes are one-on-one shots against the goalkeeper, providing teams opportunities to score under specified rules.","A field hockey penalty typically features a player taking a shot on goal from the penalty spot, often with a goalkeeper defending, and other players poised outside the shooting circle, ready to react to the play. The scene is tense, concentrated, with focused athletes and a sense of anticipation.","Whistle blasts signal penalty starts and ends, stick-on-ball clacks, players' quick footsteps, vocal communication between teammates, heavy breathing, goalie gear thuds, and possibly crowd reactions (cheers, gasps) depending on the match's viewership.",,,,,,, +Floor Gymnastics,"Floor gymnastics is an artistic and athletic discipline, part of artistic gymnastics, where gymnasts perform a choreographed routine to music, including tumbling, flips, and dance elements, showcasing strength, flexibility, and balance on a sprung floor without additional equipment. +","Floor gymnastics features athletes performing acrobatic movements like flips, tumbles, and twists on a springy, 12x12 meter mat, combining grace, strength, and flexibility, punctuated by dramatic leaps and dance elements, all choreographed to music for a flowing, expressive display of skill and athleticism.","Floor gymnastics typically includes the sounds of gymnasts' bare feet striking and brushing the mat, rhythmic music for choreographed routines, heavy breathing during exertion, and the cheers and applause of spectators. The sound of body movements and landings can also be prominent, showcasing the power and agility of the gymnasts.",,,,,,, +Frisbee Catch,"""Frisbee Catch"" is an outdoor leisure activity involving two or more players throwing and catching a flying disc called a Frisbee. It fosters hand-eye coordination and can be casually played in parks or at beaches for fun and exercise.","Participants stand apart, tossing a flat, disc-shaped object—the Frisbee—back and forth while running and leaping to catch it in flight, often displaying athletic movements in a park or open field.","The swish of the frisbee gliding through the air, user’s calls and communication, the soft thud of the frisbee's impact when caught or when hitting the ground, clapping, laughter, footsteps on grass or sand, and the occasional bark of a dog participating or watching.",,,,,,, +Front Crawl,"The front crawl, also known as freestyle, is a fast swimming style characterized by the alternate overhand motion of the arms and a flutter kick, with the face in the water and turning to the side to breathe. It's the most common stroke in competitive swimming.","The front crawl features alternating arm strokes slicing water, quick flutter kicks, and a rhythmic side-to-side turning of the head for breaths. The body maintains a straight, horizontal position, propelled smoothly and efficiently through the water with coordinated movements.","The front crawl stroke produces rhythmic splashing sounds as hands enter the water, a soft whoosh with each arm pull, bubbles from exhalation underwater, and the distinct gasp of air intake when turning the head to breathe. Gentle lapping of waves against the swimmer’s body can also be heard.",,,,,,, +Golf Swing,"Golf swing is the motion used by golfers to hit the ball with a club, aiming for distance and accuracy. It involves a precise sequence of body movements, including grip, stance, backswing, downswing, and follow-through, requiring technique and practice to perfect for consistent play on the golf course.","A golfer stands laterally, feet shoulder-width apart, gripping a club. Body rotates back with the club lifted in a fluid, arching motion, then swings forward, transferring weight through hips and legs, striking the ball with club face, following through with the motion towards the target, head down, eyeing the ball.","The ""whoosh"" of the club swinging, a crisp ""click"" upon striking the ball, followed by a softer sound as the ball makes contact with the fairway or green. Surrounding sounds may include the rustle of leaves, chatter of spectators, or distant clinking of clubs in a golf bag.",,,,,,, +Haircut,"A haircut involves cutting and styling hair on the scalp, often performed by a professional hairstylist or barber to maintain or change one's appearance according to personal preference or fashion trends. It can involve various tools such as scissors, clippers, and razors and can range from simple trims to elaborate styles.","A haircut typically involves someone trimming and styling another person's hair using scissors, clippers, combs, and other styling tools, often with the client seated in a chair at a salon or barbershop, surrounded by mirrors and grooming products.","Snipping of scissors, buzz of electric clippers, spray from mist bottle, rustling of cape, ambient salon chatter, whirring of a hair dryer, and clicking of comb through hair.",,,,,,, +Hammer Throw,"Hammer throw is an Olympic track and field event where athletes compete to hurl a heavy metal ball (the ""hammer"") attached to a grip with a steel wire as far as possible. They spin in a circle to gather momentum before releasing the hammer into the designated sector.","An athlete whirls, holding a wire attached to a heavy metal ball (the hammer), then releases it to send it flying through the air, aiming for distance inside a marked sector. The thrower often spins multiple times within a circular area before releasing the hammer.","The hammer throw produces rhythmic whooshing of the spinning hammer, the grunts of the athlete exerting force, the thud of the hammer landing in the field, and possibly the cheers and applause of spectators.",,,,,,, +Hammering,"Hammering is an activity involving striking objects with a hammer to drive nails, shape materials, break apart items, or forge metals. It requires hand-eye coordination, strength, and precision, commonly used in construction, carpentry, metalwork, and DIY projects.","Hammering involves rhythmic, forceful movements of an arm wielding a hammer, striking down onto the head of a nail or other object, which causes it to drive into a surface. Repeated impacts create a visible motion blur of the hammer with each swing, punctuated by brief moments of contact.","Hammering typically produces repetitive, sharp, loud percussive sounds as the hammer strikes a surface. The tempo can vary, and the timbre changes with material impact (metal, wood, etc.). Occasionally, background scraping or shifting noises occur as objects are manipulated between strikes.",,,,,,, +Handstand Pushups,"Handstand pushups are an advanced bodyweight exercise that target the shoulders, arms, and core. By assuming a handstand position against a wall for support, practitioners lower their head to the floor and push back up, combining strength, balance, and control for a challenging upper-body workout.","An individual kicks up into a handstand against a wall, with arms extended. They then bend their arms to lower their head towards the ground before pushing back up to fully extended arms, repeating the movement for multiple repetitions.","During handstand pushups, you might hear rhythmic breathing, straining or exertion grunts, the brush of feet against the wall for balance, and the quiet thud of feet or hands pressing into and lifting off the floor or exercise mat.",,,,,,, +Handstand Walking,"Handstand walking is an advanced gymnastic skill requiring strength, balance, and coordination, where an individual walks on their hands with feet elevated and body inverted, often used in gymnastics, CrossFit, and acrobatic disciplines for training and performance.","An individual inverted on their hands, body straight, legs together, walks forward by alternating hand placements while maintaining balance, resembling an upside-down walk.","Handstand walking may produce intermittent thuds from hand impacts, soft rustling of clothing, occasional grunts or breaths from exertion, and possibly verbal cues or encouragement if performed around others.",,,,,,, +Head Massage,"A head massage is a therapeutic relaxation technique involving the gentle manipulation of the scalp, neck, and sometimes shoulders to reduce stress, stimulate circulation, and promote hair health, often providing relief from headaches and inducing a state of calm.","A person uses their fingers to rhythmically knead, stroke, and rub another's scalp, occasionally applying gentle pressure. The recipient typically appears relaxed, often with closed eyes, as the masseur's hands move systematically across their head, sometimes extending to the neck and shoulders.","Soft rustling, gentle tapping, fingers running through hair, ambient calming music, soft spoken therapist voices, and occasional whispers.",,,,,,, +High Jump,"High jump is an athletic track and field event where competitors leap over a horizontal bar at varying heights without dislodging it. Athletes run up to gain momentum before using techniques like the Fosbury Flop to clear the bar, aiming for the maximum height. It requires agility, technique, and power.","In high jump, an athlete sprints towards a horizontal bar set at a specific height and leaps over it, back-first, using a flexible, arching motion, without knocking the bar off its supports. Landing mats cushion the athlete's fall after clearing the bar.","During a high jump event, one might hear the rapid footsteps of an athlete's approach, the rustling of clothing, a brief grunt during take-off, the thud upon landing on the mat, and possibly the clank of the bar if dislodged. Spectators' applause or encouragement could also be present.",,,,,,, +Horse Race,"Horse racing is a competitive sport where horses, guided by jockeys, race on a track to reach the finish line first. It combines athleticism, strategy, and often betting, showcasing the speed, stamina, and skill of both horse and rider in a thrilling spectator event.","A horse race typically features sleek horses thundering down a track with jockeys perched atop, clad in colorful silks. Spectators line the course, cheering, as hooves kick up dirt, with the finish line hosting a flurry of excitement as horses vie for the lead.","A horse race features galloping hooves, cheering crowds, the announcer’s call, the bugle’s “Call to the Post,” jockeys shouting, whips snapping, and the rustle of silks as horses and riders speed by.",,,,,,, +Horse Riding,"Horse riding is an engaging activity that involves mounting and riding horses for sport, recreation or practical purposes. Riders must learn to communicate and control the horse using reins and body signals, developing balance and coordination, while enjoying the connection with the animal and the outdoors.","An individual sits astride a horse, holding reins while the horse trots, canters, or gallops. The rider wears a helmet, boots, and possibly equestrian attire; they move in sync with the horse's rhythmic strides, navigating across varied terrains or within an arena.","Clip-clop of hooves, snorts, and whinnies from horses; creaking leather tack; soft thuds on ground; rustling of trees and wind; rider's commands; occasional neighing; rhythmic trotting sounds; jingling of bits or stirrups; animal breathing; distant galloping echoes.",,,,,,, +Hula Hoop,"Hula Hooping is a popular activity involving spinning a hoop around the waist, limbs, or neck. It improves coordination, flexibility, and core strength, and can be both a form of exercise and performance art, with variations like dance and tricks added for complexity and showmanship.","Activity involves spinning a colorful plastic hoop around the waist, limbs, or neck in rhythmic, fluid circular motions. Participants often sway hips or twirl, keeping the hoop in perpetual motion, exhibiting agility and coordination. Hoops may also be employed in dance routines, adding a vibrant, dynamic visual element.","Auditory features of hula hooping may include rhythmic swishing and whirring of the hoop circling the body, occasional soft thuds as it drops and hits the ground, and possibly the huffing and laughter of the participant enjoying the activity.",,,,,,, +Ice Dancing,"Ice dancing is a graceful and athletic form of figure skating that combines dance and sport, focusing on rhythm, interpretation, and partnership as skaters perform choreographed routines to music on ice.","Ice dancing features pairs gliding gracefully across the ice in coordinated costumes, executing intricate footwork, lifts, and spins in sync with music, combining artistry with athleticism, and emphasizing rhythm, interpretation, and fluid movement more so than high-flying jumps and powerful throws typical in pairs skating.","Ice dancing features the crisp, gliding sound of blades cutting across ice, the swish of skaters' costumes, the rhythmic thud of precise steps and jumps, and the accompanying music which ranges from classical to contemporary, shaping the dance's mood and tempo.",,,,,,, +Javelin Throw,"Javelin throw is an Olympic track and field event where athletes hurl a long spear-like implement as far as possible. Technique, strength, and speed combine as competitors run up to a foul line before releasing the javelin with an overhand motion into a marked sector.","An athlete sprints down a runway and hurls a long, spear-like javelin into the air, aiming for maximum distance. The javelin arches before landing tip-first on a grassy field, marked for measurement.","A whispering whoosh of the javelin slicing the air, athletes grunting with exertion during the throw, the thud as it pierces the ground, applause and cheers from spectators, and announcements by the event commentators.",,,,,,, +Juggling Balls,"Juggling balls involves tossing multiple spherical objects into the air and catching them in a rhythm, maintaining continuous motion without dropping them. This skill improves hand-eye coordination and concentration, and can be both a leisurely hobby and a performance art.","A person simultaneously tosses and catches multiple balls in a rhythmic pattern, typically in an arc-like motion, with each ball tracing a curved path through the air before being caught and thrown again with alternate hands.","The auditory features of juggling balls include rhythmic thumps as they land in hands, soft swooshing sounds during flight, occasional patter of dropped balls on the floor, and possibly the juggler's focused breathing or light grunts from exertion.",,,,,,, +Jump Rope,"Jump rope is a form of exercise where a rope is swung overhead and passed under the feet in a rhythmic motion, typically used for cardiovascular fitness, agility training, and as a competitive sport, involving various techniques and styles for individuals or teams.","Jump rope involves a person swinging a long rope overhead and jumping over it as it passes under their feet, often in rhythmic patterns or tricks, sometimes alone or in groups, characterized by the rope's arc and the rhythmic hopping or skipping motion of the jumper.","Repetitive thudding of rope on ground, rhythmic whooshing as rope cuts through air, occasional impacts of feet touching down, steady breathing patterns of jumper, intermittent vocal counts or encouragement, sometimes a light tapping from the rope's handle movements, snappy sound when rope hits the ground at high speeds.",,,,,,, +Jumping Jack,"Jumping Jack is a physical jumping exercise, performed by jumping to a position with legs spread wide and hands touching overhead, then returning to a position with feet together and arms at the sides. It's a full-body workout used for warm-ups, conditioning, and agility training.","A Jumping Jack is an aerobic exercise where one stands upright, jumps to spread the legs while simultaneously raising the arms overhead, then jumps back to the starting position with legs together and arms at the sides.","Jumping jacks produce rhythmic, repetitive sounds of feet hitting the ground and the swish of clothing or limbs moving through the air, often accompanied by breathing patterns that increase with intensity as the exercise continues.",,,,,,, +Kayaking,"Kayaking is a water sport where individuals paddle across water using a small boat called a kayak. It can be done in various water bodies such as rivers, lakes, and oceans and ranges from serene paddling to navigating whitewater rapids, offering both tranquil experiences and adrenaline-filled adventures.","Kayaking features individuals seated in small, narrow watercraft, using double-bladed paddles to navigate through waterways. The kayaks skim across the surface of rivers, lakes, or seas, often with the paddlers wearing life jackets for safety, surrounded by nature's scenic beauty or challenging white water rapids.","Splashing oars, rhythmic strokes, water flowing against the hull, wildlife calls, rustling foliage from the shore, the occasional creak of the kayak flexing, and tranquil silence broken by gentle ripples.",,,,,,, +Knitting,"Knitting is a craft involving the interlocking of yarn or thread with needles to create fabric. It's a popular pastime for creating garments, accessories, and home decor. Stitches are looped together in various patterns, resulting in intricate designs. Both relaxing and functional, knitting can be a solitary or social activity.","Knitting involves the rhythmic movement of needles looping yarn into a cohesive fabric. Fingers deftly manipulate the strands, creating patterns that emerge row by row in a growing textile piece. The knitter usually appears focused, with skeins of colored yarn and two slender needles in hand.","Knitting produces soft, rhythmic clicking of needles, occasional rustling of yarn, and periodic shifts in fabric. This creates a calming, repetitive soundscape.",,,,,,, +Long Jump,"The long jump is a track and field event where athletes sprint down a runway and leap as far as possible into a sandpit from a takeoff board. It requires speed, agility, and explosive power. The winner is the one who covers the greatest distance from the board to their landing.","In the long jump, an athlete sprints down a track to a takeoff board and leaps horizontally into a sandpit, aiming to cover the greatest distance. The motion is fluid: a quick sprint, an explosive jump with legs extended forward, and a landing often with legs swept back for maximal reach.","In long jump, you might hear the sound of running footsteps accelerating on the track, the jumper's grunt during takeoff, the swift whoosh of air as they leap, and the soft thud when landing in the sand pit, followed by spectators' applause and cheers.",,,,,,, +Lunges,"Lunges are a popular lower-body exercise targeting muscles like the quadriceps, hamstrings, glutes, and calves. They involve stepping forward into a deep stride, bending both knees while keeping the torso upright, and then pushing back to the starting position. Lunges improve strength, balance, and flexibility.","A lunge is performed by stepping forward with one foot, bending both knees at 90 degrees, with the back knee hovering above the ground. The torso remains upright, and the front thigh is parallel to the floor. The individual then pushes back to the starting position.","Lunges may involve rhythmic stepping sounds as feet alternate positions, soft thuds when knees approach the ground, rubbing of fabric from gym clothing, and controlled breathing sounds like inhales and exhales, potentially interspersed with grunts or exertion noises from the person performing the exercise.",,,,,,, +Military Parade,"A military parade is a ceremonial event where armed forces march in formation, often accompanied by military bands, to showcase discipline, ceremonial prowess, and a country's military capabilities. It can mark national holidays, honor victories, or commemorate significant historical events.","Uniformed troops march in precise formations, flanked by military vehicles and artillery. Flags and banners flutter. A display of might, with bands playing marching tunes. Crowds line streets, often against a backdrop of iconic landmarks. Soldiers' polished boots, crisp uniforms, and synchronized movements exude discipline and nationalism.","A military parade typically features the rhythmic marching sounds of soldiers' boots, the cadence of drum corps, brass bands playing martial music, commands shouted by drill sergeants, the hum of military vehicles, occasional gun salutes, and sometimes flyovers by aircraft with the associated roar of engines.",,,,,,, +Mixing,"Mixing is the process of combining two or more substances to ensure that they are evenly distributed within each other, resulting in a homogenous mixture. This can be achieved manually or mechanically in various contexts, including cooking, industrial manufacturing, pharmaceuticals, and cosmetics.","Mixing is typically represented by substances combining together, often in a bowl or container. Tools like spoons, whisks, or mixers create a swirling motion, blending ingredients into a uniform consistency. The process may show particles melding together and changing texture or color as they integrate.","Mixing may involve sounds of liquids being stirred, whisking, splashing, bottles clinking, ingredients being poured, the scrape of a spatula, the click of a switch, and the hum or whirr of electrical appliances like blenders or mixers.",,,,,,, +Mopping Floor,"Mopping the floor is a cleaning activity involving a mop to wet-wash and remove dirt, grime, and stains from hard floor surfaces, ensuring hygiene and maintaining the floor's appearance by using a combination of water, detergent, and physical action.","A person pushes a wet mop across a floor, spreading water and cleaning solution. The mop's head swabs back and forth, leaving a shiny, damp trail. The individual periodically wrings out excess liquid into a bucket, turning the murky water cloudier with each dip.","Sloshing of water, swirling sound of a wet mop, squelching as it's wrung out, rhythmic swiping on the floor, occasional dripping, bucket handle clinking, footsteps on wet surface.",,,,,,, +Nunchucks,"Nunchucks, or nunchaku, are a traditional martial arts weapon consisting of two sticks connected by a chain or rope, used in various forms of training and demonstrations for coordination, agility, and self-defense. They originated in Okinawa, Japan, and were popularized by Bruce Lee in his films.","""Nunchucks"" involves swinging two sticks connected by a chain or rope, typically in a fluid, circular motion. The practitioner displays rhythmic and coordinated twirls, spins, and strikes, often with impressive speed and agility, creating a dynamic, sometimes hypnotic visual spectacle.","Using nunchucks can produce rhythmic whooshing sounds as they cut through the air, sharp cracks when striking an object, and clicks when the two sticks collide. The intensity and tempo of the sounds vary with the practitioner's speed and nunchuck material.",,,,,,, +Parallel Bars,"Parallel bars are an apparatus used in artistic gymnastics and physical therapy, consisting of two horizontal bars aligned in parallel, allowing gymnasts to perform various swinging, balancing, and strength maneuvers, demonstrating coordination and control. The bars are typically adjustable to accommodate different users' heights and skill levels.","Parallel bars in gymnastics feature two horizontal bars aligned in parallel, elevated on upright supports. Gymnasts perform routines of flips, swings, and balances on the bars, showcasing strength and agility within a restricted space. The bars' wooden or fiberglass construction adds a subtle gloss under the bright competition lights.","Gripping and releasing metallic bars, rhythmic gymnast's hands movements, occasional metal creaks, athletes’ exerted breaths, soft thuds of landings on mats, spectators’ claps, and cheers, coach's instructions, and encouragement may characterize the auditory experience of parallel bars activity.",,,,,,, +Pizza Tossing,"Pizza tossing is a culinary technique used by chefs to stretch, aerate, and shape pizza dough into a thin base. It involves spinning and flipping dough in the air, which also adds an entertaining visual display to the pizza-making process.","An individual spins, stretches, and flips a circular disc of pizza dough overhead, using dexterous hand movements to shape and aerate it into a larger, thin base, sometimes performing acrobatic tricks for flair.","The rhythmic slapping of dough against hands, frequent flour rustling, soft thuds on the work surface, airy whooshes during tossing, and occasional playful banter between cooks.",,,,,,, +Playing Cello,"Playing the cello involves mastering a versatile string instrument with a rich, resonant tone. The cellist uses a bow or fingers to draw sound from its strings, interpreting musical scores while seated, holding the instrument between the knees, and delicately adjusting finger positions on the neck for pitch accuracy.","An individual sits holding a large, curved wooden instrument between their knees, bow in right hand gliding across strings, left hand fingers pressing down on the fingerboard, creating music. The player's posture is straight, focused, and attentive to the resonant, deep tones of the cello.","Resonant, deep, warm tones with variable pitches; smooth bowing sounds on strings; soft finger tapping on the fingerboard; occasional creak of wood; subtle shifts in dynamics; expressive vibrato hums; periodic silence during rests; potential screech from incorrect bowing.",,,,,,, +Playing Daf,"Playing Daf involves mastering a large, frame drum used in Middle Eastern music. Participants learn to produce diverse sounds through various hand techniques, often accompanying powerful, rhythmic compositions, and can engage in both solo and ensemble settings to explore the cultural and spiritual aspects of this traditional percussion instrument.","""Playing Daf"" involves holding a large, circular frame drum with metal ringlets. The player uses fingers to tap and hands to strike the drumhead, creating a variety of rhythms. The Daf vibrates, with ringlets jingling, adding a shimmering sound to the rich, resonant beats.","Playing the daf, a large Middle Eastern frame drum, produces deep resonant beats and high-pitched jingles from metal rings attached to its frame, creating layered rhythmic patterns and vibrant timbres when struck with the fingers, palms, or snapped against the player's body.",,,,,,, +Playing Dhol,"Playing Dhol involves rhythmically striking a traditional double-headed drum, originating from South Asia, often accompanying bhangra and other folk dances, using two wooden sticks, and creating high-energy beats that are key in festivals, weddings, and cultural celebrations, embodying a vibrant expression of heritage and joy.","Individuals energetically beat a barrel-shaped, two-sided traditional Indian drum, the dhol, with curved sticks, swaying to rhythmic beats, often accompanied by vibrant dance and festivity, showcasing rich, colorful attire.","Playing the dhol involves rhythmic beats, deep bass tones intermingled with high-pitched slaps, varying intensity, and tempo fluctuations, creating a vibrant, energetic soundscape often associated with cultural celebrations and dance.",,,,,,, +Playing Flute,"Playing the flute involves producing sound by directing a stream of air across the mouthpiece of a woodwind instrument, using finger placements to vary pitch and create melodies. It requires coordinated breathing, embouchure control, and finger dexterity, and is a popular choice for solo and ensemble music.","A person holds a slender, elongated musical instrument horizontally to their lips, fingers poised over its keys, cheeks slightly puffed as they blow air across the mouthpiece, producing melodious sounds.","When playing the flute, one might hear melodic tunes, breathy notes, and the occasional click of keys as fingers move. Variations in pitch, volume, and tone can occur, reflecting the player's skill and the music's dynamics. Vibrato and airy hisses might also be auditory features.",,,,,,, +Playing Guitar,"Playing guitar involves strumming or plucking strings to create music. It requires coordinating finger movements on the fretboard to form chords and melodies. There are various styles, including acoustic, electric, and classical. Learning guitar can be self-taught or through lessons, developing skills like rhythm and musical expression.","A person holds a guitar, fingers pressing strings on the fretboard while the other hand strums or plucks the strings, creating music. The player often displays focused expression, coordinating rhythmic hand movements and subtle variations in pressure and technique for different sounds.","Strumming, plucking strings, chord changes, resonant wood vibrations, finger sliding sounds, occasional string buzzing, pick tapping rhythm, soft to loud dynamic variations, harmonics, fret buzzing on certain notes, and the click-clack of fingers on fretboard.",,,,,,, +Playing Piano,"Playing piano involves using fingers to press keys, creating music by striking strings inside the instrument, developing coordination, and rhythm, reading musical notation, and expressing emotions through melody and harmony. It can be a solo activity, accompaniment, or ensemble performance, fostering both technical skill and artistic creativity.","Individuals sit or stand at a keyboard, gracefully moving their fingers across black and white keys, producing music. The pianist’s hands and arms shift in fluid motion while feet may operate pedals below. Sheet music often rests on a stand above the keyboard.","Melodic tunes, harmonious chords, rhythmic tapping of keys, soft pedal sostenuto, resonant string vibrations, occasional fingernail clicks, methodical key presses, dynamic volume shifts, felt dampers lifting, subtle bench creaks, and the mechanical action of hammers striking strings.",,,,,,, +Playing Sitar,"Playing sitar involves mastering a plucked string instrument from Indian classical music with a long neck and a gourd resonating body. It requires intricate finger techniques and understanding of raga scales for creating its distinctive, complex, and melismatic melodies.","An individual sits cross-legged, holding the sitar, a plucked string instrument, with its long neck, gourd-shaped base, and sympathetic strings. Fingers deftly pluck and strum the strings while the other hand presses the frets, eliciting a resonant melody accompanied by intricate rhythmic intricacies.","Playing sitar involves plucking strings to create a resonant, twangy sound with long sustain, featuring glissandos, microtonal bends, intricate rhythms, and the harmonious drone of sympathetic strings, characteristic of classical Indian music.",,,,,,, +Playing Tabla,"Playing tabla involves mastering a traditional Indian percussion instrument comprising two drums, producing a variety of sounds and intricate rhythms often accompanying classical, devotional, or popular music, requiring dexterity and rhythmic acumen learnt under systematic tutelage and practice.","Sitting cross-legged, one plays tabla by rhythmically striking two drums: the right hand on the smaller, higher-pitched dayan, and the left on the larger, deeper bayan, adjusting pitch by pressing the drum’s edge.","Playing tabla produces rhythmic beats and resonant percussive sounds. The two drums (dayan and bayan) deliver distinct tones: sharp trebles from the dayan and deep bass from the bayan. Skillful finger technique results in complex, melodic phrases within the framework of traditional Indian talas (rhythmic cycles).",,,,,,, +Playing Violin,"Playing the violin involves drawing a bow across strings to create music, mastering finger placement, and learning how to read sheet music. It requires coordination, practice, and an understanding of musical theory, all contributing to the expression of emotion and storytelling through sound.","An individual holds the violin under the chin, resting it on the shoulder, while the left hand fingers the strings on the neck. The right arm gracefully moves the bow across the strings, creating music. The player's focused expression often reflects the emotion of the piece being performed.","Playing violin produces melodic sounds with varying pitch, intensity, and timbre. It involves bowing strings for sustained notes and finger placement for pitch changes, alongside occasional plucking (pizzicato). Subtle string vibrations and resonant wood body contribute to its rich, expressive tones. Vibrato adds warmth and emotional depth.",,,,,,, +Pole Vault,"Pole vault is an athletic event where competitors use a flexible pole to leap over a high bar. They sprint down a runway, plant the pole into a box, and propel themselves upward and over the bar, aiming to clear the greatest height without dislodging it.","Pole vault involves an athlete sprinting with a long, flexible pole, which they then plant into a box to leverage their body over a high bar, clearing it before landing on a cushioned mat.","The swish of the pole slicing through air, the rhythmic run-up of spikes on the track, the creak and flex of the pole bending, the whoosh as the vaulter soars, the soft thud upon landing on the mat, and intermittent cheers and claps from spectators.",,,,,,, +Pommel Horse,"Pommel horse is a male gymnastics apparatus featuring a metal frame with a wooden body and two handles. Gymnasts perform continuous circular or swinging movements combined with leg splitting and bending, requiring strength, rhythm, and balance, while keeping their bodies elevated above and around the apparatus.","Gymnasts perform fluid, rhythmic routines on a leather-covered apparatus with two handles (""pommels""), swinging and rotating their bodies in circles, handstands, and scissors motions, while maintaining continuous motion and balance.","Auditory features of pommel horse activity include rhythmic thumping of hands on leather, swooshing sounds as legs cut through the air, occasional heavy breathing, the metallic groan of equipment under stress, and soft thuds when gymnasts dismount onto the mat, often accompanied by applause from spectators.",,,,,,, +Pullups,"Pull-ups are an upper-body strength exercise where you hang from a bar using an overhand grip and pull your body up until your chin is above the bar, primarily working the back, shoulders, and arms. It is a compound movement that requires minimal equipment and is effective for building muscle.","Pullups involve hanging from a bar with palms facing outward or inward and pulling up until the chin surpasses the bar, engaging the upper body muscles, particularly the back, arms, and shoulders. Repeatedly raising and lowering the body, the individual keeps their legs straight or bent to avoid swinging.","During pull-ups, one might hear the rhythmic exhale of breath with each exertion, the creak or groan of the pull-up bar or mounting hardware under strain, the slight rustle of clothing, and occasional grunts or expressions of effort from the person performing the exercise.",,,,,,, +Punch,"Punch is a full-body striking exercise where an individual thrusts their fists into the air or against a target, like a bag, to enhance cardio fitness, muscular endurance, and coordination. It's often incorporated into boxing training, martial arts, and fitness routines to improve power and agility.","A punch typically features a closed fist thrusting into a target with force, often involving a quick, straight arm movement starting from the shoulder. The movement is explosive, aimed, and executed with intent to deliver impact, showing engagement of the body's core muscles for power.","The auditory features of a punch may include a sharp, forceful ""thwack"" or ""smack"" upon impact, varying by the surface struck; a ""whoosh"" from the movement of air; muffled thuds on softer material; and possibly grunts or exhales from the person delivering the punch.",,,,,,, +Pushups,"Pushups are a traditional bodyweight exercise targeting the chest, shoulders, and triceps. Performed by elevating and lowering the body using the arms, they strengthen and tone upper body muscles, offering various modifications to suit different fitness levels and goals.","A pushup involves a person in a prone position, hands shoulder-width apart and body straight, who lowers and raises their body by bending and straightening their arms, maintaining a plank-like torso alignment throughout.","During pushups, one might hear rhythmic breathing, occasional grunts or exertion sounds, the soft thud of hands contacting the floor, fabric rustling from clothing movement, and potentially light tapping of feet or toes maintaining stability.",,,,,,, +Rafting,"Rafting is a thrilling outdoor adventure sport where groups navigate downstream on rivers aboard inflatable rafts, tackling varying levels of rapids and currents, fostering teamwork and experiencing the exhilaration of whitewater challenges in a natural setting.","Rafting: A group of people wearing helmets and life vests paddle a large inflatable raft through turbulent river waters, navigating rapids and waves, often getting splashed, with scenic natural landscapes surrounding them.","Rafting involves the sounds of rushing water, the rhythmic paddling of oars, the occasional splash as water hits the inflatable raft, shouts and communications between rafters, and possibly wildlife noises along riverbanks.",,,,,,, +Rock Climbing Indoor,"Indoor rock climbing is a physically and mentally demanding sport where individuals ascend artificial rock walls with handholds and footholds, using strength, endurance, and problem-solving skills, typically in a gym with safety equipment like harnesses and ropes, offering a controlled environment for beginners and experienced climbers alike.","Indoor rock climbing features climbers ascending artificial walls with colorful holds of varying shapes and sizes, often in a gym with ropes, harnesses, and mats for safety. The atmosphere is vibrant and active with focused climbers maneuvering through challenging routes.","Indoor rock climbing involves sounds of climbers' equipment clinking, chalk bags rustling, ropes swooshing, periodic verbal communication like calls of encouragement or coordination, the soft thud of falling onto mats, and background music or ambient noise from the facility.",,,,,,, +Rope Climbing,"Rope climbing is a physical activity involving ascending a vertical rope using only the limbs. It builds strength, endurance, and coordination, is practiced both recreationally and competitively, and is also utilized in military training and fitness regimens. Different techniques, such as the foot lock, are employed to aid climbing.","Rope climbing entails a person gripping a vertical rope with their hands, using their upper body strength and sometimes their legs to interlace or wrap around the rope, as they ascend upwards, often in a gym or outdoor setting, typically secured by climbing gear for safety.","Rope climbing typically involves the sound of hands gripping and sliding on the rope, heavy breathing from physical exertion, feet shuffling for a good hold, and the creaking or slight swaying of the rope if it's suspended from a structure.",,,,,,, +Rowing,"Rowing is a water sport using oars to propel boats, requiring synchronized teamwork, cardiovascular strength, and endurance. It offers full-body workouts on rivers, lakes, or oceans, for recreation, fitness, or competition, in sculls or sweep boats.","Rowing involves synchronized, fluid movements, with athletes sitting in narrow boats, using oars to propel themselves through water. Their backs move in harmony, legs drive together, and oars slice in and out of the water, creating ripples and splashes, all against the backdrop of scenic waterways.","Rowing generates rhythmic splashes as oars dip into the water, the mechanical slide of seat tracks, the creak of the boat with each stroke, synchronized grunts or breaths of rowers, and occasional calls from the coxswain coordinating the team's movements.",,,,,,, +Salsa Spin,"Salsa Spin is a dynamic dance move found in Salsa, a Latin dance style, where partners perform a coordinated turn or spin, typically led by the follower under the guided hand of the leader, adding flair and rhythm to the dance.","""Salsa Spin"" involves dancers in vibrant attire, energetically twirling and stepping to rhythmic Latin music. Partners execute tight spins, maintaining eye contact and fluidity, with hips swaying and feet moving quickly. The room is alight with movement, the air charged with the passion of synchronized, intricate dance patterns.","""Salsa Spin"" may include rhythmic Latin music with strong percussion, brass instruments, and vibrant melodies. Syncopated beats and fast-paced rhythms could accompany the spinning dance moves, with occasional shouts or claps for enthusiasm and timing.",,,,,,, +Shaving Beard,"Shaving a beard is the process of removing facial hair using tools such as a razor or electric shaver. It can be a daily routine for personal grooming, style, or hygiene.","A person uses a razor or electric shaver to glide along their lathered or dry skin, trimming and removing the hair growth on their face, leaving smooth skin in its wake, often with strokes upwards or downwards to achieve a clean-shaven look.","The sound of electric clippers buzzing, razors scraping against stubble, water splashing, and the soft swish of a brush applying shaving cream. Occasionally, there's the tap of razor on sink edge to dislodge hairs.",,,,,,, +Shotput,"Shot put is an athletics track and field event where competitors throw a heavy sphere (shot) from a seven-foot circle using one hand, aiming for maximum distance. Proper technique and strength are crucial to excel in this event, which is part of the Olympics and various championship meets.","An athlete in a circular ring bends holding a heavy metal ball (shot) close to their neck. They whirl or glide, then explosively extend their arm, launching the shot into the air. The goal is to achieve maximum distance, with performances judged by how far the shot lands from the circle.","Shot put typically involves grunts or exertion noises from athletes, the dull thud of the shot landing in the sand or field, and possibly the sound of cheers and applause from spectators. Additionally, there might be officials' whistles and announcements over a loudspeaker.",,,,,,, +Skate Boarding,"Skateboarding is an action sport involving riding and performing tricks on a skateboard, often in skateparks or urban environments. It combines balance, agility, and creativity, and has evolved into a global subculture with a diverse range of styles and disciplines.","Skateboarding involves riders performing tricks on skateboards, gliding on pavement with agility. They balance on wheeled boards, often flipping or jumping, using rails and ramps in urban landscapes or skate parks. The activity is fluid, dynamic, and sometimes acrobatic, characterized by casual, sporty attire.","Skateboarding produces rhythmic clattering of wheels on concrete, intermittent grinding sounds from rail slides, sharp snaps during tricks, occasional thuds from falls, and the whoosh of wheels during high-speed cruising, creating an unmistakable urban symphony.",,,,,,, +Skiing,"Skiing is a winter sport where participants glide over snow on skis with fixed-heel bindings. It combines recreation and competition, requiring balance, strength, and agility. Skiers navigate slopes of varying difficulty or enjoy cross-country trails, with activities ranging from leisurely to high-speed alpine racing.","Skiing features individuals gliding over snow-covered slopes on narrow skis, often wearing insulated clothing and goggles, against a backdrop of mountainous terrain dotted with conifers and ski lifts, with occasional sprays of powdery snow kicked up by swift turns and descents.","Skiing features the swish of skis gliding over snow, the whoosh of wind rushing past, the rhythmic pole plants, occasional crunches when crossing icy patches, distant chatter of fellow skiers, and the muffled ambiance under a thick winter hat or helmet.",,,,,,, +Skijet,"Skijet, also known as jet skiing, is a high-speed water sport where a rider on a small motorized craft skims across a water surface, performing maneuvers or racing on lakes, rivers, or coastal areas. It combines adrenaline-pumping excitement with the challenge of balance and navigation.","A skijet, also known as a jet ski, is a small, agile watercraft ridden astride like a motorcycle, with a handlebar for steering and control. The rider skims across the water surface at high speeds, creating spray and often performing sharp turns and jumps.","A skijet, commonly known as a jet ski, produces a loud, high-pitched whirring from its engine, combined with splashes and waves as it cuts through the water. Wind noise is also prevalent at high speeds, and beeping may indicate operation alerts.",,,,,,, +Sky Diving,"Sky diving is an extreme sport where participants jump from an aircraft, freefall through the air, and use parachutes to control their descent safely back to the ground. It's an exhilarating activity that provides an intense adrenaline rush and stunning aerial views.","Skydiving entails hurtling through the air from high altitude, often with a colorful parachute deploying overhead. Divers may wear jumpsuits, goggles, and helmets, freefalling with arms and legs spread before gliding gracefully under an open canopy against a backdrop of expansive skies and the earth below.","Sky diving can involve the intense rush of wind noise during freefall, a fluttering or snapping sound from the parachute, radio communication from instructors, the silence of serene descent under canopy, and the rustling of gear. These auditory elements mix with the adrenaline-fueled excitement of the experience.",,,,,,, +Soccer Juggling,"Soccer juggling involves keeping a soccer ball aloft using feet, knees, chest, and head without allowing the ball to touch the ground, improving ball control, touch, and coordination. It's practiced by tapping the ball repeatedly, challenging oneself to maintain control for as long as possible.","A person repeatedly bounces a soccer ball off their feet, knees, and head without letting it touch the ground, showcasing control and coordination.","Soccer juggling involves rhythmic thuds as the ball strikes the foot, slight swooshes during ball movement, intermittent soft taps when controlled with knees or head, and occasional sharper knocks if it contacts harder surfaces like shoes. Occasional vocalizations from the juggler may also be present.",,,,,,, +Soccer Penalty,"Soccer penalty is a critical moment in the game where a player takes an unobstructed shot on goal from the penalty mark, 12 yards from the goal line, while only the goalkeeper defends the attempt, typically awarded after a foul within the penalty area.","A player stands at the penalty spot, 12 yards from goal, poised to kick the ball. The goalkeeper readies to defend the net. Spectators anticipate the outcome. The scene embodies tension, focus, and precision as the striker aims to score, and the goalie to save, in a critical game moment.","Whistle blowing, crowd noise (cheering, booing), player's footsteps, ball being kicked, ball hitting the net/post, goalkeeper diving, and sometimes communication between players or instructions shouted by the coach.",,,,,,, +Still Rings,"Still Rings, a gymnastics apparatus, consist of two rings suspended from a structure. Athletes perform a routine including swings, holds, and strength positions, showcasing control and muscle power while keeping the rings as still as possible. It's an Olympic discipline, demanding immense upper body strength and stability.","Two gymnasts, often wearing leotards, perform gravity-defying routines on two steady rings suspended from a metal frame, showcasing strength and control in a series of holds, swings, and handstands.","The still rings event in gymnastics may be characterized by gripping sounds, the creaking of the cables, athletes' grunts of exertion, the thud of landings, and the applause or guidance of coaches and spectators.",,,,,,, +Sumo Wrestling,"Sumo wrestling is a Japanese full-contact sport where wrestlers (rikishi) use strength, technique, and strategy to force opponents out of a circular ring or make them touch the ground. It’s rich in ritual and tradition.","Sumo wrestling features two large, nearly-naked athletes clad in loincloths (mawashi) confronting each other in a circular ring (dohyō). They grapple, push, and try to force each other out of the ring or make any part of the body touch the ground.","Sumo wrestling features big wrestlers stomping and slapping each other in a ring. A referee shouts commands, while ceremonial music plays. The crowd cheers as bodies crash to the ground, and rituals include stomping and salt-tossing.",,,,,,, +Surfing,"Surfing is a water sport where individuals ride ocean waves on a surfboard, skillfully maneuvering along the face of the wave. It combines balance, strength, and timing, with surfers seeking to catch and ride waves for as long as possible, often performing dynamic turns and aerial tricks.","Surfing depicts individuals standing on boards, riding ocean waves towards the shore, often performing dynamic maneuvers as they balance against the water's force, occasionally enclosed by the wave's curling tunnel, set against coastal landscapes under various sky conditions.","The sounds of surfing include the rhythmic crashing of waves, the hiss of foam, the splash when entering water, the whoosh of riding a wave, the creak of the surfboard flexing, and the distant calls of seabirds or fellow surfers.",,,,,,, +Swing,"Swing is a lively dance style that originated in the 1920s-1940s, characterized by its upbeat tempo, bouncy movements, and iconic aerial flips. It's often danced to jazz and swing music and encompasses various dances such as the Lindy Hop, Charleston, and Jive.","Swing involves a seat suspended by ropes or chains from a metal or wooden frame, moving back and forth. Riders push their legs to gain momentum, often reaching a high arc, accompanied by feelings of weightlessness at the peak of each swing.","Swings often produce rhythmic creaking or squeaking from metal or rope hinges, the whoosh of air as the swing moves back and forth, and potentially laughter or shouts of joy from users, especially children. The intensity and timbre of sounds vary with swing speed and materials.",,,,,,, +Table Tennis Shot,"Table Tennis Shot is a fast-paced activity in which players use paddles to hit a lightweight ball back and forth over a net on a hard table, aiming for precision, spin, and speed to outmaneuver their opponent and score points.","Two players stand at opposite ends of a table tennis table, paddles in hand. A small, white, spherical ball is struck back and forth, bouncing once on the table surface per side. Action is quick, with rapid arm and paddle movements as players attempt to outmaneuver each other.","In table tennis, a shot makes a sharp “click” when the racket hits the ball, followed by a “thud” on the table. Different sounds indicate shot types like loop, smash, or chop, depending on speed, spin, and force.",,,,,,, +Taichi,"Tai chi is an ancient Chinese martial art characterized by gentle, flowing movements combined with deep breathing and mindfulness, often practiced for its health benefits, promoting balance, flexibility, and stress reduction. It's a form of moving meditation and a non-contact, low-impact exercise suitable for all ages.","Taichi involves slow, deliberate movements performed in a fluid sequence. Practitioners often wear loose, comfortable clothing and maintain a calm, focused demeanor, moving with grace and balance in open spaces like parks or studios. The activity emphasizes harmony between body and mind.","Tai chi often involves soft, flowing background music mimicking natural sounds like wind or water, with occasional verbal instructions for movements. The rhythmic sound of deep, controlled breathing is also prominent, enhancing the meditative quality of the practice.",,,,,,, +Tennis Swing,"Tennis swing refers to the motion used by players to hit the ball with a racquet during a game of tennis. Key swings include the forehand, backhand, serve, and volley, each requiring precise technique to effectively control the ball's direction, speed, and spin.","A tennis swing involves a player holding a racket with one or both hands, pivoting their body, and swinging their arm in an arc to hit the ball with control, often with a follow-through to impart speed and spin.","A tennis swing may produce a distinct ""whoosh"" from the racket cutting through the air, followed by a sharp ""pop"" or ""thwack"" upon contact with the ball, and possibly a soft squeak of shoes against the court surface during the player's movement.",,,,,,, +Throw Discus,"Throw discus is an ancient track and field event where athletes aim to hurl a heavy frisbee-shaped disc—typically made of wood and metal—farthest from a circle through a prescribed technique, combining strength, speed, and skill. It's a classic Olympic sport that measures power and precision.","An athlete spins with precise footwork in a circle, then hurls a heavy, lens-shaped disc (the discus) with a strong, whipping arm motion into the distance, aiming for maximum range within a marked sector. The body shows tension and release, demonstrating power, balance, and technique.","The whoosh of the discus cutting through the air, the athlete's grunts or exhales during the throw, the thud as the discus lands in the field, and the surrounding crowd's reactions—cheers, claps, or murmurs—can characterize the auditory environment of discus throwing events.",,,,,,, +Trampoline Jumping,"Trampoline jumping is a recreational and competitive activity where participants bounce on a trampoline, using its spring-loaded surface to perform acrobatic maneuvers, exercises, and tricks, enhancing coordination, balance, and cardiovascular fitness. It's fun for all ages and can be done indoors or outdoors.","""Participants bounce high on a taut, springy fabric stretched over a steel frame, performing flips and acrobatics while aerially suspended. The mesh-like surface flexes and recoils with each jump. Safety nets often enclose the sides, and jumpers display buoyant, gravity-defying movements.""","Trampoline jumping produces rhythmic bouncing sounds, squeaky springs stretching and contracting, laughter, shouts, and yelps of delight, the whoosh of air as the jumper ascends and descends, and the occasional sound of feet or body contacting the fabric with a soft thud.",,,,,,, +Typing,"Typing is the action of inputting text by pressing keys on a computer keyboard, typewriter, or touchscreen. It involves the coordination of the fingers to quickly and accurately strike keys to form words and sentences, facilitating written communication in the digital age.","Fingers press keys on a keyboard or touchscreen, often rhythmically. The movement is punctuated by pauses for thought. Eyes may flick between screen and keys while text appears and cursor blinks on the display. If on a physical keyboard, there's a gentle clack with each keystroke.","Typing involves rhythmic keystrokes, varied by keyboard material and typist speed; click-clack sounds from mechanical switches; soft thuds from membrane keys; spacebar thumps; occasional longer pauses; and intermittent space bar pressing. Background noise may rise from fast typing, while slow typing creates intermittent, discrete taps.",,,,,,, +Uneven Bars,"Uneven Bars is a women's gymnastics apparatus featuring two horizontal bars set at different heights where gymnasts perform a choreographed routine of swings, transitions, releases, and catches, culminating in a dismount. Mastery demands strength, agility, coordination, and precise timing.","Uneven Bars is a gymnastics event featuring two horizontal bars set at different heights. Gymnasts perform aerial flips, swings, and transitions with precise timing and fluid motions, alternating between the bars in a display of agility, strength, and grace.","Rhythmic swinging, metallic clinks of hands grasping bars, thuds of dismounts onto the mat, occasional chalk dusting sounds, audience's applause, coaches' instructions, athletes' grunts of exertion, occasional tension release creaks from the apparatus, and the muffled background hum of a gymnasium's atmosphere.",,,,,,, +Volleyball Spiking,"Volleyball spiking is an aggressive, overhead attacking move where a player jumps and forcefully hits the ball downward over the net into the opponent's court, aiming to evade defenders or make the ball difficult to return, often concluding a point-scoring opportunity with power and precision.","A volleyball spiker jumps high near the net, pulling back their arm with an open hand. The body is tensed and angled, eyes focused on the ball. They forcefully swing their arm forward, hand striking the ball sharply, sending it over the net with speed and precision toward the floor.","A volleyball spike is accompanied by the sharp, resonant sound of the palm striking the ball, followed by a thud as the ball hits the ground, often mixed with the anticipatory shouts of players and the cheering of spectators. Sound intensity increases with the force of the spike.",,,,,,, +Walk Dog,"Walking a dog is a physical activity involving an owner taking their canine companion outdoors on a leash for exercise and bathroom breaks, frequently incorporating play, improving both the dog's and owner’s health, and strengthening their bond.","A person holding a leash attached to a dog's collar; the dog may be trotting or sniffing around. They're often in a park or on a sidewalk, surrounded by trees or city streets. The dog's tail may be wagging, and both appear to be in motion.","Walking a dog may involve sounds of a leash clinking, the dog’s collar jangling, paws padding against the ground, occasional barking or panting, and ambient noises such as birdsong, traffic, human voices, or rustling leaves, depending on the environment.",,,,,,, +Wall Pushups,"Wall pushups are a beginner-friendly exercise that serves as an easier alternative to traditional pushups. They target the chest, arms, and shoulders by using the resistance of one's own body weight against a wall, promoting upper body strength and endurance through pushing away and lowering towards a vertical surface.","An individual stands facing a wall, places palms flat against it at shoulder width, steps back to lean in, and bends elbows to lower their chest to the wall before pushing back to the starting position, replicating a pushup motion vertically.","Wall pushups may produce rhythmic tapping or slapping sounds as hands repeatedly contact and push off the wall, with varying intensity reflecting pushup force. Soft foot shuffling can accompany stance adjustments, and exhales might be audible with exertion, often synchronized with the push motion.",,,,,,, +Writing On Board,"""Writing on board"" is an instructional activity where a facilitator or participant conveys information, solves problems, or teaches by inscribing words, numbers, or drawings on a surface, typically using markers or chalk, to visually communicate and engage an audience in a collaborative or educational setting.","A person stands facing a board, holding a marker or chalk, with hand movements indicating inscription. Words or drawings appear on the board's surface, often accompanied by erasing and revising as ideas are developed or explained.","Scraping or squeaking sounds of chalk or marker on the surface, tapping of the writing utensil, faint rustle of clothing as the writer reaches and moves, occasional erasing sounds—like brushing or swiping, soft clicking of pen caps or chalk pieces being picked up or set down.",,,,,,, +YoYo,"YoYo is a classic toy consisting of a spool connected to a string, which is wound and unwound to perform gravity-defying tricks and maneuvers. It's both a hobby and competitive sport, with enthusiasts striving to master intricate techniques and create new combinations of spins and movements.","YoYo involves a player holding one end of a string with the other end attached to two symmetrical discs, through which the string runs. The player performs tricks by looping, tossing, and twirling the YoYo, which rolls up and down the string using its spinning momentum.","While playing with a yo-yo, one might hear the hum of the spinning string, the gentle whir of the yo-yo's rotations, intermittent soft thuds upon catching, and occasional snaps as the yo-yo changes direction or performs tricks. Sound intensity varies with speed and surface contact.",,,,,,, diff --git a/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/VGGSound.csv b/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/VGGSound.csv new file mode 100644 index 0000000..1ea2bb7 --- /dev/null +++ b/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/VGGSound.csv @@ -0,0 +1,311 @@ +name,description_1,description_2,description_3 +air conditioning noise,"Air conditioning noise is the background hum or drone produced by air conditioning units when operating, typically including steady mechanical sounds from the fan and compressor, along with occasional clicking from thermostat controls or expansion and contraction of parts.","A vibrating air conditioning unit with undulating sound waves emanating from it, creating ripples in the surrounding air, depicted against a backdrop of a slightly disturbed, serene room where a person is visibly tense or annoyed by the persistent, monotonous mechanical hum.","Air conditioning noise typically includes a steady hum or drone, often with a low-frequency rumble and a consistent whirr. It may have periodic whooshes as the compressor cycles on and off and can include vibrations or rattling from the unit's hardware." +air horn,"An air horn is a pneumatic device designed to create an extremely loud noise for signaling purposes. It uses compressed air to vibrate a diaphragm, which produces a sound that can be heard over long distances, commonly used in ships, trucks, and sports events as an attention-getting device.","An air horn blasts loudly, startling people nearby. Many cover their ears as the sound dominates, causing vibrations and slight trembling of objects. The intense noise captures everyone’s immediate attention amidst a chaotic backdrop.","An air horn produces a loud, piercing sound, often with a fundamental frequency around low-to-midrange Hz. Its sharp, blaring tone can rapidly rise in volume, carrying a sustained, uniform note that reverberates and can be heard over long distances due to its high intensity and narrow frequency band." +airplane,"The sound event ""airplane"" refers to the audible experience related to aircraft, which includes the roar of jet engines during takeoff and landing, the whoosh of planes flying overhead, and the general hum of airborne travel, often associated with travel and transportation.","A visual representation might depict a plane in flight with lines or ripples emanating from it to indicate sound waves, or it may show people's hands over their ears, with onomatopoeic words like ""roar"" suggesting the loud, distinctive sound of an airplane.","The sound event ""airplane"" typically features a deep, resonant rumble with varying pitch due to engine thrust, a whooshing caused by air displacement, and may include higher-pitched whining from jet turbines, often accompanied by a doppler effect as the plane approaches and then recedes from the listener." +airplane flyby,"An airplane flyby is an event where an aircraft passes overhead, characterized by the distinctive roar of engines and the change in pitch due to the Doppler effect, often associated with aviation shows, military exercises, or routine flights.","A fast-moving aircraft sweeps across the sky, the sound crescendoing as it approaches, peaking overhead before fading into the distance, leaving contrails against a clear or cloud-dotted backdrop.","A long, deep roar that crescendos as the airplane approaches; a mix of engine hum, wind noise, and air displacement; followed by a Doppler shift to a lower pitch as the plane moves away; finally, a gradual fade in volume until inaudible." +alarm clock ringing,"An alarm clock ringing is a designated sound emitted by an alarm clock to awaken someone from sleep at a predetermined time, often featuring repetitive, high-pitched tones designed to attract attention and prompt action to switch it off.","A bedside table with a buzzing alarm clock flashing a bright LED time. In the background, a bed with a startled person partly covered by crumpled sheets, reaching to hit snooze, their hand suspended in motion and their eyes groggily squinting at the sudden disturbance.","High-pitched, repetitive beeping or ringing, usually with a steady rhythm, designed to be loud and penetrating to effectively wake a person from sleep. Some variations may include a buzz or a melody that escalates in volume to ensure alertness." +ambulance siren,"An ambulance siren is a distinct, loud, oscillating sound used by emergency vehicles to alert and clear traffic, indicating an urgent need to reach a destination quickly for medical purposes, often signaling an emergency involving human health or life.","An ambulance with flashing red and white lights speeds through traffic, its loud siren blaring as drivers pull aside to create a path, signaling an urgent medical emergency.","An ambulance siren is characterized by a loud, piercing wail that alternates between high and low pitches, designed to signal urgency and prompt others to clear the way. It often has a fluctuating frequency that can modulate between continuous and rhythmic patterns to attract attention." +arc welding,"Arc welding is a fabrication process that joins metals using the heat generated from an electric arc, creating a pool of molten material that cools to form a strong joint. It produces characteristic sounds such as buzzing or crackling, due to the intense electrical discharges and rapid heating/cooling cycles involved.","Intense white sparks flying as a masked welder fuses metal parts with a glowing electrode, casting a bright, localized light amidst the dark surroundings of a workshop.","Arc welding produces a consistent, high-pitched hissing or buzzing sound, punctuated by crackling or popping noises as the electrode melts and sparks fly, alongside occasional sizzling as metal fuses. The intensity of the sound varies with equipment and technique, but it generally requires hearing protection due to high decibel levels." +auto racing,"Auto racing is a motorsport involving the racing of automobiles for competition, characterized by high speeds, roaring engines, and intense competition. It encompasses various categories like Formula One, NASCAR, and rallying, each with unique vehicles and rules, drawing massive global audiences to its thrilling, adrenaline-fueled events.","A racetrack lined with cheering crowds, a blur of colorful racing cars zipping by, engines roaring, tires screeching around tight turns, checkered flags waving, and pit crews geared up for swift mechanical work.","Auto racing features high-revving engines roaring, tires squealing on asphalt, rapid gear shifts, crowds cheering, the whoosh of speeding cars, intermittent announcer commentary, and the wave-like crescendo and decrescendo of noise as vehicles zoom past." +baby babbling,"Baby babbling is an early speech development stage where infants produce repetitive syllables, like ""ba-ba"" or ""da-da,"" exploring vocalization and practicing language skills before forming meaningful words. It typically begins around 6 months of age and is a key part of linguistic growth.","A baby sits propped up with colorful toys around, mouth open, eyes bright and curious. Gentle, repetitive sounds escape their lips, forming incoherent but rhythmic syllables as they experiment with vocalizations, occasionally smiling or giggling at their own efforts.","Baby babbling features repetitive syllables, rhythmic patterns, cooing and gurgling sounds, intermittent high-pitched tones, and exploratory voice inflections, often with a conversational intonation, indicative of early language development stages." +baby crying,"A baby crying is a vocalization infants use to communicate needs or distress, ranging from hunger or discomfort to a desire for attention, characterized by a high-pitched, often rhythmic wail that humans are evolutionarily attuned to respond to.","A red-faced infant with clenched fists, tears streaming down their cheeks, mouth wide open in a wail, with furrowed brows indicating distress, while a caregiver tenderly tries to soothe the baby, rocking or holding it close in a comforting embrace.","A baby crying typically features high-pitched, loud wails and sobs with varying intensity and intervals, often characterized by repetitive patterns that can indicate distress, hunger, or need for attention. The sound may fluctuate in pitch and volume, and can be piercing and attention-grabbing." +baby laughter,"Baby laughter is a joyful, contagious vocal expression typically produced by infants and young children. This sound event, often emerging around 3 to 4 months of age, signifies pleasure and is a key milestone in social and emotional development, eliciting strong positive emotions and bonding in listeners.","A bubbly infant giggles joyfully in a sunlit nursery, chubby cheeks dimpling with each merry chuckle, eyes twinkling with delight. Soft toys and pastel decor surround the contented baby, creating a warm, serene tableau of innocence and happiness.","Baby laughter typically features high-pitched, melodic giggles and chuckles, often in short, variable bursts and repetition, with a vocal timbre reflecting joy and innocence. The sound may fluctuate in volume and pitch and is generally rhythmic and contagious to listeners." +baltimore oriole calling,"The Baltimore Oriole calling is a melodic series of whistles and chatters, characteristic of this brightly colored songbird. Found in eastern North America, males perform these calls to establish territory and attract mates, especially during spring migration and breeding seasons, adding a sweet, flutelike soundtrack to the environment.","Perched amidst lush greenery, a vibrant orange-and-black Baltimore Oriole tilts its head back, throat vibrating as it emits melodious whistles and chatters, resonating through the serene woodland ambiance.","The Baltimore Oriole’s call consists of flute-like whistles with short, clear, high-pitched notes. The sound varies in pitch and includes melodious, chattering qualities. It may feature a musical warble or a single-note “tuck,” signaling its presence in treetops." +barn swallow calling,"The ""barn swallow calling"" sound event features the distinctive, chirping vocalizations of the barn swallow, a small, agile bird known for its sleek body and forked tail, commonly heard in rural areas and open fields where these birds nest and forage for insects.","A sleek barn swallow perches under the eaves of a rustic barn, head tilted skyward, beak open as it releases a series of melodic chirps that mingle with the warm breeze over a golden field.","The barn swallow’s call features melodic chirps and twitters with clear, repeated notes. It’s cheerful and swift, reflecting the bird’s aerial agility. The high-pitched sound varies in tempo, depending on the context." +basketball bounce,"A basketball bounce is the rhythmic, thumping sound produced when a basketball strikes a hard surface and rebounds, commonly heard in association with the sport of basketball during dribbling, passing, and game play on indoor or outdoor courts.","A basketball rhythmically hits the hardwood floor, rebounding back into a player's hand amidst the squeaks of sneakers and the echo of the dribble resonating through the gym.","A basketball bounce produces a rhythmic, repetitive thudding sound, with variations in pitch and volume depending on the force of the bounce and the ball's inflation level. The sound has a resonant quality with a short decay as it echoes slightly off indoor court surfaces or becomes muted outdoors." +bathroom ventilation fan running,"The sound of a bathroom ventilation fan running is a consistent whir of the fan blades as they rotate, designed to circulate air and remove moisture, odors, and airborne pollutants from the bathroom space to improve air quality and prevent mold.","A ceiling-mounted fan spins rapidly within a small, tiled bathroom, its blades generating a steady hum as steam clears from the air above a shower or bathtub.","A bathroom ventilation fan typically emits a steady, monotonous hum or whirring sound, indicative of rotating blades within a grille. The pitch is medium to low and the volume can range from soft to moderately loud, often accompanied by occasional rattling or buzzing due to the vibration of the fixture." +beat boxing,"Beatboxing is a vocal percussion art form where performers create drum beats, rhythms, and musical sounds using their mouth, lips, tongue, and voice. It emulates DJ scratch sounds and instruments, originating within hip-hop culture but now spans various music genres as a unique performance technique.","A person rhythmically vocalizes percussion sounds, their mouth a flurry of movements, lips popping, cheeks hollowing, and tongue flicking. They mimic a drum machine with dynamic facial expressions and enthusiastic body language, creating a vibrant atmosphere of improvised musical beats.","Beatboxing involves vocal percussion that mimics drum machines. It includes deep throat pulses for bass kicks, sharp ‘ts’ for hi-hats, and ‘pf’ or ‘kch’ for snares. Various melodic and rhythmic patterns are created by manipulating breath, vocal cords, and mouth shape." +bee buzzing,"The sound event ""bee buzzing"" is a distinctive humming noise made by bees' wings beating rapidly as they fly or hover, typically indicative of bees' activity around flowers or their hive, and is a common auditory cue signaling the presence of these important pollinators in the environment.","A bee flits erratically among flowers, its wings a blur of motion. Vibrant pollen dusts its legs. The surroundings hum with its persistent, rhythmic drone, capturing the essence of a serene, sunlit day.","A bee buzzing emits a continuous, high-pitched tone, characterized by a rapid succession of vibrations or wing flaps that produce a resonant, oscillating hum in the frequency range of around 200 Hz to 450 Hz, with periodic variations in pitch and amplitude due to movement." +bird chirping,"Bird chirping refers to the melodic sounds produced by birds, often to communicate, attract mates, mark territory, or signal alarm. Each species has distinct chirps, which can vary by context and individual. The acoustic event is a defining characteristic of natural habitats and a symbol of the dawn chorus.","Dawn breaks as a watercolor sky blushes pink and orange. A silhouette of trees lines the horizon, leaves rustling gently. Perched on swaying branches, small birds flit energetically, their beaks opening and closing in rhythmic song, filling the crisp morning air with melodious chirping.","Bird chirping typically involves a series of high-pitched, rhythmic, and melodic vocalizations with varying tones and patterns, emanating from avian vocal cords, potentially interspersed with silence or background environmental noise, and often characteristic of specific bird species or contexts." +bird squawking,"A bird squawk is a loud, harsh, and often repetitive noise produced by a bird. It serves as a vocalization for communication, signaling alarm, defending territory, or social interaction among avian species.","A flustered bird with open beak, wings possibly flapping, perched or mid-flight amid a serene or disrupted setting, with concentric sound waves indicating its loud, piercing squawks.","High-pitched, repetitive, sharp squawks with variable pitch and rhythm, often piercing and loud, conveying alertness or distress, featuring brief bursts of sound with sudden onset and decay, and sometimes intermixed with softer chirping or clicking sounds depending on the bird species." +bird wings flapping,"Bird wings flapping produce rhythmic, soft whooshing sounds as feathers brush against air during flight. These distinctive noises vary among species and can indicate bird size, speed, and proximity.","A pair of birds hovering midair, wings blurring in rapid movement, feathers rustling gently, creating a rhythmic beat emblematic of flight, as they navigate the skies or prepare for takeoff amidst a backdrop of open skies or dense foliage.","Bird wings flapping produce a rhythmic, soft whooshing or rustling noise, varying in intensity with the bird's size and speed. The frequency signature is typically low to mid-range, and the sound carries short distances, often accompanied by other bird sounds such as chirping or squawking." +black capped chickadee calling,"The black-capped chickadee call is a distinctive, clear whistle that often sounds like ""phoe-be"" or ""cheeseburger,"" functioning as communication among these small North American songbirds, particularly for mate attraction and territory defense.","A small, round-bodied bird with a distinctive black cap and bib, white cheeks, and gray wings perched on a swaying branch, tilts its head back to emit a sharp, high-pitched ""chick-a-dee-dee-dee"" call into the tranquil forest air.","The black-capped chickadee call typically features clear, high-pitched notes that resemble the phrase ""chick-a-dee-dee-dee"" with an ascending pitch at the beginning and additional ""dee"" notes when alarmed. " +blowtorch igniting,"A blowtorch igniting produces a sharp, hissing sound as gas is released and combusts with a popping noise, creating a sustained roar from the intense, focused flame burning steadily once ignition is successful.","A focused, intense flame bursts forth from a blowtorch's nozzle, accompanied by a sharp hissing noise as the tool ignites, casting a bright blue and orange glow on nearby surfaces.","A blowtorch ignites with a sharp click, followed by a whoosh of intense flame. The gas combusts into a hot, steady stream, producing a high-pitched hiss and subtle crackling from the material or metal being worked." +bouncing on trampoline,"The sound event ""bouncing on trampoline"" is characterized by rhythmic boinging noises, spring compression thuds, and the occasional creaking of tensioned metal, often accompanied by laughter or exclamations from jumpers enjoying the rebounding activity.","A figure with flexed knees and arms outstretched for balance is depicted mid-air above a trampoline, with concentric circles emanating from the trampoline surface, indicating the reverberating effect of the bounce. A joyful expression and dynamic posture suggest motion and energy.","Repetitive boinging or springy noises, rhythmic squeaking of springs or fabric, occasional whoosh of air as the jumper descends and ascends, soft thuds upon landing, giggles or exclamations if people are involved, varying intensity based on jumper's weight and force." +bowling impact,"A bowling impact sound event is the audible noise created when a bowling ball strikes the pins at the end of a bowling alley lane, typically characterized by a heavy rolling sound followed by a loud, resonant clatter and crash as the pins are hit and knocked over.","A bowling ball strikes the pins with force, scattering them in an explosive clatter. The pins flail in different directions, some spinning, others toppling, amidst the resonant echo of collision in the alley. The kinetic energy is almost palpable, visually mimicking the auditory intensity of the impact.","A bowling impact event typically features a sharp, resonant crash as the ball strikes the pins, mixed with the rolling thunderous rumble of the ball on the lane, followed by a clattering cascade as pins scatter, sometimes concluding with a quieter clunk of pins settling." +bull bellowing,"A bull bellowing is a deep, prolonged roar typically emitted by male cattle (bulls) to signal their presence, display dominance, attract females, or express distress. This resonant vocalization can be heard over considerable distances and is characteristic of livestock behavior in various cultures.","A large, muscular bull stands in a dusty field, head lowered, nostrils flared. Its mouth is wide open, emitting a deep, resonant roar that echoes through the air, signaling its presence and dominance. Surrounding animals pause, acknowledging the commanding sound.","A bull bellowing produces a deep, resonant, and often sustained roar characterized by low-frequency tones with a rumbling quality, varying in pitch and intensity, signaling aggression, distress, or communication with other cattle. Vibrations may be felt, and the sound carries across long distances in open fields." +canary calling,"Canary calling is a form of animal communication where canaries produce intricate vocalizations, often characterized by melodies, trills, and chirps, used for mating, signaling danger, or expressing themselves within their social groups. Bird enthusiasts may also train canaries for singing competitions based on song quality and variety.","A yellow canary perches on a branch, its beak open in song as melodious chirps fill the air, with musical notes floating amidst a sunlit, leafy backdrop.","A canary's call features high-pitched melodic whistles and chirps, with rapid sequences of clear, varying tones. Each burst is typically short-lived and repetitive, with a rhythm that can be both musical and complex, demonstrating a wide range of frequencies, often piercing compared to ambient noise." +cap gun shooting,"A cap gun shooting is a playful mimicry of real gunfire using a toy gun that generates a loud pop. This sound event is created when a small amount of explosive material, usually a shock-sensitive compound, is ignited to produce a sudden, sharp noise for entertainment purposes, especially in children's games.","A small toy gun held by a child emitting puffs of smoke with quiet miniature popping sounds; bystanders show little reaction, dismissing the noise as harmless play.","A cap gun shooting produces a sharp, high-pitched cracking sound with a quick onset and rapid decay. It lacks echo due to low sound energy, mimicking a miniature version of a real gunshot, and may be followed by a faint smoke-hiss if the cap residue burns off." +car engine idling,"The sound event ""car engine idling"" refers to a vehicle's engine running while the vehicle is stationary, producing a steady, low-intensity rumbling noise indicative of an engine in minimal power mode awaiting the driver's next action.","A stationary car with its engine running emits a steady, low rumble, as exhaust gently puffs from the tailpipe; the vibration subtly shakes the hood, while the dashboard lights are illuminated, and the driver waits, hands on the wheel or perhaps checking a device.","The sound of a car engine idling features a steady, rhythmic hum or purring, with a low-to-mid frequency rumble. There may be minor fluctuations in pitch and volume, as well as the occasional burst from engine knocks or accessory belts. Vibrations are often felt along with the sound." +car engine knocking,"Car engine knocking is a rattling noise that occurs when fuel burns unevenly in an engine's cylinders, often caused by improper fuel-to-air ratio, low octane fuel, or faulty ignition timing, potentially leading to engine damage if not addressed.","A dashboard lit with warning lights, a driver's concerned face, a car hood open with steam rising. Underneath, a depiction of a piston and cylinder with exaggerated gaps, showing erratic movement and collision, accompanied by onomatopoeic text ""knock knock"" to indicate the distinctive sound of a malfunctioning engine.","""Car engine knocking,"" also known as ""engine detonation,"" is characterized by a rapid, rhythmic tapping noise that often accelerates with engine speed. It's a metallic pinging or knocking sound that can vary in loudness and can signal engine issues." +car engine starting,"A car engine starting is a common auditory event characterized by an initial ignition sound followed by steadily increasing vibrations and a combustion roar, indicating the engine's activating and coming to life, ready to power the vehicle's movement.","A driver turns a key in the ignition or presses a start button, the dashboard lights flicker, and the engine emits a growing hum, culminating in a steady purr, indicating readiness. Under the hood, metal components engage seamlessly, sparking fuel combustion that breathes life into the vehicle.","A car engine starting typically features a short burst of mechanical whirring or cranking followed by a steady rumbling or roaring that stabilizes as the engine idles, often accompanied by the initial sputter or cough as fuel ignites and the engine turns over." +car passing by,"The sound event ""car passing by"" is an auditory occurrence marking a vehicle moving through a space, typically characterized by a crescendo and decrescendo of engine noise and tire friction, often accompanied by changes in pitch due to the Doppler effect.","A streak of a vehicle blurs across the frame, with lines indicating motion. The surrounding scenery is slightly bent around the car__ path, suggesting the doppler effect of sound. Waves emanate from the car, symbolizing the fading ""vroom"" as it speeds away.","A ""car passing by"" typically features a doppler effect, where the pitch rises upon approach, peaks nearest the listener, and falls as the car moves away. There is a rush of varying engine noises, tire friction, and possible wind whooshing, often followed by a fading away of sound." +cat caterwauling,"Caterwauling refers to the loud, wailing noises made by cats, especially during mating season. These distressing yowls or howls serve as communication between cats and are often heard at night.","Under a moonlit sky, a cat with an arched back and puffed tail howls, showing sharp fangs. Its fur stands on end, eyes wide with fear or agitation, as it defensively faces an unseen opponent.","Cat caterwauling is a loud, high-pitched howl or screech with fluctuating pitch. This prolonged, erratic sound is linked to distress, aggression, or mating behavior and can be piercing to human ears." +cat growling,"A cat growling is a low, throaty vocalization expressing discontent, fear, or territorial aggression. It serves as a warning to perceived threats, signaling a cat's readiness to protect itself.","A cat, back arched and fur standing on end, bares its teeth and lets out a deep, menacing growl, eyes fixated intensely, possibly with ears flattened against its head, signaling irritation or a defensive stance against an unseen threat or rival.","A growling cat emits a low, guttural rumble, often vibrating, indicating aggression or discomfort. The volume can vary, and it may include hissing. The growl starts and stops abruptly, reflecting the cat’s agitation level." +cat hissing,"A cat hissing is a sharp, distinctive sound produced by cats as a defensive gesture. Characterized by a long ""s"" sound, it signals fear, aggression, or territoriality, often accompanied by a arched back, puffed fur, and bared teeth to ward off threats or express discomfort.","An arched-back cat, with fur standing on end, displays wide-open eyes and bared teeth, as its ears flatten sideways. A sharp, sibilant sound seems to emanate from its open, snarling mouth.","A cat hissing creates a harsh “ssss” sound with varying pitch and volume, often accompanied by growls or spits. This broad-spectrum noise signals agitation or aggression, with intensity reflecting the cat’s emotional state." +cat meowing,"A ""cat meowing"" is a vocalization made by cats, often as a form of communication with humans or other animals, characterized by a distinctive high-pitched tone that typically conveys a need or desire, such as for attention, food, or entry into a space.","A cat with its mouth slightly open, whiskers perked forward, ears upright, and eyes possibly wide. Sound waves or musical notes may be illustrated near its mouth to indicate meowing.","The sound event ""cat meowing"" typically features a high-pitched vocalization, varying in intensity and duration, with frequency-modulated tones expressing different emotions or needs. Its timbre is distinct with a sharp, resonant character often described as plaintive or demanding." +cat purring,"A cat purring is a continuous, soft, vibrating sound made by cats in a state of contentment, often felt as a gentle rumble. It involves the rapid movement of the muscles within a cat's larynx, creating a soothing effect for both the cat and nearby humans.","A contented cat, with closed or half-closed eyes, is curled up or sprawled comfortably, its body vibrating subtly as it emits a rhythmic, throaty hum. The scene exudes tranquility and the bond between the cat and its environment or companion.","A cat purring produces a continuous, soft, vibrating sound with a frequency range of 25 to 150 Hertz, often characterized as a rhythmic, low-pitched hum or rumble, typically associated with contentment and relaxation, and can have a calming effect on both the cat and nearby humans." +cattle cowbell,"The cattle cowbell is a metallic bell worn by cows to help farmers locate and track their herd by the distinctive sound it makes when the cow moves, aiding in managing livestock in expansive pastures or rugged terrain.","A herd of cattle grazing in a lush green field, with each cow wearing a cowbell around its neck, clanking rhythmically as they move, the tranquil scene backed by distant hills and a clear sky.","The ""cattle cowbell"" produces a metallic clinking sound with a resonant, dull clang. Its timbre is rich in mid-low frequencies, and it exhibits a consistent rhythmic pattern based on cattle movement. The sound carries well over distance due to its piercing, sustained overtones." +cattle mooing,"Cattle mooing is the characteristic vocalization made by cows or bulls, often deep and resonant, used for communication within herds, expressing needs or emotions, and for signaling distress or the presence of food. The sound is a familiar aspect of rural and agricultural environments.","A pastoral scene unfolds with cows scattered across a lush, green meadow, heads down grazing or looking up attentively, their mouths open as gentle moos break the quiet of the countryside, all under a wide, open sky.","Cattle mooing features low-pitched, resonant “moo” sounds with modulating tones. These vocalizations vary in length and intensity, containing rich harmonic tones. They are often soothing or plaintive, reflecting the animals’ communication or emotional state." +cell phone buzzing,"A cell phone buzzing represents the vibration mode of mobile phone notifications. When set to silent, the device emits a rhythmic, tactile hum to alert users of incoming calls, messages, or app notifications without an audible ringtone, allowing discreet or noise-sensitive notification acknowledgment.","A smartphone trembles on a sleek surface, its screen lit up with a cascade of notifications, vibrating rhythmically as it pushes against the silent room's stillness.","A cell phone buzzing typically features a low to mid-frequency hum or vibration sound, with a rhythmic pulsing pattern. It may include variations in intensity, mimicking the physical sensation of a phone vibrating against a surface, often with short bursts followed by brief pauses." +chainsawing trees,"""Chainsawing trees"" refers to the process of cutting down or removing sections of trees using a chainsaw, a portable, mechanical saw powered by a gasoline engine or electric motor, characterized by its sharp, rotating chain. The activity is marked by loud, rhythmic buzzing and wood splintering sounds.","A chainsaw roars and buzzes, cutting into tree bark and spewing wood chips. In the forest, a lumberjack in protective gear fells towering trees, causing birds to scatter. The air vibrates with the mechanical growl, contrasting raw nature with human activity.","The chainsaw’s high-pitched buzz and rhythmic tearing cut through wood, accompanied by the crackling of splintering timber and thuds of falling branches. Leaves rustle, operators shout, and distant thumps echo as larger trees hit the ground." +cheetah chirrup,"The ""cheetah chirrup"" is a high-pitched, bird-like call used by cheetahs for communication, particularly between a mother and her cubs, as well as between possible mates, signifying curiosity or contentment. This distinctive sound plays a crucial role in social bonding within the species.","In the golden savannah grass, a sleek cheetah crouches with perked ears and focused eyes. It emits high-pitched, birdlike “chirrup” calls, a rare sound that ripples through the silent landscape, possibly signaling its cubs or expressing contentment in its tranquil habitat.","The ""cheetah chirrup"" is a high-pitched, bird-like call typically comprising a rapid succession of short, sharp notes. It's used for intimate communication, often between a mother and her cubs, characterized by a staccato rhythm and a frequency that can range from 2 to 3 kHz." +chicken clucking,"A chicken clucking is the characteristic sound produced by chickens, often hens, consisting of short, repetitive vocalizations that can signify contentment, alarm, or communication within a flock.","A flurry of hens pecking at the ground, heads bobbing rhythmically, feathers ruffling as they move about a barnyard. The sound of clucking permeates the air amidst the flutter of wings and the occasional squabble over pecking spots.","A chicken’s clucking consists of short, staccato sounds like “bok-bok” or “cluck-cluck,” varying in pitch and tone. These vocalizations range from soft murmurs to louder calls, often communicating social behaviors or alertness within the flock." +chicken crowing,"A rooster’s crow is a loud, distinctive sound, often heard in the early morning. This rhythmic vocalization serves as a natural alarm clock, marking territorial presence or signaling the start of a new day.","A rooster stands tall at dawn, silhouetted against the early morning sky, its beak wide open and head tilted back as it emits a loud, distinct ""cock-a-doodle-doo,"" signaling the start of a new day on a rustic farm.","A chicken’s crowing features loud, piercing “cock-a-doodle-doo” calls with high, clear, fluctuating pitch. The rhythmic crow starts high and drops at the end, with each repetition lasting a few seconds and varying in duration." +child singing,"""Child singing"" refers to the melodic vocal expression of a child, typically characterized by a higher pitch and often associated with innocence or playfulness. It can range from casual, spontaneous tunes to more formal performances, capturing the unique timbre of young voices.","A small child sings with a sweet, melodic voice, eyes sparkling and hands gesturing expressively. Notes float in a soft glow. The audience, whether a delighted crowd or a proud parent nearby, watches in admiration.","A child singing typically exhibits higher pitch, a variable tonal quality due to developing vocal cords, and possibly imperfect pitch control. The timbre is usually clear and light, and may include background noises such as breaths or environmental sounds if not in a professional setting." +children shouting,"""Children shouting"" is a sound event characterized by the elevated vocal expressions of young individuals, often energetic or excited in tone, typically heard in playgrounds, schools, or during group activities, reflecting playfulness, communication, or sometimes distress.","A group of lively kids with mouths open wide, expressions of excitement and exuberance on their faces; hands might be raised or waving, as sound waves emanate from them to convey the cacophony of their collective shouting.","High-pitched, varied pitch ranges, intermittent bursts, loud, overlapping, chaotic, unstructured, high energy, spontaneous, can include laughter or squeals, potentially shrill or piercing quality, more erratic in timing compared to adult speech, typically conveys excitement or playfulness." +chimpanzee pant-hooting,"Chimpanzee pant-hooting is a unique vocalization for communication, conveying messages like location, social status, or food alerts. It consists of alternating low and high-pitched hoots that travel long distances in forests.","A group of chimpanzees gathered in a lush forest canopy; one dominant individual climbs a tree, inflates its cheeks, and releases a series of loud, rhythmic hoots, while others join in, creating a cacophony that echoes through the trees, signaling communication or excitement amongst the troop.","Chimpanzee pant-hooting features loud, rhythmic pants that rise to modulated high-pitched hoots with pitch variations and crescendos, indicating social status or group cohesion in the forest." +chinchilla barking,"A ""chinchilla barking"" is a distinctive sharp, short, repetitive sound emitted by chinchillas, often as a warning sign or response to a threat, showing fear or distress. It resembles a series of high-pitched barks, alerting others or signaling the presence of danger.","A chinchilla stands on its hind legs, mouth slightly open, in a defensive posture within its enclosure, emitting sharp, high-pitched sounds, alerting others around of perceived danger or expressing annoyance, while its ears pivot towards the source of its distress.","A chinchilla’s bark consists of short, sharp, high-pitched “kii-kii-kii” sounds, similar to small dog barks but higher. These rapid barks vary in intensity and duration, reflecting the chinchilla’s stress level. Each bark lasts only a fraction of a second." +chipmunk chirping,"Chipmunk chirping is a high-pitched, repetitive vocalization produced by chipmunks as a form of communication. These sounds can convey alarm, signal territory, or help to facilitate social interactions within their species.","A small, fluffy chipmunk perched on a forest floor, cheeks bulging with stored food, rapidly opens and closes its mouth emitting high-pitched, repetitive chirps as its tail twitches in sync, alerting others to a potential threat or communicating with nearby chipmunks amidst the verdant underbrush.","Chipmunk chirping features high-pitched, rapid sequences of short, sharp notes, resembling squeaky or bird-like sounds. The varied pitch conveys excitement or alarm, occurring in intervals or as a continuous stream, often increasing in urgency when disturbed." +chopping food,"Chopping food is the sound event characterized by rhythmic, sharp, slicing or cutting noises created when a knife makes contact with ingredients on a cutting board, typically heard during food preparation in kitchens.","A rhythmic slicing noise as a knife swiftly dices vegetables on a chopping board, hands deftly maneuvering the ingredients with precision, amidst a kitchen brimming with culinary activity.","Chopping food typically includes rhythmic, sharp slicing or dicing sounds with varying intensities depending on the food's hardness. The knife's impact against the cutting board creates a distinct ""chop"" or ""thud,"" with higher pitches for vegetables and duller sounds for meats. Rapid succession indicates quick chopping." +chopping wood,"Chopping wood is an auditory event characterized by a rhythmic series of sharp, cracking sounds made when an axe splits wood into pieces, typically punctuated by brief silences as the chopper prepares for the next strike. It evokes the essence of manual labor and nature.","A sturdy figure wielding an axe rhythmically swings down onto a log, each stroke resulting in a sharp crack that echoes through the forest; chips scatter as the wood gradually splits under the force of the impacts, revealing the textured grain within.","The sound event ""chopping wood"" is characterized by a sharp, resonant ""thwack"" as the axe strikes wood, occasional splintering or cracking sounds, and a deeper ""thud"" when wood segments hit the ground. The rhythm can be steady or irregular, depending on the chopper's pace." +church bell ringing,"Church bell ringing is a ritualistic and musical practice where bells housed in a tower are rung in patterns to signify times of worship, mark special occasions, and celebrate events. This resonant and harmonious sound tradition is deeply rooted in religious and community life.","A towering, steepled church stands against the sky; its bell sways in a lofty belfry, sending sonorous peals across a serene village or bustling cityscape, as pigeons scatter and the reverberations are echoed in the ripples of a nearby pond.","Church bells emit a resonant, metallic clanging with a reverberating decay. The pitch is often rich with harmonics and the volume usually loud. Rhythmic patterns vary, but pacing is often steady, signifying time or a ceremonial call. Vibrations may be felt at close distances." +civil defense siren,"A civil defense siren is a loud warning system used to alert the public about emergencies such as severe weather, wartime threats, or other disasters, prompting immediate protective action.","A civil defense siren sound typically cues an urgent, visually tense scene: people scattering frantically, seeking shelter, with emergency personnel mobilizing, against a backdrop of unnerving, deserted streets or imminent danger, like approaching storms or signs of conflict.","A civil defense siren typically emits a loud, penetrating wail or whoop, often rising and falling in tone, designed to carry over long distances. It may cycle through a sequence of tones to command attention for emergency alerts, warnings of severe weather, or threats like an impending disaster." +cow lowing,"A cow lowing is the characteristic deep, moaning sound that cows make, typically referred to as a moo. This vocalization serves as communication within the herd and can express a range of emotions or needs, such as calling for calves, indicating distress, or signaling the presence of food.","A serene pasture at sunrise, with mist clinging to the grass, where a placid cow stands silhouetted against the soft morning light, head bowed, opening its mouth to emit a deep, resonant moo that echoes through the calmness of the countryside.","A cow lowing emits a deep, resonant mooing sound with a tonal, drawn-out quality that can vary in pitch and duration. This vocalization often conveys contentment or discomfort and can fluctuate between low and higher frequencies, usually within the lower range of human hearing." +coyote howling,"A coyote howling is a high-pitched, drawn-out call emitted by the North American canid, used for communication. These vocalizations maintain social bonds, convey warnings, or establish territorial presence, often occurring at dusk or night, creating an eerie yet quintessential sound of the wild.","Under a silver moon, a solitary coyote stands atop a windswept hill, its silhouette sharply defined against the night sky. The coyote's head tilts back, muzzle pointing toward the stars as it releases a long, plaintive howl that echoes through the quiet wilderness.","A coyote howling typically exhibits a high-pitched, quavering vocalization that may start with a few short barks and transition into a prolonged, melodic wail with rising and falling pitches, often heard during dusk or nighttime, conveying long-distance communication among pack members or territorial presence." +cricket chirping,"Cricket chirping is a distinctive, rhythmic sound produced by certain species of crickets as a means of communication. This sound, known as stridulation, is created when crickets rub their wings together. It serves various purposes, including mating calls and territory establishment.","A serene night, a lone cricket silhouetted against the moonlight, perched on a leaf. Rhythmic chirps fill the air, a soundtrack to the stillness, as gentle waves of sound ripple through a field of dew-kissed grass, punctuated by the occasional glow of a firefly.","Cricket chirping typically involves repetitive, high-pitched trills or chirps, each consisting of short, sharp sounds made by stridulation (rubbing wings together). The rhythm can be steady or variable, often increasing with temperature, resulting in a characteristic, persistent nighttime or warm-weather soundscape element." +crocodiles hissing,"Crocodiles produce a hissing sound as a warning signal or sign of agitation, created by expelling air through their glottis when threatened or disturbed, serving as a communication method or defensive mechanism. It's an auditory cue of their presence, signaling to respect their space and avoid confrontation.","A group of menacing crocodiles gather by a murky water's edge, mouths agape revealing sharp teeth, as they emit threatening hisses that disrupt the heavy silence of a dense swamp, sending ripples across the water surface and startling nearby wildlife.","Crocodile hissing emits a low-frequency, guttural sound with sibilant qualities, including raspy breaths and growls. The intensity escalates, ending in a sudden, sharp hiss, creating a startling effect due to its unexpected and aggressive nature." +crow cawing,"The sound event ""crow cawing"" refers to the distinctive, loud, and harsh vocalization made by crows, typically characterized by a series of ""caw"" syllables. This vocalization can signal various behaviors such as territory defense, communication, or alerting others to potential threats.","Perched on a rustic fence, a solitary black crow caws loudly, breaking the silence of a misty morning while barren branches sway gently in the background, evoking an eerie, serene landscape.","The sound event ""crow cawing"" typically features harsh, guttural calls; repetitive series of ""caw-caw-caw"" with varying pitch; strident tone; may include background ambient noise depending on the environment." +cuckoo bird calling,"The sound of a cuckoo bird calling, often signifying the arrival of spring, is characterized by a distinctive two-note call_""cu-coo""__hich is produced by males as a territorial signal and mate attraction. The call varies among species, with some resembling musical notes or human whistles.","A cuckoo bird emerges from a forest, perching on a branch; its beak opens wide, emitting distinct calls. Leafy trees act as a backdrop, with occasional fluttering leaves and perhaps a dappled sun casting moving shadows, creating a serene, yet lively, portrayal of nature's symphony.","The call of a cuckoo bird is characterized by a distinctive, melodic two-note ""cu-coo"" sound, with the first note typically higher pitched and the second note lower and longer. The timbre is clear and fluty. Calls are often repetitive and heard in spring and summer during breeding season." +cupboard opening or closing,"The sound event ""cupboard opening or closing"" is an everyday audio cue indicating the action of a cupboard door being moved, characterized by a distinct creaking or clicking noise followed by a thud or latch click as it opens or closes.","A cabinet door swings on its hinges, either revealing its contents as it opens with a creak or shutting with a soft thud, obscuring the items within while the knob and wood grain detail indicate the action's direction.","A cupboard opening may produce a creaking noise if hinges are tight or squeaky, followed by a slight thud as the door swings open. Closing typically results in a solid, dull thud or click as the door shuts, potentially accompanied by the rattling of contents inside." +cutting hair with electric trimmers,"Cutting hair with electric trimmers is an auditory activity characterized by the buzzing and humming of the trimmer blades as they move across the scalp, shearing through hair with varying intensity based on thickness and motion, creating a rhythmic, mechanical sound punctuated by changes in pitch and volume.","A hand grips electric trimmers buzzing close to a head, locks of hair falling as the blades move through, leaving behind a neat, trimmed path.","The sound of cutting hair with electric trimmers is characterized by a steady buzzing or humming sound of the motor, punctuated by the clipping noise as blades slice through hair, varying in pitch and intensity with hair thickness and trimmer movement." +dinosaurs bellowing,"The sound event ""dinosaurs bellowing"" refers to the imagined, deep, and resonant vocalizations that these prehistoric creatures are theorized to have made, based on scientific extrapolations from fossil evidence and comparisons with modern animals, such as elephants and reptiles.","A scene of towering dinosaurs lifting their heads, open-mouthed, and roaring into a prehistoric sky with deep, guttural calls that reverberate through a lush, fern-covered landscape, causing flocks of small creatures to scatter in a haze of primordial mist and the ground to tremble subtly.","Low-frequency roars, thunderous bellows, resonant vibrations, possible hisses or snarls interspersed, echoing through prehistoric landscapes, conveying size, power, and primal ferocity of dinosaurs; similar to amplified, bass-heavy sounds of large modern-day reptiles or mammals. " +disc scratching,"Disc scratching is a DJ technique involving the rhythmic manipulation of a vinyl record on a turntable to produce distinct sound effects, characterized by a scratching or scrubbing noise that is blended into music mixes, often associated with hip-hop and turntablism.","A DJ energetically moves a record back and forth under a stylus on a turntable, creating rhythmic disruptions in the music. Spectators watch as the DJ's hands artfully manipulate the vinyl, with sound waves visually emanating from large speakers in a dimly lit club with vibrant, flashing lights.","Disc scratching produces a distinctive, high-pitched screeching sound with rapid, rhythmic fluctuations and scratching or scraping noises, often resulting in a rhythmic pattern that syncopates with music. These sounds are characterized by their varying pitch and tempo changes controlled by the DJ's hand movements on the turntable." +dog barking,"Dog barking is an auditory signal typically produced by dogs as a form of communication, expressing various emotions from excitement to distress or signaling alertness to territory defense. The sound's pitch, duration, and frequency can vary widely among breeds and contexts.","A dog with its mouth open mid-bark, showcasing sharp teeth, with sound waves emanating from its mouth, and a possibly startled or attentive stance with ears perked up or fur bristling.","A dog barking typically features a series of sharp, loud, repetitive noises with varying pitches and lengths. Auditory characteristics include a staccato rhythm and a timbre that can range from deep and throaty to high-pitched yapping, depending on the dog's size and breed." +dog baying,"Dog baying is a distinct, deep, and prolonged howling sound made by dogs, often associated with hound breeds. It signals excitement, hunting behavior, or a response to certain stimuli, and differs from barking in its melodious and drawn-out tones.","A hound with its snout lifted skyward, mouth agape, emitting a prolonged, deep howl, perhaps with a backdrop of a full moon, trees silhouetting the night sky, communicating urgency or alerting to a presence.","A ""dog baying"" typically presents a prolonged, deep, mournful howl with a repetitive cadence, often rising and falling in pitch. It's distinct from barking, and commonly associated with hunting dogs signaling the pursuit or sighting of prey." +dog bow-wow,"The sound event ""dog bow-wow"" refers to the vocalization of a dog, typically characterized as a bark or barking sound, which is represented onomatopoeically in English as ""bow-wow,"" imitating the pattern and tone of the noise that dogs commonly make to communicate or alert.","A cartoonish illustration of a cheerful dog, tail wagging, tongue out, with a speech bubble containing the onomatopoeic words ""Bow-Wow"" above its head, possibly with musical notes or sound waves to emphasize the noise it's making.","The ""dog bow-wow"" sound event features a rhythmic barking pattern with varying pitch and volume, often in a mid to low frequency range. The timbre is resonant and harsh, with abrupt onsets and decays that create a distinctive woofing texture characteristic of a dog's vocalization." +dog growling,"A dog growling is a low, guttural vocalization made by a dog, often indicating aggression, fear, or a warning to stay away. It's part of canine body language, signaling that the dog may be ready to escalate its response to a perceived threat if provoked.","A tense dog with bared teeth, ears pinned flat, alert eyes, and fur bristled stands in a defensive posture, emitting a deep, guttural rumble from its throat, signaling discomfort or a warning to back off.","A dog growling typically includes a low-pitched, throaty rumbling tone, with a varying pitch fluctuating depending on the dog's size and aggression level. The sound often has a guttural quality and can incorporate snarls and snapping sounds as warning indicators. Growls can be prolonged or short and repetitive." +dog howling,"A dog howling is a prolonged, mournful vocalization by a dog, often triggered by stimuli such as isolation, sirens, or other environmental cues. This behavior is considered a form of communication that can express distress or social connection.","A silhouette of a dog, head tilted upwards, mouth wide open mid-howl, with sound waves radiating outward. The atmosphere conveys nighttime, with a full moon perhaps serving as a backdrop, enhancing the quintessential imagery associated with a dog's mournful or communicative howling.","A dog howling typically presents a sustained, high-pitched vocalization, often starting with a rising note before plateauing. It can include variations in pitch and volume, with a mournful or eerie tonal quality, and may occasionally involve harmonics or overtones when multiple dogs join in or the howl echoes." +dog whimpering,"A dog whimpering is a soft, high-pitched sound typically made by dogs to communicate discomfort, anxiety, fear, or a desire for attention. It's a form of vocalization that differs from barking or growling and often elicits a caregiving response from their human companions.","A dog with its ears back, tail tucked, eyes wide or averted, perhaps pawing gently or pacing, occupies a small, shadowed corner. Its quivering body and occasional soft whines convey distress, seeking comfort or signaling fear, its gaze occasionally seeking its owner or a source of solace.","A dog whimpering typically features high-pitched, repetitive, softer sounds that can be short or elongated and may be interspersed with pauses. These sounds express distress or seeking attention and can fluctuate in pitch and volume, often conveying a sense of urgency or discomfort." +donkey braying,"A donkey braying is a loud, distinctive call characterized by a sharp, oscillating vocalization. It's often heard as a repetitive ""hee-haw"" sound used for communication within their species or to signal distress.","A donkey stands in a rustic field, head tilted back, mouth agape, as it emits a loud, harsh braying noise. Ears pivot forward with each raspy hee-haw resonating in the tranquil countryside, drawing amused or annoyed glances from nearby animals and humans alike.","A donkey’s bray features high-pitched, grating sounds starting with a sharp inhale and a loud exhale. It has strong harmonics, variable frequency (0.8 to 2.5 kHz), and an oscillating pattern with pauses, often heard at dawn or dusk." +door slamming,"A door slamming is a loud, sharp noise from forcefully closing a door against its frame, often due to wind, anger, or carelessness. It creates a sudden, startling sound peak, conveying a sense of finality or urgency.","A hand forcefully pushes a door shut, casting a sharp shadow through a hallway. The door nearly vibrates with the impact, and the adjacent walls seem to shudder. A swirling draft lifts papers in a brief dance as echoes fade into a tense silence.","A door slamming is characterized by a sharp, loud impact sound with a brief, high amplitude peak, followed by a lower-pitched reverberant tail as the sound reflects off surrounding surfaces, often accompanied by the rattle of door hardware or vibration of the door within its frame." +driving buses,"""Driving buses"" encompasses the auditory experience associated with operating a bus, featuring engine sounds, gear shifts, the hiss of hydraulic doors, the dinging of stop requests, and the ambient noise of passenger chatter or movement, all contributing to the distinctive acoustic environment of urban and intercity transit.","A row of buses in motion, engines humming rhythmically, wheels turning on asphalt, with the occasional hiss of air brakes and the closing of hydraulic doors. Visuals of bustling streets, passengers embarking and alighting, and the synchronized dance of traffic lights guiding the orchestrated movement of the urban commute.","Driving buses typically exhibit features like deep engine rumbling, air braking hisses, pneumatic door swooshes, signal indicator clicks, passengers chatting, occasional ticket machine beeps, and varying road noises depending on the speed and surface." +driving motorcycle,"The sound event ""driving motorcycle"" involves the revving of an engine, the whir of wheels on pavement, and the characteristic roar and shifts in pitch as a biker accelerates, decelerates, and maneuvers, often overlaid with the hum of wind and mechanical clicks of gear changes.","A rider clad in a helmet and leather gear roars down an open road on a sleek motorcycle, the landscape blurring by, with handlebars vibrating and the exhaust pipe releasing a powerful rumble, embodying freedom and speed.","Revving engine, wind rush, exhaust pops, tire hum on pavement, mechanical clicks from gear shifts, intermittent horn beeps, and distant traffic buzz." +driving snowmobile,"""Driving snowmobile"" is the activity of operating a motorized vehicle designed for travel over snow. It involves the sound of a revving engine, crunching snow, and the whistle of cold wind, characteristic of winter sports and transportation in snowy regions.","A figure clad in cold-weather gear maneuvers a snowmobile over a white, snowy landscape, with snowflakes streaking past and engine rumble blending with the muffled sounds of winter wildness.","The sound event ""driving snowmobile"" is characterized by a loud, continuous engine roar, punctuated by the whirring of the tracks against the snow, mechanical rattles, and the swoosh of displaced snow powder. It also includes subtle shifts in pitch corresponding to speed changes." +duck quacking,"A duck quacking is a characteristic sound made by ducks, typically a series of short, rhythmic quacks produced by the bird's voice box as a form of communication with other ducks or as a response to stimuli in their environment.","A duck with glossy feathers floats on a tranquil pond, its orange beak opening and closing rhythmically while ripples spread outward, as the distinctive ""quack"" echoes softly through the reeds and over the water's surface.","A ""duck quacking"" produces a series of short, rhythmic, and repetitive quacks often varying in pitch and volume, characterized by a nasal, sometimes harsh tone. This sound typically involves a mid-frequency range and can include background water sounds if the duck is in an aquatic environment." +eagle screaming,"An eagle screaming is a distinctive, high-pitched call used by these birds of prey for communication, often associated with territorial claims or signaling to their mates. This sharp, piercing sound echoes across the landscape, illustrating the eagle's prowess and presence in its natural habitat.","An imposing eagle soars high above mountain peaks, its wings spread wide against a clear blue sky. Suddenly, it tilts its head back and emits a piercing scream, echoing through the vastness, signaling its dominion over the tranquil landscape below.","The sound of an eagle screaming is a high-pitched, piercing whistle or screech often with a smooth, clear tonality that carries over long distances. It can have slight variations in pitch and often ends on a downslurred note." +eating with cutlery,"""Eating with cutlery"" encompasses the various sounds made while using knives, forks, and spoons to cut and consume food, such as clinking, scraping, and cutting noises, often associated with the social ambiance of dining events.","In the visual representation, a figure is seated at a dining table, fork in one hand and knife in the other, delicately slicing and spearing food, with subtle lines or musical notes emanating from the cutlery to suggest the gentle clinking sounds of eating.","The sound of “eating with cutlery” includes metallic clinks of utensils on plates, soft cutting scrapes, and occasional clattering. Chewing and muffled conversation may also be present. The overall volume is moderate, varying with the eater’s vigor and environment." +electric grinder grinding,"The sound event ""electric grinder grinding"" is a loud, consistent, abrasive noise generated when a power-driven grinding tool is used to wear away material through friction and abrasion, often producing a high-pitched, mechanical whirring.","A rotating abrasive disc of an electric grinder throws sparks as it smoothly cuts into or polishes a hard surface like metal, creating a blend of bright light flashes against a backdrop of mechanical motion and intense friction.","High-pitched whirring, buzzing noise with variable intensity; underlying hum; occasional metallic screech; sporadic change in pitch and volume corresponding to material resistance." +electric razor shaving,"The sound event ""electric razor shaving"" comprises the continuous buzzing or humming noise produced by an electric razor as it cuts hair, often including intermittent changes in pitch and intensity as the device moves across different facial areas during grooming.","A man stands before a bathroom mirror, gliding an electric razor across his jawline. Stubble disappears under the buzzing blades; tiny hairs fall into the sink. His focused expression softens as he achieves a smooth, clean shave. The rhythmic hum of the device punctuates the quiet morning air.","The sound of an electric razor shaving is a consistent, buzzing hum with variations in pitch and intensity as it moves across different facial contours and cuts through varying lengths and thicknesses of hair. Additional intermittent crackling may occur as hairs are trimmed." +elephant trumpeting,"Elephant trumpeting is a loud, distinctive call produced by an elephant forcefully expelling air through its trunk, typically signaling excitement, distress, or communication with other elephants across long distances. This versatile sound serves various functions including coordination within the herd and deterring threats.","A majestic elephant stands with its trunk lifted high, its mouth open, and its ears flared out to the sides. The surrounding air seems to vibrate with the powerful, resonant sound of its trumpeting.","An elephant trumpeting emits a loud, high-pitched, and powerful blast of sound that can range from 2 to 4 seconds long. This distinctive trumpet-like call, characterized by a modulating tone, is produced through the elephant's trunk and can be heard over long distances." +eletric blender running,"The sound of an electric blender running is a consistent, mechanical whirring noise created by its motor and spinning blades chopping or liquifying food at high speeds, often producing a variable pitch as the contents are blended to the desired texture.","A whirring electric blender with a vortex of liquid inside, possibly mixed with fruits or vegetables, the blades spinning rapidly, creating a frothy mixture, while the appliance vibrates slightly on a kitchen countertop.","An electric blender running emits a loud, continuous, high-pitched whirring sound with variable speed and intensity. The noise is often harsh, mechanical, and may contain grinding or rattling if blending hard items. Vibrations or changes in pitch occur when blending consistency varies." +elk bugling,"Elk bugling is a unique and powerful vocalization made by male elk, typically during the autumn mating season, known as the rut. The eerie, high-pitched call can carry over long distances, signaling the bull's presence and strength to attract females and ward off rival males.","A majestic elk stands in a misty, forested landscape at dawn, its head thrown back and antlers silhouetted against the soft light of sunrise while emitting a powerful, eerie call that echoes through the trees, signaling its presence to others during the rutting season.","Elk bugling is characterized by a high-pitched, resonating whistle with multiple harmonic overtones, which starts at a low frequency and ascends rapidly to a peak before tapering off. This eerily haunting call often contains grunts or barks and can last from a few seconds to over 20 seconds." +engine accelerating,"An ""engine accelerating"" sound event is the audible increase in an engine's RPMs, typically characterized by a rising pitch and volume as the engine's speed intensifies, often associated with a vehicle gaining speed.","A car's rev counter needle climbs swiftly, exhaust pipes rumble and roar, and the vehicle's body leans back slightly as the wheels grip the asphalt, propelling it forward with increasing velocity.","The engine accelerating features increasing pitch, loudness, and intensity, transitioning from a deep rumble to a smooth, high-frequency whir. Harmonic richness grows as gears shift, with rhythmic surges in mechanical and exhaust notes. Vibrations intensify, highlighting the engine’s power." +female singing,"Female singing refers to a sound event characterized by a woman's voice producing musical tones in varying pitches and rhythms, often used to convey emotion or tell a story through songs across diverse genres.","A woman with a microphone or musical instrument, her mouth open in song, musical notes adrift. An engaged audience or a quiet backdrop highlighting her alone. Emotion exudes from her expressive face, waves of sound suggested by abstract lines or colorful imagery emanating from her or the environment around.","The auditory features of a female singing may include varied pitch, usually in the soprano to alto range, melodic vocalizations, vibrato, harmonious sequences, dynamic volume, emotional expression, and potential accompaniment by music. Timbre would be specific to the individual voice, often described as smooth, clear, or powerful." +ferret dooking,"""Ferret dooking"" is a distinctive clucking or chuckling noise made by ferrets when they're excited or happy, often during play. It's a sign of contentment and joy, comparable to a cat's purr.","A curious, slender-bodied ferret bounces around playfully, arching its back and puffing out cheek pouches. It makes a series of chuckling or clucking noises__ooking__s it joyfully engages with its surroundings or fellow ferrets, suggesting excitement or happiness.","Ferret dooking is characterized by a series of clucking or chuckling sounds, which vary in pitch and rhythm, often conveying excitement or happiness. The noise resembles a mix of birdlike tweets and chattering, and tends to be expressive, with a rhythm akin to a warble or giggle." +fire crackling,"Fire crackling is the auditory experience of small, rapid, and varying sounds produced as materials combust, with the popping noise being caused by moisture escaping and expanding in the heat of the fire. It evokes warmth and is often associated with campfires or cozy fireplaces.","Flickering orange flames leap and dance on logs, casting a warm, inviting glow. Sparks occasionally pop, sending tiny embers into the cool night air as trails of smoke rise, blurring the starry backdrop. Shadows play on the faces of those gathered around, mesmerized by the hypnotic, crackling symphony.","The sound of fire crackling typically includes intermittent, sharp pops and snaps, a steady sizzling and hissing, with variable pitches and erratic rhythms as wood combusts and releases gases, producing a soothing, warm, and organic ambiance." +fire truck siren,"A fire truck siren is a loud, distinctive warning sound produced by emergency vehicles, typically heard as a wailing, yelping, or continuous tone to alert pedestrians and motorists to clear the way for their fast approach during emergencies.","A bright red fire truck races down the street, its flashing lights reflecting off buildings. A loud, urgent siren wails, slicing through the din of city noise as firefighters clad in heavy gear and helmets rush to respond to an emergency.","A fire truck siren typically emits a loud, high-pitched wailing or yelping sound, alternating between multiple tones. It's designed to be piercing and attention-grabbing, often with a doppler effect as the vehicle passes, modulating in pitch due to movement relative to the listener." +fireworks banging,"""Fireworks banging"" refers to the loud, explosive sounds made when fireworks are ignited, often characterized by sharp, concussive bursts and echoing reports, associated with celebrations, festivals, and public displays. These sounds contribute to the auditory spectacle accompanying the visual fireworks display in the sky.","A night sky bursts with vibrant colors as dazzling fireworks explode, creating cascading showers of light while the air pulsates with their resounding booms, the crowd below gazes in awe at the pyrotechnic spectacle.","Fireworks create loud, explosive bursts with varying pitches and rhythmic pops. They include echoing booms, crackling, and whistling ascents. Sounds range from low to high frequencies, with sudden onsets and decaying trails, often accompanied by high-pitched fizzing from trailing sparks." +firing cannon,"A firing cannon event is a loud, explosive occurrence marked by a rapid release of gases, a distinctive boom, and a recoil as the cannonball is projected. It embodies a sudden burst of energy, historically associated with military use during battles or as ceremonial salutes.","A visual representation may include a large cannon with a long barrel recoiling backward amidst swirling gunpowder smoke, as bright, fiery orange flashes emerge from the muzzle against a backdrop of startled onlookers covering their ears from the thunderous boom.","A firing cannon exhibits a loud, sharp initial blast, followed by a long, rumbling echo. The sound has a low-frequency boom with high-intensity peak, often accompanied by the hiss of a fuse before detonation, producing shockwaves that can be felt physically." +firing muskets,"Firing muskets refers to discharging muzzle-loading firearms used from the 16th to the 19th century, characterized by a distinct loud bang and smoke produced by igniting black powder in the firing mechanism, often associated with historical military conflicts and reenactments.","Smoke billows from the barrels of muskets as soldiers in 18th-century uniforms stand in formation, firing volleys. The scene is punctuated by bright flashes and the acrid smell of gunpowder, with echoing reports cutting through the air.","The firing of muskets is characterized by a sharp, loud report or bang, accompanied by the mechanical click of the flintlock mechanism, a brief hissing of gunpowder ignition, and a faint, lingering smoky smell afterward. Multiple firings create a staccato series of blasts echoing over distance." +fly buzzing,"A fly buzzing is a common and recognizable sound event, characterized by the continuous, rapid flapping of a fly's wings, resulting in a persistent, low-pitched hum or buzz that can vary in volume and frequency depending on the species and activity of the insect.","A close-up of a singular, iridescent fly, its wings a blur, hovers near an open window with a gently swaying curtain. The sun casts a warm glow over a still room, highlighting dust motes dancing in the air, all underscored by the persistent, droning buzz of the fly's flight.","A fly’s buzzing is a persistent, high-pitched drone, modulating with its wingbeat frequency of 150-200 Hz. The sound starts and stops abruptly as the fly moves, with softer, irregular bursts when it adjusts its flight path." +foghorn,"A foghorn is a deep, loud horn used on ships and at coastal and river locations to emit warning signals in foggy conditions or poor visibility to prevent collisions and guide vessel navigation.","A thick blanket of fog envelopes a shadowy seascape, with faint lights glimmering from a distant lighthouse. Waves gently lap against the shore, and a deep, resonant foghorn periodically breaks the silence, signaling caution to unseen ships amidst the opaque, misty veil.","A foghorn produces a deep, long, resonant sound with a low frequency, often characterized by a monotone pitch and a vibrating, rumbling quality that can travel long distances. It typically includes a pattern of repeated blasts to signal presence in foggy conditions for navigational safety." +footsteps on snow,"Footsteps on snow are the audible crunch or soft compression sounds created when someone walks over a snow-covered surface, varying with snow type and temperature, conveying the distinct, quiet atmosphere of a wintry landscape.","A blanket of pristine snow covers the ground. Each step creates a crisp, crunching noise as footprints form a lonely trail, disrupting the untouched surface. The air is sharp, carrying the echo of the deliberate, steady pacing through the serene, wintry landscape.","Crunchy, crisp, compacting sounds, with a slight squeakiness, reflect the compression of snow. The sound's intensity varies by snow type: fresh snow emits soft, muffled thuds, while icy snow produces sharper, clearer crunches. Rhythmic patterns of footsteps create a distinct cadence." +forging swords,"Forging swords involves heating metal in a forge, hammering it into shape, and refining the edges to create bladed weapons. This process produces a symphony of sounds: the roar of the forge, rhythmic clanging of hammer on anvil, and the hiss of quenching hot steel.","A rhythmic clanging reverberates as fiery sparks fly from red-hot metal; burly blacksmiths, illuminated by forge's glow, hammer and shape the nascent blades on sturdy anvils, muscles straining with each precise, forceful strike.","Clanging hammers striking metal, anvils resonating deep, metallic rings, intermittent grinding sounds, occasional sizzle of quenched steel, underlying hum of the forge, rhythmic pounding, echoes in a workshop." +fox barking,"The sound event ""fox barking"" refers to the distinct call made by foxes which is sharp, short, and often mistaken for a dog's bark. This vocalization is used for various reasons, including communication with other foxes, signaling dominance, or as an alert mechanism.","In the twilight, a russet fox stands alert in a meadow, head tilted upward, with its mouth slightly open emitting short, sharp barks. The nearby foliage casts long shadows, while curious, attentive eyes of woodland creatures peek from the undergrowth, illuminated by the glint of fading sunlight.","A fox's bark is typically high-pitched, sharp, and brief, sometimes described as a ""wow-wow-wow"" sound, with varying pitches and intervals. It can resemble a dog's bark but is more erratic and shrill, often used for communication during the nocturnal hours." +francolin calling,"The francolin’s call is a distinct sound from gamebirds in the Francolinus and Peliperdix genera. Their loud, repetitive vocalizations vary by species and are used for communication, often heard at dawn or dusk in habitats like grasslands and forests.","A gentle dawn creeps over a dew-laden landscape, lush with foliage. Amidst the rustling leaves, a plump, speckled francolin emerges, perched on a twisted branch, tilting its head back to release a series of clear, flute-like calls that resonate through the quiet of the early morning.","A francolin calling typically produces a series of loud, repetitive, and rhythmic cackles or chuckles, with a vocal pitch that varies depending on the species but often includes low to mid-tones. It's a distinctive birdcall that can carry over long distances and is commonly heard in the early morning or evening." +frog croaking,"Frog croaking is the vocalization produced by certain species of frogs, characterized by a repetitive, often guttural sound. This behavior serves various purposes, including territory establishment and attracting mates during the breeding season, and is a distinctive sound of wetland ecosystems, particularly at night.","Amidst a tranquil pond, under a crescent moon, a silhouette of reeds sways lightly. Shadows of lily pads speckle the water__ surface while a group of frogs perch atop. Ripples echo out as one frog inflates its throat, the air around charged with the rhythmic symphony of their croaks.","Frog croaking features a repetitive, guttural “ribbit” or “croak” with low to mid-range frequency, irregular rhythm, and pitch variations. Commonly heard at night during mating season, the volume and timbre differ across species." +gibbon howling,"Gibbon howling is a vocal behavior of gibbons, characterized by loud, melodious sequences of calls used to communicate with other gibbons, establish territory, and strengthen social bonds. This distinctive and complex vocalization can travel long distances through forest habitats, aiding in the survival of these arboreal primates.","In a misty forest, a gibbon energetically swings through the canopy, emitting a haunting, melodic call. The sound resonates in the morning stillness, and other gibbons may join, forming a symphony of echoing songs.","The sound event ""gibbon howling"" features a series of modulated whoops and cries that can vary in pitch and intensity, often starting soft and building to loud, piercing calls. The vocalizations are rhythmic and may include complex patterns, with each gibbon's howl being slightly unique." +goat bleating,"Goat bleating is the characteristic sound made by goats, consisting of a nasal-toned, wavering cry used to communicate distress, hunger, or to maintain contact with the herd. Each goat's bleat is unique, serving as an audible identifier to other goats and their human caretakers.","A goat stands amidst a pastoral setting, mouth open in mid-bleat, with a possible echo of countryside peace or urgent communication to its herd. Hills roll in the background, and there's a rustic quality to the image, possibly with other goats or farm life in the vicinity.","A goat bleating typically involves a nasal, medium-pitched ""maa"" or ""meh"" sound, repeated at various intervals. The tone can fluctuate in volume and pitch, indicating distress, recognition, or communication with other goats. The sound can have a vibrato or wavering quality." +golf driving,"Golf driving refers to striking a golf ball with a driver club off the tee to achieve maximum distance and accuracy, initiating play on par-4 and par-5 holes. This critical skill combines power, technique, and precision, setting the tone for subsequent shots toward the hole.","A golfer clad in sporty attire stands poised on a lush fairway, club swung back in preparation. At the moment of impact, the sharp ""whack"" of the ball echoes, as it sails against a clear sky, leaving a faint trail as it heads towards a distant green.","A golf drive typically features a sharp, crisp ""click"" or ""clack"" at the moment of impact between club and ball, followed by a decreasing whizz as the ball soars through the air. Background sounds may include the rustle of grass, birdsong, or distant chatter, depending on the environment." +goose honking,"Goose honking is a distinctive, trumpet-like vocalization produced by geese when communicating with each other, signaling distress, or protecting their territory. This sound is emblematic of wild or domesticated geese, often heard in migratory flocks or at bodies of water where they congregate.","A flock of geese flies in a V-formation against a crisp blue sky, their wings flapping in unison. Below, a tranquil lake reflects their image. The air resonates with their loud, distinctive honking as they communicate during their migratory journey.","A goose honking is characterized by its loud, nasal honk, which is a series of short, repetitive, penetrating notes with a frequency range of 1 to 4 kHz, often varying in pitch and intensity, sometimes punctuated by longer, drawn-out calls in a cacophony when in a flock." +hail,"Hail is a type of solid precipitation consisting of ice pellets, called hailstones, that form during thunderstorms when updrafts carry raindrops into extremely cold areas of the atmosphere, freezing them. It can cause significant damage to crops, vehicles, and structures.","A barrage of ice pellets bounces off surfaces with a cacophony of sharp, cracking noises; leaves tremble, and water splatters as each frozen bead impacts the ground, cars, and rooftops, creating a pervasive, drumming echo that fills the scene with the chaos of a sudden hailstorm.","Hail produces irregular, sharp tapping sounds as ice pellets strike various surfaces. The intensity varies with pellet size, with larger hailstones creating louder, more resonant impacts. The frequency can range from sporadic to a rapid succession, mingled with occasional thuds on softer materials and metallic pings on hard surfaces." +hair dryer drying,"The sound event ""hair dryer drying"" typically involves the consistent rumble and whoosh of warm air blown at high speeds, often accompanied by a slight mechanical hum from the hair dryer's motor as it operates to evaporate moisture from wet hair.","A handheld device directs warm air towards wet hair, causing loose strands to flutter slightly. Steam rises as moisture evaporates, and the user manipulates the dryer, aiming at different sections of their head.","A hair dryer emits a consistent, high-pitched whirring sound with a strong airy component from the blowing air. It can produce varying intensity levels based on the setting, often overlayed with a slight mechanical hum from the operating motor and occasional hand manipulation noises." +hammering nails,"Hammering nails is a common sound event characterized by repetitive metallic strikes as a hammer drives nails into a surface, typically wood, producing sharp, rhythmic tapping with varying intensity depending on the force applied and materials involved.","A rhythmic, echoing clang of metal striking metal, with each sharp tap, a nail is driven deeper into wood, the forceful arm of a worker raises and lowers a sturdy hammer, embedding fasteners into a surface, amidst a backdrop of a construction site or a simple DIY project.","Repetitive, sharp metallic strikes with varying intensity; rhythmic succession; occasional wood splintering sounds; echo depending on environment; high-decibel, transient impact noises with a reverberating tail." +heart sounds,"Heart sounds are acoustic phenomena produced by the heartbeat, commonly including two primary sounds: the ""lub"" of the closing mitral and tricuspid valves (S1) and the ""dub"" of the aortic and pulmonary valves closing (S2), used to assess cardiac function and identify abnormal cardiac conditions.","An image of a stethoscope placed over a stylized heart with audio wavelength lines pulsating around or emanating from it, possibly with an EKG heartbeat monitor line integrated into the background, symbolizing the rhythm and sound of a beating heart.","Heart sounds are characterized by rhythmic beats of low to medium frequency, typically described as ""lub-dub,"" corresponding to the closing of heart valves, with the first heart sound (S1) being longer and lower-pitched than the second heart sound (S2), and separated by silent intervals." +hedge trimmer running,"A hedge trimmer running produces a consistent, buzzing, and mechanical noise as the motor drives blades to rapidly oscillate, cutting through foliage. It's a common auditory cue in garden maintenance, characterized by its high-intensity, grinding sound reflecting the power tool's operation.","A person stands in a lush garden, wearing safety goggles and gloves, gripping a vibrating hedge trimmer as it slices through green foliage, leaving behind neat, manicured bushes under a bright sun.","A hedge trimmer running emits a continuous, high-pitched buzzing or whirring noise, with intermittent, sharper chopping sounds as the blades snip through branches. The sound intensity can vary as the trimmer moves through different thicknesses and the motor's load changes." +helicopter,"A helicopter is an aircraft with rotating blades, known for its distinctive chopping sound as it flies. Its sound event combines pulsating engine noise with rhythmic blade chopping through the air, often used to signify aerial arrival or surveillance in audio contexts.","A rapidly spinning rotor with blurred blades atop a sleek body, slicing through the air with a distinctive chop-chop rhythm against a backdrop of sky, often with a wisp of wind denoting motion, and concentric circles emanating from the machine to represent the echoing throb of the engine.","A helicopter sound event typically features rhythmic, pulsing blade chops, low-frequency whooshing due to rotor rotation, mechanical engine hum, and intermittent high-pitched whines, all with Doppler effect variations as it approaches and departs, and reverberations if near structures or terrain." +horse clip-clop,"The sound event ""horse clip-clop"" refers to the distinctive, rhythmic noise made by a horse's hooves striking a hard surface, typically associated with walking or trotting. This iconic sound echoes the gait's tempo and the interplay of the hooves with the ground.","A horse trots along a cobblestone road, its hooves rhythmically striking the ground, head bobbing gently with each stride, mane fluttering, as the echo of each clip-clop bounces off the surrounding buildings and trees.","A horse clip-clop is characterized by rhythmic, hollow, and muted clopping sounds made by hooves striking the ground, with variations in tempo depending on the horse's gait, often accompanied by occasional snorts, the rustle of its mane, and the jingle of harness or tack if equipped." +horse neighing,"A horse neighing is a distinct, high-pitched vocal sound made by a horse, often characterized by a strong, whinnying or squealing tone. It is typically used to communicate with other horses or express emotions such as excitement, discomfort, or curiosity.","A horse stands with flared nostrils, its mouth open, and head raised. Its eyes are bright, and it tilts its neck as it emits a loud, distinctive whinny, mane flowing slightly with the vibration of the sound.","A horse’s neigh is a high-pitched, whinnying sound starting with a prolonged snort, followed by resonant vibrations and pitch fluctuations. It varies in duration, often ending in a softer, breathy note, with vibrato and harmonic overtones enhancing its distinctness." +ice cracking,"The sound event of ice cracking often features sharp, sudden pops and fractures as the crystalline structure of frozen water cleaves and breaks. These audible cues can range from delicate tinkling to thunderous booms, depending on the scale and conditions of the ice involved.","A frozen expanse glistens under harsh cold light. Web-like fissures rapidly spread, fracturing the once solid ice surface. Each crack contributes to an intricate pattern, signifying the precarious state of the increasingly unstable frozen layer, as echoes of the splintering resonate through the stark, chilly air.","The sound event of ice cracking typically features sharp, sudden fractures or snaps followed by a series of echoes. These sounds are often high-pitched with a brittle timbre, and can contain a cascade of lesser cracks and pops as the ice continues to break apart." +ice cream truck,"An ice cream truck is a mobile vending vehicle that plays distinctive music to announce its presence and attract customers to buy frozen desserts, such as ice cream, popsicles, and snow cones, especially during warm weather. Children and adults alike are drawn to its nostalgic and joyful melody.","A colorful vehicle adorned with pictures of frozen treats, playing a cheerful, repetitive jingle drives slowly through a sunny neighborhood, as excited children run towards it, clutching coins in anticipation of buying cold ice cream on a warm day.","An ice cream truck typically features a distinctive, high-pitched melody loop, often chiming or electronic, inviting in tone. This melody is usually recognizable and repetitive, played through speakers as the truck travels slowly through neighborhoods to alert potential customers of its presence." +kayak rowing,"Kayak rowing is an outdoor activity involving a small, narrow watercraft propelled by means of a double-bladed paddle. The sound includes rhythmic splashing of water, the paddle's gentle swoosh with each stroke, and the occasional wildlife and environment noises blending with the paddler's movements.","A serene lake, its surface an unbroken mirror, reflects the lush greenery of its shores. A kayak glides through the water, a paddler rhythmically dipping their oars, sending ripples across the calm, with each stroke accompanied by the soft swish of water swirling around the blade.","Paddles gently dipping into water, rhythmic splashing, water droplets tapping kayak's surface, soft whooshing with each stroke, occasional creaking of the vessel, distant bird calls or nature sounds blending with the subtle movement of the kayak through a calm river or lake, creating a serene, meditative soundscape." +kid speaking,"A ""kid speaking"" sound event captures the vocal expressions of a child, encompassing a range of pitches and articulations characteristic of youthful speech, often marked by a higher pitch, less pronounced enunciation, and a playful or inquisitive tone, as they communicate or attempt to articulate thoughts and emotions.","A visual of ""kid speaking"" might show a child with an open mouth, sound waves emanating from their position, or a speech bubble with playful, childlike font. Their expression could be enthusiastic or curious, with attentive listeners or toys around to indicate an informal, youthful context.","A child’s speech is high-pitched with distinct intonation, possibly slower cadence, and simple word choice. Pronunciation may be errant, with varied dynamics showing emotion or excitement. The voice can be nasal, often accompanied by background noises like toys or playground sounds." +lathe spinning,"Lathe spinning refers to the process of shaping metal, wood, or plastic using a machine tool called a lathe, which rotates the workpiece against cutting tools. The sound event encompasses the hum and whir of the spinning lathe and the rhythmic cutting noises as the material is shaped.","A rotating lathe with a workpiece clamped tightly, emitting a steady, rhythmic whirring as sharp tools sculpt the material, sending curls of debris spiraling away, accompanied by the gentle hum of machinery in a workshop bathed in the warm glow of overhead lights.","A lathe spinning emits a steady, rhythmic whirring or humming due to its rotating spindle. There may be intermittent scraping or grinding sounds as the cutting tool shapes the material, and the pitch may change with adjustments to speed or material resistance. Vibrational undertones often accompany the primary noises." +lawn mowing,"Lawn mowing is the activity of cutting grass to an even height using a machine known as a lawn mower, which can be manual or powered. It's a common maintenance task for gardens and public greenspaces, often associated with spring and summer, producing a distinctive, rhythmic mechanical sound.","A person pushes a mower across a grassy yard, its blades whirring, neatly trimming the green expanse. Sunlight glimmers off the machine as grass clippings scatter, the rhythmic sound punctuating a calm suburban setting.","Lawn mowing emits steady, rhythmic mechanical drone interspersed with higher-pitched whirring of blades, occasional grass rustling, and sometimes lower, sputtering noises on denser patches. The volume ebbs with distance or obstacles and fluctuates with mower's speed or engine power variations." +lighting firecrackers,"Lighting firecrackers involves igniting a fuse attached to small explosive devices, which upon detonation produce loud, sharp noises and bright flashes, traditionally used in celebrations and festivals for their spectacular auditory and visual effects, symbolizing joy and warding off evil spirits.","Sparks fly as a series of small, colorful explosives burst in rapid succession, illuminating faces with a warm glow while plumes of smoke drift upward, accompanied by the sharp, intermittent crackles and pops of igniting pyrotechnics that punctuate the excited chatter of onlookers.","Lighting firecrackers typically involves sharp, loud cracks and pops with varying frequencies and intensities, a rapid succession of explosive sounds, accompanied by the hiss of fuses burning and possibly a faint whistling prior to detonation, creating a staccato rhythm that can startle and echo in the surrounding environment." +lions growling,"Lion's growling is a deep, resonating roar often used as a form of communication among lions to establish territory, show dominance, or signal distress. This powerful sound event can carry over long distances, conveying the strength and presence of one of the most formidable predatory cats.","A pride of fierce lions, manes bristling, deep-set eyes fixed ahead, unleash throaty roars that reverberate across the savanna, their powerful jaws wide open as they assert dominance and communicate with one another against the backdrop of tall grass swaying in the wind.","A lion’s growl is a deep, resonant sound with low-frequency vibrations felt and heard. It modulates in pitch and intensity, signaling dominance or aggression, and includes harmonic overtones for a rich timbre." +lions roaring,"A lions' roaring is an iconic, deep, and powerful vocalization used by lions for communication, establishing territory, and signaling dominance. This intimidating sound can carry over 5 miles, signifying the lion's presence and strength to other animals within its habitat.","A pride of majestic lions with thick manes stands majestically on a savannah. Their mouths wide open, they release powerful, resounding roars that reverberate across the golden landscape, asserting their domain and communicating with each other under the vast, open sky.","A lion's roar is a deep, resonant sequence of sounds that include grunts and growls extending over several seconds. It has a low-frequency rumble that can reach 114 dB and carry over 5 miles, typically starting quieter and building in volume, often described as fearsome, commanding, and powerful." +lip smacking,"Lip smacking is a common, non-verbal mouth sound typically made by pressing lips together and then separating them quickly, creating a wet clicking or smacking noise, often used to express hunger, appreciation for food, or to attract attention.","A person's close-up, lips part repeatedly, touching in a moist, pronounced manner, creating a distinctive, wet clicking noise often associated with hunger, taste enjoyment, or anticipatory behavior, possibly accompanied by wide eyes or raised eyebrows emphasizing eagerness or satisfaction.","The sound event ""lip smacking"" is characterized by wet, repetitive clicking noises produced by pressing lips together and then parting them, often associated with eating or anticipation of food, producing a range of mid to high frequencies with brief, rhythmic bursts and a resonant quality." +machine gun shooting,"A ""machine gun shooting"" sound event is characterized by rapid, rhythmic bursts of gunfire emanating from a machine gun, typically used in military or law enforcement scenarios, producing a distinct, intimidating series of loud, mechanical reports at a high rate of fire.","Rapid, successive flashes from a firearm's barrel, with shell casings ejecting, amidst a chaotic backdrop of scattering individuals, debris flying, and possible muzzle smoke with the loud, echoing crack of gunfire piercing the air.","Rapid, repetitive, sharp cracking sounds; high-intensity; staccato rhythm; bursts of echo depending on environment; metallic clinking of shell casings; potential mechanical whirring or clicking between bursts." +magpie calling,"The sound event ""magpie calling"" refers to the vocalization produced by magpies, which are intelligent birds known for their complex, varied calls and vocal mimicry. Their distinctive calls can include chatters, warbles, and other melodious notes, often signaling communication, territory defense, or social interaction among magpies.","A magpie perches on a branch, its black and white feathers stark against the clear sky. It rhythmically chatters, its calls echoing through the serene landscape, alerting curious onlookers and animals.","A magpie call is a high-pitched, warbling melody with intermittent chortles and clicks. It is a distinctive, flute-like song that can include a variety of whistles, trills, and sometimes mimicry of other birds or noises. It typically has a chattering quality, often heard during morning or dusk." +male singing,"""Male singing"" refers to the creation of musical tones and rhythmic patterns using the human male voice, often with varying pitch, tone, and volume to produce melody and express emotion, distinguishable from speaking or non-musical vocalizations.","A man's silhouette with a microphone stands in a spotlight, notes flowing from his open mouth, conveying dynamic energy and musical passion against a dark background, suggesting an intimate performance or a lively concert atmosphere.","A “male singing” event features a pitch range of 85-180 Hz (baritone/tenor), with tonal quality, varying timbre, melodic structure, and lyrical articulation. It includes vibrato, rhythm aligned with music, dynamic volume range, and harmonic overtones." +man speaking,"A ""man speaking"" sound event involves the auditory output of a male individual articulating words or sentences. It encompasses a range of frequencies and intonations unique to the speaker's voice and language, conveying information or expressing thoughts and emotions through spoken communication.","A speech bubble emanating from a male figure, possibly including typographic representations of speech like quotation marks or sound waves near his mouth, indicating verbal communication. The man's posture may suggest active talking with mouth open and facial expressions conveying the tone of the speech.","A “man speaking” sound event features a voice with a fundamental frequency of 85-180 Hz, varying intonation, rhythm, and stress patterns. It includes articulated vowels and consonants, potential background noise, and room acoustics like reverb." +metronome,"A metronome is a device used by musicians to mark time at a selected beat per minute, providing a consistent rhythmic pulse for practicing precise tempo and improving timing skills.","A sequence of evenly spaced ticks, accompanying the pendulum-like swing of a metronome's arm, which oscillates back and forth with precision, marking a steady rhythm for a musician's practice session, set against the backdrop of sheet music and instruments.","A metronome produces a consistent and rhythmic ticking or clicking sound at a set tempo, generally measured in beats per minute (BPM). The auditory pattern is regular, with evenly spaced intervals, and the pitch and timbre can vary depending on the metronome's design__echanical or digital." +missile launch,"A missile launch is the event of a projectile being propelled by a rocket or other launching device, often characterized by a loud roaring noise, the generation of heat, and release of exhaust gases. It's commonly associated with military operations or space exploration missions.","A missile soars into the sky, leaving a trail of fiery exhaust; alarms blare, lights flash at a launch pad, and military personnel watch with intense focus as the projectile ascends with a thunderous roar, cutting through the atmosphere.","A missile launch typically features a sudden, loud roar or whoosh, deep rumbling, increasing in intensity, possibly with a high-pitched whistling. These sounds are followed by a rapid fading as the missile distances. Additionally, there may be secondary explosions and mechanical noises from the launcher." +mosquito buzzing,"A mosquito buzzing is the high-pitched whine produced by the rapid flapping of a mosquito's wings at a frequency of 400 to 600 Hz, often heard during still nights and usually indicating the proximity of these small, blood-feeding insects.","A single mosquito hovers in the dimly lit room, its wings a blur as it darts erratically near a person's ear, their face contorted in annoyance while swatting the air in a futile attempt to dismiss the persistent, high-pitched whine.","The mosquito buzzing is characterized by a high-pitched, persistent whining tone, typically ranging between 400 Hz to 1 kHz. Its rapid wing flaps produce a buzzing or humming sound with a frequency modulated pattern due to the beating wings, creating slight variations in pitch and intensity." +motorboat acceleration,"A ""motorboat acceleration"" sound event encompasses the audible increase in engine revs and the resultant rise in pitch and volume as a motorboat speeds up, typically accompanied by the churning and splashing of water as the craft gains momentum.","A motorboat accelerates, its engine roaring louder. Waves churn more fiercely as the vessel's speed increases, water sprays outward, and the bow lifts slightly. The surrounding scenery blurs past while the boat leaves a frothy wake trailing behind it.","Motorboat acceleration is characterized by a low-pitched, throbbing hum that increases in frequency and volume as the engine revs higher, accompanied by the churning of water and the resultant splashing sounds as the boat gains speed and cuts through the water's surface." +mouse clicking,"A mouse click is a distinct, short, sharp sound created by pressing and releasing a button on a computer mouse, signifying an action or command input by a user, typically for selecting or interacting with elements on a screen in a graphical user interface.","A human finger presses down on a computer mouse button, causing a sharp, short ""click"" noise, often accompanied by a cursor moving or selecting something on a digital screen in a quiet room with the sound emanating clearly.","A mouse click produces a short, high-pitched clicking sound with a rapid attack and a quick decay. It frequently has a plastic or mechanically resonant quality, featuring a single, distinct, ""snappy"" actuation point often punctuated by a moderate-intensity initial peak followed by little to no sustain or echo." +mouse pattering,"Mouse pattering refers to the soft, scurrying sounds made by mice as they move across surfaces, often heard in quiet environments like homes during night hours, indicating the presence of these small rodents.","A small, nimble mouse scurries across a wooden floor, its tiny claws tapping rhythmically. Shadows flicker as it weaves through scattered debris, the faint pattering sound echoing softly in the quiet space.","Quiet, high-pitched scurrying noises with intermittent soft clicks of tiny claws against hard surfaces, indicative of fast, rhythmic movements; often erratic with occasional pauses, reflecting skittish behavior typical of a mouse in motion." +mouse squeaking,"A mouse squeaking is a high-pitched sound typically produced by mice as a form of communication, to signal distress, or attract mates. The frequency varies, but it often falls within the ultrasonic range, which can be inaudible to human ears without special equipment.","A small mouse with twitching whiskers and round ears emits high-pitched squeaks, possibly standing on hind legs in a dimly lit room. Shadowy objects create an ominous feel, suggesting the mouse’s anxious attempt to communicate or evade danger.","High-pitched, brief, repetitive squeaks with a frequency range from 1 to 70 kHz, often ultrasonic, characterized by rapid onset and decay, and variable in rhythm and pitch, indicative of communication or distress in the rodent's vocalization." +mynah bird singing,"A mynah bird singing is a melodic audible event characterized by a series of vocalizations that the bird uses to communicate or mimic sounds, showcasing its capacity for complex, varied, and often enchanting birdsong.","A mynah bird perches on a branch, beak open, vibrant feathers ruffled slightly as melodious sounds fill the air, with a backdrop of lush green foliage and the soft glow of morning light filtering through the leaves.","The mynah bird's song is characterized by a series of melodious whistles, clicks, and squawks, often mimicking natural and artificial sounds with uncanny accuracy. It exhibits a wide range of pitches and tones, demonstrating remarkable vocal versatility and complexity in its multi-note sequences." +ocean burbling,"Ocean burbling refers to the tranquil, continuous sound made by water motion within the ocean, often characterized by the gentler aspects of waves rolling, water bubbling, and currents mingling, emitting a soothing and rhythmic acoustic experience reminiscent of nature's own lullaby.","A serene seascape with gentle waves lazily lapping on the sandy shore, small bubbles forming and popping as the water retreats, the rhythm accompanied by the soothing, continuous soft noise of water interacting with the coastline and the occasional distant call of seagulls.","“Ocean burbling” involves low to mid-frequency sounds, with continuous bubbling, splashing, rhythmic ebbing, and gurgling. The interplay of water movement, underwater terrain, and life creates a soothing yet chaotic blend of predictable and random acoustic elements." +opening or closing car doors,"The sound event ""opening or closing car doors"" involves the distinct mechanical and aural cues associated with a vehicle's door being unlocked, opened, shut, or locked, often characterized by a series of clicks, thuds, and latches engaging or disengaging.","A sequence of car doors swinging open or shut with corresponding thuds, possibly involving people entering or exiting vehicles, often accompanied by interior lights flickering on or off, and the sound conveying arrival or departure.","The sound of opening or closing car doors typically includes a metallic latch click, followed by a thud from the heavy door-seal compression, and occasionally a faint creak if hinges are worn. Closing also features a resonant reverberation as the door snugly fits into the frame." +opening or closing car electric windows,"The sound event ""opening or closing car electric windows"" refers to the distinct mechanical and electronic noise produced when car windows are powered up or down using the vehicle's electrical system, typically involving motor whirring and glass movement against the seal.","A hand presses a button on a car door panel. The window glass slides smoothly up or down within its frame, with the whir of an electric motor accompanying the movement, altering the view from opaque to transparent or vice versa.","The sound of opening or closing electric car windows typically includes a low-pitched hum or whirring noise from the motor, a smooth, consistent mechanical sliding or rolling sound, and sometimes a soft thud or click when the window reaches its full open or closed position." +opening or closing drawers,"The sound event of opening or closing drawers typically involves a series of mechanical noises, including the pull and slide of drawers on their runners, often accompanied by a creak, thud, or click as they are fully opened or closed and secured in place. +","A sequence of images depicting a hand pulling handles to slide drawers open, revealing contents inside, followed by pushing them shut, creating a rhythmic sequence of wooden thuds and creaks, capturing the tactile essence of the action and its auditory accompaniment.","Opening or closing drawers typically involves sliding or rolling sounds, wood-on-wood or metal glides, and possibly a soft thud or click when the drawer is closed. The intensity can vary based on the force used and drawer contents, with potential rattling of items inside." +orchestra,"An orchestra is a large ensemble of musicians playing a variety of instruments, such as strings, brass, woodwinds, and percussion, typically led by a conductor. It performs intricate compositions, ranging from classical to contemporary pieces, creating rich, dynamic soundscapes.","Rows of seated musicians with various instruments__ blend of strings, brass, woodwinds, and percussion__ocused on a conductor standing at a podium, baton in hand, energetically guiding the ensemble through a harmonious, dynamic performance on a grand stage with an attentive audience immersed in the music.","An orchestra sound event features complex layers of instruments including strings, woodwinds, brass, and percussion. It is characterized by harmonious melodies, dynamic ranges from soft to loud, varying tempos, and rich textures. The soundscape can be both densely orchestrated and punctuated by distinctive solo moments." +otter growling,"An otter growling is a vocalization made by an otter, potentially indicating aggression or discomfort. This guttural sound serves as communication within otter communities or as a warning to perceived threats.","An agitated otter's fur is bristled, its body tensed, with sharp teeth bared. It may be standing on its hind legs or crouched, emitting a low guttural growl towards a perceived threat, perhaps another animal or human, with eyes locked in a firm, defensive stance.","An otter growling typically produces a low-to-medium frequency rumble with a guttural quality, characterized by abrupt starts and stops. This sound may include gruff, throaty harmonics and can vary in volume and duration depending on the otter's size and behavioral context." +owl hooting,"Owl hooting is the haunting vocalization used by owls for communication. This distinctive call, typically performed at night, serves to establish territory, signal alarm, locate mates, or communicate with offspring, varying greatly among species in pitch, frequency, and pattern.","A silhouetted owl perches on a gnarled branch under a moonlit sky, its round eyes glowing, while the haunting ""hoo-hoo"" echoes through the tranquil forest, adding an eerie yet serene undertone to the nocturnal landscape.","Owl hooting typically features low-pitched, resonant calls with a distinct ""who"" sound. Hoots often have a rhythmic sequence and are used to communicate territorially or with potential mates, exhibiting a haunting quality that can echo through forested areas during the night." +parrot talking,"A parrot talking is a fascinating sound event where these vocal birds mimic human speech or sounds from their environment using their syrinx, often with surprising clarity and intelligence, reflecting extensive learning and social interaction capabilities.","A vibrant parrot perched on a branch or stand, tilting its head, with its beak open and colorful feathers ruffled, as musical notes or speech bubbles emanate from it to signify the mimicking of human speech in a dynamic and whimsical setting.","A talking parrot produces mimicked human speech with varying pitch and tone, often high-pitched and nasal. Speech may exhibit erratic rhythm and abrupt changes in volume, with occasional interspersed squawks, clicks, or whistles unique to avian vocalization." +penguins braying,"Penguins braying is a vocalization that resembles the sound of a donkey's bray, typically used by penguin species like the African and Gentoo penguins for communication within their colonies, often during mating rituals or as a contact call between mates and offspring.","A group of animated penguins stand amidst icy surroundings, necks stretched upwards and beaks open wide, as a chorus of honking noises similar to donkeys' brays fills the air, reverberating through the frigid Antarctic landscape.","Penguins braying resemble a chorus of short, loud, donkey-like honks or trumpet blasts, with repetitive, rhythmic patterns varying in pitch and intensity among individuals, often with background chatter of a bustling colony, and may include flapping or slapping sounds as birds move or interact." +people babbling,"""People babbling"" refers to the background noise created by a crowd of individuals talking simultaneously, often indistinguishable as a collective murmur or hubbub. It's a common sound event in social settings like parties, receptions, or public spaces where groups of people gather and converse.","A chaotic scene of multiple animated figures with open mouths, speech bubbles containing nonsensical symbols or ellipses, overlapping lines to suggest noise, and possibly furrowed brows or exaggerated expressions conveying confusion or lack of comprehension.","A cacophony of overlapping voices at varying pitches and volumes, with indistinct speech sounds, intermittent laughter, and the murmur of multiple conversations blending into a constant, unintelligible hum reminiscent of a crowded place like a party or busy restaurant." +people battle cry,"A ""people battle cry"" is a powerful, emotive shout used by a group to express unity and determination, often associated with rallying troops or sports teams to boost morale and intimidate opponents before or during a confrontation.","A fervent crowd brandishes weapons, faces contorted with passion. They raise clenched fists to the sky, roaring a unison chant that echoes with defiance, their bodies tense and poised for action, as banners ripple above this sea of resolute warriors, ready to surge forward at the call to arms.","A ""people battle cry"" typically features a loud, high-energy collective shout or roar, often with a rising intonation. There may be a unison of voices, conveying determination or aggression, possibly accompanied by the clashing of weapons or the sounds of movement. It's an intense, rallying vocal expression." +people belly laughing,"The sound event ""people belly laughing"" involves a group spontaneously erupting in deep, robust laughter, typically characterized by loud, unrestrained chuckling that comes from the diaphragm, often indicating amusement or joy amongst the participants.","A group of individuals with heads tilted back, mouths wide open in uncontrolled mirth, eyes crinkled or closed with tears of joy possibly forming, bodies convulsing or doubled over, hands on bellies, and unabashed expressions of pure amusement and joy.","A “belly laughing” sound event includes variable-pitch, rhythmic laughter, deep tones, and breathy gasps from diaphragm use. It features harmonic chuckles, sporadic snorts, background chatter, and may include clapping or slapping sounds." +people booing,"The sound event ""people booing"" is a collective vocal expression of disapproval or contempt, where a group of individuals emit a loud ""boo"" to show dissatisfaction, usually during public events, performances, or speeches.","A crowd with thumbs down, frowning faces, and open mouths, perhaps with accompanying ""boo!"" speech bubbles, to convey dissent and displeasure. Some individuals might have arms crossed or be shaking their heads, while the ambiance is tense and unwelcoming.","A sound event of people booing typically features a chorus of discordant vocalizations with low-pitched, elongated ""boo"" sounds, often varying in intensity and pitch, expressing disapproval or disappointment, and may include whistles or hisses, all superimposed over a background of general crowd noise." +people burping,"The sound event of ""people burping"" refers to the audible release of gas from the digestive tract through the mouth, commonly producing a characteristic belch noise. It can vary in volume and pitch, and while often considered a social faux pas, it is a normal physiological process.","A group of people with wide-open mouths and raised hands to their chests. Their faces show a mix of surprise and relief, as comic-style sound effect bubbles emblazoned with ""BURP!"" erupt from their mouths. Others nearby react with exaggerated disgust or laughter.","A burp typically exhibits a low to mid-frequency range, resonant quality, often with a brief, guttural rumble. The duration is short, and may contain tonal elements based on the shape of the vocal tract, and may vary in volume from soft to loud." +people cheering,"""People cheering"" is a sound event characterized by a group of individuals clapping, shouting, and making vocal expressions of joy, enthusiasm, or support, often encountered at sports events, concerts, or celebratory gatherings.","A throng of individuals is depicted with wide smiles, upraised arms, and open mouths in a dynamic scene. Some may be clapping, waving flags or banners, others high-fiving or embracing, reflecting an atmosphere of joy and enthusiasm amidst a vibrant background noise of applause and shouts.","Cheering involves rhythmic clapping, whistles, shouts, and high-intensity vocalizations. It includes variations in pitch and volume, with a crescendo of noise as excitement builds. This sound event typically has a broad frequency range due to diverse voices and acoustics of the environment." +people clapping,"People clapping is a common sound event characterized by the repeated, rhythmic noise created when a group or an individual percussively slaps their hands together, often as a gesture of applause or to show appreciation, approval, or enjoyment in social gatherings, performances, and celebratory contexts.","A crowd of individuals with smiling faces, a variety of open hands coming together in repeated motion amidst a scene of appreciation, celebration, or approval, possibly accompanied by cheering expressions and an atmosphere of excitement.","People clapping produces a series of sharp, percussive sounds with variable intensity and rhythm, often synchronous, creating a crescendo and decrescendo, depending on the number of participants and their enthusiasm. The claps can blend into a consistent applause or be distinct individual sounds." +people coughing,"""People coughing"" is a common sound event characterized by explosive exhalations from the throat, often a reflex to clear the airway or a symptom of illness. This distinctive noise varies in intensity, duration, and frequency, easily recognizable and sometimes contagious in group settings.","A group of individuals are depicted with hands over their mouths or tissue in hand, expressions of discomfort on their faces, with sound lines or musical notes indicating coughing emanating from them, possibly surrounded by concerned onlookers or a medical setting backdrop.","A ""people coughing"" sound event typically features sporadic, abrupt expulsions of air from the throat, producing a harsh, sometimes guttural noise. Accompanying sounds can include breathy wheezing and throat clearing, with volume and pitch varying based on individual and the intensity of the cough." +people crowd,"A ""people crowd"" sound event encompasses the collective noise produced by a gathering of individuals, typified by a mixture of speech, laughter, movement, and potentially other associated sounds like clapping or footsteps, creating a buzzing atmosphere indicative of social activity or communal presence.","A dense gathering of individuals fills a space, with bodies close together, faces blending into a sea of heads. The collective chatter, laughter, and murmurs create a buzzing atmosphere, signaling a lively social event or a busy public place.","A ""people crowd"" sound event features a blend of overlapping conversations, individual voices, laughter, footsteps, occasional shouts or claps, and the general murmur of activity, creating a lively and dynamic auditory environment often characterized by varying pitch and volume levels, with indistinct language content." +people eating,"The sound event ""people eating"" encompasses the array of noises made by individuals while consuming food, such as chewing, crunching, swallowing, utensil clinking, and occasional talking or sighing, contributing to a multifaceted auditory experience of a communal or individual meal.","A graphic depicting a group of individuals seated around a table filled with food, heads inclined towards plates, with lines or musical notes emanating from their mouths to symbolize the sounds of chewing, munching, and utensils clinking against dishes.","Sound of chewing, crunching, lip-smacking, swallowing, utensil clinks, occasional talking or murmuring, possible slurping, and the rustle of napkins or packaging." +people eating apple,"The sound event ""people eating an apple"" involves crunching and chewing noises made as individuals bite and masticate the firm, juicy flesh of apples, often characterized by crisp, repetitive biting sounds followed by softer, wetter sounds of chewing.","A group or individual is depicted with apples in hand, biting into the crisp fruit. The image might capture the moment of teeth sinking into the apple's flesh, accompanied by the characteristic crunching sound, with expressions of enjoyment or refreshment on their faces.","The sound event of people eating an apple typically involves a crisp, sharp bite accompanied by the crunching noise of teeth breaking through the flesh, followed by muffled chewing and occasional squelching as the juicy fruit is masticated." +people eating crisps,"The sound event ""people eating crisps"" involves the audible crunching and rustling typically associated with individuals consuming crispy snack foods like potato chips, characterized by a series of repetitive, high-pitched crackling noises interspersed with the softer sounds of hand and bag movement.","A waveform with regular spikes corresponding to the sharp, high-pitched crunching noises, interspersed with soft rustling from hands reaching into crisp bags, against a backdrop of muffled, irregular chewing sounds.","The sound event ""people eating crisps"" typically features repetitive, sharp crunching noises with varying intensity, along with possible rustling of packaging and intermittent chewing or smacking sounds. Frequencies are often high due to the brittleness of the crisps." +people eating noodle,"The sound event ""people eating noodles"" involves auditory cues such as slurping, chewing, and the clinking of cutlery on bowls, capturing the essence of individuals consuming this popular dish, often associated with Asian cuisine and communal dining experiences.","A group of individuals huddled over bowls, slurping strands of noodles with chopsticks or forks, brows furrowed in concentration, cheeks moving while chewing, steam rising from the hot broth, and the occasional satisfied sigh or smile exchanged over the comforting meal.","Chewing sounds, slurping, intermittent sucking noises, occasional lip-smacking, and maybe the clink of utensils against a bowl, or quiet background conversation if in a social setting." +people farting,"""People farting"" refers to the natural release of intestinal gases through the rectum, producing a variety of sounds from quiet puffs to loud trumpets, often accompanied by a characteristic odor. This bodily function is a normal result of digestion and the breakdown of food in the gut.","A group of individuals stand with comical, embarrassed expressions. Some are blushing while others laugh awkwardly. A few are frozen mid-action, clenching their stomachs. Diverse cartoon-style puffs of gas escape from behind each person, with wavy lines indicating the dispersal of the sound.","The sound event ""people farting"" typically features short-duration bursts of low to mid-frequency flatulence sounds, which can vary from soft, quiet releases to loud, resonant expulsions, often accompanied by a range of pitches and possibly resulting in a humorous or embarrassing social reaction." +people finger snapping,"A ""people finger snapping"" sound event typically involves one or more individuals producing sharp, rhythmic clicking noises by briskly pushing their thumb against one or more fingers, usually the middle finger, creating a sound that is often used in musical contexts or as a non-verbal communicative gesture.","A group of individuals with extended arms and raised hands is captured mid-motion, their fingers executing a brisk pinch and release motion. An animated ripple or a small burst of lines emanates from the fingertips, visually manifesting the sharp, rhythmic ""snap"" that punctuates the air.","A finger snap produces a sharp, high-pitched clicking noise, with a short attack and quick decay. The transient sound often has a rich timbre due to the mix of frequencies, and the volume can vary from soft to moderately loud, depending on the force of the snap and the acoustics of the environment." +people gargling,"The sound event ""people gargling"" involves individuals swishing liquid in their throats, typically water or mouthwash, creating a bubbling and swishing noise as air passes through the liquid to clean or soothe the throat.","A group of individuals tilts their heads back, mouths open, liquid swishing visibly inside. Their cheeks are puffed out, eyes squinted in concentration, as the echoing, bubbly noise of gargling resonates. Some might hold bottles or cups, indicating the source of their rinse.","The sound of people gargling involves bubbling and liquid agitation sounds, often rhythmic with a gargle cycle, interspersed with muffled vocalizations. It varies in pitch and has a resonant quality due to mouth cavity effects." +people giggling,"""People giggling"" refers to the sound event characterized by light, repetitive, vocal laughter, often shared amongst individuals in response to humor, joy, or social interaction. This high-pitched, contagiously cheerful noise signifies amusement and can signal bonding and positive emotional connections among humans.","A group of individuals with wide smiles, their heads thrown back in mirth, eyes sparkling, and perhaps holding their stomachs or slapping their knees, as laughter ripples through the air, embodying a sense of joy and shared amusement.","High-pitched, irregular, spontaneous sounds characterized by short, repetitive bursts, varying in pitch and rhythm, frequently conveying light-heartedness or amusement, and often accompanied by breathy exhalations." +people hiccup,"The sound event ""people hiccup"" involves a quick, involuntary diaphragm contraction followed by the vocal cords snapping shut, creating a distinctive ""hic"" noise, often triggered by eating too quickly, excitement, or digestive disturbances. Hiccups are usually harmless and temporary.","A diverse group of individuals suddenly clutching their chests or throats, faces contorted in surprise or mild annoyance, as intermittent, sharp ""hic!"" sounds punctuate the air, with some possibly holding a glass of water or a spoonful of sugar in attempts to quell the spasms.","Hiccup sounds typically feature irregular, spasmodic, sharp inhalation noises followed by abrupt glottal stops, creating a characteristic ""hic"" or ""hiccup"" sound. The timbre may vary among individuals, but the pattern is usually distinctive and recognizable." +people humming,"""People humming"" refers to the sound event where individuals produce a consistent, musical tone by vocalizing with closed lips, creating a soothing, resonate noise often used in music or as a calming activity.","A group of individuals with closed or slightly parted lips, heads tilted upward, eyes perhaps closed in concentration, possibly swaying gently, fills the space with a soft, musical drone emanating from their throats__ harmonious blend of various pitches and tones creating a resonant hum.","The sound event ""people humming"" typically features a steady, tonal drone with a warm, resonant quality. Humming consists of voiced, mouth-closed sounds that vary in pitch and volume based on the number of individuals and their vocal ranges, producing a harmonious or layered auditory texture." +people marching,"A sound event ""people marching"" is characterized by rhythmic footsteps in unison, often accompanied by chants or cadences, typically signifying coordinated movement by a group for a demonstration, parade, or military drill.","A group of individuals stride in unison, their feet thudding rhythmically against the ground. Banners may be held aloft, and the determined expressions on their faces are evident as they move forward together with a shared purpose or cause. Signs and chanting may accompany their march.","The sound of people marching features rhythmic footsteps synchronizing on hard surfaces, occasional shuffling of feet, murmur of voices or commands, periodic heavier thuds from boots, and potential accompanying sounds of gear or instruments if it's a military or band procession." +people nose blowing,"The sound event ""people nose blowing"" refers to the audible noise produced when an individual clears their nasal passages by forcefully exhaling through the nose, often into a tissue, typically associated with relieving nasal congestion or clearing mucus.","A group of individuals are depicted with tissues pressed to their faces, some have reddened noses, furrowed brows showing discomfort. Their cheeks are inflated while they expel air forcefully through their nostrils, possibly during cold or allergy season.","The sound event of ""people nose blowing"" typically involves a forceful, snorting expulsion of air through the nostrils, which can vary in pitch and volume but often has a resonant, honking quality with possible muffled, wet sounds if the nasal passage is congested." +people running,"The sound event ""people running"" encapsulates the rhythmic pounding of footwear against a surface, with varying intensities depending on speed and the number of individuals, often accompanied by associated noises like breathing, voices, and clothing rustle.","A chaotic scene depicts diverse individuals in various states of motion__printing, darting forward, faces etched with urgency or fear__onveying a rush of movement, perhaps with blurred lines suggesting their swift paces against a dynamically composed backdrop signaling speed and haste.","Rapid, rhythmic footsteps; varying intensities depending on the surface; syncopated breathing sounds; possibly clothing rustle and vocal exclamations; fluctuating pace and volume as runners move towards or away." +people screaming,"""People screaming"" is a sound event characterized by loud, often high-pitched vocalizations, typically reflecting fear, excitement, or distress. It can occur in various contexts, ranging from enjoyment at events to reactions to danger or emergency situations, signaling the need for attention or help.","A chaotic scene with open-mouthed individuals, faces contorted in fear or panic, hands possibly raised to their ears or flailing, with waves or lines emanating from mouths to symbolize the shrillness of their screams.","“Screaming” features high-pitched, loud, shrill human vocal tones with varying frequencies and chaotic modulations, indicating fear, pain, excitement, or alarm. It lacks harmony, with discordant, overlapping cries and brief silences followed by intense screeches." +people shuffling,"""People shuffling"" refers to the soft, rustling noise created when individuals move their feet across a surface without lifting them completely, often heard in quiet, crowded spaces like libraries or lecture theatres.","A crowded room depicted with blurred feet and indistinct figures, moving in a disjointed rhythm, their steps a muted cacophony on a soft carpet or a hard floor, suggesting the hustle of a busy, confined space where individuals are in motion, perhaps queuing or navigating a congested area.","A sound event characterized by soft, intermittent rustling or dragging noises, with variations in tempo and intensity as people's feet lightly brush or scrape against a floor surface. This repetitive sound is generally low-pitched, with a non-rhythmic pattern that reflects the movement of a crowd or individual through a space." +people slapping,"The sound event ""people slapping"" is characterized by the sharp, percussive noise produced when a person's open hand forcefully hits the body of someone else, often resulting in a loud smack indicative of physical conflict or disciplinary action.","A sequence of cartoon-like figures stands in a line, arms extended, with hands connecting in a slap to the next person's cheek. Bold lines indicate movement while ""SMACK"" sound effects are visibly highlighted. Facial expressions range from surprise to comedic exaggeration, conveying the chaotic yet humorous nature of the scene.","“Slapping” produces a sharp, high-frequency sound at contact, followed by a lower thud if hitting a body. It has a quick decay and minimal reverberation unless in an enclosed space, with possible additional sounds from object impact or reactions." +people slurping,"""People slurping"" refers to the audible suction noise made when someone draws liquid, typically a soup or noodle broth, into their mouth with an intentional, continuous inhalation, often considered rude in Western dining etiquette but accepted in some cultures as a sign of enjoying the meal.","Individuals are depicted with heads tilted, lips puckered, intently sucking up liquids through straws or directly from bowls, eyes possibly closed in satisfaction. Echoing lines or musical notes may illustrate the ambient ""slurping"" noises in the scene.","The sound of people slurping typically features intermittent, wet, suction noises as liquid is rapidly drawn past the lips, often accompanied by airy, gurgling sounds when air mixes with the liquid and resonates in the mouth and throat, creating a distinctive aural signature of consumption and savoring." +people sneezing,"Sneezing is a reflex to nasal irritation, often from allergens or illness, involving a forceful expulsion of air and droplets with a distinctive “achoo” sound. It naturally clears nasal irritants.","An illustration of multiple individuals with eyes closed and mouths open in a mid-sneeze expression. Some are covering their noses with tissues, elbows bent to shield their faces, while others are unguarded. Fine spray droplets fan out around them. Expressions of surprise or discomfort are common on bystanders' faces.","A sneeze produces a sharp, explosive burst of air often preceded by inhaling and followed by characteristic sounds from the mouth and nose. It may include vocalizations like ""achoo,"" multiple sequential sneezes, and variations in pitch and loudness depending on the individual." +people sniggering,"""People sniggering"" refers to the sound of one or more individuals emitting a suppressed, quiet laugh, often indicative of amusement, irony, or mockery in a discreet or half-suppressed manner.","A group of individuals are depicted with smirks and raised eyebrows, secretly chuckling to each other. One may be covering their mouth to stifle laughter, while their eyes gleam with amusement, subtly indicating their shared joke or ridicule. Their body language suggests a communal, mocking secrecy.","Low-volume, stifled laughter characterized by brief, subdued chuckles or nasal intonations suggests people are trying to conceal their amusement or sarcasm without drawing attention." +people sobbing,"""People sobbing"" is a sound event characterized by the audible expression of deep sorrow or emotional pain. This phenomenon often involves a series of loud, convulsive inhales and exhales, with tears frequently accompanying the distinctive crying sounds.","An image captures individuals with downturned mouths, tears streaming down their cheeks, and pained expressions. Some might be embracing, offering comfort, or burying their faces in hands, while others stare forlornly into the distance, their eyes red and puffy, shoulders shaking with each heavy sob.","Auditory features of people sobbing include intermittent, uneven breaths; quiet to loud weeping sounds; sniffles; and whimpers. Vocalizations may vary in pitch and intensity, often overlayed with trembling or quivering tones indicative of distress. Sounds may be rhythmic or erratic in pacing." +people whispering,"People whispering refers to a soft, hushed conversational sound, characterized by quiet, breathy vocalization. It is typically associated with privacy, secrecy, or the need to remain undetected. Whispering reduces the volume and energy of speech sounds, making it harder to overhear.","A cluster of individuals lean in closely, heads almost touching, mouths near ears. Their expressions hold a mix of secrecy and urgency, with fingers pressed to lips, and eyes darting. The background fades, emphasizing the hushed, conspiratorial atmosphere the noisy whispers create.","People whispering typically involves soft, hushed vocalizations with a breathy quality and minimal vocal fold vibration, resulting in low volume and high-frequency hissing or rustling sounds that convey speech in a subdued manner, often perceived as private or covert communication." +people whistling,"Whistling involves creating a clear, high-pitched tone by blowing air through puckered lips. It’s used for signaling, expressing cheerfulness, or gaining attention. Whistling conveys tunes and rhythms, serving as a form of non-verbal communication and musical expression.","A diverse group of individuals stands scattered, some with heads tilted back, others with eyes closed, all puckering their lips. Their cheeks are ballooned with exerted breath, creating a chorus of high-pitched tones while their hands are casually tucked in pockets or swinging by their sides.","High-pitched, clear-tone, melodious or tuneless variations, can be rhythmic or sustained, may include multiple pitches if multiple individuals are whistling, incorporates breath control, sometimes airy or with vibrato; volume ranges from soft to piercing based on intensity and number of participants." +pheasant crowing,"Pheasant crowing is a distinctive, loud call typically made by male pheasants during the mating season to establish territory and attract females. The sound is a series of rapid, repetitive notes, often described as a coarse, fluting crow or kok-kok-kok chorus, echoing through rural landscapes especially at dawn.","A colorful pheasant stands on a rustic wooden fence at dawn, its beak open mid-call, as morning mist blankets the rolling countryside, and the first rays of sunlight peek over the horizon.","A pheasant crowing typically emits a short, loud, repetitive call. The sound often starts with a rapid, staccato note, followed by longer, clearer notes that descend in pitch. The timbre is somewhat harsh and nasal, carrying well across open fields, characteristic of early morning and late afternoon." +pig oinking,"A pig oink is a distinctive, guttural noise produced by pigs, serving as communication that varies in pitch and duration, often indicating hunger, contentment, or social interaction.","A plump pig with a pink or muddy complexion stands in a sty or farmyard, its snout raised and mouth open, as it emits a distinctive ""oinking"" noise, perhaps accompanied by other pigs or amidst a farming backdrop with barns, mud, and troughs.","A pig oinking produces a distinctive series of grunting sounds, which can vary in pitch and volume. These vocalizations are often nasal and repetitive, with abrupt starts and stops, creating a rhythmically irregular pattern. The sounds can range from low, guttural tones to higher-pitched squeals." +pigeon cooing,"The sound event ""pigeon cooing"" refers to the soft, throaty call typical of pigeons, often heard in both urban and rural settings. This repetitive vocalization plays a role in communication, especially in courtship and signaling presence within their territory.","Early morning light dapples a cobblestone square where a flock of grey pigeons pecks at scattered seeds, their gentle coos echoing softly as they flutter and prance around an old, gently bubbling stone fountain, with a few birds perched on the rim, heads tilted, serenading the quiet sunrise.","Pigeon cooing is characterized by soft, throaty coos or murmurs consisting of repeated, rhythmic patterns with a low frequency, often with a soothing and gentle tone, typically perceived as a form of avian communication or territorial presence, commonly occurring during the early morning or late evening hours in urban or wooded areas." +planing timber,"""Planing timber"" is the process of shaving wood to a desired thickness or smoothness using a tool called a plane. As the plane glides along the wood surface, it creates a characteristic swishing and scraping sound, often accompanied by the rhythmic shavings that curl from the timber.","A skilled woodworker pushes a hand plane across a wooden plank's surface, shavings curling up as the sharp blade smooths the wood, generating a rhythmic, satisfying scrape that echoes through a sawdust-scented workshop.","High-pitched whirring, rhythmic buzzing and cutting noises, occasional scraping sounds, and wood chips' rustle; the sound intensity fluctuates with the tool's movement through the wood grain." +plastic bottle crushing,"The sound event ""plastic bottle crushing"" is characterized by a distinctive crunching or cracking noise produced when a plastic bottle is squeezed or compressed, often resulting in deformation or breakage of the bottle and creating a sequence of sharp, crinkling sounds.","A hand compresses a translucent plastic bottle, causing it to crumple with sharp creases forming. The bottle's structure gives way with a crunch, as jagged lines spread where the material folds, and the typically smooth surface becomes a chaotic array of distortions reflecting light irregularly.","Crackling, popping sounds of varying pitches, brief in duration; crescendo of scrunching noises as plastic deforms; possible air whoosh if bottle is sealed; ends with softer crinkles as material settles." +playing accordion,"The sound event ""playing accordion"" involves the melodic and rhythmic manipulation of a portable keyboard wind instrument, producing music through the expansion and compression of bellows paired with key or button presses to control pitch. It is characterized by its rich, full, and often resonant sound.","A person stretches and squeezes an accordion, fingers pressing keys and buttons. Bellows flex rhythmically, emitting melodic tones. The environment may reflect a folk or festive setting, with listeners enjoying the dynamic, lively music often associated with cultural dances or social gatherings.","The sound event of ""playing accordion"" features a rich, harmonic melody with variations in volume and pitch, characterized by the wheezing of bellows and the clicking of keys or buttons, producing a vibrant, often rhythmical, resonant sound that can convey a range of musical styles from folk to classical." +playing acoustic guitar,"Playing an acoustic guitar involves strumming or plucking its strings to produce melodious sounds with a warm, rich resonance characteristic of its hollow wooden body, used across various music genres for rhythm and lead instrumentation.","A person with a relaxed posture cradles an acoustic guitar, fingers gracefully plucking or strumming the strings. Soft, warm lighting enhances the intimate setting, possibly with music notes subtly floating in the air to suggest the melody emanating from the instrument.","Playing acoustic guitar involves strumming or plucking to produce resonant chords and harmonic overtones. The sound varies with technique: soft, mellow tones for fingerpicking and crisp, rhythmic sounds for strumming. It features a warm, wooden reverberation and dynamic volume levels." +playing badminton,"The sound event ""playing badminton"" is characterized by rhythmic swooshing as shuttlecocks cut through the air, punctuated by sharp strikes from rackets hitting the shuttlecock, occasional footwork shuffles, and player exclamations during energetic rallies.","A kinetic scene with the rhythmic swishing and popping sounds as a shuttlecock is hit back and forth, accompanied by the movement of agile players lunging and leaping with rackets in hand, their focus sharply tuned to the flying object against a backdrop of a net and court lines.","Playing badminton features the sharp “thwack” of the shuttlecock hitting racquets, the soft fluttering as it flies, and occasional shoe squeaks on the court. Players’ light footwork is accompanied by claps or shouts from observers." +playing bagpipes,"The sound event ""playing bagpipes"" involves producing music through a wind instrument comprised of air-filled bags and pipes. Blown by mouth or bellows, bagpipes emit a resonant, continuous drone accompanied by a melodic line, often associated with Scottish and Irish cultural traditions.","A person stands, puffing cheeks, fingers dancing on chanter pipes as tartan kilt sways, with the ballooning bag underarm, and drones extend over the shoulder; the haunting, sonorous drone of the bagpipes fills the air.","Playing bagpipes involves a droning bass from the air-filled bag, overlaid with a high-pitched melody from the chanter. This creates a unique, resonant sound with ceremonial or mournful qualities, featuring distinctive volume and pitch variations in traditional or martial tunes." +playing banjo,"""Playing banjo"" refers to the act of performing music with a banjo, a stringed instrument featuring a distinctive twangy tone, played using fingerpicking or strumming techniques, often associated with folk, country, and bluegrass genres.","A person sits on a porch, fingers plucking at a banjo's strings, notes twanging rhythmically. Nearby, folks tap their feet, a dog lies dozing, and the air carries the warmth of a setting sun.","Playing banjo produces bright, twangy tones with rapid finger-picking or strumming. It features metallic string plucks, a resonating sound chamber, and occasional fret buzz. The music often follows a rhythmic, melodic, and syncopated pattern, with pitch and dynamics varying by style and technique." +playing bass drum,"The sound event ""playing bass drum"" is characterized by deep, resonant beats when a drummer strikes the drum with a mallet, producing a powerful, low-pitched percussion rhythm foundational to music genres like rock and orchestral compositions.","A musician with mallets striking the large, resonant head of a bass drum, creating deep, rhythmic booms. The vibrations are visually depicted by concentric sound waves emitting from the drum, illustrating the pulsating energy of the beat.","Playing a bass drum produces a deep, resonant thump with a low-frequency tone. The sound has a strong, palpable attack with a brief sustain and quick decay. It can vary in pitch and loudness based on drum size, tension of the drumhead, and striking force. Vibrations are felt physically." +playing bass guitar,"Playing bass guitar involves plucking or slapping strings to produce deep, rhythmic low-pitched sounds critical to the harmony and groove in various music genres, from rock and jazz to funk and metal.","A person with their fingers skillfully plucking or slapping the thick strings of a bass guitar, sending rhythmic vibrations as the deep, resonant tones provide the groovy foundation for a song. Waves emanate from the guitar's body, symbolizing the rich, reverberating sound filling the space.","Deep, resonant tones; plucking or picking of strings; varying pitch; rhythmic strums; potential for fret noise; amplification buzz; sustain and decay of notes; potential slapping and popping sounds in certain playing styles." +playing bassoon,"""Playing bassoon"" involves a musician producing rich, deep tones by blowing air through a double-reed attached to a long, wooden wind instrument, often used for orchestral, chamber, or solo performances, providing a distinctive, resonant sound that can range from somber to lively.","A musician sits, holding the long, wooden bassoon vertically, fingers moving deftly over the silver keys while their cheeks puff slightly and air flows through the double reed, producing a deep, resonant melody that fills the room with its rich, warm tones.","Playing bassoon creates a deep, reedy timbre with warm tones, ranging from soft, mellow notes in the lower register to bright, edgy sounds in the higher octaves. Dynamics vary from gentle murmurs to robust blasts, with pitch controlled by fingerings and breath." +playing bongo,"Playing bongo involves rhythmically tapping hand-held drums with fingers and palms, producing a variety of rich, resonant tones used in Afro-Cuban, jazz, and world music.","A person sits with a pair of bongo drums between their knees, hands tapping rhythmic patterns on the drumheads while they sway to the beat. The background may feature vibrant colors or a cozy setting, emphasizing the lively and casual atmosphere of the music session.","Rhythmic tapping, varying pitch based on hand position, soft thuds, resonance of hollow drum bodies, potential for rapid successions or slow sequences, syncopated patterns, potential for hand-slapping sounds, and subtle background buzzing from drum skin vibration." +playing bugle,"The sound event ""playing bugle"" involves the performance of a tune or signal on the bugle, a brass wind instrument used in military and ceremonial contexts, known for its clear, piercing tone and lack of valves, which produces notes through the player's embouchure and breath control.","A person in uniform stands at attention, bugle pressed to lips, filling the air with solemn notes. A flag might ripple in the background, with a focused or emotive expression on the bugler's face, suggesting a ceremonial or military setting.","The sound of a bugle playing typically features clear, resonant brass tones with a strong, piercing timbre capable of carrying over long distances. It consists of a melodious series of notes often characterized by military or ceremonial motifs, played in a staccato or legato style depending on the context." +playing castanets,"Playing castanets involves creating rhythmic clicking sounds by snapping together pairs of concave shells, typically made of wood. As a traditional percussive instrument, they are prominent in Spanish music and dance forms like flamenco, where they accentuate the rhythm with their distinctive, resonant clatter.","A pair of hands skillfully clapping together small, concave shell-like percussion instruments, creating rhythmic clicking sounds. The instruments are often associated with flamenco dancing, vibrant Spanish music, and traditional performances, where dancers often accompany their steps with the sharp, staccato beats of the castanets.","The sound event of ""playing castanets"" is characterized by sharp, clicking, or clacking sounds with a rhythmic pattern that varies in tempo and intensity, often associated with flamenco music, displaying a crisp staccato effect produced by wooden shells being struck together in the hands of the performer." +playing cello,"The sound event ""playing cello"" involves the resonant production of rich, deep tones by drawing a bow across the strings of a cello, a large stringed instrument. The musician skillfully manipulates the strings and bow to create expressive melodies and harmonies characteristic of classical and contemporary music.","A musician's poised fingers dance along the strings of a cello; the bow elegantly glides as rich, deep tones resonate. The player is in a focused trance, immersed in the rhythmical sway of the melody, expressing a harmonious blend of passion and discipline in every stroke.","The sound of playing a cello consists of rich, deep, and resonant tones with a warm timbre. It includes the smooth bowing across strings, varying dynamics from soft to loud, and occasional fingering noises as fingers press and release the strings, creating a melodious and expressive musical experience." +playing clarinet,"Playing clarinet is the act of producing music through a woodwind instrument using a single-reed mouthpiece, manipulating finger holes and keys to vary the pitch, and breath control for dynamics and tone, creating a warm, rich sound across various genres from classical to jazz.","A musician with pursed lips, fingers gracefully dancing on silver keys, raises a sleek, black clarinet to their mouth, eliciting soulful, woody tones. Swirling musical notes float in the air around them as the melody unfolds.","When playing clarinet, you hear a smooth, resonant woodwind tone with a reedy quality, melodic lines with a potential range from warm, rich lower registers to bright, piercing higher notes, accompanied by the subtle clicking of keys and occasional breath intake sounds from the player." +playing congas,"Playing congas involves rhythmically striking tall, single-headed drums with hands, creating diverse sounds essential to Latin and Afro-Caribbean music. Different drum areas produce varied tones, forming intricate patterns and rich harmonies that drive tempo and embellish melodies.","A person seated with a pair of conga drums between their legs, rhythmically tapping and slapping the drumheads with their hands, creating vibrant percussive beats, often accompanied by lively music or a band, evoking a joyful and energetic atmosphere.","Playing congas produces rhythmic tapping and deep, resonant tones with pitch variation depending on hand placement and drum size. The sound includes slaps, open tones, and bass tones, characterized by warm, round acoustic textures and distinct percussive patterns reflective of Afro-Cuban origins." +playing cornet,"The sound event ""playing cornet"" entails the production of musical notes through the brass instrument called a cornet, which is similar to a trumpet but with a mellower tone. It involves the vibration of lips and manipulation of valves to create melodic and harmonic phrases.","A musician holds a brass cornet to their lips, cheeks puffed, fingers deftly pressing valves. Smooth golden tones flow amidst a backdrop of nodding heads and tapping feet, evoking a cozy ambiance of a jazz club with soft lighting, intimate seating, and an audience immersed in the warmth of the melody.","Playing a cornet typically involves melodic brass tones, varying dynamics from soft to loud, a clear attack at note onset, a warm, rich timbre, with possible vibrato, and a resonance characteristic of metal wind instruments. Breath sounds and valve clicks may be audible between notes." +playing cymbal,"Playing cymbals involves striking two large, concave brass plates together, which produces a loud, sustained, clashing sound. Used in music for dramatic emphasis, they range in sound from gentle taps to powerful crashes, essential in orchestras, bands, and ceremonial events for their rhythmic and accentuating effects.","A pair of brass plates held by straps are clashed together by a musician, creating a bright, penetrating crash that reverberates, with golden ripples visually depicting the sound waves emanating from the point of impact.","Metallic resonance, sharp attack, sustained shimmering decay, varying pitch depending on strike location and intensity, complex overtones, possible crescendo or diminuendo effect, and potential undertones of clashing if played together with other cymbals or percussive elements." +playing darts,"""Playing darts"" involves players throwing small, sharp-tipped missiles at a circular target (dartboard) fixed to a wall, aiming to hit specific marked areas for varying points, combining skill, precision, and often social competition.","In a dimly lit pub, focused individuals stand at a line, throwing small, sharp projectiles at a circular target hung on the wall. Spectators sip drinks, observing as darts punctuate the board with thuds amidst casual laughter and the murmurs of friendly competition.","The sound of playing darts typically includes the soft thud of darts striking a sisal fiber dartboard, faint rustling as players retrieve darts, occasional metallic clicking from contact with wire dividers, and the background chatter or cheers of onlookers reacting to the players' performance." +playing didgeridoo,"The playing of the didgeridoo involves producing a deep, resonant drone by vibrating lips and using circular breathing, allowing for continuous sound flow from this indigenous Australian wind instrument, typically made from hollowed-out eucalyptus trunks.","Sitting with focused determination, a person uses circular breathing to play a wooden didgeridoo. The instrument emits hypnotic, droning vibrations that captivate listeners. Decorated with Aboriginal patterns, it evokes the Australian outback, as haunting sound waves visually undulate through the air.","A didgeridoo produces a deep, resonant, droning sound with rhythmic variations and overtones. It can also include vocalizations and rhythmic patterns made by the player's tongue and breath control, adding complexity to the drone." +playing djembe,"Playing djembe involves rhythmically striking an African drum, typically with the hands, to create a variety of tones. It's a dynamic sound event characterized by energetic, pulsating beats that are integral to West African music and are used in ensembles or solo performances to evoke emotions and tell stories.","Seated, a person rhythmically taps a goblet-shaped djembe with swift hand strokes, producing vibrant, resonant beats. The drum’s skin visibly vibrates with each impact, creating an ambiance of musical energy, while onlookers clap or move to the rhythm.","A djembe produces rhythmic thumping and resonant slaps, with a deep bass tone when struck at the center and higher-pitched, crisp sounds around the rim. The hand-drumming sequences vary in tempo and complexity, creating a rich tapestry of percussive beats and vibrant African musical patterns." +playing double bass,"""Playing double bass"" involves a musician using a bow or fingers to produce deep, resonant tones from the largest string instrument in the violin family, vital in orchestras and jazz ensembles for its rich, sonorous sound that anchors harmonies and rhythm.","A musician stands, cradling a large wooden double bass between their legs, bowing gently across the strings, fingers deftly pressing the fingerboard, resonating deep, rich tones that fill the room with a warm vibrato, while the audience listens intently to the soulful expression of the upright bass's sonorous melody.","Deep, resonant tones; low frequency rumble; rich harmonic overtones; varied dynamics from soft to forceful; intermittent plucking or consistent bowing sounds; woody timbre; string vibration and finger movement noise; subtle squeaks during position shifts." +playing drum kit,"""Playing drum kit"" refers to the act of creating rhythm and beats by striking various percussion instruments like snare, bass drums, cymbals, and toms, typically in musical performances, using hands or drumsticks.","A person sits behind a set of drums, sticks in hand, striking the snare, toms, and cymbals rhythmically, with foot pedals thumping the bass drum, all resonating in a synchronized beat, conveying a vibrant and energetic musical performance.","The sound event ""playing drum kit"" features rhythmic percussive impacts, varied pitches from deep bass of the kick drum to higher snare/toms, cymbal crashes, hi-hat clicks or shimmers, and potential dynamic range from soft taps to loud hits, often creating a tempo-setting backdrop for music." +playing electric guitar,"Playing the electric guitar involves strumming or plucking its strings, which creates vibrations amplified electrically to produce a distinct, rich sound that can be modified with effects for various genres, from rock and blues to jazz and metal.","Holding an electric guitar, one hand presses frets while the other strums or plucks strings, producing vibrant, amplified tones. Colorful sound waves symbolize the dynamic, powerful music, with the player often immersed in the performance’s intensity.","Strumming or picking strings produces sustained notes with varying pitch and timbre; possible use of distortion or effects yields a rich, textured sound; amplifier feedback and finger sliding on frets may be audible; rhythmic chord progressions and melodic solos with dynamic attack and decay characterize this sound event." +playing electronic organ,"The sound event ""playing electronic organ"" involves producing music by triggering electronic circuits or digital samples through a keyboard interface, emulating the tones of a traditional organ or creating new sounds, often used in various musical genres from classical to rock and electronic music.","A musician's hands dance across an electronic organ's multiple keyboards, fingers pressing keys to produce rich, layered tones. Cool, blue lights from the instrument's panel illuminate their focused expression, while foot pedals are worked in a rhythm, all against a backdrop of enthralled listeners swaying to the melodic waves.","Playing an electronic organ involves a rich tonal palette, layered harmonies, sustained chords, and dynamic volume fluctuations, with a potential range from deep bass to piercing high notes, often accompanied by the clicking of keys and occasional switching of register buttons or foot pedals during performance." +playing erhu,"The sound event ""playing erhu"" involves the emotive tones of a traditional two-stringed Chinese instrument, known for its mournful yet beautiful sound, often compared to a human voice. It is played with a bow and produces a distinctive, haunting music that deeply resonates with listeners.","A musician gracefully bows a slender, two-stringed erhu, fingers pressing into its long neck, producing soulful melodies. The curvaceous wooden body rests against the player's chest, as a backdrop of ancient Chinese architecture or a serene park scene enhances the poignant and expressive ambience of the traditional performance.","The sound of playing the erhu features a mellow, resonant tone with a distinctive vibrato, characterized by smooth bowing on two strings, producing sustained, sliding pitches, and sometimes rapid, staccato articulations, evoking a sense of traditional Chinese music." +playing flute,"Playing flute involves a musician blowing air across the mouthpiece of the instrument, manipulating finger holes or keys to produce melodious notes, creating a soft, ethereal sound that resonates with a warm or bright timbre depending on the technique and flute type used.","A serene image of a person with closed eyes, gently holding a flute to their lips, fingers poised elegantly on the keys. Soft, melodious notes float in the air, surrounded by tranquil scenery like a flowering meadow or a quiet forest with dappled sunlight filtering through the leaves.","Soft, melodic tones; breathy articulation; purity of pitch; occasional airy hisses during fingering; clear, sustained notes with vibrato; pitch variation with key presses; resonant harmonics; and gentle attack and decay of sound when starting and ending notes." +playing french horn,"The sound event ""playing French horn"" involves the production of rich, mellow tones from a brass instrument by buzzing lips into a mouthpiece, manipulating pitch with hand gestures inside the bell, and pressing rotary valves to alter the length of tubing the air travels through, creating a harmonious melody.","A musician with cheeks puffed, intensely focused, fingers deftly pressing valves on a curving, golden brass french horn, producing rich, warm tones, amidst an orchestra setting or solo with sheet music on a stand, embodying classical elegance and sophisticated harmony.","Playing the French horn produces rich, warm tones, ranging from mellow lows to bright highs. It features smooth, legato articulation and can deliver majestic fanfares or delicate passages, characterized by its resonant sustain supported by circular breathing." +playing glockenspiel,"The sound event ""playing glockenspiel"" refers to the act of striking the tuned metal bars of a glockenspiel with mallets, producing a bright, resonant, and melodic percussion tone commonly used in orchestras and bands for its distinct, bell-like timbre.","A musician gently strikes the tuned metal bars of a glockenspiel with small mallets, producing clear, bell-like tones. The instrumentalist is focused, and the shimmering notes float through the air, accompanying a festive or orchestral scene.","The sound of playing a glockenspiel features clear, bright, and resonant tones with a metallic timbre. Each note strikes with a plinking sound that decays rapidly; the pitch is high and can vary depending on the size of the metal bars. It often creates a delicate, crystalline ambiance." +playing gong,"The sound event ""playing gong"" involves striking a large metal disc, creating a resonant, reverberating tone with a deep pitch used for musical, ceremonial, or signaling purposes, characteristic of its long sustain and shimmering quality.","A musician striking a large, shimmering brass gong with a mallet, creating a deep, resonant sound wave that visibly ripples through the air, while the audience watches in anticipation, feeling the vibration emanate from the instrument.","Playing a gong typically produces a deep, resonant tone with a sustained, reverberating sound that fades gradually. The initial strike can have a sharp attack if hit forcefully, followed by complex overtones that mellow out as the sound decays. Volume and pitch can vary based on gong size and striking technique." +playing guiro,"Playing the guiro involves stroking a ribbed percussion instrument with a stick, creating a raspy, rhythmic scraping sound commonly heard in Latin American music. The player varies pressure and speed to produce different tones and rhythms, adding texture to the musical ensemble.","A person uses a stick to rhythmically scrape along the ridged surface of a handheld cylindrical or gourd-like instrument (guiro), producing a distinctive percussive sound often used in Latin American music.","Playing the guiro produces a raspy, rhythmic scraping sound with variable pitch and intensity, depending on the stroke length and force. It exhibits a distinctive high-frequency, percussive pattern as the stick or tines rub against the instrument's grooved surface." +playing hammond organ,"""Playing the Hammond organ"" refers to the act of creating music using the distinctive Hammond organ, an electric, early keyboard instrument known for its rich, harmonic tones and unique rotary speaker system, often heard in jazz, blues, rock, and church music.","A musician with expressive hands on a dual keyboard, feet on bass pedals, surrounded by a wooden, warm-toned Hammond organ, with spinning Leslie speakers imparting a rich, soulful vibrato to the bluesy, jazz-infused sound filling an intimate, dimly lit venue with an enraptured audience tapping their feet.","The sound of playing a Hammond organ is characterized by warm, rich tones with a distinctive rotating Leslie speaker effect, creating a swirl of harmonics and Doppler-like modulation. It often involves percussive key clicks, sustained chords, and the use of drawbars for dynamic tonal shifts." +playing harmonica,"""Playing harmonica"" involves a musician using their breath to create music by blowing and drawing air through reed chambers in a handheld harmonica, producing a distinctive, soulful sound with a wide range of tones and rhythms suited for genres like blues, folk, and rock.","A person's lips press against a small, metal reed instrument, fingers deftly adjusting its position. Cheeks puff rhythmically, eyes often closed in concentration, as soulful, bluesy notes spill forth in undulating waves, the harmonica's distinctive timbre filling the air with a heartfelt, melodic breathiness.","Playing a harmonica produces a series of clear, melodious tones with a reedy quality, often featuring bending notes and vibrato. The sound can vary from soft, haunting echoes to loud, piercing notes, characterized by breathy accents and rapid changes in pitch reflecting the musician's breathing pattern and techniques." +playing harp,"Playing a harp involves delicately plucking its strings, producing ethereal, resonant tones that can vary from soft, angelic whispers to vibrant cascading melodies, often evoking a sense of serenity and classical elegance.","A serene image of slender fingers gracefully plucking the strings of a golden harp, producing a cascade of soft, melodious notes, as soothing light filters through a peaceful setting, perhaps with elements of nature or an intimate, cozy interior space illuminated by warm, ambient lighting.","Plucking strings produces resonant, melodic tones with a soft, ethereal quality; there's a broad range of pitches depending on the strings played. Sustain and reverberation are noticeable as the harmonic vibrations linger after being plucked. Volume varies from gentle to dynamic based on the force applied to the strings." +playing harpsichord,"Playing the harpsichord involves creating music by pressing keys on a keyboard, which activates small plectra to pluck the strings inside the instrument, producing a bright, resonant sound distinctive to Baroque and Renaissance compositions.","An elegant room with baroque decor; a musician's poised fingers dance across the ivory keys of an ornate harpsichord, as the instrument's rich, plucked string notes weave through the air, mingling with the ruffle of sheet music and the warm glow of candlelight.","Playing the harpsichord produces a bright, metallic timbre with crisp, resonant tones that decay rapidly, creating a staccato effect. It has a distinct Baroque texture and lacks the dynamic range of a piano." +playing hockey,"Playing hockey is characterized by sounds of skates slicing ice, sticks clashing, pucks ricocheting off boards, players communicating, and occasionally the buzz of a goal horn.","An image of players gliding across an ice rink, sticks in hand, puck sliding over the ice, with the sharp sound of skates carving the ice, the swish of sticks, and the thump of the puck hitting the boards or goals.","Staccato of hockey sticks clacking, puck gliding on ice, players skating with sharp blade swooshes, boards rattling with body checks, whistle blows, crowd cheering, buzzer for period ends, goalie pads thudding from blocked shots." +playing lacrosse,"Playing lacrosse encompasses the swish of netted sticks passing the ball, the thud of rubber on turf, sharp referee whistles, and the shouts of players coordinating plays, celebrating goals, and colliding in athletic combat, all set against a backdrop of cheering spectators.","A dynamic scene: athletes cradling sticks, swiftly running, dodging across the field. Intermittent clacks of stick-on-stick contact mix with the sharp sound of rubber lacrosse balls being caught and shot at goal, accompanied by vibrant team shouts and the referee's whistle piercing through the rhythmic stomping of cleats.","Whistle blows, rapid footsteps, the thwack of sticks clashing, the crisp sound of a rubber ball being caught in the netted stick-head, players calling out to teammates, and the occasional cheer from onlookers as goals are scored or key plays are made." +playing mandolin,"""Playing mandolin"" involves creating music by strumming or plucking the strings of a mandolin, a small, pear-shaped stringed instrument with a distinctive, high-pitched, resonating sound, commonly associated with folk, bluegrass, and classical music genres.","An individual sits on a rustic wooden chair, fingers deftly plucking the strings of a mandolin. Soft, melodious tunes fill the air, accompanied by the gentle strumming that resonates with a folksy charm. The scene is warm, cozy, and imbued with a sense of traditional musicality.","Plucking or strumming strings produces resonant, bright, and twangy tones with a quick decay. Chordal or melodic sequences can be heard, often with a crisp, clean sound. Vibrato and tremolo may add variability, while fretting creates pitch changes and metallic finger slides." +playing oboe,"The sound event ""playing oboe"" involves producing rich, reedy musical tones through a woodwind instrument by blowing air through a double reed, which vibrates to create sound, executed with fingerings on various keys to alter pitch.","A musician plays the slender, wooden double-reed oboe, fingers moving across silver keys with focus. Soft, warm notes create a rich melody with lilting vibrations, immersing listeners in the oboe’s resonant, penetrating timbre.","The oboe produces a high-pitched, penetrating tone with a nasal quality and rich harmonics. Its reedy character allows for expressive articulation in both legato and staccato, dynamically ranging from soft whispers to bold, resonant blasts." +playing piano,"Playing piano involves creating harmonious sound by pressing keys which trigger hammers to strike strings inside the instrument, producing musical notes that can be combined into melodies and chords, integral to genres from classical to jazz.","A person sits at a piano, fingers gracefully dancing across black and white keys, sheets of music on a stand, soft light illuminating the instrument while notes seemingly float in the air, encapsulating the harmony and movement of a melodic performance.","Playing piano features melodic sequences, harmonic chords, the percussive strike of hammers on strings, varying dynamics from soft to loud, resonant decay of notes, and the mechanical sounds of keys and pedals being depressed and released, often with a sustain effect from the damper pedal." +playing saxophone,"Playing the saxophone involves producing rich, resonant sounds by blowing into a mouthpiece with a single-reed, while pressing keys to control pitch and tone on this brass woodwind instrument, often associated with jazz and classical music performances.","A person with a saxophone, fingers dancing on keys, cheeks puffed, and a burst of musical notes swirling around, set against a backdrop of soft, blue-toned lighting, creating a moody, jazz club atmosphere.","Playing saxophone produces a rich, resonant tone varying from mellow to bright. It involves breathy notes, reedy vibrations, occasional key clicks, dynamic range from soft whispers to piercing loudness, and expressive elements like vibrato, pitch bends, and versatile articulation characteristic of jazz, classical, or other musical styles." +playing shofar,"The ""playing shofar"" event involves blowing a traditional ancient musical horn typically made from a ram's horn and used in Jewish religious ceremonies, particularly during Rosh Hashanah and Yom Kippur, to create a range of blasts and tones that hold significant spiritual symbolism.","A person blows into a polished ram’s horn, the shofar, with puffed cheeks. The sound waves symbolize the rich, reverberating tones that fill the air during Jewish rituals or celebrations, conveying spirituality and cultural heritage.","The shofar, a traditional Jewish horn, produces a resonant, trumpet-like sound. It starts with a low, sustained tone that may rise to a higher pitch, characterized by its raw, vibrating, and primal timbre." +playing sitar,"The sound event ""playing sitar"" involves the resonant strumming and plucking of strings on the sitar, a classical Indian instrument characterized by its long neck, gourd body, and distinctive, complex, and melodious twang.","A serene setting with an individual gracefully plucking the strings of a sitar, surrounded by intricate tapestries, dim lighting, and the faint aroma of incense. Delicate, resonant notes fill the air, conveying a sense of tranquility and cultural richness.","The sound of playing a sitar involves resonant, twangy plucks accompanied by continuous, droning strings. It exhibits complex overtones and a distinctive buzz, often with intricate, melodic patterns and sliding pitches due to the use of frets and a variety of playing techniques unique to Indian classical music." +playing snare drum,"Playing a snare drum involves striking a drum with wires stretched across its bottom, producing a sharp, crisp sound. It's a central component in percussion sections for its rhythmic accents and is widely used in various music genres, from military marches to rock and jazz.","A snare drum image with tight, crisscrossed wires on the bottom, paired with drumsticks in mid-motion above, capturing rhythmic hits and vibrations, possibly amidst a musical performance setting with blurred background suggesting movement and energy.","A playing snare drum produces a sharp, crisp crack with a bright, high-pitched tone. It consists of rapid, staccato hits and buzzing rattle from the snares (metal wires) on the drum's underside. Volume levels can vary from soft taps to loud strikes." +playing squash,"Playing squash involves rapid movement on a court with sounds of a small rubber ball being struck by rackets, echoing thuds against walls, players' quick footsteps, and occasional grunts or calls between competitors.","A rapid succession of thuds and squeaks echoes in a confined space with two players wielding rackets, a small rubber ball ricocheting off walls, and intense movements with occasional shouts, reflecting the fast-paced and energetic nature of a squash game.","The sound of a squash game includes the rhythmic thud of the rubber ball against the walls, the squeak and scuffle of players' shoes on the court floor, occasional grunts of exertion, and the sharp sound of rackets striking the ball with variable force." +playing steel guitar,"The sound event ""playing steel guitar"" involves sliding a metal bar or bottleneck along the strings of a steel guitar, producing a characteristic twangy, sustained tone used in various music genres like country, blues, and Hawaiian music.","A musician sits or stands with a steel guitar on their lap or on a stand before them, fingers deftly sliding a metal bar along the strings, other hand picking or strumming, eliciting soulful, resonant twangs. The ambiance is likely intimate, reminiscent of country blues or Hawaiian melodies.","Playing a steel guitar involves resonant, sustained notes with a smooth, gliding pitch. The twangy, metallic timbre comes from sliding a metal bar along the strings, creating a unique weeping, singing quality. Vibrato and volume swells enhance expressiveness." +playing steelpan,"""Playing steelpan"" involves creating music with a steel drum, an instrument originating from Trinidad and Tobago, where mallets strike different areas of the pan to produce varied pitches and tones, producing a distinctive, resonant sound that's often associated with Caribbean music and calypso.","A person with rhythmic precision gently strikes concave metal pans with rubber-tipped mallets, producing melodious Caribbean tones, as the reflective surfaces shimmer under warm, festive lights, with swaying palms in the background and an enraptured audience tapping their feet to the syncopated harmony of the steelpan's echo.","Playing steelpan produces melodic tones with resonant metallic timbres, characterized by a blend of percussive taps and sustained harmonics, achieving a cheerful and rhythmic soundscape with distinct pitches depending on the area struck. Variations in volume and tempo can create complex, layered musical patterns." +playing synthesizer,"""Playing synthesizer"" refers to the act of using a keyboard-like electronic instrument that generates audio sounds through digital or analog circuits, shaping and combining tones in diverse ways to mimic instruments or create new sonic textures, widely used in music genres like pop, rock, and electronic dance music.","Colorful oscillating waveforms and neon-lit keys dance against a backdrop of digital interfaces, with fingers gracefully sliding over touch-responsive pads and knobs tweaking electronic textures amidst a dimly lit studio aura.","Playing a synthesizer produces electronic tones that can vary widely in pitch, timbre, and dynamics, typically characterized by oscillating waveforms, filters, and modulations creating unique and layered sounds, with potential for sustained notes and rhythmic patterns, often accompanied by key-press actions and knob adjustments." +playing tabla,"The sound event ""playing tabla"" refers to the distinctive percussive beats produced by striking the tabla, a pair of Indian drums with differing pitches, typically used in classical and devotional music. The player creates complex rhythms by tapping and sliding fingers across the drumheads.","In a scene depicting the sound of playing tabla, two small, distinct drums rest before a seated musician, fingers deftly tapping the skins, creating rhythmic beats. Waves of vibration might be shown emanating from the instruments, suggesting the pulsating, captivating tones that underpin traditional Indian music.","Playing tabla typically involves rhythmic tapping patterns, varied pitch between the smaller high-pitched dayan and the deeper bayan, intricate fingerwork producing complex beats and resonances, and occasionally sliding or rubbing motions to create modulating tones, all combining to create a rich tapestry of percussive sounds." +playing table tennis,"Playing table tennis involves rhythmic bouncing sounds from the hollow ball hitting the table and paddles, mixed with players’ movements and vocalizations. The game features sharp taps, quick volleys, and the shuffle of feet, creating a fast-paced, precise experience.","A rhythmic back-and-forth ping of the ball, with intermittent clacks from paddle strikes and occasional louder pops when a shot is more forceful. Subtle sounds of player movement and table contact accompany the central play sounds, all set against a backdrop of muted spectator murmurs and footwork shuffles.","The sound of playing table tennis typically includes a repetitive, rhythmic clicking of a lightweight ball being struck by paddles, interspersed with occasional bounces on the table, and possibly the sounds of player movements and verbal expressions during the rally." +playing tambourine,"""Playing tambourine"" refers to the act of striking or shaking a small drum with metal jingles, creating a percussive, rhythmic sound often used in music ensembles for its bright, crisp accentuation.","A person with a bright, joyous expression rhythmically shakes a handheld tambourine, its metallic jingles clashing merrily. Notes and musical symbols might float in the air, representing the sound's lively beat, capturing the essence of the festive and musical atmosphere typically associated with playing such a percussion instrument.","Playing a tambourine produces jingling and shaking sounds with varying intensities and rhythms, dependent on how it's struck or shaken; it resonates with a bright, metallic timbre due to the small cymbals (zils) attached to its frame." +playing tennis,"The sound event ""playing tennis"" includes distinct noises such as the rhythmic thwack of the ball hitting rackets, the soft thud when it strikes the court, intermittent player grunts, and the occasional shuffle of feet as players move swiftly across the court surface.","Two individuals are swinging rackets, hitting a yellow tennis ball back and forth over a net on a green rectangular court, with a rhythmic ""thwack"" each time the ball is struck, characters dressed in athletic attire ready in anticipatory stances.","The sound of tennis includes rhythmic bouncing of a ball, sharp swishes of racquets slicing the air, forceful thwacks at impact, occasional shoe squeaks on the court, and intermittent grunts from player exertion. There may also be applause or commentary if played before an audience." +playing theremin,"The theremin is an early electronic musical instrument controlled without physical contact. Playing it involves moving hands in proximity to two antennas, one controlling pitch, the other volume. The resulting sound is eerie and unique, often associated with sci-fi or horror soundtracks, demonstrating an ethereal and haunting musical experience.","A musician waves their hands near two metal antennas of a box-like instrument, creating eerie, swooping sounds without physical contact. Ethereal tones fluctuate with hand movements, capturing a sense of invisible interaction between player and theremin, often evoking a vintage or otherworldly atmosphere.","Whistling and wavering tones with continuous pitch variance; no fixed rhythm; eerie, electronic timbre from sweeping hand movements near antennas; volume and pitch altering dynamically; resembles human vocal or violin-like sounds; ethereal, haunting ambiance with possible vibrato effect from the performer's precise hand oscillations." +playing timbales,"Playing timbales involves rhythmically striking a pair of shallow, single-headed Cuban drums with sticks, producing high-pitched tones essential in Latin music genres like salsa, cha-cha, and mambo, often punctuating the music with dynamic, syncopated patterns and improvised drum fills.","A musician passionately plays timbales, striking metal-shelled drums with sticks. Fingers dance over cascara surfaces, creating vibrant Latin beats. Syncopated notes fill the air, accented by sharp cowbell clangs, as hips sway and feet tap to the salsa rhythm.","""Playing timbales"" features rhythmic, high-pitched metallic tapping and resonant drumming sounds, with occasional sharp rimshots, producing intricate patterns that vary in tempo and dynamics, punctuated by the sizzle of the cymbals." +playing timpani,"""Playing timpani"" involves striking a set of large, tunable drums with mallets to produce pitch-varied, resonant tones, key in orchestral and percussive music to create rhythmic depth and dramatic emphasis.","A musician strikes large kettle drums with mallets in a concert hall, precise rhythmic thuds resonate, punctuating an orchestral performance, intensity conveyed by focused expressions and dynamic arm movements.","Deep, resonant tones with varying pitches; rhythmic tapping and rolling sounds; subtler nuances include the tension of drumheads and mallet selection, influencing timbre and attack; reverberation reflecting room acoustics; occasional pedal adjustments altering pitch." +playing trombone,"Playing the trombone involves a musician blowing into a mouthpiece and sliding a telescopic tube to change pitches, producing a rich, brassy sound distinctive to this brass instrument, often heard in jazz, classical, and marching bands.","A person holds a trombone, sliding its extendable arm confidently while lips buzz into the mouthpiece. Musical notes float in the air, suggesting rich, brassy tones. The musician's cheeks are puffed, and the audience's faces show enjoyment or foot-tapping to the rhythm of the iconic sliding pitch.","A trombone playing delivers rich, brassy tones with a wide dynamic range, from soft, mellow pitches to loud, resonant blasts. Sound features include slide movements creating smooth glissandos, varied articulations such as legato and staccato, and potential flutter-tonguing, resulting in a vibrato effect." +playing trumpet,"""Playing trumpet"" refers to producing music by blowing air through pursed lips into a brass instrument with a flared bell, controlling pitch with three valves, and creating a vibrant, bold sound used across genres from classical to jazz. The trumpet player manipulates breath and fingerings to create melodies.","A musician, lips pursed, passionately blows into a trumpet, fingers dancing on the valves. Brass gleams under the spotlight, and a wave of vibrant notes fills the air, suggesting a lively jazz band performance or a solo act, engulfed in the rhythm of the music.","When playing a trumpet, you can expect a vibrant, brassy tone with a dynamic range from soft murmurs to piercing highs. There's a mix of clear, resonant notes and potential breathy sounds or valve clicks, often interspersed with the stylistic use of vibrato and occasional muffled notes when muted." +playing tuning fork,"A tuning fork emits a pure musical tone when struck, typically used to tune instruments or for auditory demonstrations. The sound results from the resonating vibration of the fork's prongs, creating a consistent pitch that aids in achieving the desired musical harmony.","A visual representation might show a tuning fork with animated lines or waves emanating from its prongs, symbolizing the vibrations and the resonant, pure musical tone produced when struck, typically against an object or surface, then held in the air or against a resonant body.","A playing tuning fork typically emits a clear, pure, sustained musical note at a fixed frequency. It presents a steady pitch with minimal overtones and a smooth decay as vibrations diminish, often producing a subtle humming or ringing quality perceived as a sinusoidal waveform." +playing tympani,"Playing tympani involves striking tuned drums with mallets to produce rhythmic tones that vary in pitch and intensity, commonly featured in orchestras, adding depth and drama to musical compositions. Tympanists skillfully manipulate the pedal mechanism to change pitches during performances, creating resonant, melodic percussive effects.","A musician strikes a large kettle drum with mallets in a rhythmical pattern, creating deep resonant notes. The scene might include several timpani with varying sizes set up on a concert stage, possibly with an orchestra, under bright stage lights, highlighting the intense concentration and precise movements of the performer.","Playing tympani involves rhythmic, resonant beats with varying pitch and dynamics. Each strike produces deep, booming sounds, ranging from soft whispers to thunderous roars, depending on the force and mallet used. The drum’s large, kettle-like cavity adds a subtle sustain to the tones." +playing ukulele,"Playing ukulele involves strumming or plucking the strings of a small, guitar-like instrument to produce a light, melodic sound characteristic of Hawaiian music and popular in various musical genres for its cheerful tone.","A person strums a small four-stringed ukulele, notes floating in the air, with a relaxed, joyous expression against a backdrop of a sunny beach or a cozy room; the instrument's petite body cradled gently, capturing the essence of a carefree, melodic moment.","Strumming chords, plucking nylon strings; bright, warm, Hawaiian-inspired tones; mellow, rhythmic, soft twangs; distinct higher pitch compared to a guitar; occasional finger sliding noises; cheerful, melodic, harmonious sound." +playing vibraphone,"Playing the vibraphone involves striking its metal bars with mallets to create melodious, resonant tones. It often features in jazz and orchestral music, with motor-driven rotating disks inside resonator tubes creating its characteristic vibrato effect.","A musician stands with mallets in hand, poised over a large metallic instrument with bars arranged like a keyboard, often with resonator tubes hanging below. Soft, resonant notes fill the air as the player strikes and sustains tones, perhaps with a foot pedal enhancing the vibrato effect.","The playing of a vibraphone produces resonant, metallic tones with a sustained, mellow decay. It can vary in pitch depending on the note struck and often exhibits a soft, vibrato effect due to motor-driven rotating dampers beneath the bars, creating a wavering, ethereal quality to the sound." +playing violin,"Playing the violin involves drawing a bow across the strings to produce melodious notes, employing finger placement for pitch control, creating a rich tapestry of sound that ranges from vibrant and energetic to soft and melancholic in classical, folk, and contemporary music genres.","A musician drawing a bow across violin strings, producing elegant notes, standing under a spotlight or amidst an orchestra, with focused concentration and graceful hand movements.","The sound of playing violin involves resonant, continuous tones varying in pitch and dynamics, with possible vibrato. It features distinct bowing textures, from smooth legato to sharper staccato sounds, and can convey emotional nuance ranging from soft, mellow timbres to bright, intense expressions." +playing volleyball,"The sound event ""playing volleyball"" includes distinctive noises such as the thud of the ball hitting the sand or floor, slaps from players_ hands striking the ball, whistles, cheers from spectators, and calls from teammates communicating during a game.","A series of waveforms depicting rhythmic thuds of the ball being struck, intermittent sharper spikes from hand slaps, and a consistent background murmur of sand movement and player communication. Sound frequency would vary from low (ball hits) to high (whistle blows, cheers).","A volleyball game features sounds of the ball being struck and bounced, players calling out and communicating, occasional whistles from referees, sand or court floor impacting noises, and audience reactions if present, including clapping and cheering." +playing washboard,"""Playing washboard"" refers to using a ribbed metal or wooden board, traditionally a laundry tool, as a musical instrument by scraping or tapping it with thimbles or fingers to create a rhythmic, percussive sound often used in folk, zydeco, and jug band music.","A musician rhythmically strokes a ribbed metal washboard with thimbled fingers, creating a percussive backdrop. Around them, an upbeat folk or jazz band enhances the rustic, lively ambiance.","Playing a washboard typically produces rhythmic, high-pitched scraping or percussive sounds with a metallic timbre, varying in amplitude and tempo based on the scrubbing motion's intensity and speed, evoking an old-timey, traditional folk or jug band musical feel." +playing xylophone,"The sound event ""playing xylophone"" involves striking tuned wooden bars with mallets, producing a distinct, resonant, and melodic percussion. Each bar corresponds to a musical note, allowing various tunes to be played rhythmically and harmonically.","A person with mallets in hand strikes the tuned metal or wooden bars of a xylophone, producing melodic notes. The sequence of hits creates a ripple of musical tones, depicted with vibrant notes floating in the air and the happy, focused expression of the player.","A xylophone produces melodious, percussive tones with varying pitches depending on the bar struck. It creates a resonant, wooden, often bright sound, with a quick decay, and can present a range of dynamics from soft to loud depending on the force of the mallet strike." +playing zither,"The sound event ""playing zither"" is characterized by the delicate plucking or strumming of strings on the zither, a family of stringed instruments, producing melodious, resonant tones that can evoke a sense of tranquility and classic elegance.","Playing the zither involves gentle hands gracefully plucking strings on a long, horizontal instrument. This produces melodious tones and resonant vibrations that create a tranquil ambiance. Soft light reflects off the polished wood, enhancing the serene and contemplative setting.","Plucking strings, resonant tones, delicate harmonics, varying pitch, soft wooden timbre, intermittent string buzzes, sustained notes, occasional fingernail clicks, and the gentle background noise of hand movement across the instrument's body." +police car siren,"A police car siren is an auditory signaling device used by law enforcement vehicles. It emits a distinctive, piercing wail or yelp to alert the public and clear traffic when officers are responding to emergencies, pursuing suspects, or signaling urgent warnings.","Flashing blue and red lights atop a speeding police car, piercing the night with urgent wails, slice through traffic, alerting citizens as the vehicle weaves through the streets in response to an emergency.","A police car siren typically features a high-pitched, oscillating wail with a rapidly alternating frequency, often moving between two tones (yelp and wail modes). It is designed to cut through ambient noise, signaling urgency and prompting immediate attention. Its loudness varies, increasing as the vehicle approaches." +police radio chatter,"Police radio chatter consists of rapid, concise communications exchanged between law enforcement officers and dispatch over a dedicated radio frequency, often coded and including status updates, alerts, and coordination of police activities.","A scene filled with flashing blue lights, uniformed officers bustling, squad cars parked haphazardly, radios crackling with dispatch voices, and officers hurriedly relaying information through handheld transceivers amidst an atmosphere of urgency and alertness.","Police radio chatter is characterized by crisp, static-laden bursts of speech, often in a compressed, urgent tone, with procedural codes, brief pauses, and squelchy beeps signaling transmission start or end, overlaid by intermittent background radio noise and occasionally overlapped by multiple voices." +popping popcorn,"Popping popcorn is a rapid, staccato sound event that occurs when the heated kernels of the popcorn maize expand and burst, releasing moisture and creating a characteristic ""pop"" as they transform from hard kernels into fluffy, edible snacks.","An image of popcorn kernels in a pot or machine, with several puffed-up white pieces mid-air, steam rising, as they burst from their golden shells, capturing the dynamic and erratic motion typically associated with the ""popping"" sound.","Popping popcorn produces sharp, intermittent crackles at irregular intervals, with a crescendo as the rate increases, followed by a lull as it tapers off. The timbre is high-pitched and bursting, with a textured, airy quality, and a distinct popping characteristic of expanding kernels." +printer printing,"A ""printer printing"" sound event typically consists of rhythmic mechanical whirring and clicking as paper is fed through rollers, combined with the buzz or hum of a printer's moving parts as text or images are transferred onto the page, creating a recognizable office ambiance.","A printer's mechanical parts move with precision, as paper smoothly feeds through rollers. The rhythmic hum and intermittent buzz accompany the synchronized dance, while a freshly inked sheet emerges, patterned by the distinctive sound of information being transferred from digital to physical form.","The sound of a printer printing typically includes intermittent mechanical whirring, clicking of moving parts, rhythmic rolling as paper feeds through the mechanism, the buzz of motors, and occasional softer thuds as the print head adjusts or paper is deposited into the tray." +pumping water,"Pumping water is the auditory occurrence characterized by rhythmic mechanical and liquid sounds emitted when a pump moves water from a source to a desired location, typically involving a repetitive whooshing or splashing as liquid flows through the mechanism.","A visual might depict a hand-operated water pump with a spout gushing clear liquid rhythmically into a bucket, the handle moving up and down, and sound waves indicating the distinctive mechanical creaks and the slosh of water exiting the spout.","The ""pumping water"" sound event includes rhythmic mechanical noises, water splashing, gurgling as water moves through a hose, and possibly the creaking of the pump handle or motor hum if powered. There may be intermittent sounds of water flow increasing and decreasing with each pump action." +railroad car,"A ""railroad car"" sound event typically refers to the noises associated with train cars, such as the clattering of wheels on tracks, the rumbling of heavy machinery, the screech of metal on metal, and the sound of cargo or passenger movement.","An image might show a train car in motion with lines or musical notes emanating from it, indicating the rhythmic clacking of wheels on tracks, or a vibration effect to suggest the deep rumble and screeching of metal associated with trains moving or braking.","A railroad car typically produces rhythmic clacking from wheels on tracks, metallic screeches during turns or braking, the rumble of heavy machinery in motion, and occasionally the sound of cargo shifting or couplings clanging when cars are joined or separated." +raining,"The sound event ""raining"" encompasses the ambient noises produced when droplets of water fall from clouds, striking various surfaces, often creating a calming, rhythmic, and continuous patter that can vary from a soft drizzle to a heavy downpour.","Wavy lines or musical notes cascade downward like droplets in a stylized representation. Speakers, instruments, or clouds could be depicted at the top, emphasizing the auditory nature, while objects below might show ripples or vibrations, suggesting the impact of the falling ""rain"" of sound.","""Raining"" is characterized by a continuous, rhythmic pattering of raindrops, varying in intensity from gentle to torrential. It can include the splashing on various surfaces, subtle rolling thunder in the background, and occasionally the swish of wind-blown rain." +rapping,"Rapping is a musical form characterized by rhythmic, rhymed speech often set to a beat, central to hip-hop culture. It showcases verbal dexterity and wordplay, allowing artists to express complex ideas, emotions, and stories.","A figure leans into a microphone, mouth open in mid-verse, hand gestures punctuating the air. Stylized sound waves emanate, while an audience nods to the rhythmic beats. Graffiti backgrounds and urban attire complete the scene, encapsulating the essence of hip-hop culture.","Rapping is characterized by rhythmic speech with rhyme and wordplay, often laid over a beat. Vocal tones can vary, with emphasis on flow, delivery, and timing. There's a percussive element to the vocalization, with artists using pitch variation, cadence changes, and vocal inflection to create a dynamic performance." +reversing beeps,"Reversing beeps, or backup alarms, are warning sounds emitted by vehicles when they are moving backward, alerting pedestrians and other drivers to their presence to prevent accidents. These beeps are usually a series of high-pitched tones or pulses that increase in frequency as the vehicle gets closer to an object.","A vehicle, such as a truck or forklift, is pictured in reverse gear, with caution lights blinking. An audible series of rhythmic beeps accompanies the movement, alerting bystanders to the vehicle's backward motion for safety.","Reversing beeps typically consist of repetitive, high-pitched, piercing tones that are rhythmically emitted. This distinctive pattern of short beeps is designed to alert passersby to the presence of a vehicle backing up, increasing in frequency as urgency or proximity danger escalates." +ripping paper,"Ripping paper is the abrasive, tearing sound produced when paper fibers are forcefully separated, typically characterized by a sharp, high-pitched noise that fluctuates depending on the paper's thickness, size, and tearing speed.","A hand grips a corner of a sheet of paper, fingers poised and tensed. As the arm pulls, fibers stretch before tearing along a jagged path, creases forming while edges flutter. The sound resonates as the two separate pieces move apart, betraying the paper's once smooth, intact state.","The sound event ""ripping paper"" typically includes a sharp, high-frequency tearing sound with variations in pitch and intensity depending on the paper weight and tearing speed, accompanied by brief periods of lower-frequency rustling. It has a brief, non-repetitive, and distinctive crescendo-like profile." +roller coaster running,"A ""roller coaster running"" sound event captures the rumbling roar and screeching of a roller coaster__ cars gliding along tracks, filled with clattering mechanics, wind rush, and occasional shouts of thrilled riders, embodying the exhilaration and dynamism of a theme park ride.","A twisting, looping roller coaster rapidly navigates steep drops and sharp turns, its chain clanking and wheels rumbling on the tracks, with screams of thrilled riders piercing the air, amidst a backdrop of a bustling amusement park.","The sound of a roller coaster running features a mechanical symphony of clattering tracks, the whoosh of brisk wind, screams of thrilled riders, rhythmic clanks of the chain lift, sharp swooshes during drops and turns, and the final decelerating grind as the ride slows to a stop." +rope skipping,"Rope skipping is a rhythmic activity combining coordination, agility, and fitness, where an individual or group jumps over a swinging rope at varying speeds and techniques, creating a distinct sound pattern of the rope hitting the ground and whooshing through the air with each revolution.","A rhythmic thwacking echoes as a rope slaps the ground. A focused individual hops, timing their jumps with precision. Observers might see the rope blur in a swift arc above the head and under the feet, creating a cycle of motion, accompanied by the constant beat of the rope's contact.","The auditory features of rope skipping include rhythmic whooshing or swishing sounds as the rope cuts through the air, intermittent light thudding when the rope hits the ground, and repetitive tapping from the jumper's feet making contact with the surface, often accompanied by occasional breath sounds or exertion grunts." +running electric fan,"A running electric fan produces a steady, whirring sound created by the rotation of its blades, which circulate air. The noise includes a consistent hum from the motor with occasional slight variations due to changes in speed or airflow disturbances.","A spinning fan with rotating blades creates a gentle breeze, as its motor hums steadily. The fan's oscillation suggests movement, and the sound waves imply a consistent, soothing white noise. The scene is often associated with a cool, airy environment, possibly providing relief on a warm day.","A running electric fan produces a steady, whirring hum or buzz resulting from the rotation of its blades. The pitch may vary with speed, and there can be intermittent clicking or rattling if the fan is unbalanced or encountering resistance." +sailing,"Sailing is an outdoor sport involving the navigation of a boat powered by wind in sails. The sound event typically includes flapping sails, the hull cutting through waves, rigging clinks, and the wind's rush. It is a harmonious blend of natural and human-made sounds associated with nautical travel.","A scene with undulating audio waveforms or musical notes floating like boats on a stylized, wavy blue sea, with the soft glow of a sunset in the background, creating a serene and rhythmic atmosphere akin to the tranquil movement of sailing on calm waters.","The auditory features associated with the sound event ""sailing"" typically include the flapping of sails, the creaking of ropes and masts, the sound of wind whistling through the rigging, the gentle splashing of water against the hull, and the rhythmic lapping of waves." +scuba diving,"Scuba diving is an underwater activity where divers use self-contained underwater breathing apparatus (scuba) to explore marine environments, observe wildlife, and examine sunken structures. It requires training and certification to manage equipment and safety while experiencing the weightlessness and tranquility of the aquatic world.","A tranquil underwater scene with a diver, surrounded by bubbles and marine life, the sun's rays piercing the blue water, with sounds of breaths through a regulator and the muted, distant ocean ambiance.","Bubbling breaths, regulator exhalation, underwater ambience, muffled movements, gear clinks, wetsuit squeaks, distant marine life, pressure equalization pops, fin strokes against water." +sea lion barking,"The sound event ""sea lion barking"" refers to the loud, distinctive calls made by sea lions, often resembling dog barks. This vocalization serves communication purposes, such as territory establishment, identification, and social interactions within colonies, and is characterized by its deep, repetitive nature.","A sea lion lounges on a rocky coastline, or in a crowded marine sanctuary, head tilted back, mouth wide open emitting a loud, distinctive bark, as waves crash in the background and other sea lions possibly join in the cacophony, lazing or interacting on the sun-drenched shore.","The sound event ""sea lion barking"" features rhythmic, repetitive deep barks or roars, often with a rumbly quality, varying in pitch and length. These vocalizations can resemble a dog bark but have a more guttural tone and are usually heard in a sequence or chorus from a colony." +sea waves,"Sea waves are natural phenomena where ocean water undulates rhythmically, creating soothing sounds as the water swells and crashes onto the shore, often associated with coastal ambience and maritime activity.","Blue-green hues ripple across a serene seascape, with undulating waves rhythmically rolling toward a sandy shore under a tranquil sky, while seagulls soar and dive amidst gentle sea breezes.","Sea waves emit rhythmic crashes and whooshes, characterized by a broad spectrum of frequencies, with a soothing white noise quality. The ebb and flow create a natural oscillation, varying in volume as waves break and recede, offering a calming, consistent backdrop interspersed with occasional sharper sounds from pebbles and bubbles." +sharpen knife,"The sound event ""sharpen knife"" typically involves the abrasive interaction between a knife blade and a sharpening tool, such as a whetstone or honing rod, producing a distinct, consistent scraping noise as the blade is honed to restore its cutting edge.","A close-up showing a knife blade being dragged across a honing steel, creating a rhythmic metallic scraping sound. Bright sparks occasionally fly off the edge, reflecting focused intensity and the meticulous action of refining the blade's sharpness.","The sound event ""sharpen knife"" typically includes a repetitive, rhythmic scraping noise as the blade is swept across a sharpening stone or steel, characterized by a high-pitched, metallic, and sometimes gritty resonance that varies in intensity with the applied pressure and motion consistency." +sheep bleating,"A sheep bleating is the characteristic vocalization of sheep, sounding like a nasal ""baa"" or ""meh."" It conveys communication within a flock, expressing needs or emotions such as distress, hunger, or social bonding.","A pastoral scene unfolds with fluffy white sheep scattered across a verdant field, some grazing peacefully, others lifting their heads to emit soft, repetitive ""baa"" sounds under a bright, expansive sky as a shepherd watches over the tranquil tableau.","Sheep bleating is characterized by a distinctive, vibratory ""baa"" sound with a moderate to high pitch, fluctuating volume, and a nasal tone. The duration varies, often repeated in sequences, conveying stress levels or social communication among flock members." +shot football,"""Shot football"" refers to the specific sound made when a soccer player kicks or shoots the ball during a game, often characterized by a sharp, powerful thud or bang, indicative of the force and contact between the ball and player's foot or head.","During a game, a football deflates mid-air, leaving players puzzled. The ball’s torn surface releases compressed air with a sharp hiss, resembling a “shot football.” The scene shifts to disappointed athletes and murmurs from a stunned audience.","The sound event ""shot football"" features a sharp, succinct thump or thud of a foot striking the ball, possibly followed by a brief whooshing air sound as the ball accelerates, and potentially distant cheers or shouts if in a game context. Reverberation might occur in an enclosed stadium." +singing bowl,"A singing bowl is a type of bell, typically made from metal alloys, that produces a rich, harmonic and sustaining musical note when the rim is struck or rubbed with a mallet, used for meditation, music, relaxation, and personal well-being.","In a serene, dimly lit room, a person sits cross-legged, gently striking and rubbing a metallic singing bowl with a wooden mallet, producing soothing, resonant tones that ripple through the air, accompanied by gentle vibrations and a sense of calmness enveloping the space.","A singing bowl produces resonant, harmonic vibrations with sustained tones when struck or circled with a mallet. The sound is rich with overtones, often starting with a bright strike note that smoothens into a continuous ringing or humming, varying with the bowl size and material, often perceived as calming and meditative." +singing choir,"A singing choir is a group of singers who perform together, blending their voices in harmonious arrangements. Choirs can vary in size and often include a range of voice types such as soprano, alto, tenor, and bass, covering a broad spectrum of musical works, both secular and sacred.","A diverse choir stands united, mouths open mid-song, holding sheet music. Positioned on risers, a conductor energetically guides their harmonious performance. The ornate hall or church interior enhances the solemnity and resonance of their voices.","A singing choir features harmonized voices with varying pitches, timber, and dynamics; it presents sustained vowel sounds, rhythmic patterns from lyrical articulation, and possibly reverberation within an acoustically resonant space, creating a rich, layered, and melodic auditory experience." +skateboarding,"Skateboarding is an action sport that involves riding and performing tricks on a skateboard, characterized by distinct sounds such as wheels rolling on pavement, board impacts from jumps and tricks, and the scrape of grinding on rails and ledges.","A skateboarder glides across a concrete landscape, the wheels rumble and clack over pavement seams. Mid-tricks, the board taps and scrapes on rails and ledges, punctuated by the occasional snap of a clean landing.","Skateboarding sound events include rhythmic clattering of wheels on concrete, grinding of trucks against metal rails, occasional thuds from jumping and landing, and occasional distinctive popping sounds from kickflips or ollies. The overall timbre is a mix of rolling, scraping, and intermittent impacts." +skidding,"Skidding is a friction-induced sound event characterized by the high-pitched squealing noise produced when an object, typically a tire, rapidly moves across a surface while resisting motion, resulting in audible vibrations commonly associated with loss of traction or abrupt stops.","A vehicle's tires lose traction against the roadway, leaving streaks as they slide askew with puffs of smoke, accompanied by the sharp, screeching noise of rubber scraping the surface.","A skidding sound event features a high-pitched screeching or shrieking noise with varying intensity, often accompanied by a rough, abrasive quality. It can include fluctuations depending on traction loss and surface texture. The sound quickly decays once the vehicle stops." +skiing,"Skiing sound events encapsulate the distinctive swishes and whooshes of skis gliding across snow, punctuated by periodic clicks of ski poles, often accompanied by the soft crunch of snowpack and the sounds of the surrounding wintry environment, conveying the brisk motion and ambience of this winter sport.","A crisp, white snowscape bisected by smooth, carved tracks, with a skier in snug attire swooshing down a slope, poles alternating in rhythm, as puffs of powder lift with each turn, and the sharp sound of skis slicing the cold air merges with the muted ambiance of a mountain expanse.","The sound of skiing typically features the crisp crunch of skis slicing through snow, soft swishes of powder displacement, rhythmic tapping of ski poles, and occasional whooshes of wind as the skier gains speed down slopes. Sometimes, distant chatter from other skiers or the mechanical hum of ski lifts accompanies these sounds." +sliding door,"A sliding door sound event is characterized by the noise produced when a door glides along a track, often resulting in a smooth, continuous motion with a distinctive mechanical whirr or whoosh as the panels move and a soft thud or click when the door settles into its closed or open position.","A split screen depicts two parallel outcomes: on one side a figure hesitates then misses a closing elevator door, while the other confidently strides in before it shuts. The shared backdrop features sleek, metallic surfaces and a flickering light accentuating the echoing 'whoosh' as each door glides shut.","A sliding door typically produces a low-threshold whooshing sound from the movement, combined with a series of clicks or clacks from the door's mechanisms engaging, and may end with a soft thud or bump as it closes, all of which can vary with speed and materials." +sloshing water,"Sloshing water is a liquid movement sound, characterized by a rhythmic, splashing noise created when water moves back and forth often within a container, like a tank or a bucket, typically due to motion or disturbance.","A container partially filled with liquid is agitated, causing the liquid to oscillate and lap against the walls, creating a fluctuating, splashing noise, visually exemplified by rippling surfaces and intermittent splashes or waves inside the vessel.","Sloshing water typically manifests as a low to mid-frequency, rhythmic, repetitive sound with a liquid quality, often containing splashing and bubbling components with varying intensity and pitch depending on the movement intensity and the container's size." +slot machine,"A slot machine sound event typically includes a blend of spinning reel noises, clicking of stops, jingling of coins, and celebratory sound effects upon winning or activating bonuses, creating an iconic casino atmosphere designed to enhance the gaming experience and stimulate feelings of anticipation and excitement.","Flashing neon lights, spinning fruit symbols, and cherries aligning on a screen amidst a casino backdrop, with jubilant coins clinking into a metal tray as a jackpot is hit.","A ""slot machine"" sound event often features a blend of mechanical reels spinning, coins clinking, electronic beeps, melodies signifying a win, and a lever being pulled or buttons pressed. The repeated plunks of coins and celebratory sounds create an atmosphere of anticipation and excitement." +smoke detector beeping,"A smoke detector beeping is an audible alarm signal emitted by the device to alert occupants of potential smoke presence, indicative of a fire, or a need to replace batteries or maintenance requirements. It typically sounds as repetitive, high-pitched chirps or beeps for immediate attention.","A ceiling-mounted smoke detector flashes a red light with intermittent beeps, signaling either smoke presence or a low battery. Anxious inhabitants look up or stand on chairs to reach the device, some covering their ears, while others wave towels to clear potential smoke or address the nuisance alarm.","A smoke detector beeping typically emits a sharp, piercing, repetitive high-pitched sound, usually around 3,150 Hz, designed to alert occupants with a loud volume exceeding 85 dB, repeated at regular short intervals, often with a temporal pattern of three successive beeps." +snake hissing,"A snake hiss is a defensive sound produced by the expulsion of air through the serpent's glottis, warning predators or threats of its presence and readiness to protect itself. It's characterized by a distinctive sibilant noise that can vary among snake species.","A coiled serpent with its head raised and forked tongue flickering, its scales glistening, as it emits a sharp, continuous sibilant sound from its slightly opened mouth, signaling a mix of aggression and defensiveness in a tense, silent environment.","A snake hiss typically includes a sustained, high-frequency sibilant sound with a broad spectral range, lacking a tonal melody and fluctuating slightly in volume and pitch, evoking a sense of warning or threat, often with an abrupt start and finish." +snake rattling,"The snake rattling sound is a distinctive warning noise produced by the rattlesnake, a venomous reptile. It occurs when the snake vibrates its tail, causing the segments of the rattle to collide and create a rapid, buzzing noise to deter potential threats.","A coiled rattlesnake poised in a defensive posture with its tail raised, segments shaking rapidly to produce a warning buzz, amidst arid brush under the harsh sun, as onlookers freeze, alerted to the potential danger of an imminent strike.","A snake rattling produces a continuous, high-pitched buzzing sound, created by the rapid shaking of keratin segments in the rattle. Its frequency and tempo can vary but typically has a sharp, percussive quality that can serve as a warning signal to potential predators or threats." +splashing water,"Splashing water is the auditory event characterized by the distinct, liquid sound produced when an object or substance strikes or moves rapidly in water, dispersing droplets and creating ripples and bubbles in a fluid, dynamic interaction.","Transparent droplets scatter energetically from a disturbed water surface, creating ripples and catching the light while some liquid splashes onto nearby surfaces or objects.","Splashing water involves a mix of high, rapid, irregular, non-harmonic, and repetitive sounds. It has a transient, percussive quality with bubbling noises and a resonant background, reflecting the volume and nature of the liquid body." +spraying water,"A spraying water sound event typically consists of a continuous, hissing or splattering noise as liquid forcefully ejects and disperses into fine droplets, often associated with applications like watering plants, using a hose, or operating a spray bottle.","A high-pressure nozzle ejects a fine mist of water droplets, refracting light into a subtle rainbow as they cascade against a backdrop of shimmering beads bouncing off surfaces, accompanied by the continual hiss and rhythmic splattering against the wettened ground or objects.","Spraying water typically features a continuous, hissing or splashing sound with varying pitch and intensity, often accompanied by intermittent drips or droplets and the reverberation of spray impact depending on the surface it contacts." +squishing water,"The sound event ""squishing water"" refers to the distinct, often rhythmic, wet and soft crushing noise produced when water is pressed and moves between surfaces, such as footsteps in a puddle or a hand squeezing a wet sponge.","An individual steps onto saturated, muddy ground, pressing down as water oozes out around their footwear, creating ripples and bubbles with each squelching, sodden step, vividly exemplifying the ""squishing water"" sound in a damp, maybe grassy environment.","The sound event ""squishing water"" typically includes low to mid-frequency dampened squelching, intermittent liquid displacement, rhythmic sloshing, and subtle popping air bubbles, all conveying a sense of soft, wet compression and release." +stream burbling,"Stream burbling refers to the relaxing, natural sound created as water flows, gurgles, and bubbles over rocks and down the course of a stream, producing a calming, rhythmic noise often associated with serenity and the presence of a clean, vibrant ecosystem.","A gentle stream meanders through a lush forest; clear water flows over smooth pebbles and between moss-covered rocks, creating a soft, soothing symphony. Bright sunlight glimmers on the babbling water's surface as it travels downstream.","The auditory features of a burbling stream include: a continuous low-pitched gurgle, irregular high-pitched tinkles, the rippling sound of water flowing over rocks, and intermittent splashes, all creating a soothing and rhythmically complex natural soundscape." +strike lighter,"A ""strike lighter"" sound event is the audible result of flicking a lighter's wheel against its flint, producing a spark that ignites fuel, creating a brief, distinctive scratching and clicking noise followed by a soft whoosh as the flame ignites.","A hand flicks a flint wheel, igniting a flame with a bright burst. Sparks shower, then settle as a flame steadies at the lighter's tip, casting a soft glow on nearby objects, accompanied by the crisp, sharp click and whoosh of the ignition.","A ""strike lighter"" sound event includes a brief, sharp metallic scrape followed by a short fizzle and a soft, sustained hissing or gentle roar as the gas ignites, producing a warm, flickering sound if the lighter stays lit." +striking bowling,"The sound event ""striking bowling"" typically involves the collision of a heavy bowling ball with pins, producing a loud, distinctive crash that signifies the successful knocking down of the pins during a bowling game. This event combines the rolling sound of the ball and the subsequent pin impact.","A series of bowling pins scatter dramatically as a gleaming ball hurtles down the lane, culminating in a resounding crash. Pins fly in various directions, a few spinning in mid-air, reflecting the bright lights overhead, while the ball continues its triumphant path into the shadows of the back end.","A ""striking bowling"" sound event typically features a rolling rumble followed by a crescendo into a sharp, crashing clatter of pins, often with resonant echoes in a large, enclosed space, and intermittent cheers or groans from observers." +striking pool,"""Striking pool"" refers to the sound event characterized by a sharp, clear noise produced when an object makes contact with the surface of water in a pool, causing a splash and subsequent ripples, often associated with diving or dropping an item into the water.","A shimmering swimming pool, a diver poised mid-air, a moment before breaking the surface, ripples radiating, capturing a frozen splash, the crystalline water disturbed, emitting a resonant, sharp echo bouncing off surrounding tiled walls.","A ""striking pool"" sound event typically features a sharp, crisp splash with varying pitches depending on the size/weight of the object, followed by subsequent ripples and smaller splashes, possibly accompanied by the sounds of water movement and disturbed water settling back to a calm state." +swimming,"Swimming is a sound event characterized by splashes, water movements, and rhythmic strokes as a swimmer propels through water, along with occasional gasps for air. It's often heard at pools, beaches, or during competitions, evoking a sense of exertion, fluidity, and sometimes, tranquility or intense activity.","Waves of translucent blue notes undulate fluidly across the space, flowing like water around a silhouetted figure seemingly immersed in the melody, with sound vibrations visibly rippling outwards from a central point, creating a serene, aquatic ambiance.","The sound event ""swimming"" typically involves splashing, rhythmic water movement, muted underwater noises, occasional breathing or gasping sounds, and the distinct lapping of water against the pool edge or swimmer's body." +tap dancing,"Tap dancing is a percussive performing art where dancers use shoes with metal taps to create rhythmic sounds, blending footwork with musical expression and often involving improvisation and syncopated rhythms, originating from African, Irish, and English dance traditions.","A stage is alive with a dancer's rhythmic feet clattering, tapping metal-plated shoes striking wooden floorboards, creating a percussive musical performance. Their swift, precise movements are accompanied by graceful arm gestures and a beaming smile under the spotlight.","Tap dancing produces rhythmic, syncopated clicking and tapping sounds, with varying tempo and intensity, created by metal plates on the dancer's shoes striking hard surfaces, often accentuated by patterns and sequences that can include shuffles, flaps, and slides." +tapping guitar,"Tapping on a guitar involves using the fingers of both hands to 'tap' the strings on the fretboard, creating a percussive and melodic effect, often associated with electric guitar solos but also used in various musical genres on acoustic guitars.","A musician's fingers rhythmically press and flick strings on the guitar's fretboard, producing melodious percussive plucks, as the instrument resonates with warm, vibrant tones. The player's focused expression mirrors the intricate dance of touch and sound.","The sound of ""tapping guitar"" features rhythmic taps and clear metallic resonances from fingers striking strings against frets, creating percussive tones interspersed with brief harmonies and overtones peculiar to a guitar's timbre." +telephone bell ringing,"A telephone bell ringing is an auditory signal produced by a telephone to alert recipients of an incoming call. The sound typically comprises a repetitive chiming or ringing tone, often mechanical or electronic, designed to capture attention without being overly disruptive.","A telephone, possibly vintage, occupies the foreground with sound waves emanating from the receiver. The bell inside the phone may be visible, vibrating. An urgency or curiosity may be reflected in the surrounding scene, suggesting an impending action to answer the call.","A telephone bell ringing typically features a repeated high-pitched chime or ring, with a clear, resonant tonal quality. It can have a pattern of rings followed by a brief pause. The sound often has a piercing characteristic designed to grab attention, and its volume decreases if unanswered." +thunder,"Thunder is the loud, rumbling sound that follows a lightning flash, caused by the rapid expansion and contraction of air heated instantaneously by the electric discharge. It can vary from a sharp, loud crack to a long, low rumble, depending on the distance and nature of the lightning.","Dark clouds loom overhead; jagged lightning bolts pierce the sky. Shadows flicker as flashes illuminate the ominous landscape. Trees sway wildly in the gusty wind, and rain pelts the ground. The air is charged, tense, before a deafening crack resonates, leaving a brief silence in its wake.","Thunder is characterized by a sudden, loud, and deep rumble or sharp crack. Its sound varies from a low, resonating roar to a quick, explosive snap, with reverberations that may echo. The pitch can shift, reflecting the distance and nature of the lightning strike causing it." +toilet flushing,"Toilet flushing is the sound created by the swift flow of water in a toilet bowl that removes waste, typically triggered by a handle or button, marked by a distinct rush followed by a decrease in intensity as the tank refills.","A swirling whirlpool of water cascades down a porcelain bowl, carrying away its contents, as the resonant sound of gushing water echoes in a tiled bathroom, signifying cleanliness and the disposal of waste.","A toilet flushing emits a distinct, rushing water sound with a strong initial surge, followed by a swirling, gurgling decline, and concludes with a resounding water refill in the toilet's tank, typically lasting several seconds." +tornado roaring,"A tornado's roar is a powerful auditory event, characterized by a continuous deep rumble, often likened to a freight train, caused by intense wind velocity and turbulence as the tornado moves and interacts with structures and debris.","A ferocious tornado spirals with debris swirling around its core. Darkened skies, lightning flashes, and bent trees under the might of howling winds embody the chaos as the twister's roar dominates the landscape, evoking fear and awe.","The sound of a tornado roaring includes a continuous low rumble, overlaid with a whistling and whooshing as debris and wind swirl. It's often likened to a freight train due to its intense, deep, and powerful vibration that can be felt physically as well as heard." +tractor digging,"A tractor digging sound event is characterized by the deep, rumbling noise of the engine, combined with the clanking of metal as the tractor's attachments, like a bucket or shovel, break ground and move earth during agricultural or construction tasks.","A heavy-duty tractor excavates soil with its metal scoop, engine growling and metal clanging. Dirt flies while hydraulic arms operate the bucket, carving into the earth, under a cloud of dust against the backdrop of an active construction site or a farm.","A tractor digging emits a low-pitched rumbling engine noise, intermittent backup alarm beeping, and metallic scraping and clanging as the shovel hits soil or rocks. It also produces a cyclic whirring from mechanical parts and muffled thuds when scooping or dumping earth." +train horning,"Train horning refers to the loud, resonant sound blast from a locomotive's air horn, used to warn of a train's approach or presence, especially at crossings to alert vehicles and pedestrians for safety reasons. It's characterized by its long-distance carrying power and distinctive echoing note.","A blaring train horn cuts through the stillness as a powerful locomotive barrels down the tracks, its commanding presence signaled by the urgent sound, warning all nearby as it speeds past a crossing, steam pluming, and wheels clacking rhythmically on the rails.","A train horn produces a loud, resonant blast, often comprising multiple tones or a harmonic series. It carries a prolonged, echoing quality with a decreasing pitch and fading volume over distance, and may include the rhythmic chugging or clattering of a moving train." +train wheels squealing,"Train wheels squealing is a high-pitched, abrasive sound emitted when a train's metal wheels grind against the rails, typically during sharp turns or sudden stops due to the frictional forces at play. This acoustic occurrence is common in rail transport systems.","A stationary train departs with a loud, high-pitched screech as its wheels grind against the metal rails, releasing puffs of smoke, with the friction visibly etching marks on the tracks, vibrations subtly shaking the platform.","The sound event of ""train wheels squealing"" features high-pitched, prolonged shrieks with fluctuating intensity, often accompanied by rhythmic clacking of tracks and underlying metallic groans, evoking a sense of friction and resistance between wheel and rail, especially noticeable during deceleration or tight turns." +train whistling,"A train whistling is a sharp, loud sound produced by a train to signal its presence, warn of its approach at crossings, or communicate with rail workers. Trains use different whistle patterns to convey specific messages or alerts, and it serves as an important safety feature in rail transport.","A sleek locomotive barrels across the countryside, its sharp whistle piercing through the tranquil landscape, signaling its presence as it hurtles along the gleaming tracks, with plumes of steam billowing into the clear sky.","A train whistle typically harbors a loud, piercing tone with a slightly wavering pitch. It carries a prolonged, echoing quality and can vary from a single blast to a repeated pattern. The sound decreases in volume and pitch due to the Doppler effect as the train moves away." +turkey gobbling,"A turkey gobble is the distinctive clucking sound made by male turkeys, known as toms, often used to attract females during mating season and establish dominance within their territory. It's a loud, rapid series of throaty notes that may echo through their woodland habitats.","A plump turkey with iridescent feathers struts across a rustic farmyard, periodically puffing its chest and fanning its tail while lifting its head to emit a series of throaty ""gobble-gobble"" sounds, the call reverberating through the crisp autumn air.","A turkey gobble begins with a low, hollow roll, escalating into rapid, throaty pulsations in a resonant “gobble-gobble” rhythm. It fluctuates in pitch and volume, often carrying far. Each turkey’s gobble is unique, varying slightly in tone and cadence." +typing on computer keyboard,"Typing on a computer keyboard produces distinct, rhythmic tapping sounds made by fingers striking keys, often associated with office environments, data entry work, or writing activities.","A person's hands hover over a keyboard, fingers tapping the keys rhythmically, with onomatopoeic words like ""click-clack"" or sound waves emanating from the keyboard to symbolize the distinct sound of typing.","Typing on a computer keyboard typically features rhythmic tapping sounds, with varying intensities dependent on key pressure; the spacebar often has a deeper tone. The tempo fluctuates with typing speed, and there may be subtle plastic clicking and the springy release of keys." +typing on typewriter,"Typing on a typewriter is characterized by rhythmic, mechanical clicks as keys strike the paper, punctuated by an occasional ding at the line's end, and the sliding motion of the carriage return lever.","A figure types on an old typewriter, fingers creating rhythmic clacks. The ink ribbon imprints characters on paper, forming text-filled sheets beside the machine. The scene is lit by a desk lamp, with the room filled with the scent of parchment.","Typing on a typewriter produces rhythmic, mechanical keystrokes, with a sharp click-clack sound for each character imprinted, interspersed with soft thuds of spacebar presses and a distinctive zipping sound of the carriage return at the end of a line." +underground,"An ""underground"" sound event typically refers to an audio occurrence within subterranean environments, such as subway stations, mines, or natural caves, characterized by unique acoustics, reverberations, and potential interactions with geological structures, often distinct from surface-level soundscapes.","A shadowy, subterranean space filled with obscured figures, vibrant graffiti on rough walls, and dim, flickering lights that pulse in sync with the gritty, raw beats of music that reverberates through the close, air-thick atmosphere of an elusive, urban setting.","Thrumming echoes, a low-frequency rumble, metallic clanking, muffled distant voices, irregular drips, grinding of machinery or trains, resonance of footsteps, and the muting effect of earth insulating the space from above-ground sounds." +underwater bubbling,"Underwater bubbling is the emission of gas bubbles from a liquid, typically water, resulting in a distinctive sound as the bubbles rise and burst at the surface, often associated with underwater geological or biological activity or human-induced processes like diving or submerged machinery operation.","Submerged in a clear blue expanse, clusters of iridescent bubbles rise rhythmically from the ocean floor, rippling and refracting light as they ascend toward the undulating surface, where they burst softly, merging with the aqueous world above.","Underwater bubbling sounds feature bursty, gurgling noises with a muffled resonance. They range from low to mid frequencies, with bubble size affecting pitch and intensity. Sound travels faster and more efficiently in water due to its density." +using sewing machines,"Using sewing machines entails the rhythmic hum and repetitive mechanical clicks of needles piercing fabric, often accompanied by the buzz of the motor and occasional sound of scissors cutting threads or the rustle of material being handled.","Multicolored threads, rhythmic motion of needle and fabric, fingers deftly guiding materials, the whir of electric motors, and the steady clack of mechanical parts create an imagery that captures the essence of using sewing machines.","The sound of a sewing machine is characterized by rhythmic, repetitive mechanical whirring, punctuated by clicks as the needle punctures fabric; the pitch and tempo may vary with speed and fabric type, and occasional softer spool unwinding sounds or fabric rustling may be audible, complementing the steady hum." +vacuum cleaner cleaning floors,"A vacuum cleaner cleaning floors produces a distinctive, continuous hum or whirring noise while it sucks up dirt and debris from carpets and hard surfaces, often accompanied by occasional louder thumps or rattles when larger particles are ingested.","A vacuum cleaner, its nozzle moving methodically across the carpet or floor, emits a steady hum while it sucks up dirt, dust, and debris, with visible particles being whisked into the machine. The rhythmic back-and-forth motion indicates the area being methodically cleaned.","The sound event ""vacuum cleaner cleaning floors"" typically features a loud, sustained, monotonous roar with high and low-frequency hums, punctuated by intermittent crackles and pops as debris is sucked up, often with a whirring motor sound and air suction noise." +vehicle horn,"A vehicle horn is an auditory signaling device commonly installed in automobiles and other forms of transportation, used to warn others of the vehicle's presence or to signal the driver's intention, providing a means of avoiding potential hazards or accidents.","A busy city street scene with cars, buses, and bikes in congested traffic. A driver's arm extends from a car window, pressing the horn impatiently, causing others to look irritated. Sound waves emanate from the vehicle indicating the loud, blaring noise of the horn amidst the urban hustle.","A vehicle horn typically produces a loud, sharp sound ranging from 250 to 500 Hz, designed for audibility over distance. The tone is often harsh, insistent, and brief, with a rapid onset to alert nearby individuals of the vehicle's presence, serving as a warning or communication signal in traffic." +volcano explosion,"A volcano explosion is a catastrophic natural phenomenon where a volcanic mountain erupts, forcefully ejecting ash, lava, and gases with intense sound blasts, often causing widespread damage and posing serious risks to nearby life and property.","A towering volcano erupts, spewing a fiery column of ash and lava into the sky, while plumes of smoke and glowing molten rock burst from the crater amidst a backdrop of trembling ground and chaotic escape of wildlife and people.","A volcano explosion features deep, low-frequency rumbling, explosive booms, rising pitch as pressure builds, sudden loud blasts, echoes bouncing off surrounding terrain, crackling or fracturing sounds from rock breaking, and a prolonged roar during eruption, possibly mixed with the hiss of escaping gases or steam." +warbler chirping,"Warbler chirping is the melodic, flutelike vocalization of small passerine birds known for their intricate songs. These sounds, often heard in spring and summer, are used for communication, territory defense, and mating purposes, showcasing a range of frequencies and patterns unique to each warbler species.","A small, vibrant warbler perched on a leafy branch, its throat vibrating with melody in a tranquil forest, sunlight filtering through the canopy, casting dappled light on the mossy undergrowth around it.","A warbler chirping emits a series of high-pitched melodic trills and whistles, with a variable pitch and rhythm, often incorporating rapid frequency modulation, clear tonal quality, and sometimes repetition of short, distinct phrases, evoking a cheerful or plaintive quality typical of their bird song." +waterfall burbling,"The sound event ""waterfall burbling"" captures the continuous, soothing murmur produced by water cascading over rocks, typically creating a rhythmic, calming ambiance associated with nature and tranquility.","A stream cascades down a rocky incline, with crystal-clear water bubbling over stones and moss, forming frothy pools below, surrounded by lush greenery, as sunlight filters through the leaves, creating a serene, picturesque backdrop for the gentle, rhythmic sound of the waterfall.","The auditory features of a ""waterfall burbling"" typically include a continuous, soothing white noise comprising low frequencies, persistent rushing sounds, with varying tones and volumes depending on the waterfall's size and water flow, often intermingled with higher-pitched trickling and splashing as water interacts with rocks and terrain." +whale calling,"Whale calling involves the vocalizations produced by whales to communicate with each other. These complex calls vary by species and can include songs, clicks, and whistles, often heard over vast ocean distances, playing a crucial role in social interactions, navigation, and foraging.","An immense, calm sea spans the horizon, mist wafts above gentle waves. A colossal whale's silhouette emerges, water cascading off its back. Its mouth opens, emitting deep, sonorous calls that ripple through the water, mingling with the calls of distant brethren, connecting across the vast, serene ocean expanse.","Whale calls are low-frequency, melodic moans and pulses that can travel long distances underwater, varying in pitch and duration, often with patterned sequences unique to species like the humpback whale's complex, repeating song structures." +wind chime,"A wind chime is a decorative assembly of tubes, bells, or other objects that produce melodious ringing sounds when moved by the breeze, creating a soothing auditory experience often used for ambiance or as a sensory garden feature.","Gentle breezes sway an array of whimsical chimes, each tinkling harmoniously. Sunlight glints off metal and glass, casting dancing patterns as the chimes strike a serene, melodic symphony propelled by the wind's invisible touch.","Wind chimes produce a series of melodic tinkling sounds of varying pitches when stirred by the breeze, creating a harmonious, soothing resonance. The pitch and volume are influenced by wind strength and the material and size of the chime elements__ypically metal, bamboo, or glass." +wind noise,"Wind noise is the rushing, whistling, or rumbling sound caused by air flowing over, around, and into structures or objects, including microphones and ears. It is often an unwanted background sound in recordings and can impair communication and the enjoyment of outdoor activities.","Turbulent air swirls, bending tree branches, and whisking leaves dance across a blustery landscape. Objects flutter and vibrate as the invisible force of wind hums and howls, visually encapsulated by motion and the chaotic flight of debris caught in the gusts.","Wind noise comprises whooshing, rustling, and whistling sounds with fluctuating volume and pitch, broadband frequencies, and white noise characteristics, which vary with wind speed and interactions with the environment, such as trees or buildings." +wind rustling leaves,"The sound of wind rustling leaves is a soothing, natural noise produced when breezes cause tree foliage to flutter and rub against each other, often yielding a calming, harmonic rustle that can evoke a sense of serenity and connection with nature.","A tree's branches sway gently under a clear sky, its leaves dancing and shimmering in the sunlight, creating a symphony of light rustling sounds as the breeze passes through them, evoking a sense of tranquility and harmony with nature.","The sound of wind rustling leaves is characterized by a gentle, continuous white noise with varying frequencies and a soft rustling or whispering quality. It ebbs and flows in intensity and pitch as the wind's strength and direction change, creating a soothing and dynamic natural rhythm." +woman speaking,"A sound event of a ""woman speaking"" involves the auditory occurrence of a female voice articulating words or sentences, incorporating distinct pitch, tone, and speech patterns characteristic of a female's vocal range and communication style.","A visual representation might include an image of a woman with her mouth open mid-speech, possibly with sound waves emanating from her or a speech bubble to signify communication. Her expression could convey engagement or passion, and audience members might be depicted to show she is being listened to.","A woman’s voice generally has a higher pitch range than a man’s, with a fundamental frequency between 165 and 255 Hz. It features melodic intonation, vocal warmth, varied rhythm, and dynamic timbre. Consonant articulation and vowel resonance add to its distinct auditory characteristics." +wood thrush calling,"The wood thrush calling is a melodic bird song that is often considered a quintessential sound of Eastern U.S. forests. This flute-like call, typically heard during spring and summer, has a haunting, ethereal quality that birds use to defend territories and attract mates.","Amidst the twilight hues of a dense, leafy forest, a solitary wood thrush perches on a gnarled branch, its throat vibrating melodically, filling the tranquil air with its flute-like song while dappled sunlight filters through the canopy overhead.","The sound event of a wood thrush calling features melodic, flute-like tones in a series of ethereal, warbling phrases, each composed of a different combination of notes with a distinct, clear whistle quality, often resonating through deciduous forests during dawn and dusk in the Eastern United States." +woodpecker pecking tree,"A woodpecker pecking a tree is a rhythmic tapping sound created when the bird rapidly beats its beak against the trunk to find insects, communicate, or excavate nesting holes.","A woodpecker rhythmically hammers its beak into the bark of a tree, head bobbing with each impact. Wood chips scatter, and the repetitive tapping echoes through the forest, signaling the bird's search for insects or nest building.","A woodpecker pecking a tree produces a rapid, rhythmic tapping or drumming sound, with a sharp, resonant quality. The tempo can vary, and there are brief pauses between bursts of pecks. It can echo through a forested area, indicative of the bird's method of foraging or communication." +writing on blackboard with chalk,"The sound event ""writing on blackboard with chalk"" is characterized by a distinct scraping noise as the chalk contacts the rough surface, resulting in audible friction, varying in pitch and intensity with the pressure and speed of writing.","A hand clasps a piece of chalk, squeaking across a dark slate blackboard, leaving trails of white, dusty lines forming letters and numbers, a powdery residue dusting the ledge below.","Writing on a blackboard with chalk creates sounds like screeching and scratching, varying in pitch and intensity based on pressure and speed. Softer skittering noises occur as the chalk skips over the board’s irregularities." +yodelling,"Yodelling is a singing technique involving rapid alternation between the low-pitch chest register and the high-pitch head register, creating a distinct sound. It originated in the Central Alps and is associated with traditional folk music, embraced in various cultures and music genres worldwide.","A figure stands on a mountain slope, mouth open mid-song, dressed in traditional alpine attire with lederhosen and a hat. Echoes of the melodious yodel ripple through the picturesque valley, bouncing off the Swiss chalets and distant snowy peaks under a bright blue sky.","Yodelling is characterized by rapid alternation between the low-pitch chest register and the high-pitch head register, creating a distinctive echo-like quality. It often involves sustained notes that fluctuate in pitch with a clear, powerful vocal tone, which may include melodic patterns repeated at different pitches." +zebra braying,"A zebra’s bray is a unique sound, blending a donkey’s bray and a horse’s whinny. Used for herd communication, it expresses emotions like excitement, agitation, or distress, and helps maintain social bonds. The sound includes high-pitched squeals and snorts.","A black and white striped zebra stands on a sun-bathed savanna, with its mouth wide open and ears pulled back, as it emits a high-pitched, braying call that pierces the quiet of the wild landscape.","A zebra braying is characterized by a series of hoarse, high-pitched calls with a sequence of ascending then descending tones. The sound is somewhat like a donkey's bray but with more variation, often starting with a barking noise and transitioning into a prolonged, squealing whinny." diff --git a/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/wavcaps_word_embeddings_vggsound_normed.npy b/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/wavcaps_word_embeddings_vggsound_normed.npy new file mode 100644 index 0000000..6a83490 Binary files /dev/null and b/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/wavcaps_word_embeddings_vggsound_normed.npy differ diff --git a/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/word_embeddings_vggsound_normed.npy b/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/word_embeddings_vggsound_normed.npy new file mode 100644 index 0000000..159843d Binary files /dev/null and b/avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/word_embeddings_vggsound_normed.npy differ diff --git a/c3d/c3d.py b/c3d/c3d.py new file mode 100644 index 0000000..8a96ebe --- /dev/null +++ b/c3d/c3d.py @@ -0,0 +1,77 @@ +import torch.nn as nn + + +class C3D(nn.Module): + """ + The C3D network as described in [1]. + """ + + def __init__(self): + super(C3D, self).__init__() + + self.conv1 = nn.Conv3d(3, 64, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.pool1 = nn.MaxPool3d(kernel_size=(1, 2, 2), stride=(1, 2, 2)) + + self.conv2 = nn.Conv3d(64, 128, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.pool2 = nn.MaxPool3d(kernel_size=(2, 2, 2), stride=(2, 2, 2)) + + self.conv3a = nn.Conv3d(128, 256, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.conv3b = nn.Conv3d(256, 256, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.pool3 = nn.MaxPool3d(kernel_size=(2, 2, 2), stride=(2, 2, 2)) + + self.conv4a = nn.Conv3d(256, 512, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.conv4b = nn.Conv3d(512, 512, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.pool4 = nn.MaxPool3d(kernel_size=(2, 2, 2), stride=(2, 2, 2)) + + self.conv5a = nn.Conv3d(512, 512, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.conv5b = nn.Conv3d(512, 512, kernel_size=(3, 3, 3), padding=(1, 1, 1)) + self.pool5 = nn.MaxPool3d(kernel_size=(2, 2, 2), stride=(2, 2, 2), padding=(0, 1, 1)) + + self.fc6 = nn.Linear(8192, 4096) + self.fc7 = nn.Linear(4096, 4096) + self.fc8 = nn.Linear(4096, 487) + + self.dropout = nn.Dropout(p=0.5) + + self.relu = nn.ReLU() + self.softmax = nn.Softmax() + + def forward(self, x): + + h = self.relu(self.conv1(x)) + h = self.pool1(h) + + h = self.relu(self.conv2(h)) + h = self.pool2(h) + + h = self.relu(self.conv3a(h)) + h = self.relu(self.conv3b(h)) + h = self.pool3(h) + + h = self.relu(self.conv4a(h)) + h = self.relu(self.conv4b(h)) + h = self.pool4(h) + + h = self.relu(self.conv5a(h)) + h = self.relu(self.conv5b(h)) + h = self.pool5(h) + + h = h.view(-1, 8192) + + h = self.relu(self.fc6(h)) + h = self.dropout(h) + h = self.relu(self.fc7(h)) + h = self.dropout(h) + return h + + logits = self.fc8(h) + probs = self.softmax(logits) + + return probs + +""" +References +---------- +[1] Tran, Du, et al. "Learning spatiotemporal features with 3d convolutional networks." +Proceedings of the IEEE international conference on computer vision. 2015. +""" \ No newline at end of file diff --git a/clip_embeddings_extraction/get_clip_embeddings_activitynet.py b/clip_embeddings_extraction/get_clip_embeddings_activitynet.py index 618f210..c7e57ea 100644 --- a/clip_embeddings_extraction/get_clip_embeddings_activitynet.py +++ b/clip_embeddings_extraction/get_clip_embeddings_activitynet.py @@ -10,11 +10,18 @@ # from prompt_toolkit import prompt import pandas as pd from tqdm import tqdm + +# 解决pycharm有时索引不到文件 +import os, sys +# sys.path.append(os.getcwd()) +base_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) +sys.path.append(base_dir) + from WavCaps.retrieval.models.ase_model import ASE from ruamel import yaml import argparse from src.args import str_to_bool - +from datetime import datetime def zeroshot_classifier(classnames, templates, device): with torch.no_grad(): @@ -30,10 +37,45 @@ def zeroshot_classifier(classnames, templates, device): # zeroshot_weights = torch.stack(zeroshot_weights, dim=1).to(device) return zeroshot_weights +# 从CSV文件中加载UCF类别描述 +df2 = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/ActivityNet.csv') +descriptions = { + "description_1": df2['description_1'].tolist(), + "description_2": df2['description_2'].tolist(), + "description_3": df2['description_3'].tolist(), +} +# 将类别名称、模板和描述组合在一起时,生成的文本太长,超过了CLIP模型的上下文长度限制(77个token) +def zeroshot_classifier_with_descriptions(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + for idx, classname in enumerate(tqdm(classnames)): + all_embeddings = [] + + # 处理每个模板 + for template in templates: + base_text = template.format(classname) + # 方案2: 如果需要使用所有描述,可以分别处理每个描述 + for desc_key in ["description_1", "description_2", "description_3"]: + desc = descriptions[desc_key][idx] + text = f"{base_text} {desc}" + tokens = clip.tokenize(text).to(device) + embedding = model.encode_text(tokens) + embedding /= embedding.norm(dim=-1, keepdim=True) + all_embeddings.append(embedding) + + # 合并所有嵌入 + all_embeddings = torch.cat(all_embeddings, dim=0) + class_embedding = all_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + + return zeroshot_weights -df = pd.read_csv('/home/aoq234/akata-shared/aoq234/avzsl/clip_original/avgzsl_benchmark_datasets/ActivityNet/class-split/activitynet_w2v_class_names.csv') + +# df = pd.read_csv('/home/aoq234/akata-shared/aoq234/avzsl/clip_original/avgzsl_benchmark_datasets/ActivityNet/class-split/activitynet_w2v_class_names.csv') +df = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/ActivityNet/class-split/activitynet_w2v_class_names.csv') activitynet_classes = df['manual'].tolist() @@ -90,7 +132,8 @@ def zeroshot_classifier(classnames, templates, device): -device = 'cuda:3' +# device = 'cuda:3' +device = 'cuda:0' model, preprocess = clip.load("ViT-B/32", device=device) @@ -106,20 +149,27 @@ def zeroshot_classifier(classnames, templates, device): print("Context length:", context_length) print("Vocab size:", vocab_size) - model_version = 'clip_original' -zeroshot_weights = zeroshot_classifier(activitynet_classes, activitynet_templates, device) -print(zeroshot_weights.keys()) +# zeroshot_weights = zeroshot_classifier(activitynet_classes, activitynet_templates, device) +zeroshot_weights = zeroshot_classifier_with_descriptions(activitynet_classes, activitynet_templates, descriptions, device) + -data_root_path = f'/home/aoq234/akata-shared/aoq234/avzsl/{model_version}/avgzsl_benchmark_datasets/ActivityNet/features/cls_features_non_averaged' +print(zeroshot_weights.keys()) +# data_root_path = '/home/wh/clip_original/avgzsl_benchmark_datasets/UCF/features/cls_features_non_averaged' +data_root_path = f'/home/wh/{model_version}/avgzsl_benchmark_datasets/ActivityNet/features/cls_features_non_averaged' data_path = os.path.join(data_root_path, 'text') if not(os.path.exists(data_path)): os.makedirs(data_path) -filename = os.path.join(data_path, 'word_embeddings_activitynet_normed.npy') +# filename = os.path.join(data_path, 'word_embeddings_activitynet_normed.npy') +word_embedding = 'word_embeddings_activitynet_description_normed' +file_extension = '.npy' +current_time = datetime.now().strftime("%Y%m%d_%H%M%S") +new_filename = f"{word_embedding}_{current_time}{file_extension}" +filename = os.path.join(data_path, new_filename) np.save(filename, zeroshot_weights) @@ -149,6 +199,25 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) return zeroshot_weights +def wavcaps_zeroshot_classifier_with_descriptions(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + for idx, classname in enumerate(tqdm(classnames)): + texts = [] + for template in templates: + base_text = template.format(classname) + for desc_key in ["description_1", "description_2", "description_3"]: + desc = descriptions[desc_key][idx] + text = f"{base_text} {desc}" + embedding = wavcaps_model.encode_text([text]) + embedding /= embedding.norm(dim=-1, keepdim=True) + texts.append(embedding) + class_embeddings = torch.cat(texts, dim=0) + class_embedding = class_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + return zeroshot_weights + @@ -187,22 +256,26 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): ] -with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +# with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +with open("../WavCaps/retrieval/settings/inference.yaml", "r") as f: config = yaml.safe_load(f) -device = 'cuda:3' +# device = 'cuda:3' +device = 'cuda:0' wavcaps_model = ASE(config) wavcaps_model.to(device) -cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' +# cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' +cp_path = '/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/pretrained_models/HTSAT_BERT_zero_shot.pt' state_dict_key = 'model' cp = torch.load(cp_path) wavcaps_model.load_state_dict(cp[state_dict_key]) wavcaps_model.eval() print("Model weights loaded from {}".format(cp_path)) -wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier(activitynet_classes, activitynet_audio_templates, device) +# wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier(activitynet_classes, activitynet_audio_templates, device) +wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier_with_descriptions(activitynet_classes, activitynet_audio_templates, descriptions, device) print(wavecaps_zeroshot_weights.keys()) @@ -210,8 +283,12 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): if not(os.path.exists(data_path)): os.makedirs(data_path) -filename = os.path.join(data_path, 'wavcaps_word_embeddings_activitynet_normed.npy') +# filename = os.path.join(data_path, 'wavcaps_word_embeddings_activitynet_normed.npy') +wavcaps_word_embedding = 'wavcaps_word_embeddings_activitynet_description_normed' +current_time = datetime.now().strftime("%Y%m%d_%H%M%S") +new_filename = f"{wavcaps_word_embedding}_{current_time}{file_extension}" +filename = os.path.join(data_path, new_filename) np.save(filename, wavecaps_zeroshot_weights) diff --git a/clip_embeddings_extraction/get_clip_embeddings_ucf.py b/clip_embeddings_extraction/get_clip_embeddings_ucf.py index 1307149..78aaa32 100644 --- a/clip_embeddings_extraction/get_clip_embeddings_ucf.py +++ b/clip_embeddings_extraction/get_clip_embeddings_ucf.py @@ -10,26 +10,217 @@ # from prompt_toolkit import prompt import pandas as pd from tqdm import tqdm +# from ClipClap-GZSL.WavCaps.retrieval.models.ase_model import ASE +import os, sys +# sys.path.append(os.getcwd()) +base_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) +sys.path.append(base_dir) from WavCaps.retrieval.models.ase_model import ASE +# from /home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/models/ase_model.py from ruamel import yaml +from datetime import datetime +# 从CSV文件中加载UCF类别描述 +df2 = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/UCF/class-split/UCF.csv') + +# 加载动作名称的最大补充描述 +# ucf_classes = df2['name'].tolist() +descriptions = { + "description_1": df2['description_1'].tolist(), + "description_2": df2['description_2'].tolist(), + "description_3": df2['description_3'].tolist(), +} + +# 传入零样本分类器 +# zeroshot_weights = zeroshot_classifier_with_descriptions(ucf_classes, ucf_templates, descriptions, device) + + +# 根据提示模板使用CLIP对类别标签进行嵌入 def zeroshot_classifier(classnames, templates, device): with torch.no_grad(): zeroshot_weights = {} for classname in tqdm(classnames): - texts = [template.format(classname) for template in templates] #format with class - texts = clip.tokenize(texts).to(device) #tokenize - class_embeddings = model.encode_text(texts) #embed with text encoder + texts = [template.format(classname) for template in templates] #format with class根据模板生成具体文本 + + texts = clip.tokenize(texts).to(device) #tokenize 将文本转换为模型可处理的输入 + class_embeddings = model.encode_text(texts) #embed with text encoder 使用 CLIP 模型生成文本嵌入 + class_embeddings /= class_embeddings.norm(dim=-1, keepdim=True) # 每个嵌入向量归一化 + class_embedding = class_embeddings.mean(dim=0)# 对模板生成的所有嵌入取平均值 + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + # zeroshot_weights = torch.stack(zeroshot_weights, dim=1).to(device) + return zeroshot_weights + + +# 在类别文本模板后添加补充描述 +def zeroshot_classifier_with_descriptions(classnames, templates, descriptions, device): + + with torch.no_grad(): + zeroshot_weights = {} + + # 遍历每个类别的动作名称 + for idx, classname in enumerate(tqdm(classnames)): + texts = [] + + # 处理每个模板,将补充描述添加到动作文本中 + for template in templates: + # 获取对应类别的补充描述 + description_1 = descriptions["description_1"][idx] + description_2 = descriptions["description_2"][idx] + description_3 = descriptions["description_3"][idx] + + # 拼接描述到模板后面 + text_with_descriptions = f"{template.format(classname)} {description_1} {description_2} {description_3}" + texts.append(text_with_descriptions) + + # Tokenize模板+描述 + tokens = clip.tokenize(texts).to(device) + + # 生成嵌入向量 + class_embeddings = model.encode_text(tokens) class_embeddings /= class_embeddings.norm(dim=-1, keepdim=True) + + # 对所有模板的嵌入取均值归一化,生成该类别的权重 class_embedding = class_embeddings.mean(dim=0) class_embedding /= class_embedding.norm() + + # 保存到字典 zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) - # zeroshot_weights = torch.stack(zeroshot_weights, dim=1).to(device) + return zeroshot_weights +# 将类别名称、模板和描述组合在一起时,生成的文本太长,超过了CLIP模型的上下文长度限制(77个token) +def zeroshot_classifier_with_descriptions2(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + + for idx, classname in enumerate(tqdm(classnames)): + all_embeddings = [] + + # 处理每个模板 + for template in templates: + base_text = template.format(classname) + + # 方案1: 只使用第一个描述,避免文本过长 + # description_1 = descriptions["description_1"][idx] + # text = f"{base_text} {description_1}" + # + # # 确保文本不会太长 + # if len(text.split()) > 50: # 粗略估计token数量 + # text = " ".join(text.split()[:50]) + # + # tokens = clip.tokenize([text]).to(device) + # embedding = model.encode_text(tokens) + # embedding /= embedding.norm(dim=-1, keepdim=True) + # all_embeddings.append(embedding) + + # 方案2: 如果需要使用所有描述,可以分别处理每个描述 + for desc_key in ["description_1", "description_2", "description_3"]: + desc = descriptions[desc_key][idx] + text = f"{base_text} {desc}" + # if len(text.split()) > 50: + # text = " ".join(text.split()[:50]) + tokens = clip.tokenize(text).to(device) + embedding = model.encode_text(tokens) + embedding /= embedding.norm(dim=-1, keepdim=True) + all_embeddings.append(embedding) + + # 合并所有嵌入 + all_embeddings = torch.cat(all_embeddings, dim=0) + class_embedding = all_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + + return zeroshot_weights -df = pd.read_csv('/home/aoq234/thesis/ClipClap-GZSL/avgzsl_benchmark_non_averaged_datasets/UCF/class-split/ucf_clip_class_names.csv') +#KDA方式实现 +def generate_zeroshot_weights(classnames): + """ + 生成零样本分类的权重字典,键为类名,值为嵌入向量 + + Args: + attributes_ids: 需要处理的类别ID列表 + + Returns: + zeroshot_weights: 字典,键为类名,值为嵌入向量 + """ + zeroshot_weights = {} + act_name = df2["name"].tolist() + act_1 = df2["description_1"].tolist() + act_2 = df2["description_2"].tolist() + act_3 = df2["description_3"].tolist() + + # 确保索引在有效范围内 + # valid_ids = [i for i in attributes_ids if i < len(act_name)] + + for class_id, classname in enumerate(tqdm(classnames)): + class_name = act_name[class_id] + + # 获取该类别的所有描述 + descriptions = [ + # act_name[class_id], # 类名本身 + act_1[class_id], # 描述1 + act_2[class_id], # 描述2 + act_3[class_id] # 描述3 + ] + + # 使用CLIP模型处理所有描述 + with torch.no_grad(): + # 对每个描述进行编码 + text_embeds_list = [] + for desc in descriptions: + # 确保描述不为空 + if not isinstance(desc, str) or not desc.strip(): + continue + + # 使用CLIP tokenizer和模型处理文本 + inputs = clip.tokenize([desc], return_tensors="pt") + inputs = {key: value.to(device) for key, value in inputs.items()} + + # 获取文本嵌入 + text_embed = clip(**inputs).text_embeds + + # 归一化嵌入向量 + text_embed = text_embed / text_embed.norm(dim=-1, keepdim=True) + text_embeds_list.append(text_embed) + + # 如果有有效的描述 + if text_embeds_list: + # 堆叠所有嵌入并取平均值 + all_embeds = torch.cat(text_embeds_list, dim=0) + class_embedding = all_embeds.mean(dim=0) + + # 再次归一化 + class_embedding = class_embedding / class_embedding.norm() + + # 存储到字典中 + zeroshot_weights[class_name] = class_embedding.cpu().detach().numpy().astype(np.float32) + + return zeroshot_weights + + +def zeroshot_classifier_descriptions_non_templates(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + texts = [] + for idx, classname in enumerate(tqdm(classnames)): + description_1 = descriptions["description_1"][idx] + text = f"{description_1}" + texts.append(text) + + # 合并所有嵌入 + texts = clip.tokenize(texts).to(device) # tokenize 将文本转换为模型可处理的输入 + class_embeddings = model.encode_text(texts) # embed with text encoder 使用 CLIP 模型生成文本嵌入 + class_embeddings /= class_embeddings.norm(dim=-1, keepdim=True) # 每个嵌入向量归一化 + class_embedding = class_embeddings.mean(dim=0) # 对模板生成的所有嵌入取平均值 + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + return zeroshot_weights + +# df = pd.read_csv('/home/aoq234/thesis/ClipClap-GZSL/avgzsl_benchmark_non_averaged_datasets/UCF/class-split/ucf_clip_class_names.csv') +df = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/UCF/class-split/ucf_clip_class_names.csv') ucf_classes = df['clip_class_name'].tolist() ucf_templates = [ @@ -85,7 +276,8 @@ def zeroshot_classifier(classnames, templates, device): -device = 'cuda:3' +# device = 'cuda:3' +device = 'cuda:0' model, preprocess = clip.load("ViT-B/32", device=device) @@ -105,14 +297,27 @@ def zeroshot_classifier(classnames, templates, device): -zeroshot_weights = zeroshot_classifier(ucf_classes, ucf_templates, device) +# zeroshot_weights = zeroshot_classifier(ucf_classes, ucf_templates, device) +# 将对类别的文本描述加入到文本嵌入当中 +# zeroshot_weights = zeroshot_classifier_with_descriptions(ucf_classes, ucf_templates, descriptions, device) +zeroshot_weights = zeroshot_classifier_with_descriptions2(ucf_classes, ucf_templates, descriptions, device) +# zeroshot_weights = zeroshot_classifier_descriptions_non_templates(ucf_classes, ucf_templates, descriptions, device) +# zeroshot_weights = generate_zeroshot_weights(ucf_classes) + print(zeroshot_weights.keys()) -data_root_path = '/home/aoq234/akata-shared/aoq234/avzsl/clip_original/avgzsl_benchmark_datasets/UCF/features/cls_features_non_averaged' +# data_root_path = '/home/aoq234/akata-shared/aoq234/avzsl/clip_original/avgzsl_benchmark_datasets/UCF/features/cls_features_non_averaged' +data_root_path = '/home/wh/clip_original/avgzsl_benchmark_datasets/UCF/features/cls_features_non_averaged' data_path = os.path.join(data_root_path, 'text') if not(os.path.exists(data_path)): os.makedirs(data_path) -filename = os.path.join(data_path, 'word_embeddings_ucf_normed.npy') +# filename = os.path.join(data_path, 'word_embeddings_ucf_normed.npy') +word_embedding = 'word_embeddings_ucf_description_normed' +file_extension = '.npy' +current_time = datetime.now().strftime("%Y%m%d_%H%M%S") +new_filename = f"{word_embedding}_{current_time}{file_extension}" +filename = os.path.join(data_path, new_filename) +# filename = os.path.join(data_path, 'word_embeddings_ucf_description_normed.npy') np.save(filename, zeroshot_weights) @@ -143,6 +348,70 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) return zeroshot_weights +# 在类别文本模板后添加补充描述 +def wavcaps_zeroshot_classifier_with_descriptions(classnames, templates, descriptions, device): + + with torch.no_grad(): + zeroshot_weights = {} + + # 遍历每个类别的动作名称 + for idx, classname in enumerate(tqdm(classnames)): + texts = [] + + # 处理每个模板,将补充描述添加到动作文本中 + for template in templates: + # 获取对应类别的补充描述 + description_1 = descriptions["description_1"][idx] + description_2 = descriptions["description_2"][idx] + description_3 = descriptions["description_3"][idx] + + # 拼接描述到模板后面 + text_with_descriptions = f"{template.format(classname)} {description_1} {description_2} {description_3}" + texts.append(text_with_descriptions) + + class_embeddings = wavcaps_model.encode_text(texts) # embed with text encoder + class_embedding = class_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + return zeroshot_weights + + +def wavcaps_zeroshot_classifier_with_descriptions2(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + + for idx, classname in enumerate(tqdm(classnames)): + texts = [] + + for template in templates: + base_text = template.format(classname) + + # 只使用第一个描述 + # description_1 = descriptions["description_1"][idx] + # text = f"{base_text} {description_1}" + # + # # 确保文本不会太长 + # if len(text.split()) > 50: + # text = " ".join(text.split()[:50]) + # embedding = wavcaps_model.encode_text([text]) + # embedding /= embedding.norm(dim=-1, keepdim=True) + # texts.append(embedding) + for desc_key in ["description_1", "description_2", "description_3"]: + desc = descriptions[desc_key][idx] + text = f"{base_text} {desc}" + # if len(text.split()) > 50: + # text = " ".join(text.split()[:50]) + + embedding = wavcaps_model.encode_text([text]) + embedding /= embedding.norm(dim=-1, keepdim=True) + texts.append(embedding) + + class_embeddings = torch.cat(texts, dim=0) + class_embedding = class_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + + return zeroshot_weights @@ -181,20 +450,25 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): ] -with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +# with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +with open("/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: config = yaml.safe_load(f) -device = 'cuda:3' +# device = 'cuda:3' +device = 'cuda:0' wavcaps_model = ASE(config) wavcaps_model.to(device) -cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' +# cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' +cp_path = '/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/pretrained_models/HTSAT_BERT_zero_shot.pt' state_dict_key = 'model' cp = torch.load(cp_path) wavcaps_model.load_state_dict(cp[state_dict_key]) wavcaps_model.eval() print("Model weights loaded from {}".format(cp_path)) -wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier(ucf_classes, ucf_audio_templates, device) +# wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier(ucf_classes, ucf_audio_templates, device) +# wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier_with_descriptions(ucf_classes, ucf_audio_templates,descriptions, device) +wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier_with_descriptions2(ucf_classes, ucf_audio_templates,descriptions, device) print(wavecaps_zeroshot_weights.keys()) @@ -202,8 +476,13 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): if not(os.path.exists(data_path)): os.makedirs(data_path) -filename = os.path.join(data_path, 'wavcaps_word_embeddings_ucf_normed.npy') - +# filename = os.path.join(data_path, 'wavcaps_word_embeddings_ucf_normed.npy') +# filename = os.path.join(data_path, 'wavcaps_word_embeddings_ucf_description_normed.npy') +wavcaps_word_embedding = 'wavcaps_word_embeddings_ucf_description_normed' +# file_extension = '.npy' +current_time = datetime.now().strftime("%Y%m%d_%H%M%S") +new_filename = f"{wavcaps_word_embedding}_{current_time}{file_extension}" +filename = os.path.join(data_path, new_filename) np.save(filename, wavecaps_zeroshot_weights) diff --git a/clip_embeddings_extraction/get_clip_embeddings_vggsound.py b/clip_embeddings_extraction/get_clip_embeddings_vggsound.py index 4fccec3..eda08c2 100644 --- a/clip_embeddings_extraction/get_clip_embeddings_vggsound.py +++ b/clip_embeddings_extraction/get_clip_embeddings_vggsound.py @@ -10,11 +10,18 @@ # from prompt_toolkit import prompt import pandas as pd from tqdm import tqdm + +# 解决pycharm有时索引不到文件 +import os, sys +# sys.path.append(os.getcwd()) +base_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) +sys.path.append(base_dir) + from WavCaps.retrieval.models.ase_model import ASE from ruamel import yaml import argparse from src.args import str_to_bool - +from datetime import datetime def zeroshot_classifier(classnames, templates, device): with torch.no_grad(): @@ -30,11 +37,47 @@ def zeroshot_classifier(classnames, templates, device): # zeroshot_weights = torch.stack(zeroshot_weights, dim=1).to(device) return zeroshot_weights +# 从CSV文件中加载UCF类别描述 +df2 = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/VGGSound.csv') +descriptions = { + "description_1": df2['description_1'].tolist(), + "description_2": df2['description_2'].tolist(), + "description_3": df2['description_3'].tolist(), +} +# 将类别名称、模板和描述组合在一起时,生成的文本太长,超过了CLIP模型的上下文长度限制(77个token) +def zeroshot_classifier_with_descriptions(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + + for idx, classname in enumerate(tqdm(classnames)): + all_embeddings = [] + + # 处理每个模板 + for template in templates: + base_text = template.format(classname) + # 方案2: 如果需要使用所有描述,可以分别处理每个描述 + for desc_key in ["description_1", "description_2", "description_3"]: + desc = descriptions[desc_key][idx] + text = f"{base_text} {desc}" + tokens = clip.tokenize(text).to(device) + embedding = model.encode_text(tokens) + embedding /= embedding.norm(dim=-1, keepdim=True) + all_embeddings.append(embedding) + + # 合并所有嵌入 + all_embeddings = torch.cat(all_embeddings, dim=0) + class_embedding = all_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + + return zeroshot_weights -df = pd.read_csv('/home/aoq234/akata-shared/aoq234/avzsl/clip_original/avgzsl_benchmark_datasets/VGGSound/class-split/vggsound_w2v_class_names.csv') -vggsound_classes = df['manual'].tolist() +# df = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/vggsound_w2v_class_names.csv') +# df = pd.read_csv('../avgzsl_benchmark_non_averaged_datasets/VGGSound/class-split/vggsound_w2v_class_names.csv') +# vggsound_classes = df['manual'].tolist() +vggsound_classes = df2['name'].tolist() # vggsound_templates = [ @@ -102,7 +145,8 @@ def zeroshot_classifier(classnames, templates, device): -device = 'cuda:3' +# device = 'cuda:3' +device = 'cuda:0' model, preprocess = clip.load("ViT-B/32", device=device) @@ -122,15 +166,23 @@ def zeroshot_classifier(classnames, templates, device): model_version = 'clip_original' -zeroshot_weights = zeroshot_classifier(vggsound_classes, vggsound_templates, device) +# zeroshot_weights = zeroshot_classifier(vggsound_classes, vggsound_templates, device) +zeroshot_weights = zeroshot_classifier_with_descriptions(vggsound_classes, vggsound_templates, descriptions, device) + print(zeroshot_weights.keys()) -data_root_path = f'/home/aoq234/akata-shared/aoq234/avzsl/{model_version}/avgzsl_benchmark_datasets/VGGSound/features/cls_features_non_averaged' +data_root_path = f'/home/wh/{model_version}/avgzsl_benchmark_datasets/VGGSound/features/cls_features_non_averaged' data_path = os.path.join(data_root_path, 'text') if not(os.path.exists(data_path)): os.makedirs(data_path) -filename = os.path.join(data_path, 'word_embeddings_vggsound_normed.npy') +# filename = os.path.join(data_path, 'word_embeddings_vggsound_normed.npy') + +word_embedding = 'word_embeddings_vggsound_description_normed' +file_extension = '.npy' +current_time = datetime.now().strftime("%Y%m%d_%H%M%S") +new_filename = f"{word_embedding}_{current_time}{file_extension}" +filename = os.path.join(data_path, new_filename) np.save(filename, zeroshot_weights) @@ -160,7 +212,24 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) return zeroshot_weights - +def wavcaps_zeroshot_classifier_with_descriptions(classnames, templates, descriptions, device): + with torch.no_grad(): + zeroshot_weights = {} + for idx, classname in enumerate(tqdm(classnames)): + texts = [] + for template in templates: + base_text = template.format(classname) + for desc_key in ["description_1", "description_2", "description_3"]: + desc = descriptions[desc_key][idx] + text = f"{base_text} {desc}" + embedding = wavcaps_model.encode_text([text]) + embedding /= embedding.norm(dim=-1, keepdim=True) + texts.append(embedding) + class_embeddings = torch.cat(texts, dim=0) + class_embedding = class_embeddings.mean(dim=0) + class_embedding /= class_embedding.norm() + zeroshot_weights[classname] = class_embedding.cpu().detach().numpy().astype(np.float32) + return zeroshot_weights @@ -211,22 +280,32 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): ] -with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +# with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +with open("../WavCaps/retrieval/settings/inference.yaml", "r") as f: config = yaml.safe_load(f) -device = 'cuda:3' +# device = 'cuda:3' +device = 'cuda:0' wavcaps_model = ASE(config) wavcaps_model.to(device) -cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' +# cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' +cp_path = '/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/pretrained_models/HTSAT_BERT_zero_shot.pt' state_dict_key = 'model' cp = torch.load(cp_path) wavcaps_model.load_state_dict(cp[state_dict_key]) wavcaps_model.eval() print("Model weights loaded from {}".format(cp_path)) -wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier(vggsound_classes, vggsound_audio_templates, device) +df3 = pd.read_csv('/home/wh/PycharmProjects/KDA/avgzsl_benchmark_datasets/VGGSound/class-split/VGGSound.csv') +descriptions = { + "description_1": df3['description_1'].tolist(), + "description_2": df3['description_2'].tolist(), + "description_3": df3['description_3'].tolist(), +} +# wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier(vggsound_classes, vggsound_audio_templates, device) +wavecaps_zeroshot_weights = wavcaps_zeroshot_classifier_with_descriptions(vggsound_classes, vggsound_audio_templates, descriptions, device) print(wavecaps_zeroshot_weights.keys()) @@ -234,8 +313,12 @@ def wavcaps_zeroshot_classifier(classnames, templates, device): if not(os.path.exists(data_path)): os.makedirs(data_path) -filename = os.path.join(data_path, 'wavcaps_word_embeddings_vggsound_normed.npy') +# filename = os.path.join(data_path, 'wavcaps_word_embeddings_vggsound_normed.npy') +wavcaps_word_embedding = 'wavcaps_word_embeddings_vggsound_description_normed' +current_time = datetime.now().strftime("%Y%m%d_%H%M%S") +new_filename = f"{wavcaps_word_embedding}_{current_time}{file_extension}" +filename = os.path.join(data_path, new_filename) np.save(filename, wavecaps_zeroshot_weights) diff --git a/clip_feature_extraction/get_clip_features_ucf.py b/clip_feature_extraction/get_clip_features_ucf.py index 1bff342..93e8731 100644 --- a/clip_feature_extraction/get_clip_features_ucf.py +++ b/clip_feature_extraction/get_clip_features_ucf.py @@ -7,6 +7,9 @@ sys.path.append("..") from tqdm import tqdm import torch +import os, sys +base_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) +sys.path.append(base_dir) from c3d.c3d import C3D import torchvision import csv @@ -23,6 +26,9 @@ import soundfile as sf import librosa import torch.nn.functional as F + + + from WavCaps.retrieval.models.ase_model import ASE import argparse from src.args import str_to_bool @@ -54,8 +60,10 @@ def read_prepare_audio(audio_path, device): -device = 'cuda:4' +# device = 'cuda:4' +device = 'cuda:0' model, preprocess = clip.load("ViT-B/32", device=device) +# 作者自己对特征提取模型进行了微调,但论文中并没有对其进行微调,可以忽略 if args.finetuned_model == True: model_path = '/home/aoq234/dev/ClipClap/logs/clip_finetuning/second_try_Aug25_19-53-14_475888_callisto/checkpoints/clip_finetuned.pt' save_path = '/home/aoq234/akata-shared/aoq234/mnt/ucf_features_finetuned_clip_wavcaps' @@ -63,7 +71,8 @@ def read_prepare_audio(audio_path, device): model.load_state_dict(checkpoint['model_state_dict']) else: model_path = "ViT-B/32" - save_path = '/home/aoq234/akata-shared/aoq234/mnt/ucf_features_original_clip_wavcaps' + # save_path = '/home/aoq234/akata-shared/aoq234/mnt/ucf_features_original_clip_wavcaps' + save_path = '/home/wh/clip_original/ucf_features_original_clip_wavcaps' model = model.to(device) @@ -86,7 +95,8 @@ def read_prepare_audio(audio_path, device): output_list_no_average=[] -path=Path("/home/aoq234/akata-shared/datasets/UCF101/UCF-101") # path to search for videos +# path=Path("/home/aoq234/akata-shared/datasets/UCF101/UCF-101") # path to search for videos +path=Path("/home/wh/work/dataset/UCF101/UCF-101") # path to search for videos dict_csv={} list_classes=[] @@ -106,7 +116,8 @@ def read_prepare_audio(audio_path, device): -with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +# with open("/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: +with open("/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/settings/inference.yaml", "r") as f: config = yaml.safe_load(f) @@ -118,7 +129,8 @@ def read_prepare_audio(audio_path, device): cp_path = '/home/aoq234/dev/ClipClap/logs/wavcaps_finetuning/first_try_Aug29_07-25-05_613403_callisto/checkpoints/WavCaps_finetuned.pt' state_dict_key = 'model_state_dict' else: - cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' + # cp_path = '/home/aoq234/dev/CLIP-GZSL/WavCaps/retrieval/pretrained_models/audio_encoders/HTSAT_BERT_zero_shot.pt' + cp_path = '/home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/WavCaps/retrieval/pretrained_models/HTSAT_BERT_zero_shot.pt' state_dict_key = 'model' cp = torch.load(cp_path) @@ -142,8 +154,10 @@ def read_prepare_audio(audio_path, device): try: # audio mp4_version = AudioSegment.from_file(str(f), "avi") - mp4_version.export("/home/aoq234/akata-shared/aoq234/mnt/ucf_dummy_tmp.wav", format="wav") - audio = read_prepare_audio("/home/aoq234/akata-shared/aoq234/mnt/ucf_dummy_tmp.wav", device) + # mp4_version.export("/home/aoq234/akata-shared/aoq234/mnt/ucf_dummy_tmp.wav", format="wav") + mp4_version.export("/home/wh/clip_original/ucf_dummy_tmp.wav", format="wav") + # audio = read_prepare_audio("/home/aoq234/akata-shared/aoq234/mnt/ucf_dummy_tmp.wav", device) + audio = read_prepare_audio("/home/wh/clip_original/ucf_dummy_tmp.wav", device) with torch.no_grad(): audio_emb = wavcaps_model.encode_audio(audio).squeeze() diff --git a/clipclap.yml b/clipclap.yml index dcf33d0..f9e5392 100644 --- a/clipclap.yml +++ b/clipclap.yml @@ -170,7 +170,7 @@ dependencies: - antlr4-python3-runtime==4.8 - click==8.1.3 - configargparse==1.5.3 - - docker-pycreds==0.4.0 + - docker-pycreds==0.4.0k - efficientnet-pytorch==0.7.1 - filelock==3.0.12 - gdown==3.13.0 diff --git a/clipclap_feature_extraction.yml b/clipclap_feature_extraction.yml index 767147b..c117339 100644 --- a/clipclap_feature_extraction.yml +++ b/clipclap_feature_extraction.yml @@ -99,7 +99,6 @@ dependencies: - cachetools==5.2.0 - charset-normalizer==2.1.1 - click==8.1.3 - - clip==1.0 - configargparse==1.7 - cycler==0.11.0 - decorator==4.4.2 @@ -196,3 +195,4 @@ dependencies: - werkzeug==2.2.2 - yarl==1.8.2 - zipp==3.11.0 + - clip==1.0 diff --git a/commands.sh b/commands.sh index d6701c7..681d5f0 100644 --- a/commands.sh +++ b/commands.sh @@ -1,4 +1,14 @@ - +# UCF +python3 main.py --cfg config/clipclap.yaml + --root_dir /home/wh/work/data/clipclap/UCF + --log_dir /home/wh/.ssh/ClipClap-GZSL/ClipClap-GZSL/logs/ClipClap_UCF + --dataset_name UCF + --epochs 20 + --lr 0.00007 + --use_wavcaps_embeddings True + --modality both + --word_embeddings both + --run all diff --git a/splitting_scripts_cls/create_pkl_files_cls.py b/splitting_scripts_cls/create_pkl_files_cls.py index 81367d1..ea48d95 100644 --- a/splitting_scripts_cls/create_pkl_files_cls.py +++ b/splitting_scripts_cls/create_pkl_files_cls.py @@ -137,6 +137,7 @@ def save_pickle_files(which_dataset, use_audio, root_path, original_dataset_path # call for UCF # python splitting_scripts_cls/create_pkl_files_cls.py --dataset_name UCF --path_original_dataset /home/aoq234/akata-shared/aoq234/mnt/ucf_features_original_clip_wavcaps --path_splitted_dataset /home/aoq234/akata-shared/aoq234/avzsl/clip_original +# python splitting_scripts_cls/create_pkl_files_cls.py --dataset_name UCF --path_original_dataset /home/wh/clip_original/ucf_features_original_clip_wavcaps --path_splitted_dataset /home/wh/avzsl/clip_original diff --git a/src/clipclap_model.py b/src/clipclap_model.py index f5f9e71..c3834f3 100644 --- a/src/clipclap_model.py +++ b/src/clipclap_model.py @@ -14,7 +14,7 @@ # user defined from src.optimizer import SAM - +from einops.layers.torch import Rearrange torch.set_printoptions(threshold=10_000) def disable_running_stats(model): def _disable(module): @@ -68,45 +68,143 @@ def get_embedding(self, x): +class PreNorm(nn.Module): + def __init__(self, dim, fn): + super().__init__() + self.norm = nn.LayerNorm(dim) + self.fn = fn + def forward(self, x, **kwargs): + return self.fn(self.norm(x), **kwargs) +class FeedForward(nn.Module): + def __init__(self, dim, hidden_dim, dropout = 0.): + super().__init__() + self.net = nn.Sequential( + nn.Linear(dim, hidden_dim), + nn.GELU(), + nn.Dropout(dropout), + nn.Linear(hidden_dim, dim), + nn.Dropout(dropout) + ) + def forward(self, x): + return self.net(x) +class Attention(nn.Module): + def __init__(self, dim, heads = 8, dim_head = 64, dropout = 0.): + super().__init__() + inner_dim = dim_head * heads + project_out = not (heads == 1 and dim_head == dim) + self.heads = heads + self.scale = dim_head ** -0.5 + self.attend = nn.Softmax(dim = -1) + self.to_qkv = nn.Linear(dim, inner_dim * 3, bias = False) + self.to_out = nn.Sequential( + nn.Linear(inner_dim, dim), + nn.Dropout(dropout) + ) if project_out else nn.Identity() + def forward(self, x): + qkv = self.to_qkv(x).chunk(3, dim = -1) + q, k, v = map(lambda t: rearrange(t, 'b n (h d) -> b h n d', h = self.heads), qkv) + dots = torch.matmul(q, k.transpose(-1, -2)) * self.scale + attn = self.attend(dots) + out = torch.matmul(attn, v) + out = rearrange(out, 'b h n d -> b n (h d)') + return self.to_out(out) +class Transformer(nn.Module): + def __init__(self, dim, depth, heads, dim_head, mlp_dim, dropout = 0.): + super().__init__() + self.layers = nn.ModuleList([]) + for _ in range(depth): + self.layers.append(nn.ModuleList([ + PreNorm(dim, Attention(dim, heads = heads, dim_head = dim_head, dropout = dropout)), + PreNorm(dim, FeedForward(dim, mlp_dim, dropout = dropout)) + ])) + def forward(self, x): + for attn, ff in self.layers: + x = attn(x) + x + x = ff(x) + x + return x + + +class AutoFusion(nn.Module): + """docstring for AutoFusion""" + def __init__(self, dim, hidden_dim): + super(AutoFusion, self).__init__() + + self.fuse_in = nn.Sequential( + nn.Linear(dim, hidden_dim//2), + nn.Tanh(), + nn.Linear(hidden_dim//2, dim), + nn.ReLU() + ) + self.fuse_out = nn.Sequential( + nn.Linear(dim, hidden_dim//2), + nn.ReLU(), + nn.Linear(hidden_dim//2, dim) + ) + self.criterion = nn.MSELoss() + + def forward(self, z): + compressed_z = self.fuse_in(z) + loss = self.criterion(self.fuse_out(compressed_z), z) + return compressed_z,loss + +class CosineSimilarityLoss(nn.Module): + def __init__(self): + super(CosineSimilarityLoss, self).__init__() + + def forward(self, input_vectors, target_vectors): + # 计算余弦相似度 + cosine_similarity = F.cosine_similarity(input_vectors, target_vectors) + + # 构建损失函数,使余弦相似度接近1 + loss = 1 - cosine_similarity + + return loss.mean() + +class MLP_block(nn.Module): + def __init__(self, input_size, hidden_size, dropout=0.5): + super().__init__() + self.net = nn.Sequential( + nn.Linear(input_size, hidden_size), + nn.GELU(), + nn.Dropout(dropout), + nn.Linear(hidden_size, input_size), + nn.Dropout(dropout) + ) + def forward(self, x): + x = self.net(x) + return x + + +class MLP_Communicator(nn.Module): + def __init__(self, token, channel, hidden_size, depth=1): + super(MLP_Communicator, self).__init__() + self.depth = depth + self.token_mixer = nn.Sequential( + Rearrange('b n d -> b d n'), + MLP_block(input_size=channel, hidden_size=hidden_size), + Rearrange('b n d -> b d n') + ) + self.channel_mixer = nn.Sequential( + MLP_block(input_size=token, hidden_size=hidden_size) + ) - - - - - - - - - - - - - - - - - - - - - - - - - - + def forward(self, x): + for _ in range(self.depth): + x = x + self.token_mixer(x) + x = x + self.channel_mixer(x) + return x class ClipClap_model(nn.Module): @@ -217,6 +315,18 @@ def __init__(self, params_model, input_size_audio, input_size_video): dropout=self.drop_proj_w, use_bn=params_model['embeddings_batch_norm'] ) + self.cross_attention = Transformer(512, 6, 8, 64, 512, dropout=0.2) + self.pos_emb1D = torch.nn.Parameter(torch.randn(1, 512)) + self.fu = AutoFusion( + dim=512, + hidden_dim=512, + ) + self.mlp = MLP_Communicator( + token=512, # token 的大小 + channel=1, # 通道的大小 + hidden_size=64, # 隐藏层的大小 + depth=1 # 深度 + ) @@ -282,6 +392,18 @@ def forward(self, a, v, w, masks, timesteps): o = self.O_enc(model_input) + # o = o.unsqueeze(1) + # #print(o.shape) + # o = self.mlp(o).squeeze(1) + + m, l = self.fu(o) + m = m + self.pos_emb1D[0, :] + m = m.unsqueeze(1) + #print(m.shape) + o = self.cross_attention(m).squeeze(1) + o = o.unsqueeze(1) + # print(o.shape)s + o = self.mlp(o).squeeze(1) w = self.W_enc(w) @@ -431,7 +553,16 @@ def get_embeddings(self, a, v, w, masks, timesteps): o = self.O_enc(model_input) - + # o = o.unsqueeze(1) + # #print(o.shape)s + # o = self.mlp(o).squeeze(1) + m, l = self.fu(o) + m = m + self.pos_emb1D[0, :] + m = m.unsqueeze(1) + o = self.cross_attention(m).squeeze(1) + o = o.unsqueeze(1) + # print(o.shape)s + o = self.mlp(o).squeeze(1) w = self.W_enc(w) diff --git a/src/dataset.py b/src/dataset.py index 8e26a08..06a60dd 100644 --- a/src/dataset.py +++ b/src/dataset.py @@ -110,11 +110,20 @@ def classes(self): @property def class_to_idx(self): - return {_class: i for i, _class in enumerate(sorted(self.all_class_names))} - + # 检查 self.all_class_names 是否已经被计算过 + if not hasattr(self, '_all_class_names_cache'): + self._all_class_names_cache = self.all_class_names + # return {_class: i for i, _class in enumerate(sorted(self.all_class_names))} + return {_class: i for i, _class in enumerate(sorted(self._all_class_names_cache))} @property def all_class_names(self): - return get_class_names(self.root / "class-split/all_class.txt") + # return get_class_names(self.root / "class-split/all_class.txt") + + if isinstance(self.root, Path): + path = self.root.joinpath("class-split", "all_class.txt") + else: + path = Path(self.root).joinpath("class-split", "all_class.txt") + return get_class_names(path) @property def seen_class_names(self): @@ -958,7 +967,16 @@ def class_to_idx(self): @property def all_class_names(self): - return get_class_names(self.root / "class-split/all_class.txt") + # return get_class_names(self.root / "class-split/all_class.txt") + # return get_class_names(self.root / "class-split" / "all_class.txt") + # return get_class_names(Path(self.root) / "class-split" / "all_class.txt") + # return get_class_names(Path(self.root).joinpath("class-split", "all_class.txt")) + + if isinstance(self.root, Path): + path = self.root.joinpath("class-split", "all_class.txt") + else: + path = Path(self.root).joinpath("class-split", "all_class.txt") + return get_class_names(path) @property def seen_class_names(self): @@ -1275,7 +1293,14 @@ def class_to_idx(self): @property def all_class_names(self): - return get_class_names(self.root / "class-split/all_class.txt") + # return get_class_names(self.root / "class-split/all_class.txt") + return get_class_names(Path(self.root).joinpath("class-split", "all_class.txt")) + + # if isinstance(self.root, Path): + # path = self.root.joinpath("class-split", "all_class.txt") + # else: + # path = Path(self.root).joinpath("class-split", "all_class.txt") + # return get_class_names(path) @property def seen_class_names(self): diff --git a/src/utils.py b/src/utils.py index 99470ac..4ef7cf2 100644 --- a/src/utils.py +++ b/src/utils.py @@ -80,8 +80,8 @@ def log_hparams(writer, args, metrics): args_dict[k] = v.as_posix() del metrics["recall"] metrics = {"Eval/"+k: v for k,v in metrics.items()} - del args_dict['audio_hip_blocks'] - del args_dict['video_hip_blocks'] + # del args_dict['audio_hip_blocks'] + # del args_dict['video_hip_blocks'] writer.add_hparams(args_dict, metrics)