CovidSpeechChallenge_2021/vggish/vggish_params.py


# Copyright 2017 The TensorFlow Authors All Rights Reserved.

#

# Licensed under the Apache License, Version 2.0 (the "License");

# you may not use this file except in compliance with the License.

# You may obtain a copy of the License at

#

#     http://www.apache.org/licenses/LICENSE-2.0

#

# Unless required by applicable law or agreed to in writing, software

# distributed under the License is distributed on an "AS IS" BASIS,

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

# See the License for the specific language governing permissions and

# limitations under the License.

# ==============================================================================


"""Global parameters for the VGGish model.


See vggish_slim.py for more information.

"""


# Architectural constants.

NUM_FRAMES = 96  # Frames in input mel-spectrogram patch.

NUM_BANDS = 64  # Frequency bands in input mel-spectrogram patch.

EMBEDDING_SIZE = 128  # Size of embedding layer.


# Hyperparameters used in feature and example generation.

SAMPLE_RATE = 16000

STFT_WINDOW_LENGTH_SECONDS = 0.025

STFT_HOP_LENGTH_SECONDS = 0.010

NUM_MEL_BINS = NUM_BANDS

MEL_MIN_HZ = 125

MEL_MAX_HZ = 7500

LOG_OFFSET = 0.01  # Offset used for stabilized log of input mel-spectrogram.

EXAMPLE_WINDOW_SECONDS = 0.96  # Each example contains 96 10ms frames

EXAMPLE_HOP_SECONDS = 0.96     # with zero overlap.


# Parameters used for embedding postprocessing.

PCA_EIGEN_VECTORS_NAME = 'pca_eigen_vectors'

PCA_MEANS_NAME = 'pca_means'

QUANTIZE_MIN_VAL = -2.0

QUANTIZE_MAX_VAL = +2.0


# Hyperparameters used in training.

INIT_STDDEV = 0.01  # Standard deviation used to initialize weights.

LEARNING_RATE = 1e-4  # Learning rate for the Adam optimizer.

ADAM_EPSILON = 1e-8  # Epsilon for the Adam optimizer.


# Names of ops, tensors, and features.

INPUT_OP_NAME = 'vggish/input_features'

INPUT_TENSOR_NAME = INPUT_OP_NAME + ':0'

OUTPUT_OP_NAME = 'vggish/embedding'

OUTPUT_TENSOR_NAME = OUTPUT_OP_NAME + ':0'

AUDIO_EMBEDDING_FEATURE_NAME = 'audio_embedding'
add VGGSH tool 2021-08-19 07:06:30 +00:00
			`# Copyright 2017 The TensorFlow Authors All Rights Reserved.`

			`#`

			`# Licensed under the Apache License, Version 2.0 (the "License");`

			`# you may not use this file except in compliance with the License.`

			`# You may obtain a copy of the License at`

			`#`

			`# http://www.apache.org/licenses/LICENSE-2.0`

			`#`

			`# Unless required by applicable law or agreed to in writing, software`

			`# distributed under the License is distributed on an "AS IS" BASIS,`

			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`

			`# See the License for the specific language governing permissions and`

			`# limitations under the License.`

			`# ==============================================================================`



			`"""Global parameters for the VGGish model.`



			`See vggish_slim.py for more information.`

			`"""`



			`# Architectural constants.`

			`NUM_FRAMES = 96 # Frames in input mel-spectrogram patch.`

			`NUM_BANDS = 64 # Frequency bands in input mel-spectrogram patch.`

			`EMBEDDING_SIZE = 128 # Size of embedding layer.`



			`# Hyperparameters used in feature and example generation.`

			`SAMPLE_RATE = 16000`

			`STFT_WINDOW_LENGTH_SECONDS = 0.025`

			`STFT_HOP_LENGTH_SECONDS = 0.010`

			`NUM_MEL_BINS = NUM_BANDS`

			`MEL_MIN_HZ = 125`

			`MEL_MAX_HZ = 7500`

			`LOG_OFFSET = 0.01 # Offset used for stabilized log of input mel-spectrogram.`

			`EXAMPLE_WINDOW_SECONDS = 0.96 # Each example contains 96 10ms frames`

			`EXAMPLE_HOP_SECONDS = 0.96 # with zero overlap.`



			`# Parameters used for embedding postprocessing.`

			`PCA_EIGEN_VECTORS_NAME = 'pca_eigen_vectors'`

			`PCA_MEANS_NAME = 'pca_means'`

			`QUANTIZE_MIN_VAL = -2.0`

			`QUANTIZE_MAX_VAL = +2.0`



			`# Hyperparameters used in training.`

			`INIT_STDDEV = 0.01 # Standard deviation used to initialize weights.`

			`LEARNING_RATE = 1e-4 # Learning rate for the Adam optimizer.`

			`ADAM_EPSILON = 1e-8 # Epsilon for the Adam optimizer.`



			`# Names of ops, tensors, and features.`

			`INPUT_OP_NAME = 'vggish/input_features'`

			`INPUT_TENSOR_NAME = INPUT_OP_NAME + ':0'`

			`OUTPUT_OP_NAME = 'vggish/embedding'`

			`OUTPUT_TENSOR_NAME = OUTPUT_OP_NAME + ':0'`

			`AUDIO_EMBEDDING_FEATURE_NAME = 'audio_embedding'`