88 lines
3.0 KiB
JSON
88 lines
3.0 KiB
JSON
{
|
|
"name": "mood acoustic",
|
|
"type": "multi-class classifier",
|
|
"link": "https://essentia.upf.edu/models/classifiers/mood_acoustic/mood_acoustic-musicnn-mtt-2.pb",
|
|
"version": "1",
|
|
"description": "classification of music by type of sound (acoustic/non-acoustic)",
|
|
"author": "Pablo Alonso",
|
|
"email": "pablo.alonso@upf.edu",
|
|
"release_date": "2020-07-07",
|
|
"framework": "tensorflow",
|
|
"framework_version": "1.15.0",
|
|
"classes": [
|
|
"acoustic",
|
|
"non_acoustic"
|
|
],
|
|
"model_types": [
|
|
"frozen_model"
|
|
],
|
|
"dataset": {
|
|
"name": "In-house MTG collection",
|
|
"citation": "@inproceedings{laurier2009music,\n title={Music mood annotator design and integration},\n author={Laurier, Cyril and Meyers, Owen and Serra, Joan and Blech, Martin and Herrera, Perfecto},\n booktitle={2009 Seventh International Workshop on Content-Based Multimedia Indexing},\n pages={156--161},\n year={2009},\n organization={IEEE}\n}",
|
|
"size": "321 full tracks + excerpts, 193/128 per class",
|
|
"metrics": {
|
|
"5-fold_cross_validation_normalized_accuracy": 0.93
|
|
}
|
|
},
|
|
"schema": {
|
|
"inputs": [
|
|
{
|
|
"name": "model/Placeholder",
|
|
"type": "float",
|
|
"shape": [
|
|
187,
|
|
96
|
|
]
|
|
}
|
|
],
|
|
"outputs": [
|
|
{
|
|
"name": "model/Sigmoid",
|
|
"type": "float",
|
|
"shape": [
|
|
1,
|
|
2
|
|
],
|
|
"op": "Sigmoid",
|
|
"output_purpose": "predictions"
|
|
},
|
|
{
|
|
"name": "model/dense_2/BiasAdd",
|
|
"type": "float",
|
|
"shape": [
|
|
1,
|
|
2
|
|
],
|
|
"op": "fully connected",
|
|
"description": "logits",
|
|
"output_purpose": ""
|
|
},
|
|
{
|
|
"name": "model/dense_1/BiasAdd",
|
|
"type": "float",
|
|
"shape": [
|
|
1,
|
|
100
|
|
],
|
|
"op": "fully connected",
|
|
"description": "penultimate layer",
|
|
"output_purpose": ""
|
|
},
|
|
{
|
|
"name": "model/dense/BiasAdd",
|
|
"type": "float",
|
|
"shape": [
|
|
1,
|
|
200
|
|
],
|
|
"op": "fully connected",
|
|
"output_purpose": "embeddings"
|
|
}
|
|
]
|
|
},
|
|
"citation": "@inproceedings{alonso2020tensorflow,\n title={Tensorflow Audio Models in Essentia},\n author={Alonso-Jim{\\'e}nez, Pablo and Bogdanov, Dmitry and Pons, Jordi and Serra, Xavier},\n booktitle={IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},\n year={2020}\n}",
|
|
"inference": {
|
|
"sample_rate": 16000,
|
|
"algorithm": "TensorflowPredictMusiCNN"
|
|
}
|
|
} |