Upload folder using huggingface_hub
Browse files- README.md +9 -0
 - config.json +139 -0
 - onnx/model.onnx +3 -0
 - onnx/model_bnb4.onnx +3 -0
 - onnx/model_fp16.onnx +3 -0
 - onnx/model_int8.onnx +3 -0
 - onnx/model_q4.onnx +3 -0
 - onnx/model_q4f16.onnx +3 -0
 - onnx/model_quantized.onnx +3 -0
 - onnx/model_uint8.onnx +3 -0
 - preprocessor_config.json +9 -0
 - quantize_config.json +18 -0
 
    	
        README.md
    ADDED
    
    | 
         @@ -0,0 +1,9 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            ---
         
     | 
| 2 | 
         
            +
            library_name: transformers.js
         
     | 
| 3 | 
         
            +
            base_model:
         
     | 
| 4 | 
         
            +
            - prithivMLmods/Speech-Emotion-Classification
         
     | 
| 5 | 
         
            +
            ---
         
     | 
| 6 | 
         
            +
             
     | 
| 7 | 
         
            +
            # Speech-Emotion-Classification (ONNX)
         
     | 
| 8 | 
         
            +
             
     | 
| 9 | 
         
            +
            This is an ONNX version of [prithivMLmods/Speech-Emotion-Classification](https://huggingface.co/prithivMLmods/Speech-Emotion-Classification). It was automatically converted and uploaded using [this space](https://huggingface.co/spaces/onnx-community/convert-to-onnx).
         
     | 
    	
        config.json
    ADDED
    
    | 
         @@ -0,0 +1,139 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            {
         
     | 
| 2 | 
         
            +
              "_attn_implementation_autoset": true,
         
     | 
| 3 | 
         
            +
              "_name_or_path": "prithivMLmods/Speech-Emotion-Classification",
         
     | 
| 4 | 
         
            +
              "activation_dropout": 0.0,
         
     | 
| 5 | 
         
            +
              "adapter_attn_dim": null,
         
     | 
| 6 | 
         
            +
              "adapter_kernel_size": 3,
         
     | 
| 7 | 
         
            +
              "adapter_stride": 2,
         
     | 
| 8 | 
         
            +
              "add_adapter": false,
         
     | 
| 9 | 
         
            +
              "apply_spec_augment": true,
         
     | 
| 10 | 
         
            +
              "architectures": [
         
     | 
| 11 | 
         
            +
                "Wav2Vec2ForSequenceClassification"
         
     | 
| 12 | 
         
            +
              ],
         
     | 
| 13 | 
         
            +
              "attention_dropout": 0.1,
         
     | 
| 14 | 
         
            +
              "bos_token_id": 1,
         
     | 
| 15 | 
         
            +
              "classifier_proj_size": 256,
         
     | 
| 16 | 
         
            +
              "codevector_dim": 256,
         
     | 
| 17 | 
         
            +
              "contrastive_logits_temperature": 0.1,
         
     | 
| 18 | 
         
            +
              "conv_bias": false,
         
     | 
| 19 | 
         
            +
              "conv_dim": [
         
     | 
| 20 | 
         
            +
                512,
         
     | 
| 21 | 
         
            +
                512,
         
     | 
| 22 | 
         
            +
                512,
         
     | 
| 23 | 
         
            +
                512,
         
     | 
| 24 | 
         
            +
                512,
         
     | 
| 25 | 
         
            +
                512,
         
     | 
| 26 | 
         
            +
                512
         
     | 
| 27 | 
         
            +
              ],
         
     | 
| 28 | 
         
            +
              "conv_kernel": [
         
     | 
| 29 | 
         
            +
                10,
         
     | 
| 30 | 
         
            +
                3,
         
     | 
| 31 | 
         
            +
                3,
         
     | 
| 32 | 
         
            +
                3,
         
     | 
| 33 | 
         
            +
                3,
         
     | 
| 34 | 
         
            +
                2,
         
     | 
| 35 | 
         
            +
                2
         
     | 
| 36 | 
         
            +
              ],
         
     | 
| 37 | 
         
            +
              "conv_stride": [
         
     | 
| 38 | 
         
            +
                5,
         
     | 
| 39 | 
         
            +
                2,
         
     | 
| 40 | 
         
            +
                2,
         
     | 
| 41 | 
         
            +
                2,
         
     | 
| 42 | 
         
            +
                2,
         
     | 
| 43 | 
         
            +
                2,
         
     | 
| 44 | 
         
            +
                2
         
     | 
| 45 | 
         
            +
              ],
         
     | 
| 46 | 
         
            +
              "ctc_loss_reduction": "sum",
         
     | 
| 47 | 
         
            +
              "ctc_zero_infinity": false,
         
     | 
| 48 | 
         
            +
              "diversity_loss_weight": 0.1,
         
     | 
| 49 | 
         
            +
              "do_stable_layer_norm": false,
         
     | 
| 50 | 
         
            +
              "eos_token_id": 2,
         
     | 
| 51 | 
         
            +
              "feat_extract_activation": "gelu",
         
     | 
| 52 | 
         
            +
              "feat_extract_norm": "group",
         
     | 
| 53 | 
         
            +
              "feat_proj_dropout": 0.1,
         
     | 
| 54 | 
         
            +
              "feat_quantizer_dropout": 0.0,
         
     | 
| 55 | 
         
            +
              "final_dropout": 0.0,
         
     | 
| 56 | 
         
            +
              "freeze_feat_extract_train": true,
         
     | 
| 57 | 
         
            +
              "hidden_act": "gelu",
         
     | 
| 58 | 
         
            +
              "hidden_dropout": 0.1,
         
     | 
| 59 | 
         
            +
              "hidden_size": 768,
         
     | 
| 60 | 
         
            +
              "id2label": {
         
     | 
| 61 | 
         
            +
                "0": "ANG",
         
     | 
| 62 | 
         
            +
                "1": "CAL",
         
     | 
| 63 | 
         
            +
                "2": "DIS",
         
     | 
| 64 | 
         
            +
                "3": "FEA",
         
     | 
| 65 | 
         
            +
                "4": "HAP",
         
     | 
| 66 | 
         
            +
                "5": "NEU",
         
     | 
| 67 | 
         
            +
                "6": "SAD",
         
     | 
| 68 | 
         
            +
                "7": "SUR"
         
     | 
| 69 | 
         
            +
              },
         
     | 
| 70 | 
         
            +
              "initializer_range": 0.02,
         
     | 
| 71 | 
         
            +
              "intermediate_size": 3072,
         
     | 
| 72 | 
         
            +
              "label2id": {
         
     | 
| 73 | 
         
            +
                "ANG": 0,
         
     | 
| 74 | 
         
            +
                "CAL": 1,
         
     | 
| 75 | 
         
            +
                "DIS": 2,
         
     | 
| 76 | 
         
            +
                "FEA": 3,
         
     | 
| 77 | 
         
            +
                "HAP": 4,
         
     | 
| 78 | 
         
            +
                "NEU": 5,
         
     | 
| 79 | 
         
            +
                "SAD": 6,
         
     | 
| 80 | 
         
            +
                "SUR": 7
         
     | 
| 81 | 
         
            +
              },
         
     | 
| 82 | 
         
            +
              "layer_norm_eps": 1e-05,
         
     | 
| 83 | 
         
            +
              "layerdrop": 0.0,
         
     | 
| 84 | 
         
            +
              "mask_channel_length": 10,
         
     | 
| 85 | 
         
            +
              "mask_channel_min_space": 1,
         
     | 
| 86 | 
         
            +
              "mask_channel_other": 0.0,
         
     | 
| 87 | 
         
            +
              "mask_channel_prob": 0.0,
         
     | 
| 88 | 
         
            +
              "mask_channel_selection": "static",
         
     | 
| 89 | 
         
            +
              "mask_feature_length": 10,
         
     | 
| 90 | 
         
            +
              "mask_feature_min_masks": 0,
         
     | 
| 91 | 
         
            +
              "mask_feature_prob": 0.0,
         
     | 
| 92 | 
         
            +
              "mask_time_length": 10,
         
     | 
| 93 | 
         
            +
              "mask_time_min_masks": 2,
         
     | 
| 94 | 
         
            +
              "mask_time_min_space": 1,
         
     | 
| 95 | 
         
            +
              "mask_time_other": 0.0,
         
     | 
| 96 | 
         
            +
              "mask_time_prob": 0.05,
         
     | 
| 97 | 
         
            +
              "mask_time_selection": "static",
         
     | 
| 98 | 
         
            +
              "model_type": "wav2vec2",
         
     | 
| 99 | 
         
            +
              "no_mask_channel_overlap": false,
         
     | 
| 100 | 
         
            +
              "no_mask_time_overlap": false,
         
     | 
| 101 | 
         
            +
              "num_adapter_layers": 3,
         
     | 
| 102 | 
         
            +
              "num_attention_heads": 12,
         
     | 
| 103 | 
         
            +
              "num_codevector_groups": 2,
         
     | 
| 104 | 
         
            +
              "num_codevectors_per_group": 320,
         
     | 
| 105 | 
         
            +
              "num_conv_pos_embedding_groups": 16,
         
     | 
| 106 | 
         
            +
              "num_conv_pos_embeddings": 128,
         
     | 
| 107 | 
         
            +
              "num_feat_extract_layers": 7,
         
     | 
| 108 | 
         
            +
              "num_hidden_layers": 12,
         
     | 
| 109 | 
         
            +
              "num_negatives": 100,
         
     | 
| 110 | 
         
            +
              "output_hidden_size": 768,
         
     | 
| 111 | 
         
            +
              "pad_token_id": 0,
         
     | 
| 112 | 
         
            +
              "proj_codevector_dim": 256,
         
     | 
| 113 | 
         
            +
              "tdnn_dilation": [
         
     | 
| 114 | 
         
            +
                1,
         
     | 
| 115 | 
         
            +
                2,
         
     | 
| 116 | 
         
            +
                3,
         
     | 
| 117 | 
         
            +
                1,
         
     | 
| 118 | 
         
            +
                1
         
     | 
| 119 | 
         
            +
              ],
         
     | 
| 120 | 
         
            +
              "tdnn_dim": [
         
     | 
| 121 | 
         
            +
                512,
         
     | 
| 122 | 
         
            +
                512,
         
     | 
| 123 | 
         
            +
                512,
         
     | 
| 124 | 
         
            +
                512,
         
     | 
| 125 | 
         
            +
                1500
         
     | 
| 126 | 
         
            +
              ],
         
     | 
| 127 | 
         
            +
              "tdnn_kernel": [
         
     | 
| 128 | 
         
            +
                5,
         
     | 
| 129 | 
         
            +
                3,
         
     | 
| 130 | 
         
            +
                3,
         
     | 
| 131 | 
         
            +
                1,
         
     | 
| 132 | 
         
            +
                1
         
     | 
| 133 | 
         
            +
              ],
         
     | 
| 134 | 
         
            +
              "torch_dtype": "float32",
         
     | 
| 135 | 
         
            +
              "transformers_version": "4.49.0",
         
     | 
| 136 | 
         
            +
              "use_weighted_layer_sum": false,
         
     | 
| 137 | 
         
            +
              "vocab_size": 32,
         
     | 
| 138 | 
         
            +
              "xvector_output_dim": 512
         
     | 
| 139 | 
         
            +
            }
         
     | 
    	
        onnx/model.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:5e29cab15162f74f42c1afc3d5577497861758c7acd6e4da3d1f70977bd9e1b7
         
     | 
| 3 | 
         
            +
            size 378609481
         
     | 
    	
        onnx/model_bnb4.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:ea8a44e6e742997cc6f5ae3a193b483629d0159e705cda23afff240bb17b4000
         
     | 
| 3 | 
         
            +
            size 84630595
         
     | 
    	
        onnx/model_fp16.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:60fa5e9f3d9f1796607bb430c9ce932b3c1e9bc14f9e7d0d270d3af66a18db84
         
     | 
| 3 | 
         
            +
            size 189468010
         
     | 
    	
        onnx/model_int8.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:1720a40017ecd8d71bc41988b115bd9d96cfdf796c127268b2afa1302473632f
         
     | 
| 3 | 
         
            +
            size 95389021
         
     | 
    	
        onnx/model_q4.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:03b3ef1347f1ebdd9154d7f851d6edb81c8361cb9e962749a75406668d87ea34
         
     | 
| 3 | 
         
            +
            size 89975333
         
     | 
    	
        onnx/model_q4f16.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:c9668908ebbb87fb9996bec8a8d2b60f5df95d307e107949aba1a8537ebafce3
         
     | 
| 3 | 
         
            +
            size 66537637
         
     | 
    	
        onnx/model_quantized.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:3217e95e4b28d53913fbe94cd9650b520f8e7ecf2bd643b9e45fc5b8b93b8aab
         
     | 
| 3 | 
         
            +
            size 95389059
         
     | 
    	
        onnx/model_uint8.onnx
    ADDED
    
    | 
         @@ -0,0 +1,3 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            version https://git-lfs.github.com/spec/v1
         
     | 
| 2 | 
         
            +
            oid sha256:3217e95e4b28d53913fbe94cd9650b520f8e7ecf2bd643b9e45fc5b8b93b8aab
         
     | 
| 3 | 
         
            +
            size 95389059
         
     | 
    	
        preprocessor_config.json
    ADDED
    
    | 
         @@ -0,0 +1,9 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            {
         
     | 
| 2 | 
         
            +
              "do_normalize": true,
         
     | 
| 3 | 
         
            +
              "feature_extractor_type": "Wav2Vec2FeatureExtractor",
         
     | 
| 4 | 
         
            +
              "feature_size": 1,
         
     | 
| 5 | 
         
            +
              "padding_side": "right",
         
     | 
| 6 | 
         
            +
              "padding_value": 0.0,
         
     | 
| 7 | 
         
            +
              "return_attention_mask": false,
         
     | 
| 8 | 
         
            +
              "sampling_rate": 16000
         
     | 
| 9 | 
         
            +
            }
         
     | 
    	
        quantize_config.json
    ADDED
    
    | 
         @@ -0,0 +1,18 @@ 
     | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
|
| 
         | 
| 
         | 
|
| 1 | 
         
            +
            {
         
     | 
| 2 | 
         
            +
                "modes": [
         
     | 
| 3 | 
         
            +
                    "fp16",
         
     | 
| 4 | 
         
            +
                    "q8",
         
     | 
| 5 | 
         
            +
                    "int8",
         
     | 
| 6 | 
         
            +
                    "uint8",
         
     | 
| 7 | 
         
            +
                    "q4",
         
     | 
| 8 | 
         
            +
                    "q4f16",
         
     | 
| 9 | 
         
            +
                    "bnb4"
         
     | 
| 10 | 
         
            +
                ],
         
     | 
| 11 | 
         
            +
                "per_channel": false,
         
     | 
| 12 | 
         
            +
                "reduce_range": false,
         
     | 
| 13 | 
         
            +
                "block_size": null,
         
     | 
| 14 | 
         
            +
                "is_symmetric": true,
         
     | 
| 15 | 
         
            +
                "accuracy_level": null,
         
     | 
| 16 | 
         
            +
                "quant_type": 1,
         
     | 
| 17 | 
         
            +
                "op_block_list": null
         
     | 
| 18 | 
         
            +
            }
         
     |