Add files using upload-large-folder tool

Browse files

Files changed (2) hide show

README.md +1 -79
tokenizer/tokenizer_config.json +8 -1

README.md CHANGED Viewed

@@ -68,85 +68,7 @@ The compression configuration of the model is stored in the `smash_config.json`
 The configuration of the model is stored in the `config.json` file.
 ```bash
-{
-    "config": {
-        "architectures": [
-            "Llama4ForCausalLM"
-        ],
-        "attention_bias": false,
-        "attention_chunk_size": 8192,
-        "attention_dropout": 0.0,
-        "attn_scale": 0.1,
-        "attn_temperature_tuning": 4,
-        "bos_token_id": 200000,
-        "cache_implementation": "hybrid",
-        "eos_token_id": [
-            200001,
-            200007,
-            200008
-        ],
-        "floor_scale": 8192,
-        "for_llm_compressor": false,
-        "head_dim": 8,
-        "hidden_act": "silu",
-        "hidden_size": 16,
-        "initializer_range": 0.02,
-        "interleave_moe_layer_step": 1,
-        "intermediate_size": 32,
-        "intermediate_size_mlp": 64,
-        "max_position_embeddings": 10485760,
-        "model_type": "llama4_text",
-        "moe_layers": [
-            0,
-            1,
-            2,
-            3,
-            4
-        ],
-        "no_rope_layers": [
-            1,
-            1,
-            1,
-            0,
-            1
-        ],
-        "num_attention_heads": 10,
-        "num_experts_per_tok": 1,
-        "num_hidden_layers": 5,
-        "num_key_value_heads": 2,
-        "num_local_experts": 4,
-        "output_router_logits": false,
-        "pad_token_id": 200018,
-        "rms_norm_eps": 1e-05,
-        "rope_scaling": {
-            "factor": 8.0,
-            "high_freq_factor": 4.0,
-            "low_freq_factor": 1.0,
-            "original_max_position_embeddings": 8192,
-            "rope_type": "llama3"
-        },
-        "rope_theta": 500000.0,
-        "router_aux_loss_coef": 0.001,
-        "router_jitter_noise": 0.0,
-        "tie_word_embeddings": false,
-        "torch_dtype": "bfloat16",
-        "transformers_version": "4.51.3",
-        "use_cache": true,
-        "use_qk_norm": true,
-        "vocab_size": 202048
-    },
-    "generation_config": {
-        "_from_model_config": true,
-        "bos_token_id": 200000,
-        "eos_token_id": [
-            200001,
-            200007,
-            200008
-        ],
-        "pad_token_id": 200018,
-        "transformers_version": "4.51.3"
-    }
-}
 ```
 ## 🌍 Join the Pruna AI community!

 The configuration of the model is stored in the `config.json` file.
 ```bash
+{}
 ```
 ## 🌍 Join the Pruna AI community!

tokenizer/tokenizer_config.json CHANGED Viewed

@@ -9086,12 +9086,19 @@
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|eot|>",
   "extra_special_tokens": {},
   "model_input_names": [
     "input_ids",
     "attention_mask"
   ],
   "model_max_length": 10485760,
   "pad_token": "<|finetune_right_pad_id|>",
   "processor_class": "Llama4Processor",
-  "tokenizer_class": "PreTrainedTokenizer"
 }

   "clean_up_tokenization_spaces": false,
   "eos_token": "<|eot|>",
   "extra_special_tokens": {},
+  "max_length": 10485760,
   "model_input_names": [
     "input_ids",
     "attention_mask"
   ],
   "model_max_length": 10485760,
+  "pad_to_multiple_of": null,
   "pad_token": "<|finetune_right_pad_id|>",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
   "processor_class": "Llama4Processor",
+  "stride": 0,
+  "tokenizer_class": "PreTrainedTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first"
 }