| """
|
| Vortex-13B model configuration.
|
| Optimized for 16GB VRAM (4060 Ti laptop) and MacBook Pro M3 Max.
|
| """
|
|
|
| VORTEX_13B_CONFIG = {
|
|
|
| "d_model": 5120,
|
| "num_layers": 40,
|
| "num_heads": 40,
|
| "head_dim": 128,
|
|
|
|
|
| "d_state": 32,
|
| "d_conv": 4,
|
|
|
|
|
| "window_size": 512,
|
| "use_flash_attention": True,
|
|
|
|
|
| "ffn_expansion": 4,
|
| "num_domains": 7,
|
| "vocab_size": 50000,
|
| "max_seq_len": 16384,
|
|
|
|
|
| "ssm_ratio": 0.5,
|
|
|
|
|
| "dtype": "bfloat16",
|
|
|
|
|
| "special_tokens": {
|
| "[PAD]": 0,
|
| "[UNK]": 1,
|
| "[BOS]": 2,
|
| "[EOS]": 3,
|
| "[EQUATION]": 4,
|
| "[/EQUATION]": 5,
|
| "[CITATION]": 6,
|
| "[/CITATION]": 7,
|
| "[MOLECULE]": 8,
|
| "[/MOLECULE]": 9,
|
| "[FIGURE]": 10,
|
| "[TABLE]": 11,
|
| "[MATH]": 12,
|
| "[CHEM]": 13,
|
| "[BIO]": 14,
|
| "[PHYS]": 15,
|
| "[EARTH]": 16,
|
| "[SPACE]": 17,
|
| "[ZOO]": 18,
|
| },
|
|
|
| "domain_tags": ["[MATH]", "[CHEM]", "[BIO]", "[PHYS]", "[EARTH]", "[SPACE]", "[ZOO]"],
|
|
|
|
|
| "enable_equation_module": True,
|
| "enable_numerical_module": True,
|
| "enable_citation_module": True,
|
| "enable_molecular_module": True,
|
| }
|
|
|
|
|
| def get_config():
|
| """Return the 13B configuration dictionary."""
|
| return VORTEX_13B_CONFIG
|
|
|