{ | |
"architectures": [ | |
"GPTNeoCodebookModel" | |
], | |
"codebook_at": [ | |
"attn", | |
"mlp" | |
], | |
"codebook_kwargs": {}, | |
"codebook_type": [ | |
"vanilla", | |
"vanilla" | |
], | |
"k_codebook": [ | |
16, | |
16 | |
], | |
"kmeans_init": false, | |
"kmeans_init_examples": 1000, | |
"kmeans_kwargs": { | |
"batch_size": 24576, | |
"n_init": "auto" | |
}, | |
"kmeans_path": "/.cache/cb_volume/huggingface/kmeans_embeddings.pt", | |
"layers_to_snap": [ | |
0 | |
], | |
"loss": "aeloss", | |
"model_type": "codebook", | |
"num_codebooks": [ | |
1, | |
1 | |
], | |
"num_codes": [ | |
10000, | |
10000 | |
], | |
"replace_codes": false, | |
"similarity_metric": "inner_product", | |
"torch_dtype": "float32", | |
"transformers_version": "4.35.2" | |
} | |