| { | |
| "architectures": [ | |
| "GPTNeoXCodebookModel" | |
| ], | |
| "codebook_at": [ | |
| "attn_preproj" | |
| ], | |
| "codebook_type": "group", | |
| "k_codebook": 8, | |
| "kmeans_init": false, | |
| "kmeans_init_examples": 1000, | |
| "kmeans_kwargs": { | |
| "batch_size": 24576, | |
| "n_init": "auto" | |
| }, | |
| "kmeans_path": "/.cache/cb_volume/huggingface/kmeans_embeddings.pt", | |
| "layers_to_snap": [ | |
| 0, | |
| 1, | |
| 2, | |
| 3, | |
| 4, | |
| 5, | |
| 6, | |
| 7, | |
| 8, | |
| 9, | |
| 10, | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15, | |
| 16, | |
| 17, | |
| 18, | |
| 19, | |
| 20, | |
| 21, | |
| 22, | |
| 23 | |
| ], | |
| "loss": "aeloss", | |
| "model_type": "codebook", | |
| "num_codebooks": 16, | |
| "num_codes": 10000, | |
| "similarity_metric": "inner_product", | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.27.3" | |
| } | |