lowlorenz
/

vit-sae-acae9988-openai_clip_vit_b_32

Model card Files Files and versions Community

vit-sae-acae9988-openai_clip_vit_b_32 / config.json

lowlorenz

Upload folder using huggingface_hub

87413bd verified about 2 months ago

raw

history blame contribute delete

1.82 kB

	{
	"model_class_name": "HookedViT",
	"model_name": "openai/clip-vit-base-patch32",
	"vit_model_cfg": null,
	"model_path": null,
	"hook_point_layer": 11,
	"layer_subtype": "hook_resid_post",
	"hook_point_head_index": null,
	"context_size": 50,
	"use_cached_activations": false,
	"use_patches_only": false,
	"cached_activations_path": "activations/_datasets_imagenet1k/openai_clip-vit-base-patch32/blocks.11.hook_resid_post",
	"image_size": 224,
	"architecture": "standard",
	"b_dec_init_method": "geometric_median",
	"expansion_factor": 64,
	"from_pretrained_path": null,
	"seed": 42,
	"d_in": 768,
	"activation_fn_str": "topk",
	"activation_fn_kwargs": {
	"k": 64
	},
	"cls_token_only": true,
	"max_grad_norm": 1.0,
	"initialization_method": "encoder_transpose_decoder",
	"normalize_activations": null,
	"n_batches_in_buffer": 20,
	"store_batch_size": 256,
	"num_workers": 32,
	"num_epochs": 2,
	"verbose": false,
	"l1_coefficient": 3e-05,
	"lp_norm": 1,
	"lr": 0.005,
	"lr_scheduler_name": "constantwithwarmup",
	"lr_warm_up_steps": 200,
	"train_batch_size": 4096,
	"dataset_name": "imagenet1k",
	"dataset_path": "/datasets/imagenet1k",
	"dataset_train_path": "/datasets/imagenet1k/ILSVRC/Data/CLS-LOC/train",
	"dataset_val_path": "/datasets/imagenet1k/ILSVRC/Data/CLS-LOC/val",
	"use_ghost_grads": true,
	"feature_sampling_window": 1000,
	"dead_feature_window": 5000,
	"dead_feature_threshold": 1e-08,
	"log_to_wandb": true,
	"wandb_project": "openai_clip_vit_b_32",
	"wandb_entity": "perceptual-alignment",
	"wandb_log_frequency": 100,
	"n_validation_runs": 4,
	"n_checkpoints": 2,
	"checkpoint_path": "models/sae/openai/topk/acae9988-openai_clip_vit_b_32"
	}