mirror of
				https://github.com/comfyanonymous/ComfyUI.git
				synced 2025-10-25 07:54:30 +00:00 
			
		
		
		
	support clip-vit-large-patch14-336 (#4042)
* support clip-vit-large-patch14-336 * support clip-vit-large-patch14-336
This commit is contained in:
		| @@ -94,7 +94,10 @@ def load_clipvision_from_sd(sd, prefix="", convert_keys=False): | ||||
|     elif "vision_model.encoder.layers.30.layer_norm1.weight" in sd: | ||||
|         json_config = os.path.join(os.path.dirname(os.path.realpath(__file__)), "clip_vision_config_h.json") | ||||
|     elif "vision_model.encoder.layers.22.layer_norm1.weight" in sd: | ||||
|         json_config = os.path.join(os.path.dirname(os.path.realpath(__file__)), "clip_vision_config_vitl.json") | ||||
|         if sd["vision_model.embeddings.position_embedding.weight"].shape[0] == 577: | ||||
|             json_config = os.path.join(os.path.dirname(os.path.realpath(__file__)), "clip_vision_config_vitl_336.json") | ||||
|         else: | ||||
|             json_config = os.path.join(os.path.dirname(os.path.realpath(__file__)), "clip_vision_config_vitl.json") | ||||
|     else: | ||||
|         return None | ||||
|  | ||||
|   | ||||
							
								
								
									
										18
									
								
								comfy/clip_vision_config_vitl_336.json
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										18
									
								
								comfy/clip_vision_config_vitl_336.json
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,18 @@ | ||||
| { | ||||
|   "attention_dropout": 0.0, | ||||
|   "dropout": 0.0, | ||||
|   "hidden_act": "quick_gelu", | ||||
|   "hidden_size": 1024, | ||||
|   "image_size": 336, | ||||
|   "initializer_factor": 1.0, | ||||
|   "initializer_range": 0.02, | ||||
|   "intermediate_size": 4096, | ||||
|   "layer_norm_eps": 1e-5, | ||||
|   "model_type": "clip_vision_model", | ||||
|   "num_attention_heads": 16, | ||||
|   "num_channels": 3, | ||||
|   "num_hidden_layers": 24, | ||||
|   "patch_size": 14, | ||||
|   "projection_dim": 768, | ||||
|   "torch_dtype": "float32" | ||||
| } | ||||
		Reference in New Issue
	
	Block a user