badaoui HF Staff commited on 26 days ago

Commit

6bb235f

verified ·

1 Parent(s): 133a221

Adding Neuron-optimized model files

🤖 Neuron Export Bot: On behalf of [badaoui](https://huggingface.co/badaoui), adding AWS Neuron-optimized model files.
Neuron-optimized models can achieve high-performance inference on AWS Inferentia and Trainium chips. Learn more:
- [AWS Neuron Documentation](https://awsdocs-neuron.readthedocs-hosted.com)
- [🤗 Optimum Neuron Guide](https://huggingface.co/docs/optimum-neuron/index)

Files changed (17) hide show

.gitattributes +4 -1
README.md +17 -14
neuron/feature_extractor/preprocessor_config.json +27 -0
neuron/model_index.json +39 -0
neuron/scheduler/scheduler_config.json +15 -0
neuron/text_encoder/config.json +50 -0
neuron/text_encoder/model.neuron +3 -0
neuron/tokenizer/merges.txt +0 -0
neuron/tokenizer/special_tokens_map.json +30 -0
neuron/tokenizer/tokenizer_config.json +31 -0
neuron/tokenizer/vocab.json +0 -0
neuron/unet/config.json +131 -0
neuron/unet/model.neuron +3 -0
neuron/vae_decoder/config.json +74 -0
neuron/vae_decoder/model.neuron +3 -0
neuron/vae_encoder/config.json +74 -0
neuron/vae_encoder/model.neuron +3 -0

.gitattributes CHANGED Viewed

@@ -29,4 +29,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
-*.safetensors filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -textneuron/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
+neuron/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
+neuron/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
+neuron/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -4,26 +4,29 @@ tags:
 - stable-diffusion
 - stable-diffusion-diffusers
 - text-to-image
 widget:
-- text: "A high tech solarpunk utopia in the Amazon rainforest"
   example_title: Amazon rainforest
-- text: "A pikachu fine dining with a view to the Eiffel Tower"
   example_title: Pikachu in Paris
-- text: "A mecha robot in a favela in expressionist style"
   example_title: Expressionist robot
-- text: "an insect robot preparing a delicious meal"
   example_title: Insect robot
-- text: "A small cabin on top of a snowy mountain in the style of Disney, artstation"
   example_title: Snowy disney cabin
-extra_gated_prompt: |-
-  This model is open access and available to all, with a CreativeML OpenRAIL-M license further specifying rights and usage.
-  The CreativeML OpenRAIL License specifies:
-  1. You can't use the model to deliberately produce nor share illegal or harmful outputs or content
-  2. The authors claim no rights on the outputs you generate, you are free to use them and are accountable for their use which must not go against the provisions set in the license
-  3. You may re-distribute the weights and use the model commercially and/or as a service. If you do, please be aware you have to include the same use restrictions as the ones in the license and share a copy of the CreativeML OpenRAIL-M to all your users (please read the license entirely and carefully)
-  Please read the full license carefully here: https://huggingface.co/spaces/CompVis/stable-diffusion-license
 extra_gated_heading: Please read the LICENSE to access this model
 ---

 - stable-diffusion
 - stable-diffusion-diffusers
 - text-to-image
+- neuron
 widget:
+- text: A high tech solarpunk utopia in the Amazon rainforest
   example_title: Amazon rainforest
+- text: A pikachu fine dining with a view to the Eiffel Tower
   example_title: Pikachu in Paris
+- text: A mecha robot in a favela in expressionist style
   example_title: Expressionist robot
+- text: an insect robot preparing a delicious meal
   example_title: Insect robot
+- text: A small cabin on top of a snowy mountain in the style of Disney, artstation
   example_title: Snowy disney cabin
+extra_gated_prompt: "This model is open access and available to all, with a CreativeML\
+  \ OpenRAIL-M license further specifying rights and usage.\nThe CreativeML OpenRAIL\
+  \ License specifies: \n\n1. You can't use the model to deliberately produce nor\
+  \ share illegal or harmful outputs or content \n2. The authors claim no rights on\
+  \ the outputs you generate, you are free to use them and are accountable for their\
+  \ use which must not go against the provisions set in the license\n3. You may re-distribute\
+  \ the weights and use the model commercially and/or as a service. If you do, please\
+  \ be aware you have to include the same use restrictions as the ones in the license\
+  \ and share a copy of the CreativeML OpenRAIL-M to all your users (please read the\
+  \ license entirely and carefully)\nPlease read the full license carefully here:\
+  \ https://huggingface.co/spaces/CompVis/stable-diffusion-license\n    "
 extra_gated_heading: Please read the LICENSE to access this model
 ---

neuron/feature_extractor/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": true,
+  "do_convert_rgb": true,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.48145466,
+    0.4578275,
+    0.40821073
+  ],
+  "image_processor_type": "CLIPImageProcessor",
+  "image_std": [
+    0.26862954,
+    0.26130258,
+    0.27577711
+  ],
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "shortest_edge": 224
+  }
+}

neuron/model_index.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_class_name": "NeuronStableDiffusionPipeline",
+  "_diffusers_version": "0.34.0",
+  "feature_extractor": [
+    "transformers",
+    "CLIPImageProcessor"
+  ],
+  "force_zeros_for_empty_prompt": true,
+  "image_encoder": [
+    null,
+    null
+  ],
+  "requires_aesthetics_score": false,
+  "requires_safety_checker": true,
+  "safety_checker": [
+    null,
+    null
+  ],
+  "scheduler": [
+    "diffusers",
+    "PNDMScheduler"
+  ],
+  "text_encoder": [
+    "optimum.neuron.modeling_diffusion",
+    "NeuronModelTextEncoder"
+  ],
+  "tokenizer": [
+    "transformers",
+    "CLIPTokenizer"
+  ],
+  "unet": [
+    "optimum.neuron.modeling_diffusion",
+    "NeuronModelUnet"
+  ],
+  "vae": [
+    "optimum.neuron.modeling_diffusion",
+    "NeuronModelVae"
+  ]
+}

neuron/scheduler/scheduler_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "_class_name": "PNDMScheduler",
+  "_diffusers_version": "0.34.0",
+  "beta_end": 0.012,
+  "beta_schedule": "scaled_linear",
+  "beta_start": 0.00085,
+  "clip_sample": false,
+  "num_train_timesteps": 1000,
+  "prediction_type": "epsilon",
+  "set_alpha_to_one": false,
+  "skip_prk_steps": true,
+  "steps_offset": 1,
+  "timestep_spacing": "leading",
+  "trained_betas": null
+}

neuron/text_encoder/config.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "_attn_implementation_autoset": true,
+  "_name_or_path": "/home/user/.cache/huggingface/hub/models--CompVis--stable-diffusion-v1-4/snapshots/133a221b8aa7292a167afc5127cb63fb5005638b/text_encoder",
+  "architectures": [
+    "CLIPTextModel"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "dropout": 0.0,
+  "eos_token_id": 2,
+  "hidden_act": "quick_gelu",
+  "hidden_size": 768,
+  "initializer_factor": 1.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 77,
+  "model_type": "clip_text_model",
+  "neuron": {
+    "auto_cast": "matmul",
+    "auto_cast_type": "bf16",
+    "compiler_type": "neuronx-cc",
+    "compiler_version": "2.15.143.0+e39249ad",
+    "dynamic_batch_size": false,
+    "inline_weights_to_neff": true,
+    "input_names": [
+      "input_ids"
+    ],
+    "model_type": "clip-text-model",
+    "optlevel": "2",
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_names": [
+      "last_hidden_state",
+      "pooler_output"
+    ],
+    "static_batch_size": 1,
+    "static_sequence_length": 77,
+    "tensor_parallel_size": 1
+  },
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "projection_dim": 512,
+  "task": "feature-extraction",
+  "torch_dtype": "float32",
+  "torchscript": true,
+  "transformers_version": "4.48.3",
+  "vocab_size": 49408
+}

neuron/text_encoder/model.neuron ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0317993ca77ba8658bb9cb3e6acf8de57b98b862fbe51fa11d499bd53194d896
+size 375660151

neuron/tokenizer/merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

neuron/tokenizer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

neuron/tokenizer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "add_prefix_space": false,
+  "added_tokens_decoder": {
+    "49406": {
+      "content": "<|startoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "49407": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|startoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "do_lower_case": true,
+  "eos_token": "<|endoftext|>",
+  "errors": "replace",
+  "extra_special_tokens": {},
+  "model_max_length": 77,
+  "pad_token": "<|endoftext|>",
+  "tokenizer_class": "CLIPTokenizer",
+  "unk_token": "<|endoftext|>"
+}

neuron/tokenizer/vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff

neuron/unet/config.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "_class_name": "UNet2DConditionModel",
+  "_commit_hash": null,
+  "_diffusers_version": "0.34.0",
+  "_name_or_path": "/home/user/.cache/huggingface/hub/models--CompVis--stable-diffusion-v1-4/snapshots/133a221b8aa7292a167afc5127cb63fb5005638b/unet",
+  "_use_default_values": [
+    "num_attention_heads",
+    "num_class_embeds",
+    "time_embedding_type",
+    "only_cross_attention",
+    "class_embeddings_concat",
+    "resnet_out_scale_factor",
+    "dual_cross_attention",
+    "time_cond_proj_dim",
+    "conv_in_kernel",
+    "time_embedding_act_fn",
+    "reverse_transformer_layers_per_block",
+    "resnet_skip_time_act",
+    "cross_attention_norm",
+    "resnet_time_scale_shift",
+    "conv_out_kernel",
+    "addition_time_embed_dim",
+    "addition_embed_type",
+    "mid_block_only_cross_attention",
+    "mid_block_type",
+    "projection_class_embeddings_input_dim",
+    "encoder_hid_dim",
+    "transformer_layers_per_block",
+    "upcast_attention",
+    "attention_type",
+    "use_linear_projection",
+    "dropout",
+    "addition_embed_type_num_heads",
+    "time_embedding_dim",
+    "timestep_post_act",
+    "encoder_hid_dim_type",
+    "class_embed_type"
+  ],
+  "act_fn": "silu",
+  "addition_embed_type": null,
+  "addition_embed_type_num_heads": 64,
+  "addition_time_embed_dim": null,
+  "attention_head_dim": 8,
+  "attention_type": "default",
+  "block_out_channels": [
+    320,
+    640,
+    1280,
+    1280
+  ],
+  "center_input_sample": false,
+  "class_embed_type": null,
+  "class_embeddings_concat": false,
+  "conv_in_kernel": 3,
+  "conv_out_kernel": 3,
+  "cross_attention_dim": 768,
+  "cross_attention_norm": null,
+  "down_block_types": [
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "CrossAttnDownBlock2D",
+    "DownBlock2D"
+  ],
+  "downsample_padding": 1,
+  "dropout": 0.0,
+  "dual_cross_attention": false,
+  "encoder_hid_dim": null,
+  "encoder_hid_dim_type": null,
+  "flip_sin_to_cos": true,
+  "freq_shift": 0,
+  "in_channels": 4,
+  "layers_per_block": 2,
+  "mid_block_only_cross_attention": null,
+  "mid_block_scale_factor": 1,
+  "mid_block_type": "UNetMidBlock2DCrossAttn",
+  "neuron": {
+    "auto_cast": "matmul",
+    "auto_cast_type": "bf16",
+    "compiler_type": "neuronx-cc",
+    "compiler_version": "2.15.143.0+e39249ad",
+    "dynamic_batch_size": false,
+    "inline_weights_to_neff": true,
+    "input_names": [
+      "sample",
+      "timestep",
+      "encoder_hidden_states"
+    ],
+    "model_type": "unet",
+    "optlevel": "2",
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_names": [
+      "sample"
+    ],
+    "static_batch_size": 1,
+    "static_height": 64,
+    "static_num_channels": 4,
+    "static_sequence_length": 77,
+    "static_vae_scale_factor": 8,
+    "static_width": 64,
+    "tensor_parallel_size": 1
+  },
+  "norm_eps": 1e-05,
+  "norm_num_groups": 32,
+  "num_attention_heads": null,
+  "num_class_embeds": null,
+  "only_cross_attention": false,
+  "out_channels": 4,
+  "projection_class_embeddings_input_dim": null,
+  "resnet_out_scale_factor": 1.0,
+  "resnet_skip_time_act": false,
+  "resnet_time_scale_shift": "default",
+  "reverse_transformer_layers_per_block": null,
+  "sample_size": 64,
+  "task": "semantic-segmentation",
+  "time_cond_proj_dim": null,
+  "time_embedding_act_fn": null,
+  "time_embedding_dim": null,
+  "time_embedding_type": "positional",
+  "timestep_post_act": null,
+  "transformer_layers_per_block": 1,
+  "transformers_version": null,
+  "up_block_types": [
+    "UpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D",
+    "CrossAttnUpBlock2D"
+  ],
+  "upcast_attention": false,
+  "use_linear_projection": false
+}

neuron/unet/model.neuron ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5d2ea7e8f9e69a2c4625cee3286e40c07168ece969951a9ea71b28c5e5d9fd6
+size 1900028915

neuron/vae_decoder/config.json ADDED Viewed

	@@ -0,0 +1,74 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_commit_hash": null,
+  "_diffusers_version": "0.34.0",
+  "_name_or_path": "/home/user/.cache/huggingface/hub/models--CompVis--stable-diffusion-v1-4/snapshots/133a221b8aa7292a167afc5127cb63fb5005638b/vae",
+  "_use_default_values": [
+    "use_post_quant_conv",
+    "mid_block_add_attention",
+    "shift_factor",
+    "latents_std",
+    "use_quant_conv",
+    "latents_mean",
+    "norm_num_groups",
+    "force_upcast"
+  ],
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": true,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "latents_mean": null,
+  "latents_std": null,
+  "layers_per_block": 2,
+  "mid_block_add_attention": true,
+  "neuron": {
+    "auto_cast": "matmul",
+    "auto_cast_type": "bf16",
+    "compiler_type": "neuronx-cc",
+    "compiler_version": "2.15.143.0+e39249ad",
+    "dynamic_batch_size": false,
+    "inline_weights_to_neff": true,
+    "input_names": [
+      "latent_sample"
+    ],
+    "model_type": "vae-decoder",
+    "optlevel": "2",
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_names": [
+      "sample"
+    ],
+    "static_batch_size": 1,
+    "static_height": 64,
+    "static_num_channels": 4,
+    "static_width": 64,
+    "tensor_parallel_size": 1
+  },
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 512,
+  "scaling_factor": 0.18215,
+  "shift_factor": null,
+  "task": "semantic-segmentation",
+  "transformers_version": null,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ],
+  "use_post_quant_conv": true,
+  "use_quant_conv": true
+}

neuron/vae_decoder/model.neuron ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e34b73737a49dbadfae2e5bc5d21fdbdc35441fe5935d81926366d5905d5585
+size 247896819

neuron/vae_encoder/config.json ADDED Viewed

	@@ -0,0 +1,74 @@

+{
+  "_class_name": "AutoencoderKL",
+  "_commit_hash": null,
+  "_diffusers_version": "0.34.0",
+  "_name_or_path": "/home/user/.cache/huggingface/hub/models--CompVis--stable-diffusion-v1-4/snapshots/133a221b8aa7292a167afc5127cb63fb5005638b/vae",
+  "_use_default_values": [
+    "use_post_quant_conv",
+    "mid_block_add_attention",
+    "shift_factor",
+    "latents_std",
+    "use_quant_conv",
+    "latents_mean",
+    "norm_num_groups",
+    "force_upcast"
+  ],
+  "act_fn": "silu",
+  "block_out_channels": [
+    128,
+    256,
+    512,
+    512
+  ],
+  "down_block_types": [
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D",
+    "DownEncoderBlock2D"
+  ],
+  "force_upcast": true,
+  "in_channels": 3,
+  "latent_channels": 4,
+  "latents_mean": null,
+  "latents_std": null,
+  "layers_per_block": 2,
+  "mid_block_add_attention": true,
+  "neuron": {
+    "auto_cast": "matmul",
+    "auto_cast_type": "bf16",
+    "compiler_type": "neuronx-cc",
+    "compiler_version": "2.15.143.0+e39249ad",
+    "dynamic_batch_size": false,
+    "inline_weights_to_neff": true,
+    "input_names": [
+      "sample"
+    ],
+    "model_type": "vae-encoder",
+    "optlevel": "2",
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_names": [
+      "latent_parameters"
+    ],
+    "static_batch_size": 1,
+    "static_height": 512,
+    "static_num_channels": 3,
+    "static_width": 512,
+    "tensor_parallel_size": 1
+  },
+  "norm_num_groups": 32,
+  "out_channels": 3,
+  "sample_size": 512,
+  "scaling_factor": 0.18215,
+  "shift_factor": null,
+  "task": "semantic-segmentation",
+  "transformers_version": null,
+  "up_block_types": [
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D",
+    "UpDecoderBlock2D"
+  ],
+  "use_post_quant_conv": true,
+  "use_quant_conv": true
+}

neuron/vae_encoder/model.neuron ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3851ce0e1548466616908a111352321f080a5fd7672e09f91a28cab0eb7103c
+size 155910897