Upload 2 files

Browse files

Files changed (2) hide show

SplatFusion_PONY_XL_V5.safetensors +3 -0
SplatFusion_PONY_XL_V5.yaml +100 -0

SplatFusion_PONY_XL_V5.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0d94c5de65ba5f1b48483788a3d3f6f773a5ab59574efde4f7f9e2389678a8e6
+size 13875783240

SplatFusion_PONY_XL_V5.yaml ADDED Viewed

	@@ -0,0 +1,100 @@

+model:
+  params:
+    conditioner_config:
+      params:
+        emb_models:
+        - input_key: txt
+          is_trainable: false
+          params:
+            layer: hidden
+            layer_idx: 11
+          target: sgm.modules.encoders.modules.FrozenCLIPEmbedder
+        - input_key: txt
+          is_trainable: false
+          params:
+            always_return_pooled: true
+            arch: ViT-bigG-14
+            freeze: true
+            layer: penultimate
+            legacy: false
+            version: laion2b_s39b_b160k
+          target: sgm.modules.encoders.modules.FrozenOpenCLIPEmbedder2
+        - input_key: original_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: crop_coords_top_left
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+        - input_key: target_size_as_tuple
+          is_trainable: false
+          params:
+            outdim: 256
+          target: sgm.modules.encoders.modules.ConcatTimestepEmbedderND
+      target: sgm.modules.GeneralConditioner
+    denoiser_config:
+      params:
+        discretization_config:
+          target: sgm.modules.diffusionmodules.discretizer.LegacyDDPMDiscretization
+        num_idx: 1000
+        scaling_config:
+          target: sgm.modules.diffusionmodules.denoiser_scaling.EpsScaling
+        weighting_config:
+          target: sgm.modules.diffusionmodules.denoiser_weighting.EpsWeighting
+      target: sgm.modules.diffusionmodules.denoiser.DiscreteDenoiser
+    disable_first_stage_autocast: true
+    first_stage_config:
+      params:
+        ddconfig:
+          attn_resolutions: []
+          attn_type: vanilla-xformers
+          ch: 128
+          ch_mult:
+          - 1
+          - 2
+          - 4
+          - 4
+          double_z: true
+          dropout: 0.0
+          in_channels: 3
+          num_res_blocks: 2
+          out_ch: 3
+          resolution: 256
+          z_channels: 4
+        embed_dim: 4
+        lossconfig:
+          target: torch.nn.Identity
+        monitor: val/rec_loss
+      target: sgm.models.autoencoder.AutoencoderKLInferenceWrapper
+    network_config:
+      params:
+        adm_in_channels: 2816
+        attention_resolutions:
+        - 4
+        - 2
+        channel_mult:
+        - 1
+        - 2
+        - 4
+        context_dim: 2048
+        in_channels: 4
+        legacy: false
+        model_channels: 320
+        num_classes: sequential
+        num_head_channels: 64
+        num_res_blocks: 2
+        out_channels: 4
+        spatial_transformer_attn_type: softmax-xformers
+        transformer_depth:
+        - 1
+        - 2
+        - 10
+        use_checkpoint: true
+        use_linear_in_transformer: true
+        use_spatial_transformer: true
+      target: sgm.modules.diffusionmodules.openaimodel.UNetModel
+    scale_factor: 0.13025
+  target: sgm.models.diffusion.DiffusionEngine