SwinV23D#

pydantic model vision_architectures.nets.swinv2_3d.SwinV23DPatchMergingConfig[source]#

Bases: CustomBaseModel

Show JSON schema

{
   "title": "SwinV23DPatchMergingConfig",
   "type": "object",
   "properties": {
      "out_dim_ratio": {
         "title": "Out Dim Ratio",
         "type": "integer"
      },
      "merge_window_size": {
         "maxItems": 3,
         "minItems": 3,
         "prefixItems": [
            {
               "type": "integer"
            },
            {
               "type": "integer"
            },
            {
               "type": "integer"
            }
         ],
         "title": "Merge Window Size",
         "type": "array"
      }
   },
   "required": [
      "out_dim_ratio",
      "merge_window_size"
   ]
}

Config:

arbitrary_types_allowed: bool = True
extra: str = ignore
validate_default: bool = True
validate_assignment: bool = True
validate_return: bool = True

Fields:

merge_window_size (tuple[int, int, int])
out_dim_ratio (int)

Validators:

validate_before » all fields

field out_dim_ratio: int [Required]#

Validated by:

validate
validate_before

field merge_window_size: tuple[int, int, int] [Required]#

Validated by:

validate
validate_before

validator validate_before » all fields[source]#: Base class method for validating data before creating the model.

pydantic model vision_architectures.nets.swinv2_3d.SwinV23DPatchSplittingConfig[source]#

Bases: CustomBaseModel

Show JSON schema

{
   "title": "SwinV23DPatchSplittingConfig",
   "type": "object",
   "properties": {
      "out_dim_ratio": {
         "title": "Out Dim Ratio",
         "type": "integer"
      },
      "final_window_size": {
         "maxItems": 3,
         "minItems": 3,
         "prefixItems": [
            {
               "type": "integer"
            },
            {
               "type": "integer"
            },
            {
               "type": "integer"
            }
         ],
         "title": "Final Window Size",
         "type": "array"
      }
   },
   "required": [
      "out_dim_ratio",
      "final_window_size"
   ]
}

Config:

arbitrary_types_allowed: bool = True
extra: str = ignore
validate_default: bool = True
validate_assignment: bool = True
validate_return: bool = True

Fields:

final_window_size (tuple[int, int, int])
out_dim_ratio (int)

Validators:

validate_before » all fields

field out_dim_ratio: int [Required]#

Validated by:

validate
validate_before

field final_window_size: tuple[int, int, int] [Required]#

Validated by:

validate
validate_before

validator validate_before » all fields[source]#: Base class method for validating data before creating the model.

pydantic model vision_architectures.nets.swinv2_3d.SwinV23DStageConfig[source]#

Bases: Attention3DWithMLPConfig

Show JSON schema

{
   "title": "SwinV23DStageConfig",
   "type": "object",
   "properties": {
      "dim": {
         "default": 0,
         "description": "dim at which attention is performed",
         "title": "Dim",
         "type": "integer"
      },
      "num_heads": {
         "description": "Number of query heads",
         "title": "Num Heads",
         "type": "integer"
      },
      "ratio_q_to_kv_heads": {
         "default": 1,
         "title": "Ratio Q To Kv Heads",
         "type": "integer"
      },
      "logit_scale_learnable": {
         "default": false,
         "title": "Logit Scale Learnable",
         "type": "boolean"
      },
      "attn_drop_prob": {
         "default": 0.0,
         "title": "Attn Drop Prob",
         "type": "number"
      },
      "proj_drop_prob": {
         "default": 0.0,
         "title": "Proj Drop Prob",
         "type": "number"
      },
      "max_attention_batch_size": {
         "default": -1,
         "description": "Runs attention by splitting the inputs into chunks of this size. 0 means no chunking. Useful for large inputs during inference.",
         "title": "Max Attention Batch Size",
         "type": "integer"
      },
      "mlp_ratio": {
         "default": 4,
         "description": "Ratio of the hidden dimension in the MLP to the input dimension.",
         "title": "Mlp Ratio",
         "type": "integer"
      },
      "activation": {
         "default": "gelu",
         "description": "Activation function for the MLP.",
         "title": "Activation",
         "type": "string"
      },
      "mlp_drop_prob": {
         "default": 0.0,
         "description": "Dropout probability for the MLP.",
         "title": "Mlp Drop Prob",
         "type": "number"
      },
      "norm_location": {
         "default": "post",
         "description": "Location of the normalization layer in the attention block. Pre-normalization implies normalization before the attention operation, while post-normalization applies it after.",
         "enum": [
            "pre",
            "post"
         ],
         "title": "Norm Location",
         "type": "string"
      },
      "layer_norm_eps": {
         "default": 1e-06,
         "description": "Epsilon value for the layer normalization.",
         "title": "Layer Norm Eps",
         "type": "number"
      },
      "depth": {
         "title": "Depth",
         "type": "integer"
      },
      "window_size": {
         "maxItems": 3,
         "minItems": 3,
         "prefixItems": [
            {
               "type": "integer"
            },
            {
               "type": "integer"
            },
            {
               "type": "integer"
            }
         ],
         "title": "Window Size",
         "type": "array"
      },
      "use_relative_position_bias": {
         "default": true,
         "title": "Use Relative Position Bias",
         "type": "boolean"
      },
      "patch_merging": {
         "anyOf": [
            {
               "$ref": "#/$defs/SwinV23DPatchMergingConfig"
            },
            {
               "type": "null"
            }
         ],
         "default": null
      },
      "patch_splitting": {
         "anyOf": [
            {
               "$ref": "#/$defs/SwinV23DPatchSplittingConfig"
            },
            {
               "type": "null"
            }
         ],
         "default": null
      },
      "in_dim": {
         "anyOf": [
            {
               "type": "integer"
            },
            {
               "type": "null"
            }
         ],
         "default": null,
         "title": "In Dim"
      },
      "out_dim": {
         "anyOf": [
            {
               "type": "integer"
            },
            {
               "type": "null"
            }
         ],
         "default": null,
         "title": "Out Dim"
      }
   },
   "$defs": {
      "SwinV23DPatchMergingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "merge_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Merge Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "merge_window_size"
         ],
         "title": "SwinV23DPatchMergingConfig",
         "type": "object"
      },
      "SwinV23DPatchSplittingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "final_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Final Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "final_window_size"
         ],
         "title": "SwinV23DPatchSplittingConfig",
         "type": "object"
      }
   },
   "required": [
      "num_heads",
      "depth",
      "window_size"
   ]
}

Config:

arbitrary_types_allowed: bool = True
extra: str = ignore
validate_default: bool = True
validate_assignment: bool = True
validate_return: bool = True

Fields:

depth (int)
dim (int)
in_dim (int | None)
logit_scale_learnable (bool)
out_dim (int | None)
patch_merging (vision_architectures.nets.swinv2_3d.SwinV23DPatchMergingConfig | None)
patch_splitting (vision_architectures.nets.swinv2_3d.SwinV23DPatchSplittingConfig | None)
use_relative_position_bias (bool)
window_size (tuple[int, int, int])

Validators:

field depth: int [Required]#

Validated by:

field window_size: tuple[int, int, int] [Required]#

Validated by:

field use_relative_position_bias: bool = True#

Validated by:

field patch_merging: SwinV23DPatchMergingConfig | None = None#

Validated by:

field patch_splitting: SwinV23DPatchSplittingConfig | None = None#

Validated by:

field in_dim: int | None = None#

Validated by:

field dim: int = 0#

dim at which attention is performed

Validated by:

field out_dim: int | None = None#

Validated by:

field logit_scale_learnable: bool = False#

Validated by:

property spatial_compression_ratio#

get_out_patch_size(in_patch_size)[source]#

get_in_patch_size(out_patch_size)[source]#

pydantic model vision_architectures.nets.swinv2_3d.SwinV23DEncoderDecoderConfig[source]#

Bases: CustomBaseModel

Show JSON schema

{
   "title": "SwinV23DEncoderDecoderConfig",
   "type": "object",
   "properties": {
      "dim": {
         "title": "Dim",
         "type": "integer"
      },
      "stages": {
         "items": {
            "$ref": "#/$defs/SwinV23DStageConfig"
         },
         "title": "Stages",
         "type": "array"
      },
      "drop_prob": {
         "default": 0.0,
         "title": "Drop Prob",
         "type": "number"
      },
      "embed_spacing_info": {
         "default": false,
         "title": "Embed Spacing Info",
         "type": "boolean"
      }
   },
   "$defs": {
      "SwinV23DPatchMergingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "merge_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Merge Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "merge_window_size"
         ],
         "title": "SwinV23DPatchMergingConfig",
         "type": "object"
      },
      "SwinV23DPatchSplittingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "final_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Final Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "final_window_size"
         ],
         "title": "SwinV23DPatchSplittingConfig",
         "type": "object"
      },
      "SwinV23DStageConfig": {
         "properties": {
            "dim": {
               "default": 0,
               "description": "dim at which attention is performed",
               "title": "Dim",
               "type": "integer"
            },
            "num_heads": {
               "description": "Number of query heads",
               "title": "Num Heads",
               "type": "integer"
            },
            "ratio_q_to_kv_heads": {
               "default": 1,
               "title": "Ratio Q To Kv Heads",
               "type": "integer"
            },
            "logit_scale_learnable": {
               "default": false,
               "title": "Logit Scale Learnable",
               "type": "boolean"
            },
            "attn_drop_prob": {
               "default": 0.0,
               "title": "Attn Drop Prob",
               "type": "number"
            },
            "proj_drop_prob": {
               "default": 0.0,
               "title": "Proj Drop Prob",
               "type": "number"
            },
            "max_attention_batch_size": {
               "default": -1,
               "description": "Runs attention by splitting the inputs into chunks of this size. 0 means no chunking. Useful for large inputs during inference.",
               "title": "Max Attention Batch Size",
               "type": "integer"
            },
            "mlp_ratio": {
               "default": 4,
               "description": "Ratio of the hidden dimension in the MLP to the input dimension.",
               "title": "Mlp Ratio",
               "type": "integer"
            },
            "activation": {
               "default": "gelu",
               "description": "Activation function for the MLP.",
               "title": "Activation",
               "type": "string"
            },
            "mlp_drop_prob": {
               "default": 0.0,
               "description": "Dropout probability for the MLP.",
               "title": "Mlp Drop Prob",
               "type": "number"
            },
            "norm_location": {
               "default": "post",
               "description": "Location of the normalization layer in the attention block. Pre-normalization implies normalization before the attention operation, while post-normalization applies it after.",
               "enum": [
                  "pre",
                  "post"
               ],
               "title": "Norm Location",
               "type": "string"
            },
            "layer_norm_eps": {
               "default": 1e-06,
               "description": "Epsilon value for the layer normalization.",
               "title": "Layer Norm Eps",
               "type": "number"
            },
            "depth": {
               "title": "Depth",
               "type": "integer"
            },
            "window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Window Size",
               "type": "array"
            },
            "use_relative_position_bias": {
               "default": true,
               "title": "Use Relative Position Bias",
               "type": "boolean"
            },
            "patch_merging": {
               "anyOf": [
                  {
                     "$ref": "#/$defs/SwinV23DPatchMergingConfig"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null
            },
            "patch_splitting": {
               "anyOf": [
                  {
                     "$ref": "#/$defs/SwinV23DPatchSplittingConfig"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null
            },
            "in_dim": {
               "anyOf": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null,
               "title": "In Dim"
            },
            "out_dim": {
               "anyOf": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null,
               "title": "Out Dim"
            }
         },
         "required": [
            "num_heads",
            "depth",
            "window_size"
         ],
         "title": "SwinV23DStageConfig",
         "type": "object"
      }
   },
   "required": [
      "dim",
      "stages"
   ]
}

Config:

arbitrary_types_allowed: bool = True
extra: str = ignore
validate_default: bool = True
validate_assignment: bool = True
validate_return: bool = True

Fields:

dim (int)
drop_prob (float)
embed_spacing_info (bool)
stages (list[vision_architectures.nets.swinv2_3d.SwinV23DStageConfig])

Validators:

validate » all fields

field dim: int [Required]#

Validated by:

field stages: list[SwinV23DStageConfig] [Required]#

Validated by:

field drop_prob: float = 0.0#

Validated by:

field embed_spacing_info: bool = False#

Validated by:

populate()[source]#

validator validate » all fields[source]#: Base method for validating the model after creation.

pydantic model vision_architectures.nets.swinv2_3d.SwinV23DConfig[source]#

Bases: SwinV23DEncoderDecoderConfig

Show JSON schema

{
   "title": "SwinV23DConfig",
   "type": "object",
   "properties": {
      "dim": {
         "title": "Dim",
         "type": "integer"
      },
      "stages": {
         "items": {
            "$ref": "#/$defs/SwinV23DStageConfig"
         },
         "title": "Stages",
         "type": "array"
      },
      "drop_prob": {
         "default": 0.0,
         "title": "Drop Prob",
         "type": "number"
      },
      "embed_spacing_info": {
         "default": false,
         "title": "Embed Spacing Info",
         "type": "boolean"
      },
      "in_channels": {
         "title": "In Channels",
         "type": "integer"
      },
      "patch_size": {
         "maxItems": 3,
         "minItems": 3,
         "prefixItems": [
            {
               "type": "integer"
            },
            {
               "type": "integer"
            },
            {
               "type": "integer"
            }
         ],
         "title": "Patch Size",
         "type": "array"
      },
      "image_size": {
         "anyOf": [
            {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "type": "array"
            },
            {
               "type": "null"
            }
         ],
         "default": null,
         "description": "required for learnable absolute position embeddings",
         "title": "Image Size"
      },
      "use_absolute_position_embeddings": {
         "default": true,
         "title": "Use Absolute Position Embeddings",
         "type": "boolean"
      },
      "learnable_absolute_position_embeddings": {
         "default": false,
         "title": "Learnable Absolute Position Embeddings",
         "type": "boolean"
      }
   },
   "$defs": {
      "SwinV23DPatchMergingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "merge_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Merge Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "merge_window_size"
         ],
         "title": "SwinV23DPatchMergingConfig",
         "type": "object"
      },
      "SwinV23DPatchSplittingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "final_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Final Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "final_window_size"
         ],
         "title": "SwinV23DPatchSplittingConfig",
         "type": "object"
      },
      "SwinV23DStageConfig": {
         "properties": {
            "dim": {
               "default": 0,
               "description": "dim at which attention is performed",
               "title": "Dim",
               "type": "integer"
            },
            "num_heads": {
               "description": "Number of query heads",
               "title": "Num Heads",
               "type": "integer"
            },
            "ratio_q_to_kv_heads": {
               "default": 1,
               "title": "Ratio Q To Kv Heads",
               "type": "integer"
            },
            "logit_scale_learnable": {
               "default": false,
               "title": "Logit Scale Learnable",
               "type": "boolean"
            },
            "attn_drop_prob": {
               "default": 0.0,
               "title": "Attn Drop Prob",
               "type": "number"
            },
            "proj_drop_prob": {
               "default": 0.0,
               "title": "Proj Drop Prob",
               "type": "number"
            },
            "max_attention_batch_size": {
               "default": -1,
               "description": "Runs attention by splitting the inputs into chunks of this size. 0 means no chunking. Useful for large inputs during inference.",
               "title": "Max Attention Batch Size",
               "type": "integer"
            },
            "mlp_ratio": {
               "default": 4,
               "description": "Ratio of the hidden dimension in the MLP to the input dimension.",
               "title": "Mlp Ratio",
               "type": "integer"
            },
            "activation": {
               "default": "gelu",
               "description": "Activation function for the MLP.",
               "title": "Activation",
               "type": "string"
            },
            "mlp_drop_prob": {
               "default": 0.0,
               "description": "Dropout probability for the MLP.",
               "title": "Mlp Drop Prob",
               "type": "number"
            },
            "norm_location": {
               "default": "post",
               "description": "Location of the normalization layer in the attention block. Pre-normalization implies normalization before the attention operation, while post-normalization applies it after.",
               "enum": [
                  "pre",
                  "post"
               ],
               "title": "Norm Location",
               "type": "string"
            },
            "layer_norm_eps": {
               "default": 1e-06,
               "description": "Epsilon value for the layer normalization.",
               "title": "Layer Norm Eps",
               "type": "number"
            },
            "depth": {
               "title": "Depth",
               "type": "integer"
            },
            "window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Window Size",
               "type": "array"
            },
            "use_relative_position_bias": {
               "default": true,
               "title": "Use Relative Position Bias",
               "type": "boolean"
            },
            "patch_merging": {
               "anyOf": [
                  {
                     "$ref": "#/$defs/SwinV23DPatchMergingConfig"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null
            },
            "patch_splitting": {
               "anyOf": [
                  {
                     "$ref": "#/$defs/SwinV23DPatchSplittingConfig"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null
            },
            "in_dim": {
               "anyOf": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null,
               "title": "In Dim"
            },
            "out_dim": {
               "anyOf": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null,
               "title": "Out Dim"
            }
         },
         "required": [
            "num_heads",
            "depth",
            "window_size"
         ],
         "title": "SwinV23DStageConfig",
         "type": "object"
      }
   },
   "required": [
      "dim",
      "stages",
      "in_channels",
      "patch_size"
   ]
}

Config:

arbitrary_types_allowed: bool = True
extra: str = ignore
validate_default: bool = True
validate_assignment: bool = True
validate_return: bool = True

Fields:

image_size (tuple[int, int, int] | None)
in_channels (int)
learnable_absolute_position_embeddings (bool)
patch_size (tuple[int, int, int])
use_absolute_position_embeddings (bool)

Validators:

validate » all fields

field in_channels: int [Required]#

Validated by:

field patch_size: tuple[int, int, int] [Required]#

Validated by:

field image_size: tuple[int, int, int] | None = None#

required for learnable absolute position embeddings

Validated by:

field use_absolute_position_embeddings: bool = True#

Validated by:

field learnable_absolute_position_embeddings: bool = False#

Validated by:

validator validate » all fields[source]#: Base method for validating the model after creation.

pydantic model vision_architectures.nets.swinv2_3d.Swin3DMIMConfig[source]#

Bases: SwinV23DConfig

Show JSON schema

{
   "title": "Swin3DMIMConfig",
   "type": "object",
   "properties": {
      "dim": {
         "title": "Dim",
         "type": "integer"
      },
      "stages": {
         "items": {
            "$ref": "#/$defs/SwinV23DStageConfig"
         },
         "title": "Stages",
         "type": "array"
      },
      "drop_prob": {
         "default": 0.0,
         "title": "Drop Prob",
         "type": "number"
      },
      "embed_spacing_info": {
         "default": false,
         "title": "Embed Spacing Info",
         "type": "boolean"
      },
      "in_channels": {
         "title": "In Channels",
         "type": "integer"
      },
      "patch_size": {
         "maxItems": 3,
         "minItems": 3,
         "prefixItems": [
            {
               "type": "integer"
            },
            {
               "type": "integer"
            },
            {
               "type": "integer"
            }
         ],
         "title": "Patch Size",
         "type": "array"
      },
      "image_size": {
         "anyOf": [
            {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "type": "array"
            },
            {
               "type": "null"
            }
         ],
         "default": null,
         "description": "required for learnable absolute position embeddings",
         "title": "Image Size"
      },
      "use_absolute_position_embeddings": {
         "default": true,
         "title": "Use Absolute Position Embeddings",
         "type": "boolean"
      },
      "learnable_absolute_position_embeddings": {
         "default": false,
         "title": "Learnable Absolute Position Embeddings",
         "type": "boolean"
      },
      "mim": {
         "additionalProperties": true,
         "title": "Mim",
         "type": "object"
      }
   },
   "$defs": {
      "SwinV23DPatchMergingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "merge_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Merge Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "merge_window_size"
         ],
         "title": "SwinV23DPatchMergingConfig",
         "type": "object"
      },
      "SwinV23DPatchSplittingConfig": {
         "properties": {
            "out_dim_ratio": {
               "title": "Out Dim Ratio",
               "type": "integer"
            },
            "final_window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Final Window Size",
               "type": "array"
            }
         },
         "required": [
            "out_dim_ratio",
            "final_window_size"
         ],
         "title": "SwinV23DPatchSplittingConfig",
         "type": "object"
      },
      "SwinV23DStageConfig": {
         "properties": {
            "dim": {
               "default": 0,
               "description": "dim at which attention is performed",
               "title": "Dim",
               "type": "integer"
            },
            "num_heads": {
               "description": "Number of query heads",
               "title": "Num Heads",
               "type": "integer"
            },
            "ratio_q_to_kv_heads": {
               "default": 1,
               "title": "Ratio Q To Kv Heads",
               "type": "integer"
            },
            "logit_scale_learnable": {
               "default": false,
               "title": "Logit Scale Learnable",
               "type": "boolean"
            },
            "attn_drop_prob": {
               "default": 0.0,
               "title": "Attn Drop Prob",
               "type": "number"
            },
            "proj_drop_prob": {
               "default": 0.0,
               "title": "Proj Drop Prob",
               "type": "number"
            },
            "max_attention_batch_size": {
               "default": -1,
               "description": "Runs attention by splitting the inputs into chunks of this size. 0 means no chunking. Useful for large inputs during inference.",
               "title": "Max Attention Batch Size",
               "type": "integer"
            },
            "mlp_ratio": {
               "default": 4,
               "description": "Ratio of the hidden dimension in the MLP to the input dimension.",
               "title": "Mlp Ratio",
               "type": "integer"
            },
            "activation": {
               "default": "gelu",
               "description": "Activation function for the MLP.",
               "title": "Activation",
               "type": "string"
            },
            "mlp_drop_prob": {
               "default": 0.0,
               "description": "Dropout probability for the MLP.",
               "title": "Mlp Drop Prob",
               "type": "number"
            },
            "norm_location": {
               "default": "post",
               "description": "Location of the normalization layer in the attention block. Pre-normalization implies normalization before the attention operation, while post-normalization applies it after.",
               "enum": [
                  "pre",
                  "post"
               ],
               "title": "Norm Location",
               "type": "string"
            },
            "layer_norm_eps": {
               "default": 1e-06,
               "description": "Epsilon value for the layer normalization.",
               "title": "Layer Norm Eps",
               "type": "number"
            },
            "depth": {
               "title": "Depth",
               "type": "integer"
            },
            "window_size": {
               "maxItems": 3,
               "minItems": 3,
               "prefixItems": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  },
                  {
                     "type": "integer"
                  }
               ],
               "title": "Window Size",
               "type": "array"
            },
            "use_relative_position_bias": {
               "default": true,
               "title": "Use Relative Position Bias",
               "type": "boolean"
            },
            "patch_merging": {
               "anyOf": [
                  {
                     "$ref": "#/$defs/SwinV23DPatchMergingConfig"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null
            },
            "patch_splitting": {
               "anyOf": [
                  {
                     "$ref": "#/$defs/SwinV23DPatchSplittingConfig"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null
            },
            "in_dim": {
               "anyOf": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null,
               "title": "In Dim"
            },
            "out_dim": {
               "anyOf": [
                  {
                     "type": "integer"
                  },
                  {
                     "type": "null"
                  }
               ],
               "default": null,
               "title": "Out Dim"
            }
         },
         "required": [
            "num_heads",
            "depth",
            "window_size"
         ],
         "title": "SwinV23DStageConfig",
         "type": "object"
      }
   },
   "required": [
      "dim",
      "stages",
      "in_channels",
      "patch_size",
      "mim"
   ]
}

Config:

arbitrary_types_allowed: bool = True
extra: str = ignore
validate_default: bool = True
validate_assignment: bool = True
validate_return: bool = True

Fields:

mim (dict)

Validators:

field mim: dict [Required]#

Validated by:

class vision_architectures.nets.swinv2_3d.SwinV23DLayerLogitScale(num_heads)[source]#

Bases: Module

__init__(num_heads)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward()[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

Although the recipe for forward pass needs to be defined within this function, one should call the Module instance afterwards instead of this since the former takes care of running the registered hooks while the latter silently ignores them.

class vision_architectures.nets.swinv2_3d.SwinV23DLayer(config={}, checkpointing_level=0, **kwargs)[source]#

Bases: Module

__init__(config={}, checkpointing_level=0, **kwargs)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(*args, **kwargs)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DBlock(config={}, checkpointing_level=0, **kwargs)[source]#

Bases: Module

__init__(config={}, checkpointing_level=0, **kwargs)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(hidden_states, channels_first=True, return_intermediates=False)[source]#: Please note that the layer_outputs returned if return_intermediates=True will always be in channels_last format

class vision_architectures.nets.swinv2_3d.SwinV23DPatchMerging(merge_window_size, in_dim, out_dim, checkpointing_level=0)[source]#

Bases: Module

__init__(merge_window_size, in_dim, out_dim, checkpointing_level=0)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(*args, **kwargs)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DPatchSplitting(final_window_size, in_dim, out_dim, checkpointing_level=0)[source]#

Bases: Module

__init__(final_window_size, in_dim, out_dim, checkpointing_level=0)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(*args, **kwargs)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DStage(stage_config={}, checkpointing_level=0, **kwargs)[source]#

Bases: Module

__init__(stage_config={}, checkpointing_level=0, **kwargs)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(*args, **kwargs)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DEncoder(config={}, checkpointing_level=0, **kwargs)[source]#

Bases: Module, PyTorchModelHubMixin

__init__(config={}, checkpointing_level=0, **kwargs)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(*args, **kwargs)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DDecoder(config, checkpointing_level=0)[source]#

Bases: Module, PyTorchModelHubMixin

__init__(config, checkpointing_level=0)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(*args, **kwargs)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23D(config, checkpointing_level=0)[source]#

Bases: Module, PyTorchModelHubMixin

__init__(config, checkpointing_level=0)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(pixel_values, spacings=None, crop_offsets=None, channels_first=True, return_intermediates=False)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DReconstructionDecoder(config)[source]#

Bases: Module

__init__(config)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

forward(encodings)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DMIM(swin_config, decoder_config, mim_config)[source]#

Bases: Module

__init__(swin_config, decoder_config, mim_config)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

mask_image(pixel_values)[source]#

class vision_architectures.nets.swinv2_3d.SwinV23DSimMIM(*args, **kwargs)[source]#

Bases: SwinV23DMIM, PyTorchModelHubMixin

__init__(swin_config, decoder_config, mim_config)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

static loss_fn(pred, target, reduction='mean')[source]#

forward(pixel_values, spacings=None)[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note

class vision_architectures.nets.swinv2_3d.SwinV23DVAEMIM(*args, **kwargs)[source]#

Bases: SwinV23DMIM, PyTorchModelHubMixin

__init__(swin_config, decoder_config, mim_config)[source]#: Initialize internal Module state, shared by both nn.Module and ScriptModule.

get_beta()[source]#

reparameterize(mu, logvar)[source]#

static reconstruction_loss_fn(pred, target, loss_type='l2', reduction='mean')[source]#

static kl_divergence_loss_fn(mu, logvar)[source]#

forward(pixel_values, spacings=None, reconstruction_loss_type='l2')[source]#

Define the computation performed at every call.

Should be overridden by all subclasses.

Note