in pytorchvideo/models/resnet.py [0:0]
def create_acoustic_resnet(
*,
# Input clip configs.
input_channel: int = 1,
# Model configs.
model_depth: int = 50,
model_num_class: int = 400,
dropout_rate: float = 0.5,
# Normalization configs.
norm: Callable = nn.BatchNorm3d,
# Activation configs.
activation: Callable = nn.ReLU,
# Stem configs.
stem_dim_out: int = 64,
stem_conv_kernel_size: Tuple[int] = (9, 1, 9),
stem_conv_stride: Tuple[int] = (1, 1, 3),
stem_pool: Callable = None,
stem_pool_kernel_size: Tuple[int] = (3, 1, 3),
stem_pool_stride: Tuple[int] = (2, 1, 2),
stem: Callable = create_acoustic_res_basic_stem,
# Stage configs.
stage1_pool: Callable = None,
stage1_pool_kernel_size: Tuple[int] = (2, 1, 1),
stage_conv_a_kernel_size: Union[Tuple[int], Tuple[Tuple[int]]] = (3, 1, 1),
stage_conv_b_kernel_size: Union[Tuple[int], Tuple[Tuple[int]]] = (3, 1, 3),
stage_conv_b_num_groups: Tuple[int] = (1, 1, 1, 1),
stage_conv_b_dilation: Union[Tuple[int], Tuple[Tuple[int]]] = (1, 1, 1),
stage_spatial_h_stride: Tuple[int] = (1, 1, 1, 1),
stage_spatial_w_stride: Tuple[int] = (1, 2, 2, 2),
stage_temporal_stride: Tuple[int] = (1, 2, 2, 2),
bottleneck: Union[Tuple[Callable], Callable] = (
create_acoustic_bottleneck_block,
create_acoustic_bottleneck_block,
create_bottleneck_block,
create_bottleneck_block,
),
# Head configs.
head_pool: Callable = nn.AvgPool3d,
head_pool_kernel_size: Tuple[int] = (4, 1, 2),
head_output_size: Tuple[int] = (1, 1, 1),
head_activation: Callable = None,
head_output_with_global_average: bool = True,