name: ViT-B/16 layers: 12 pretrained: true num_classes: 1000 hidden_dim: 768 num_heads: 12 patch_size: 16