concat_type: Literal["feature", "sequence", "add", "tuple"] = "tuple", **ignore_kwargs, ): super().__init__() self.vision_tower_high = CLIPVisionTower(**high_res_cfg) self.vision_tower_low = CLIPVisionTower(**low_res_cfg) self.low_res_size = low_res_cfg["image_size"] ...