| |
| from transformers import PretrainedConfig |
|
|
|
|
| class DownsamplerConfig(PretrainedConfig): |
| model_type = 'downsampler' |
| _auto_class = 'AutoConfig' |
|
|
| def __init__( |
| self, |
| kernel_size=1, |
| stride=1, |
| visual_hidden_size=4096, |
| llm_hidden_size=4096, |
| depth=2, |
| hidden_act='gelu', |
| bias=False, |
| **kwargs, |
| ): |
| self.visual_hidden_size = visual_hidden_size |
| self.llm_hidden_size = llm_hidden_size |
| self.depth = depth |
| self.hidden_act = hidden_act |
| self.bias = bias |
| self.kernel_size = kernel_size |
| self.stride = stride |
| super().__init__(**kwargs) |
|
|