|
695 | 695 | "Pix2StructVisionConfig", |
696 | 696 | ], |
697 | 697 | "models.pixtral": ["PixtralProcessor", "PixtralVisionConfig"], |
| 698 | + "models.internvl": ["InternVLProcessor", "InternVLConfig"], |
698 | 699 | "models.plbart": ["PLBartConfig"], |
699 | 700 | "models.poolformer": ["PoolFormerConfig"], |
700 | 701 | "models.pop2piano": ["Pop2PianoConfig"], |
|
1266 | 1267 | _import_structure["models.perceiver"].extend(["PerceiverFeatureExtractor", "PerceiverImageProcessor"]) |
1267 | 1268 | _import_structure["models.pix2struct"].extend(["Pix2StructImageProcessor"]) |
1268 | 1269 | _import_structure["models.pixtral"].append("PixtralImageProcessor") |
| 1270 | + _import_structure["models.internvl"].append("InternVLImageProcessor") |
1269 | 1271 | _import_structure["models.poolformer"].extend(["PoolFormerFeatureExtractor", "PoolFormerImageProcessor"]) |
1270 | 1272 | _import_structure["models.pvt"].extend(["PvtImageProcessor"]) |
1271 | 1273 | _import_structure["models.qwen2_5_vl"].extend(["Qwen2_5_VLImageProcessor"]) |
|
1304 | 1306 | _import_structure["models.deformable_detr"].append("DeformableDetrImageProcessorFast") |
1305 | 1307 | _import_structure["models.detr"].append("DetrImageProcessorFast") |
1306 | 1308 | _import_structure["models.pixtral"].append("PixtralImageProcessorFast") |
| 1309 | + _import_structure["models.internvl"].append("InternVLImageProcessorFast") |
1307 | 1310 | _import_structure["models.qwen2_vl"].append("Qwen2VLImageProcessorFast") |
1308 | 1311 | _import_structure["models.rt_detr"].append("RTDetrImageProcessorFast") |
1309 | 1312 | _import_structure["models.vit"].append("ViTImageProcessorFast") |
|
3225 | 3228 | ] |
3226 | 3229 | ) |
3227 | 3230 | _import_structure["models.pixtral"].extend(["PixtralPreTrainedModel", "PixtralVisionModel"]) |
| 3231 | + _import_structure["models.internvl"].extend(["InternVLPreTrainedModel", "InternVLModel"]) |
3228 | 3232 | _import_structure["models.plbart"].extend( |
3229 | 3233 | [ |
3230 | 3234 | "PLBartForCausalLM", |
|
5589 | 5593 | InstructBlipVideoQFormerConfig, |
5590 | 5594 | InstructBlipVideoVisionConfig, |
5591 | 5595 | ) |
| 5596 | + from .models.internvl import ( |
| 5597 | + InternVLConfig, |
| 5598 | + InternVLProcessor, |
| 5599 | + ) |
5592 | 5600 | from .models.jamba import JambaConfig |
5593 | 5601 | from .models.jetmoe import JetMoeConfig |
5594 | 5602 | from .models.kosmos2 import ( |
|
6348 | 6356 | from .models.idefics3 import Idefics3ImageProcessor |
6349 | 6357 | from .models.imagegpt import ImageGPTFeatureExtractor, ImageGPTImageProcessor |
6350 | 6358 | from .models.instructblipvideo import InstructBlipVideoImageProcessor |
| 6359 | + from .models.internvl import InternVLImageProcessor |
6351 | 6360 | from .models.layoutlmv2 import ( |
6352 | 6361 | LayoutLMv2FeatureExtractor, |
6353 | 6362 | LayoutLMv2ImageProcessor, |
|
6419 | 6428 | from .image_processing_utils_fast import BaseImageProcessorFast |
6420 | 6429 | from .models.deformable_detr import DeformableDetrImageProcessorFast |
6421 | 6430 | from .models.detr import DetrImageProcessorFast |
| 6431 | + from .models.internvl import InternVLImageProcessorFast |
6422 | 6432 | from .models.pixtral import PixtralImageProcessorFast |
6423 | 6433 | from .models.qwen2_vl import Qwen2VLImageProcessorFast |
6424 | 6434 | from .models.rt_detr import RTDetrImageProcessorFast |
|
7491 | 7501 | InstructBlipVideoQFormerModel, |
7492 | 7502 | InstructBlipVideoVisionModel, |
7493 | 7503 | ) |
| 7504 | + from .models.internvl import ( |
| 7505 | + InternVLModel, |
| 7506 | + InternVLPreTrainedModel, |
| 7507 | + ) |
7494 | 7508 | from .models.jamba import ( |
7495 | 7509 | JambaForCausalLM, |
7496 | 7510 | JambaForSequenceClassification, |
|
0 commit comments