We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
get_image_features
1 parent f5b6b66 commit 6a1904eCopy full SHA for 6a1904e
src/diffusers/pipelines/glm_image/pipeline_glm_image.py
@@ -407,8 +407,8 @@ def generate_prior_tokens(
407
408
if len(source_grids) > 0:
409
prior_token_image_embed = self.vision_language_encoder.get_image_features(
410
- inputs["pixel_values"], source_grids, return_dict=False
411
- )
+ inputs["pixel_values"], source_grids
+ ).pooler_output
412
prior_token_image_embed = torch.cat(prior_token_image_embed, dim=0)
413
prior_token_image_ids_d32 = self.vision_language_encoder.get_image_tokens(
414
prior_token_image_embed, source_grids
0 commit comments