{'input_ids': tensor([[49406,   320,  1125,   539,   550,  2619, 49407],
        [49406,   320,  1125,   539,   320,  5363, 49407]]), 'attention_mask': tensor([[1, 1, 1, 1, 1, 1, 1],
        [1, 1, 1, 1, 1, 1, 1]]), 'pixel_values': tensor([[[[-0.5222, -0.5514, -0.5514,  ..., -1.6901, -1.7047, -1.7047],
          [-0.5222, -0.5222, -0.5368,  ..., -1.6901, -1.7047, -1.7047],
          [-0.5076, -0.5222, -0.5222,  ..., -1.7047, -1.7193, -1.7047],
          ...,
          [-1.6317, -1.6755, -1.6901,  ..., -1.6901, -1.6755, -1.6901],
          [-1.6755, -1.6901, -1.6609,  ..., -1.6609, -1.6755, -1.6755],
          [-1.6609, -1.6609, -1.6317,  ..., -1.6025, -1.6463, -1.6609]],
         [[ 0.6191,  0.6041,  0.6041,  ..., -0.5365, -0.5365, -0.5515],
          [ 0.6191,  0.6041,  0.6041,  ..., -0.5215, -0.5365, -0.5365],
          [ 0.6191,  0.6191,  0.6191,  ..., -0.5065, -0.5215, -0.5215],
          ...,
          [-0.4914, -0.6415, -0.7016,  ..., -0.3114, -0.3564, -0.2363],
          [-0.6865, -0.7766, -0.6715,  ..., -0.3114, -0.3864, -0.3714],
          [-0.7316, -0.7016, -0.5815,  ..., -0.2213, -0.3414, -0.4164]],
         [[ 1.4776,  1.5060,  1.4918,  ...,  0.5106,  0.5106,  0.4821],
          [ 1.5060,  1.5060,  1.5060,  ...,  0.5390,  0.5248,  0.5248],
          [ 1.5060,  1.5202,  1.5202,  ...,  0.5675,  0.5675,  0.5390],
          ...,
          [-0.2715, -0.3711, -0.4137,  ..., -0.2431, -0.2431, -0.1578],
          [-0.4137, -0.4706, -0.3995,  ..., -0.2431, -0.2715, -0.2573],
          [-0.4564, -0.4279, -0.3284,  ..., -0.1435, -0.2289, -0.2857]]]])}