{'input_ids': tensor([[49406, 320, 1125, 539, 550, 2619, 49407],
[49406, 320, 1125, 539, 320, 5363, 49407]]), 'attention_mask': tensor([[1, 1, 1, 1, 1, 1, 1],
[1, 1, 1, 1, 1, 1, 1]]), 'pixel_values': tensor([[[[-0.5222, -0.5514, -0.5514, ..., -1.6901, -1.7047, -1.7047],
[-0.5222, -0.5222, -0.5368, ..., -1.6901, -1.7047, -1.7047],
[-0.5076, -0.5222, -0.5222, ..., -1.7047, -1.7193, -1.7047],
...,
[-1.6317, -1.6755, -1.6901, ..., -1.6901, -1.6755, -1.6901],
[-1.6755, -1.6901, -1.6609, ..., -1.6609, -1.6755, -1.6755],
[-1.6609, -1.6609, -1.6317, ..., -1.6025, -1.6463, -1.6609]],
[[ 0.6191, 0.6041, 0.6041, ..., -0.5365, -0.5365, -0.5515],
[ 0.6191, 0.6041, 0.6041, ..., -0.5215, -0.5365, -0.5365],
[ 0.6191, 0.6191, 0.6191, ..., -0.5065, -0.5215, -0.5215],
...,
[-0.4914, -0.6415, -0.7016, ..., -0.3114, -0.3564, -0.2363],
[-0.6865, -0.7766, -0.6715, ..., -0.3114, -0.3864, -0.3714],
[-0.7316, -0.7016, -0.5815, ..., -0.2213, -0.3414, -0.4164]],
[[ 1.4776, 1.5060, 1.4918, ..., 0.5106, 0.5106, 0.4821],
[ 1.5060, 1.5060, 1.5060, ..., 0.5390, 0.5248, 0.5248],
[ 1.5060, 1.5202, 1.5202, ..., 0.5675, 0.5675, 0.5390],
...,
[-0.2715, -0.3711, -0.4137, ..., -0.2431, -0.2431, -0.1578],
[-0.4137, -0.4706, -0.3995, ..., -0.2431, -0.2715, -0.2573],
[-0.4564, -0.4279, -0.3284, ..., -0.1435, -0.2289, -0.2857]]]])}