>>> train_set[2]
(
  <PIL.JpegImagePlugin.JpegImageFile image mode=RGB size=500x330 at 0x7F98AD088220>,
  Target(
    annotations=FrameAnnotations(
      tags=[
        {
          'attributes': [],
          'frame': 2,
          'group': None,
          'id': 426657,
          'label_id': 431496,
          'source': 'manual'
        }
      ],
      shapes=[
        {
          'attributes': [],
          'elements': [],
          'frame': 2,
          'group': 0,
          'id': 41000665,
          'label_id': 431496,
          'occluded': False,
          'outside': False,
          'points': [
            170.1162758827213,
            158.9655911445625,
            349.43134126663244,
            329.23956079483105
          ],
          'rotation': 0.0,
          'source': 'manual',
          'type': 'rectangle',
          'z_order': 0
        },
[...snipped...]
      ]
    ),
    label_id_to_index=mappingproxy({431492: 0, 431493: 1, 431494: 2, 431495: 3, 431496: 4})
  )
)