A medium-long shot of green water flowing through an area that has two rock and dirt hillsides along the sides of it. Along the dirt hillsides, there are tire tracks that run horizontally. To the left of the water and on the hillside, a gray tube can be seen. Covering the tube is the dirt hill. Sticking out of the hillside on the near side of the river is another tube that can barely be seen. On the river, the reflection of the blue sky and trees. On the other side of the hillside, on the left, there are multiple trees and a cut-grass field. On the grass and along its center, there is an orange umbrella. It is daytime, as the sun is shining brightly in the area.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'water' in entity:
3 if 'flow' in scene_graph.get_attributes(entity).get('state',
''):
4 return scene_graph.get_attributes(entity).get('color', '')
5 return None
6
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'hillsides' in entity:
3 count = scene_graph.get_attributes(entity).get('count', '0')
4 texture = scene_graph.get_attributes(entity).get('texture', '')
5 return f'There are {count} hillsides with a {texture} texture.'
6 return None
7
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'tire tracks' in entity:
3 return scene_graph.get_attributes(entity).get('state', '')
4 return None
5
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'tube' in entity:
3 relations = scene_graph.get_outgoing_relations(entity)
4 if 'water' in relations and 'left of' in
relations['water'].get('spatial', ''):
5 return f'A gray tube is located to the left of the water.'
6 return None
7
An outdoor angled up long shot view taken from the southwest corner of Central Park in New York City. Closer up and towards the left side is a gold statue of a person with one arm raised up, and a gold horse beneath them. The gold statue is on top of a thick and tall cement structure that has designs engraved and embossed onto its surface. To the left of the statue is a partial view of tree branches with green leaves, and to the bottom right of the statue are more partial views of tree branches with green leaves. Far behind the statue, and to the right of it, is a tall beige colored building that is many stories high and appears to be old. Behind the beige building and to the right of it, is an enormous silver colored skyscraper building. As the skyscraper goes up, it gets more narrow until reaching its pointed top. The sky is clear, and is a light blue color that gets slightly darker the higher up it goes.
0 def execute_command(scene_graph):
1 statue_entity = None
2 cement_entity = None
3 for entity in scene_graph.get_entities():
4 if 'statue' in entity:
5 statue_entity = entity
6 elif 'cement structure' in entity:
7 cement_entity = entity
8 if statue_entity and cement_entity:
9 statue_material =
scene_graph.get_attributes(statue_entity).get('material', '')
10 cement_description =
scene_graph.get_attributes(cement_entity).get('state', '')
11 return f"The statue is made of {statue_material}, and it sits on
top of a cement structure that is thick and tall with
{cement_description}."
12 return None
13
0 def execute_command(scene_graph):
1 building1_entity = None
2 building2_entity = None
3 for entity in scene_graph.get_entities():
4 if 'building_1' in entity:
5 building1_entity = entity
6 elif 'building_2' in entity:
7 building2_entity = entity
8 if building1_entity and building2_entity:
9 building1_attributes = scene_graph.get_attributes(building1_entity)
10 building2_attributes = scene_graph.get_attributes(building2_entity)
11 building1_description = f"a tall,
{building1_attributes.get('color', 'beige')}-colored,
{building1_attributes.get('state', 'old')} building"
12 building2_description = f"an enormous
{building2_attributes.get('color', 'silver')}-colored skyscraper with
{building2_attributes.get('shape', 'a narrow top')}"
13 return f"The photo features {building1_description}, and
{building2_description}."
14 return None
15
A top down 3/4 view of a Warhammer figure from the Age of Sigmar placed on top of a tabletop map meant to resemble a dungeon. The figure resembles a brown Tree Lord and is grasping a scythe with two hands. The figure’s base has fake grass and a brown edge all around. The scythe has a wooden handle made of light brown wood and the blade is green gray. Behind the figure, there is a modular dungeon set. The top and left of the frame has a gray dungeon fence. The upper left frame has a dungeon wall composed of bricks.
0 def execute_command(scene_graph):
1 # Find the Warhammer figure
2 for entity in scene_graph.get_entities():
3 if 'Warhammer figure' in entity:
4 part_entities = scene_graph.get_outgoing_relations(entity)
5 for part_entity in part_entities:
6 if 'figure' in part_entity:
7 return scene_graph.get_attributes(part_entity)['state']
8 return None
9
0 def execute_command(scene_graph):
1 frame_elements = []
2 # Find the fence
3 for entity in scene_graph.get_entities():
4 if 'fence' in entity or 'dungeon wall' in entity:
5 for position, spatial_data in
scene_graph.get_outgoing_relations(entity).items():
6 if spatial_data['spatial'] == 'in':
7 frame_elements.append(scene_graph.describe(scene_graph.g
enerate_subgraph([entity])))
8 return ', '.join(frame_elements)
9
0 def execute_command(scene_graph):
1 # Find the scythe's handle
2 for entity in scene_graph.get_entities():
3 if "scythe's handle" in entity:
4 return scene_graph.get_attributes(entity)['material']
5 return None
6
0 def execute_command(scene_graph):
1 # Find the tabletop map
2 for entity in scene_graph.get_entities():
3 if 'tabletop map' in entity:
4 return
scene_graph.describe(scene_graph.generate_subgraph([entity]))
5 return None
6
A nighttime view up at the Austin skyline with a large firework exploding over it on the left. The firework is spherical explosion of red, white, and pink. It's filling the top left quadrant of the frame. To the right of the firework the prominent building is the Austin Google "Sail" tower. The tower is still under construction in this image with a crane still sticking up skyward on its right side. Beneath the firework smoke from the explosion is drifting down and to the bottom left corner.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'firework' in entity:
3 return scene_graph.get_attributes(entity).get('shape', '')
4 return None
5
A monster truck is in the air and jumping over a line of red crushed cars. The truck has a color scheme of red and blue. The word "BIG FOOT" is written on the side of the truck in big white letters. The grille of the truck is silver. An orange truck with black stripes is in the background behind the truck red and blue truck. The word "Hot Wheels" is inside a flame logo on the blue wall. The "H" is partially covered by the truck's shark fin design. An orange van is partially cut off from the right of the image next to a crushed blue car. An audience of people are in the background in the stands watching the trucks.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'truck' in entity:
3 relations = scene_graph.get_outgoing_relations(entity)
4 for relation, details in relations.items():
5 if "red and blue" in
scene_graph.get_attributes(relation).get('color', "") and 'behind' in
details.get('spatial', ""):
6 return scene_graph.get_attributes(entity).get('color',
"")
7 return None
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if "H" in entity:
3 relations = scene_graph.get_outgoing_relations(entity)
4 for relation, details in relations.items():
5 if "shark fin design" in relation and "partially covered by"
in details.get('spatial', ""):
6 return 'The "H" is partially covered by the truck’s
shark fin design.'
7 return None
A top-down, close-up of a black and white tabby cat sitting in a round, tall, rattan decorative basket with two stuffed animals. The cat is in the front side of the basket facing forward, angled to the left, with a white stuffed plush bear to the back right and a gray stuffed plush tiger to the back left. The black and white tabby cat is mostly white, with black on top of its head and ears and around the right eye. The iris of the eye is thin and yellow-green, with a large black pupil. The basket has handles. One is in the top right corner, and one is on the left side. The background is a white panel wall with white trim at the bottom. Similar-type baskets are slightly visible on the bottom left and top right. A shadow is visible on the wall behind the basket. Indoors. The lights are on.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'cat' in entity:
3 color = scene_graph.get_attributes(entity).get('color', '')
4 return color
5 return None
6
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'tiger' in entity:
3 relations = scene_graph.get_outgoing_relations(entity)
4 basket_relation = relations.get('basket', {}).get('spatial', '')
5 if 'back left' in basket_relation:
6 return basket_relation
7 return None
8
0 def execute_command(scene_graph):
1 if 'lights' in scene_graph.get_entities():
2 state = scene_graph.get_attributes('lights').get('state', '')
3 if 'on' in state:
4 return 'indoors'
5 return 'unknown'
6
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'basket' in entity:
3 material = scene_graph.get_attributes(entity).get('material',
'')
4 return material
5 return None
6
An outdoor top-down view of a gray brick pathway with an inlaid small metal manhole cover with the letters,"A / W W" debossed in the center of the lid. The text and the lid are rotated about 45 degrees to the right. The bricks of the pathway are laid in a running pattern. A light shadow is covering the upper left half of the manhole cover and the brick pathway, as the sunlight appears and shines in the lower right corner.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'bricks' in entity:
3 return scene_graph.get_attributes(entity).get('state', '')
4 return None
5
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'pathway' in entity:
3 return scene_graph.get_attributes(entity).get('color', '')
4 return None
5
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'manhole cover' in entity:
3 return scene_graph.get_attributes(entity).get('text rendering',
'')
4 return None
5
A top down view of a brown Labradoodle puppy standing to two hind legs leaning on a white wall. The puppy is trying to look over the edge of the wall. The floor is covered in a light blue wool rug. A blue stuffed animal and a purple strand of rope is to the right of the brown puppy. A black Labradoodle puppy with white paws is visible on the upper edge of the frame. Only the black puppy’s paws and nose are within the frame.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'rope' in entity:
3 attributes = scene_graph.get_attributes(entity)
4 if 'purple' in attributes.get('color', ''):
5 outgoing_relations =
scene_graph.get_outgoing_relations(entity)
6 for target, relation in outgoing_relations.items():
7 if 'puppy' in target and 'to the right of' in
relation.get('spatial', ''):
8 return relation.get('spatial', '')
9 return None
10
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'stuffed animal' in entity:
3 attributes = scene_graph.get_attributes(entity)
4 if 'blue' in attributes.get('color', ''):
5 return
scene_graph.describe(scene_graph.generate_subgraph([entity]))
6 return None
7
A front view of a sculpture of a man standing up on a pile of gray cement blocks on a sidewalk. He is looking to the right and has a pair of shoes in the right hand and a golf bag in the left with some clubs in it. He has a short-sleeve collared shirt on and slacks. The sun is hitting the right side of his forehead. A stone wall to a building is behind him. On the left are a tree, plants, and dried twigs and leaves on the ground. A parking lot is visible in the distance on the left, as is a building. Part of a white parked car is visible. On the right, on the cement, part of a gray sculpture is visible on a black platform.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if "sculpture" in entity:
3 relations = scene_graph.get_outgoing_relations(entity)
4 for target_entity, relation_info in relations.items():
5 if "platform" in target_entity and "on" in
relation_info.get('spatial', ''):
6 return
scene_graph.describe(scene_graph.generate_subgraph([entity]))
7 return None
8
An outdoor long shot view looking down a long railroad track that is straight, and curves slightly to the left. The railroad track is placed on top of a ground floor made up of white rocks. About twenty-five feet to the left of the railroad track are two gray electrical boxes that are placed side by side, parallel to the railroad track, with about seven feet between them. Behind the electrical boxes is a field made up of dry yellow grass. To the right of the railroad track is a large maroon colored building, and two more multi-colored buildings behind it. Further behind the buildings, and hovering above them, is a large rectangular billboard that is colored blue, and has white letters on it that read "Feeling Stuck?". Further in the distance, to the left and right of the railroad track is a tree line consisting of tall bushy green trees. The sky is partly cloudy, and is a light baby blue color.
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'billboard' in entity:
3 attributes = scene_graph.get_attributes(entity)
4 if 'above' in
scene_graph.get_outgoing_relations(entity).get('buildings',
{}).get('spatial', ''):
5 return attributes.get('color', '')
6 return None
7
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'electrical boxes' in entity:
3 description =
scene_graph.describe(scene_graph.generate_subgraph([entity]))
4 return description
5 return None
6
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'billboard\'s letters' in entity:
3 return scene_graph.get_attributes(entity).get('text rendering',
'').strip('"')
4 return None
5
0 def execute_command(scene_graph):
1 results = []
2 for entity in scene_graph.get_entities():
3 if 'building' in entity:
4 results.append(scene_graph.describe(scene_graph.generate_subgrap
h([entity])))
5 return ' '.join(results)
6
0 def execute_command(scene_graph):
1 for entity in scene_graph.get_entities():
2 if 'field' in entity:
3 if 'electrical boxes' in
scene_graph.get_outgoing_relations(entity):
4 return
scene_graph.describe(scene_graph.generate_subgraph([entity]))
5 return None
6