chunks = video[0.0:2.0].chunk(0.200) # VideoArray of 10 × 200mschunks[:, 0].numpy() # first frame of each → (10, H, W, 3)chunks[:, 0].tensor() # feed to model
TextTrack
Buffer time-aligned text entries, flush to server:
python
track = dl.text_track(prefix="/run-042/captions", project="robotics@alice")track.add("Robot picks up cup", source=clip)track.flush()
VectorIndex
Store and search embeddings:
python
index = dl.vec_index("my-experiment")index.add(vector=enc(clip[0]), caption="robot arm", source=clip)results = index.search("robot picking up cup", limit=10)
Prefix Context
python
with dl.Prefix(project="robotics@alice", prefix="/2026/04/run-042"): dl.upload("./video.mp4", path="camera/front") track = dl.text_track(path="captions/llava")