{
  "$type": "site.standard.document",
  "description": "A method estimating a depth of an environment includes generating, via a cross-attention model, a cross-attention cost volume based on a current image of the environment and a previous image of the environment in a sequence of images. The method also includes generating, via the cross-attention…",
  "path": "/patents/1365849",
  "publishedAt": "2024-07-04T00:00:00.000Z",
  "site": "at://did:plc:oql6ds5vnff4ugar6rruliwd/site.standard.publication/3mn3ohu7oxx5w",
  "tags": [
    "B60W60/001",
    "TOYOTA RESEARCH INSTITUTE, INC."
  ],
  "textContent": "A method estimating a depth of an environment includes generating, via a cross-attention model, a cross-attention cost volume based on a current image of the environment and a previous image of the environment in a sequence of images. The method also includes generating, via the cross-attention model, a depth estimate of the current image based on the cross-attention cost volume, the cross-attention model having been trained using a photometric loss associated with a single-frame depth estimation model. The method further includes controlling an action of the vehicle based on the depth estimate.",
  "title": "PHOTOMETRIC MASKS FOR SELF-SUPERVISED DEPTH LEARNING"
}