{
"$type": "site.standard.document",
"description": "A method estimating a depth of an environment includes generating, via a cross-attention model, a cross-attention cost volume based on a current image of the environment and a previous image of the environment in a sequence of images. The method also includes generating, via the cross-attention…",
"path": "/patents/1365849",
"publishedAt": "2024-07-04T00:00:00.000Z",
"site": "at://did:plc:oql6ds5vnff4ugar6rruliwd/site.standard.publication/3mn3ohu7oxx5w",
"tags": [
"B60W60/001",
"TOYOTA RESEARCH INSTITUTE, INC."
],
"textContent": "A method estimating a depth of an environment includes generating, via a cross-attention model, a cross-attention cost volume based on a current image of the environment and a previous image of the environment in a sequence of images. The method also includes generating, via the cross-attention model, a depth estimate of the current image based on the cross-attention cost volume, the cross-attention model having been trained using a photometric loss associated with a single-frame depth estimation model. The method further includes controlling an action of the vehicle based on the depth estimate.",
"title": "PHOTOMETRIC MASKS FOR SELF-SUPERVISED DEPTH LEARNING"
}