{
  "$type": "site.standard.document",
  "bskyPostRef": {
    "cid": "bafyreicagpvapqab43wxtiwoy5m4l5vdfywjpz4pmvocaf5w7tbuutfhpu",
    "uri": "at://did:plc:pgryn3ephfd2xgft23qokfzt/app.bsky.feed.post/3mmxnlx5w3lg2"
  },
  "path": "/t/construction-equipment-synthetic-dataset-coco-parquet/176329#post_1",
  "publishedAt": "2026-05-29T02:07:12.000Z",
  "site": "https://discuss.huggingface.co",
  "tags": [
    "https://huggingface.co/datasets/m2m-datasets/construction-equipment-sample"
  ],
  "textContent": "Excited to share the first dataset from **Synthetic M2M** — a series of niche-vertical synthetic ML training datasets.\n\nWe’re targeting verticals that are underrepresented on Roboflow Universe — construction, medical devices, HVAC, industrial machinery, retail products — at price points that work for solo ML engineers and small teams.\n\n**Dataset card:** https://huggingface.co/datasets/m2m-datasets/construction-equipment-sample\n\n**Construction Equipment Sample:**\n\n- 10 high-resolution images with COCO bounding-box annotations, captions, and category tags\n\n- Includes HF Parquet shard for one-line `datasets.load_dataset(…)` loading\n\n- Sample available via the dataset card linked above; the full 250-image pack drops later this week\n\nWhat other niches would you want to see? Happy to take requests.",
  "title": "Construction-equipment synthetic dataset (COCO + Parquet)"
}