{
  "$type": "site.standard.document",
  "bskyPostRef": {
    "cid": "bafyreidlkvb6jrejpjqi3gh6tuhmuw6d4yuistmvjcploodffzc2lcx6g4",
    "uri": "at://did:plc:lk3jfj3zq4k4wxnk474axylu/app.bsky.feed.post/3meiwd3tdvao2"
  },
  "path": "/t/finetuning-query-for-gpt-oss/1373859#post_1",
  "publishedAt": "2026-02-10T11:56:00.000Z",
  "site": "https://community.openai.com",
  "textContent": "We created our own medical dataset, and then prepare data with the help of openai harmony github after this i performed finetuning with unsloth and offload the model then with llama.cpp converted to gguf and after this quantize to q4_k_m and with pretrained model file available in ollama we upload the model to ollama for simpler query it is giving right output but as user context grows model is thinking only and not generating the response.\nWhy is this so and how to solve this what precautions to taken care of\nI added analysis samples as well in training set..",
  "title": "Finetuning Query for gpt-oss"
}