Add training type support for fine-tuning jobs (#44036)

jayesh-tanna · Jayesh Tanna · web-flow · commit 696d9d190c3d · 2025-11-14T23:24:51.000+05:30
* Add training type support for fine-tuning jobs

* updating readme.md

---------

Co-authored-by: Jayesh Tanna &lt;jatanna@microsoft.com&gt;
diff --git a/sdk/ai/azure-ai-projects/README.md b/sdk/ai/azure-ai-projects/README.md
@@ -737,9 +737,9 @@ print(f"Successfully deleted file: {deleted_file.id}")
 
 ### Fine-tuning operations
 
-The code below shows Fine-tuning operations using the OpenAI client, which allow you to create, retrieve, list, cancel, pause, resume, and manage fine-tuning jobs. These operations support various fine-tuning techniques like Supervised Fine-Tuning (SFT), Reinforcement Fine-Tuning (RFT), and Direct Performance Optimization (DPO). Full samples can be found under the "finetuning" folder in the [package samples][samples].
+The code below shows how to create fine-tuning jobs using the OpenAI client. These operations support various fine-tuning techniques like Supervised Fine-Tuning (SFT), Reinforcement Fine-Tuning (RFT), and Direct Performance Optimization (DPO). Full samples can be found under the "finetuning" folder in the [package samples][samples].
 
-<!-- SNIPPET:sample_finetuning_supervised_job.finetuning_supervised_job_sample-->
+<!-- SNIPPET:sample_finetuning_oss_models_supervised_job.finetuning_oss_model_supervised_job_sample-->
 
 ```python
 print("Uploading training file...")
@@ -752,8 +752,10 @@ with open(validation_file_path, "rb") as f:
     validation_file = openai_client.files.create(file=f, purpose="fine-tune")
 print(f"Uploaded validation file with ID: {validation_file.id}")
 
-# For OpenAI model supervised fine-tuning jobs, "Standard" is the default training type.
-# To use global standard training, uncomment the extra_body parameter below.
+print("Waits for the training and validation files to be processed...")
+openai_client.files.wait_for_processing(train_file.id)
+openai_client.files.wait_for_processing(validation_file.id)
+
 print("Creating supervised fine-tuning job")
 fine_tuning_job = openai_client.fine_tuning.jobs.create(
     training_file=train_file.id,
@@ -763,76 +765,13 @@ fine_tuning_job = openai_client.fine_tuning.jobs.create(
         "type": "supervised",
         "supervised": {"hyperparameters": {"n_epochs": 3, "batch_size": 1, "learning_rate_multiplier": 1.0}},
     },
-    # extra_body={"trainingType":"GlobalStandard"}
+    extra_body={
+        "trainingType": "GlobalStandard"
+    },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
+    # Preferred trainingtype is GlobalStandard.  Note:  Global training offers cost savings , but copies data and weights outside the current resource region.
+    # Learn more - https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/ and https://azure.microsoft.com/en-us/explore/global-infrastructure/data-residency/
 )
 print(fine_tuning_job)
-
-print(f"Getting fine-tuning job with ID: {fine_tuning_job.id}")
-retrieved_job = openai_client.fine_tuning.jobs.retrieve(fine_tuning_job.id)
-print(retrieved_job)
-
-print("Listing all fine-tuning jobs:")
-for job in openai_client.fine_tuning.jobs.list():
-    print(job)
-
-print("Listing only 10 fine-tuning jobs:")
-for job in openai_client.fine_tuning.jobs.list(limit=10):
-    print(job)
-
-print(f"Pausing fine-tuning job with ID: {fine_tuning_job.id}")
-paused_job = openai_client.fine_tuning.jobs.pause(fine_tuning_job.id)
-print(paused_job)
-
-print(f"Resuming fine-tuning job with ID: {fine_tuning_job.id}")
-resumed_job = openai_client.fine_tuning.jobs.resume(fine_tuning_job.id)
-print(resumed_job)
-
-print(f"Listing events of fine-tuning job: {fine_tuning_job.id}")
-for event in openai_client.fine_tuning.jobs.list_events(fine_tuning_job.id):
-    print(event)
-
-# Note that to retrieve the checkpoints, job needs to be in terminal state.
-print(f"Listing checkpoints of fine-tuning job: {fine_tuning_job.id}")
-for checkpoint in openai_client.fine_tuning.jobs.checkpoints.list(fine_tuning_job.id):
-    print(checkpoint)
-
-print(f"Cancelling fine-tuning job with ID: {fine_tuning_job.id}")
-cancelled_job = openai_client.fine_tuning.jobs.cancel(fine_tuning_job.id)
-print(f"Successfully cancelled fine-tuning job: {cancelled_job.id}, Status: {cancelled_job.status}")
-
-# Deploy model (using Azure Management SDK - azure-mgmt-cognitiveservices)
-# Note: Deployment can only be started after the fine-tuning job completes successfully.
-print(f"Getting fine-tuning job with ID: {fine_tuning_job.id}")
-fine_tuned_model_name = openai_client.fine_tuning.jobs.retrieve(fine_tuning_job.id).fine_tuned_model
-deployment_name = "gpt-4-1-fine-tuned"
-
-with CognitiveServicesManagementClient(credential=credential, subscription_id=subscription_id) as cogsvc_client:
-
-    deployment_model = DeploymentModel(format="OpenAI", name=fine_tuned_model_name, version="1")
-
-    deployment_properties = DeploymentProperties(model=deployment_model)
-
-    deployment_sku = Sku(name="GlobalStandard", capacity=100)
-
-    deployment_config = Deployment(properties=deployment_properties, sku=deployment_sku)
-
-    deployment = cogsvc_client.deployments.begin_create_or_update(
-        resource_group_name=resource_group,
-        account_name=account_name,
-        deployment_name=deployment_name,
-        deployment=deployment_config,
-    )
-
-    while deployment.status() not in ["Succeeded", "Failed"]:
-        time.sleep(30)
-        print(f"Status: {deployment.status()}")
-
-print(f"Testing fine-tuned model via deployment: {deployment_name}")
-
-response = openai_client.responses.create(
-    model=deployment_name, input=[{"role": "user", "content": "Who invented the telephone?"}]
-)
-print(f"Model response: {response.output_text}")
 ```
 
 <!-- END SNIPPET -->
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_dpo_job.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_dpo_job.py
@@ -56,8 +56,10 @@
         validation_file = openai_client.files.create(file=f, purpose="fine-tune")
     print(f"Uploaded validation file with ID: {validation_file.id}")
 
-    # For OpenAI model DPO fine-tuning jobs, "Standard" is the default training type.
-    # To use global standard training, uncomment the extra_body parameter below.
+    print("Waits for the training and validation files to be processed...")
+    openai_client.files.wait_for_processing(train_file.id)
+    openai_client.files.wait_for_processing(validation_file.id)
+
     print("Creating DPO fine-tuning job")
     fine_tuning_job = openai_client.fine_tuning.jobs.create(
         training_file=train_file.id,
@@ -67,6 +69,8 @@
             "type": "dpo",
             "dpo": {"hyperparameters": {"n_epochs": 3, "batch_size": 1, "learning_rate_multiplier": 1.0}},
         },
-        # extra_body={"trainingType":"GlobalStandard"}
+        extra_body={
+            "trainingType": "Standard"
+        },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
     )
     print(fine_tuning_job)
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_dpo_job_async.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_dpo_job_async.py
@@ -61,8 +61,10 @@ async def main():
             validation_file = await openai_client.files.create(file=f, purpose="fine-tune")
         print(f"Uploaded validation file with ID: {validation_file.id}")
 
-        # For OpenAI model DPO fine-tuning jobs, "Standard" is the default training type.
-        # To use global standard training, uncomment the extra_body parameter below.
+        print("Waits for the training and validation files to be processed...")
+        await openai_client.files.wait_for_processing(train_file.id)
+        await openai_client.files.wait_for_processing(validation_file.id)
+
         print("Creating DPO fine-tuning job")
         fine_tuning_job = await openai_client.fine_tuning.jobs.create(
             training_file=train_file.id,
@@ -78,7 +80,9 @@ async def main():
                     }
                 },
             },
-            # extra_body={"trainingType":"GlobalStandard"}
+            extra_body={
+                "trainingType": "Standard"
+            },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
         )
         print(fine_tuning_job)
 
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_oss_models_supervised_job.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_oss_models_supervised_job.py
@@ -58,6 +58,10 @@
         validation_file = openai_client.files.create(file=f, purpose="fine-tune")
     print(f"Uploaded validation file with ID: {validation_file.id}")
 
+    print("Waits for the training and validation files to be processed...")
+    openai_client.files.wait_for_processing(train_file.id)
+    openai_client.files.wait_for_processing(validation_file.id)
+
     print("Creating supervised fine-tuning job")
     fine_tuning_job = openai_client.fine_tuning.jobs.create(
         training_file=train_file.id,
@@ -67,6 +71,11 @@
             "type": "supervised",
             "supervised": {"hyperparameters": {"n_epochs": 3, "batch_size": 1, "learning_rate_multiplier": 1.0}},
         },
+        extra_body={
+            "trainingType": "GlobalStandard"
+        },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
+        # Preferred trainingtype is GlobalStandard.  Note:  Global training offers cost savings , but copies data and weights outside the current resource region.
+        # Learn more - https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/ and https://azure.microsoft.com/en-us/explore/global-infrastructure/data-residency/
     )
     print(fine_tuning_job)
     # [END finetuning_oss_model_supervised_job_sample]
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_oss_models_supervised_job_async.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_oss_models_supervised_job_async.py
@@ -61,6 +61,10 @@ async def main():
             validation_file = await openai_client.files.create(file=f, purpose="fine-tune")
         print(f"Uploaded validation file with ID: {validation_file.id}")
 
+        print("Waits for the training and validation files to be processed...")
+        await openai_client.files.wait_for_processing(train_file.id)
+        await openai_client.files.wait_for_processing(validation_file.id)
+
         print("Creating supervised fine-tuning job")
         fine_tuning_job = await openai_client.fine_tuning.jobs.create(
             training_file=train_file.id,
@@ -70,6 +74,11 @@ async def main():
                 "type": "supervised",
                 "supervised": {"hyperparameters": {"n_epochs": 3, "batch_size": 1, "learning_rate_multiplier": 1.0}},
             },
+            extra_body={
+                "trainingType": "GlobalStandard"
+            },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
+            # Preferred trainingtype is GlobalStandard.  Note:  Global training offers cost savings , but copies data and weights outside the current resource region.
+            # Learn more - https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/ and https://azure.microsoft.com/en-us/explore/global-infrastructure/data-residency/
         )
         print(fine_tuning_job)
 
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_reinforcement_job.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_reinforcement_job.py
@@ -58,6 +58,10 @@
         validation_file = openai_client.files.create(file=f, purpose="fine-tune")
     print(f"Uploaded validation file with ID: {validation_file.id}")
 
+    print("Waits for the training and validation files to be processed...")
+    openai_client.files.wait_for_processing(train_file.id)
+    openai_client.files.wait_for_processing(validation_file.id)
+
     grader: Dict[str, Any] = {
         "name": "Response Quality Grader",
         "type": "score_model",
@@ -71,8 +75,6 @@
         "range": [0.0, 10.0],
     }
 
-    # For OpenAI model RFT fine-tuning jobs, "Standard" is the default training type.
-    # To use global standard training, uncomment the extra_body parameter below.
     print("Creating reinforcement fine-tuning job")
     fine_tuning_job = openai_client.fine_tuning.jobs.create(
         training_file=train_file.id,
@@ -92,6 +94,8 @@
                 },
             },
         },
-        # extra_body={"trainingType":"GlobalStandard"}
+        extra_body={
+            "trainingType": "Standard"
+        },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
     )
     print(fine_tuning_job)
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_reinforcement_job_async.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_reinforcement_job_async.py
@@ -60,6 +60,10 @@ async def main():
             validation_file = await openai_client.files.create(file=f, purpose="fine-tune")
         print(f"Uploaded validation file with ID: {validation_file.id}")
 
+        print("Waits for the training and validation files to be processed...")
+        await openai_client.files.wait_for_processing(train_file.id)
+        await openai_client.files.wait_for_processing(validation_file.id)
+
         grader = {
             "name": "Response Quality Grader",
             "type": "score_model",
@@ -73,8 +77,6 @@ async def main():
             "range": [0.0, 10.0],
         }
 
-        # For OpenAI model RFT fine-tuning jobs, "Standard" is the default training type.
-        # To use global standard training, uncomment the extra_body parameter below.
         fine_tuning_job = await openai_client.fine_tuning.jobs.create(
             training_file=train_file.id,
             validation_file=validation_file.id,
@@ -93,7 +95,9 @@ async def main():
                     },
                 },
             },
-            # extra_body={"trainingType":"GlobalStandard"}
+            extra_body={
+                "trainingType": "Standard"
+            },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
         )
         print(fine_tuning_job)
 
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_supervised_job.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_supervised_job.py
@@ -72,8 +72,10 @@
         validation_file = openai_client.files.create(file=f, purpose="fine-tune")
     print(f"Uploaded validation file with ID: {validation_file.id}")
 
-    # For OpenAI model supervised fine-tuning jobs, "Standard" is the default training type.
-    # To use global standard training, uncomment the extra_body parameter below.
+    print("Waits for the training and validation files to be processed...")
+    openai_client.files.wait_for_processing(train_file.id)
+    openai_client.files.wait_for_processing(validation_file.id)
+
     print("Creating supervised fine-tuning job")
     fine_tuning_job = openai_client.fine_tuning.jobs.create(
         training_file=train_file.id,
@@ -83,7 +85,9 @@
             "type": "supervised",
             "supervised": {"hyperparameters": {"n_epochs": 3, "batch_size": 1, "learning_rate_multiplier": 1.0}},
         },
-        # extra_body={"trainingType":"GlobalStandard"}
+        extra_body={
+            "trainingType": "Standard"
+        },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
     )
     print(fine_tuning_job)
 
diff --git a/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_supervised_job_async.py b/sdk/ai/azure-ai-projects/samples/finetuning/sample_finetuning_supervised_job_async.py
@@ -75,8 +75,10 @@ async def main():
             validation_file = await openai_client.files.create(file=f, purpose="fine-tune")
         print(f"Uploaded validation file with ID: {validation_file.id}")
 
-        # For OpenAI model supervised fine-tuning jobs, "Standard" is the default training type.
-        # To use global standard training, uncomment the extra_body parameter below.
+        print("Waits for the training and validation files to be processed...")
+        await openai_client.files.wait_for_processing(train_file.id)
+        await openai_client.files.wait_for_processing(validation_file.id)
+
         print("Creating supervised fine-tuning job")
         fine_tuning_job = await openai_client.fine_tuning.jobs.create(
             training_file=train_file.id,
@@ -86,7 +88,9 @@ async def main():
                 "type": "supervised",
                 "supervised": {"hyperparameters": {"n_epochs": 3, "batch_size": 1, "learning_rate_multiplier": 1.0}},
             },
-            # extra_body={"trainingType":"GlobalStandard"}
+            extra_body={
+                "trainingType": "Standard"
+            },  # Recommended approach to set trainingType. Omitting this field may lead to unsupported behavior.
         )
         print(fine_tuning_job)
 
diff --git a/sdk/ai/azure-ai-projects/tests/finetuning/test_finetuning.py b/sdk/ai/azure-ai-projects/tests/finetuning/test_finetuning.py
@@ -15,7 +15,9 @@
 )
 class TestFineTuning(TestBase):
 
-    def _create_sft_finetuning_job(self, openai_client, train_file_id, validation_file_id, model_type="openai"):
+    def _create_sft_finetuning_job(
+        self, openai_client, train_file_id, validation_file_id, model_type="openai", training_type="Standard"
+    ):
         """Helper method to create a supervised fine-tuning job."""
         return openai_client.fine_tuning.jobs.create(
             training_file=train_file_id,
@@ -31,6 +33,7 @@ def _create_sft_finetuning_job(self, openai_client, train_file_id, validation_fi
                     }
                 },
             },
+            extra_body={"trainingType": training_type},
         )
 
     def _create_dpo_finetuning_job(self, openai_client, train_file_id, validation_file_id):
@@ -49,6 +52,7 @@ def _create_dpo_finetuning_job(self, openai_client, train_file_id, validation_fi
                     }
                 },
             },
+            extra_body={"trainingType": "Standard"},
         )
 
     def _create_rft_finetuning_job(self, openai_client, train_file_id, validation_file_id):
@@ -84,6 +88,7 @@ def _create_rft_finetuning_job(self, openai_client, train_file_id, validation_fi
                     },
                 },
             },
+            extra_body={"trainingType": "Standard"},
         )
 
     def _upload_test_files(self, openai_client, job_type="sft"):
@@ -323,7 +328,7 @@ def test_sft_finetuning_create_job_oss_model(self, **kwargs):
                 train_file, validation_file = self._upload_test_files(openai_client, "sft")
 
                 fine_tuning_job = self._create_sft_finetuning_job(
-                    openai_client, train_file.id, validation_file.id, "oss"
+                    openai_client, train_file.id, validation_file.id, "oss", "GlobalStandard"
                 )
                 print(f"[test_finetuning_sft_oss] Created fine-tuning job: {fine_tuning_job.id}")
 
diff --git a/sdk/ai/azure-ai-projects/tests/finetuning/test_finetuning_async.py b/sdk/ai/azure-ai-projects/tests/finetuning/test_finetuning_async.py
@@ -17,7 +17,7 @@
 class TestFineTuningAsync(TestBase):
 
     async def _create_sft_finetuning_job_async(
-        self, openai_client, train_file_id, validation_file_id, model_type="openai"
+        self, openai_client, train_file_id, validation_file_id, model_type="openai", training_type="Standard"
     ):
         """Helper method to create a supervised fine-tuning job asynchronously."""
         return await openai_client.fine_tuning.jobs.create(
@@ -34,6 +34,7 @@ async def _create_sft_finetuning_job_async(
                     }
                 },
             },
+            extra_body={"trainingType": training_type},
         )
 
     async def _create_dpo_finetuning_job_async(self, openai_client, train_file_id, validation_file_id):
@@ -52,6 +53,7 @@ async def _create_dpo_finetuning_job_async(self, openai_client, train_file_id, v
                     }
                 },
             },
+            extra_body={"trainingType": "Standard"},
         )
 
     async def _create_rft_finetuning_job_async(self, openai_client, train_file_id, validation_file_id):
@@ -87,6 +89,7 @@ async def _create_rft_finetuning_job_async(self, openai_client, train_file_id, v
                     },
                 },
             },
+            extra_body={"trainingType": "Standard"},
         )
 
     async def _upload_test_files_async(self, openai_client, job_type="sft"):
@@ -354,7 +357,7 @@ async def test_sft_finetuning_create_job_oss_model_async(self, **kwargs):
             train_file, validation_file = await self._upload_test_files_async(openai_client, "sft")
 
             fine_tuning_job = await self._create_sft_finetuning_job_async(
-                openai_client, train_file.id, validation_file.id, "oss"
+                openai_client, train_file.id, validation_file.id, "oss", "GlobalStandard"
             )
             print(f"[test_finetuning_sft_oss_async] Created fine-tuning job: {fine_tuning_job.id}")
             TestBase.validate_fine_tuning_job(

Original file line number	Diff line number	Diff line change
`@@ -15,7 +15,9 @@`
`15`	`15`	`)`
`16`	`16`	`class TestFineTuning(TestBase):`
`17`	`17`
`18`		`- def _create_sft_finetuning_job(self, openai_client, train_file_id, validation_file_id, model_type="openai"):`
	`18`	`+ def _create_sft_finetuning_job(`
	`19`	`+ self, openai_client, train_file_id, validation_file_id, model_type="openai", training_type="Standard"`
	`20`	`+ ):`
`19`	`21`	`"""Helper method to create a supervised fine-tuning job."""`
`20`	`22`	`return openai_client.fine_tuning.jobs.create(`
`21`	`23`	`training_file=train_file_id,`
`@@ -31,6 +33,7 @@ def _create_sft_finetuning_job(self, openai_client, train_file_id, validation_fi`
`31`	`33`	`}`
`32`	`34`	`},`
`33`	`35`	`},`
	`36`	`+ extra_body={"trainingType": training_type},`
`34`	`37`	`)`
`35`	`38`
`36`	`39`	`def _create_dpo_finetuning_job(self, openai_client, train_file_id, validation_file_id):`
`@@ -49,6 +52,7 @@ def _create_dpo_finetuning_job(self, openai_client, train_file_id, validation_fi`
`49`	`52`	`}`
`50`	`53`	`},`
`51`	`54`	`},`
	`55`	`+ extra_body={"trainingType": "Standard"},`
`52`	`56`	`)`
`53`	`57`
`54`	`58`	`def _create_rft_finetuning_job(self, openai_client, train_file_id, validation_file_id):`
`@@ -84,6 +88,7 @@ def _create_rft_finetuning_job(self, openai_client, train_file_id, validation_fi`
`84`	`88`	`},`
`85`	`89`	`},`
`86`	`90`	`},`
	`91`	`+ extra_body={"trainingType": "Standard"},`
`87`	`92`	`)`
`88`	`93`
`89`	`94`	`def _upload_test_files(self, openai_client, job_type="sft"):`
`@@ -323,7 +328,7 @@ def test_sft_finetuning_create_job_oss_model(self, **kwargs):`
`323`	`328`	`train_file, validation_file = self._upload_test_files(openai_client, "sft")`
`324`	`329`
`325`	`330`	`fine_tuning_job = self._create_sft_finetuning_job(`
`326`		`- openai_client, train_file.id, validation_file.id, "oss"`
	`331`	`+ openai_client, train_file.id, validation_file.id, "oss", "GlobalStandard"`
`327`	`332`	`)`
`328`	`333`	`print(f"[test_finetuning_sft_oss] Created fine-tuning job: {fine_tuning_job.id}")`
`329`	`334`