fix: add hf causal LM python tests, fix build (#2374)

JessicaXYWang · web-flow · commit 141039b45107 · 2025-05-22T22:38:38.000-04:00
* add hf causal python test

* add chat template example

* move causallm test

* fix typo

* use phi4 for hf causal lm test

* test db run

* test gpu run

* test onnx

* test run

* test run

* test run

* test run

* force reinstall protobuf

* test run

* test run

* test run

* test remove onnxmltools from adb

* test run

* remove install library when submit run

* test run

* test run

* update submit run

* add back dependency
diff --git a/core/src/test/scala/com/microsoft/azure/synapse/ml/nbtest/DatabricksUtilities.scala b/core/src/test/scala/com/microsoft/azure/synapse/ml/nbtest/DatabricksUtilities.scala
@@ -279,8 +279,7 @@ object DatabricksUtilities {
          |  "notebook_task": {
          |    "notebook_path": "$notebookPath",
          |    "base_parameters": []
-         |  },
-         |  "libraries": $Libraries
+         |  }
          |}
       """.stripMargin
     databricksPost("jobs/runs/submit", body).select[Long]("run_id")
diff --git a/deep-learning/src/test/python/synapsemltest/hf/test_HuggingFaceCausalLMTransform.py b/deep-learning/src/test/python/synapsemltest/hf/test_HuggingFaceCausalLMTransform.py
@@ -0,0 +1,75 @@
+# Copyright (C) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT License. See LICENSE in project root for information.
+
+# Prepare training and test data.
+
+import unittest
+from synapse.ml.llm.HuggingFaceCausallmTransform import HuggingFaceCausalLM
+from pyspark.sql import SQLContext
+from synapse.ml.core.init_spark import *
+from synapse.ml.core import __spark_package_version__
+
+spark = init_spark()
+sc = SQLContext(spark.sparkContext)
+
+
+class HuggingFaceCausalLMTester(unittest.TestCase):
+    def __init__(self, *args, **kwargs):
+        super(HuggingFaceCausalLMTester, self).__init__(*args, **kwargs)
+        self.transformer = (
+            HuggingFaceCausalLM()
+            .setModelName("Qwen/Qwen2.5-0.5B-Instruct")
+            .setInputCol("messages")
+            .setOutputCol("result")
+            .setModelParam(max_new_tokens=10)
+        )
+        self.strDataFrame = (
+            spark.createDataFrame(
+                [
+                    (
+                        "positive",
+                        "output a single word (without quotes) of positive or negative in lower case to reflect their sentiment: I like SynapseML",
+                    ),
+                ]
+            )
+            .toDF("gt", "messages")
+            .repartition(1)
+        )
+        self.listDataFrame = (
+            spark.createDataFrame(
+                [
+                    (
+                        "positive",
+                        [
+                            {
+                                "role": "system",
+                                "content": "Your job is to detect the sentiment of user reviews. Given some text, output a single word (without quotes) of positive or negative to reflect their intent. Output only that single word in lower case: no explanations or complete sentences.",
+                            },
+                            {"role": "user", "content": "I like SynapseML"},
+                        ],
+                    ),
+                ]
+            )
+            .toDF("gt", "messages")
+            .repartition(1)
+        )
+
+    def _assert_output(self, transformer, input_df):
+        transformed_df = transformer.transform(input_df).collect()
+        gt_col_value = [row.gt for row in transformed_df]
+        output_col_value = [row.result for row in transformed_df]
+        input_col_value = [row.messages for row in transformed_df]
+        for i in range(len(gt_col_value)):
+            assert (
+                gt_col_value[i] == output_col_value[i]
+            ), f"model prediction {output_col_value[i]} does not match with ground truth {gt_col_value[i]}, input message is {input_col_value[i]}"
+
+    def test_str_df(self):
+        self._assert_output(self.transformer, self.strDataFrame)
+
+    def test_list_df(self):
+        self._assert_output(self.transformer, self.listDataFrame)
+
+
+if __name__ == "__main__":
+    result = unittest.main()
diff --git a/docs/Explore Algorithms/Deep Learning/Quickstart - Apply Phi Model with HuggingFace CausalLM.ipynb b/docs/Explore Algorithms/Deep Learning/Quickstart - Apply Phi Model with HuggingFace CausalLM.ipynb
@@ -82,6 +82,50 @@
     "display(result_df)"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Apply Chat Template"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from pyspark.sql.functions import udf\n",
+    "from pyspark.sql.types import ArrayType, MapType, StringType\n",
+    "\n",
+    "reviews = [\n",
+    "    (1, \"I like SynapseML\"),\n",
+    "    (2, \"Contoso is awful\"),\n",
+    "]\n",
+    "reviews_df = spark.createDataFrame(reviews, [\"row_index\", \"content\"])\n",
+    "\n",
+    "PROMPT_1 = f\"\"\"You are an AI assistant that identifies the sentiment of a given text. Respond with only the single word “positive” or “negative.”\n",
+    "        \"\"\"\n",
+    "\n",
+    "\n",
+    "@udf\n",
+    "def make_template(s: str):\n",
+    "    return [{\"role\": \"system\", \"content\": PROMPT_1}, {\"role\": \"user\", \"content\": s}]\n",
+    "\n",
+    "\n",
+    "reviews_df = reviews_df.withColumn(\"messages\", make_template(\"content\"))\n",
+    "\n",
+    "phi3_transformer = (\n",
+    "    HuggingFaceCausalLM()\n",
+    "    .setModelName(\"microsoft/Phi-3-mini-4k-instruct\")\n",
+    "    .setInputCol(\"messages\")\n",
+    "    .setOutputCol(\"result\")\n",
+    "    .setModelParam(max_new_tokens=10)\n",
+    ")\n",
+    "result_df = phi3_transformer.transform(reviews_df).collect()\n",
+    "display(result_df)"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
diff --git a/docs/Explore Algorithms/Deep Learning/Quickstart - Fine-tune a Text Classifier.ipynb b/docs/Explore Algorithms/Deep Learning/Quickstart - Fine-tune a Text Classifier.ipynb
@@ -16,24 +16,24 @@
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "### Environment Setup on databricks"
-   ],
    "metadata": {
     "collapsed": false
-   }
+   },
+   "source": [
+    "### Environment Setup on databricks"
+   ]
   },
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false
+   },
    "outputs": [],
    "source": [
     "# install cloudpickle 2.0.0 to add synapse module for usage of horovod\n",
     "%pip install cloudpickle==2.0.0 --force-reinstall --no-deps"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
diff --git a/docs/Explore Algorithms/Deep Learning/Quickstart - Fine-tune a Vision Classifier.ipynb b/docs/Explore Algorithms/Deep Learning/Quickstart - Fine-tune a Vision Classifier.ipynb
@@ -70,6 +70,9 @@
   {
    "cell_type": "code",
    "execution_count": null,
+   "metadata": {
+    "collapsed": false
+   },
    "outputs": [],
    "source": [
     "folder_path = \"/tmp/flowers_prepped\"\n",
@@ -81,10 +84,7 @@
     "    with zipfile.ZipFile(zip_path, \"r\") as zip_ref:\n",
     "        zip_ref.extractall(\"/dbfs/tmp\")\n",
     "    os.remove(zip_path)"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
diff --git a/docs/Explore Algorithms/Deep Learning/Quickstart - ONNX Model Inference.ipynb b/docs/Explore Algorithms/Deep Learning/Quickstart - ONNX Model Inference.ipynb
@@ -13,7 +13,8 @@
     "This example uses the following Python packages and versions:\n",
     "\n",
     "- `onnxmltools==1.7.0`\n",
-    "- `lightgbm==3.2.1`\n"
+    "- `lightgbm==3.2.1`\n",
+    "- `onnx==1.17.0`"
    ]
   },
   {
@@ -35,7 +36,7 @@
    },
    "outputs": [],
    "source": [
-    "%pip install lightgbm onnxmltools==1.7.0"
+    "%pip install --no-cache-dir lightgbm onnxmltools==1.7.0 onnx==1.17.0"
    ]
   },
   {

Original file line number	Diff line number	Diff line change
`@@ -13,7 +13,8 @@`
`13`	`13`	`"This example uses the following Python packages and versions:\n",`
`14`	`14`	`"\n",`
`15`	`15`	"- `onnxmltools==1.7.0`\n",
`16`		- "- `lightgbm==3.2.1`\n"
	`16`	+ "- `lightgbm==3.2.1`\n",
	`17`	+ "- `onnx==1.17.0`"
`17`	`18`	`]`
`18`	`19`	`},`
`19`	`20`	`{`
`@@ -35,7 +36,7 @@`
`35`	`36`	`},`
`36`	`37`	`"outputs": [],`
`37`	`38`	`"source": [`
`38`		`- "%pip install lightgbm onnxmltools==1.7.0"`
	`39`	`+ "%pip install --no-cache-dir lightgbm onnxmltools==1.7.0 onnx==1.17.0"`
`39`	`40`	`]`
`40`	`41`	`},`
`41`	`42`	`{`