Address CI and review comments

microsoft · Oct 21, 2024 · c48ff4c · c48ff4c
1 parent bdd1938
commit c48ff4c
Show file tree

Hide file tree

Showing 10 changed files with 14 additions and 14 deletions.
diff --git a/src/csharp/Adapters.cs b/src/csharp/Adapters.cs
@@ -1,4 +1,7 @@
-using Microsoft.ML.OnnxRuntimeGenAI;
+// Copyright (c) Microsoft Corporation. All rights reserved.
+// Licensed under the MIT License.
+
+using Microsoft.ML.OnnxRuntimeGenAI;
 using System;
 using System.Runtime.InteropServices;
 

diff --git a/src/csharp/Exceptions.cs b/src/csharp/Exceptions.cs
@@ -2,7 +2,6 @@
 // Licensed under the MIT License.
 
 using System;
-using System.Collections.Generic;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/MultiModalProcessor.cs b/src/csharp/MultiModalProcessor.cs
@@ -2,7 +2,6 @@
 // Licensed under the MIT License.
 
 using System;
-using System.Runtime.InteropServices;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/Result.cs b/src/csharp/Result.cs
@@ -3,7 +3,6 @@
 
 using System;
 using System.Runtime.CompilerServices;
-using System.Runtime.InteropServices;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/Sequences.cs b/src/csharp/Sequences.cs
@@ -2,7 +2,6 @@
 // Licensed under the MIT License.
 
 using System;
-using System.Runtime.InteropServices;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/Tensor.cs b/src/csharp/Tensor.cs
@@ -3,7 +3,6 @@
 
 using System;
 using System.Diagnostics;
-using System.Runtime.InteropServices;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/Tokenizer.cs b/src/csharp/Tokenizer.cs
@@ -2,8 +2,6 @@
 // Licensed under the MIT License.
 
 using System;
-using System.Runtime.InteropServices;
-using System.Text;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/TokenizerStream.cs b/src/csharp/TokenizerStream.cs
@@ -2,7 +2,6 @@
 // Licensed under the MIT License.
 
 using System;
-using System.Runtime.InteropServices;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI
 {

diff --git a/src/csharp/Utils.cs b/src/csharp/Utils.cs
@@ -2,7 +2,6 @@
 // Licensed under the MIT License.
 
 using System;
-using System.Runtime.InteropServices;
 using System.Text;
 
 namespace Microsoft.ML.OnnxRuntimeGenAI

diff --git a/test/python/test_onnxruntime_genai_api.py b/test/python/test_onnxruntime_genai_api.py
@@ -434,14 +434,20 @@ def _prepare_adapter_model(test_data_path):
         model.graph.input.extend([adapter_a, adapter_b])
 
        # tensor proto for default lora parameter A
-        adapter_weight_a = np.zeros([vocab_size], dtype=np.float32)
+        adapter_weight_a = np.zeros([vocab_size], dtype=(np.float32 if device == "cpu" else np.float16))
         adapter_weight_a_tensor = onnx.helper.make_tensor(
-            "adapter_a", onnx.TensorProto.FLOAT, [vocab_size], adapter_weight_a.flatten()
+            "adapter_a", 
+            onnx.TensorProto.FLOAT if device == "cpu" else onnx.TensorProto.FLOAT16,
+            [vocab_size],
+            adapter_weight_a.flatten()
         )
 
-        adapter_weight_b = np.zeros([vocab_size], dtype=np.float32)
+        adapter_weight_b = np.zeros([vocab_size], dtype=(np.float32 if device == "cpu" else np.float16))
         adapter_weight_b_tensor = onnx.helper.make_tensor(
-            "adapter_b", onnx.TensorProto.FLOAT, [vocab_size], adapter_weight_b.flatten()
+            "adapter_b",
+            onnx.TensorProto.FLOAT if device == "cpu" else onnx.TensorProto.FLOAT16,
+            [vocab_size],
+            adapter_weight_b.flatten()
         )
 
         model.graph.initializer.extend([adapter_weight_a_tensor, adapter_weight_b_tensor])