Spaces:

prithivMLmods
/

convert-to-onnx-dir

Running

prithivMLmods commited on Jan 27

Commit

125c8b4

verified ·

1 Parent(s): 88d49ae

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -20,7 +20,7 @@ class Config:
     hf_token: str
     hf_username: str
-    transformers_version: str = "3.0.0"
     hf_base_url: str = "https://huggingface.co"
     transformers_base_url: str = (
         "https://github.com/xenova/transformers.js/archive/refs"
@@ -95,6 +95,12 @@ class ModelConverter:
     def convert_model(self, input_model_id: str) -> Tuple[bool, Optional[str]]:
         """Convert the model to ONNX format."""
         try:
             result = subprocess.run(
                 [
                     sys.executable,
@@ -103,6 +109,8 @@ class ModelConverter:
                     "--quantize",
                     "--model_id",
                     input_model_id,
                 ],
                 cwd=self.config.repo_path,
                 capture_output=True,

     hf_token: str
     hf_username: str
+    transformers_version: str = "4.47.0"  # Updated to latest version
     hf_base_url: str = "https://huggingface.co"
     transformers_base_url: str = (
         "https://github.com/xenova/transformers.js/archive/refs"
     def convert_model(self, input_model_id: str) -> Tuple[bool, Optional[str]]:
         """Convert the model to ONNX format."""
         try:
+            # Ensure accelerate is installed for weight deduplication
+            subprocess.run(
+                [sys.executable, "-m", "pip", "install", "accelerate"],
+                check=True,
+            )
             result = subprocess.run(
                 [
                     sys.executable,
                     "--quantize",
                     "--model_id",
                     input_model_id,
+                    "--atol",  # Adjust tolerance for numerical precision
+                    "1e-04",  # Increased tolerance to 1e-04
                 ],
                 cwd=self.config.repo_path,
                 capture_output=True,