Spaces:

arcee-ai
/

Benchmarks

Running

App Files Files Community

Julien Simon commited on Sep 4, 2024

Commit

3fdf87c

1 Parent(s): 75e81c7

Update

Browse files

Files changed (3) hide show

.pre-commit-config.yaml +77 -0
.pylintrc +2 -0
results.py +29 -6

.pre-commit-config.yaml ADDED Viewed

	@@ -0,0 +1,77 @@

+repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.6.0
+    hooks:
+      - id: trailing-whitespace
+      - id: end-of-file-fixer
+      - id: check-added-large-files
+  - repo: https://github.com/psf/black
+    rev: 24.8.0
+    hooks:
+      - id: black
+        entry: bash -c 'black "$@"; git add -u' --
+  - repo: https://github.com/pycqa/isort
+    rev: 5.13.2
+    hooks:
+      - id: isort
+        args: ["--profile", "black"]
+        entry: bash -c 'isort "$@"; git add -u' --
+  - repo: https://github.com/PyCQA/flake8
+    rev: 7.1.1
+    hooks:
+      - id: flake8
+        args: [--max-line-length=120, "--extend-ignore=E501,E402"]
+  - repo: https://github.com/kynan/nbstripout
+    rev: 0.7.1
+    hooks:
+      - id: nbstripout
+  - repo: https://github.com/nbQA-dev/nbQA
+    rev: 1.8.7
+    hooks:
+      - id: nbqa-black
+        additional_dependencies: [black==23.3.0]
+        entry: bash -c 'nbqa-black "$@"; git add -u' --
+      - id: nbqa-isort
+        additional_dependencies: [isort==5.12.0]
+        entry: bash -c 'nbqa-isort "$@"; git add -u' --
+      - id: nbqa-flake8
+        additional_dependencies: [flake8==6.0.0]
+        args: [--max-line-length=120, "--extend-ignore=E501,E402,E231"]
+  - repo: https://github.com/mwouts/jupytext
+    rev: v1.16.4b
+    hooks:
+      - id: jupytext
+        args: [--sync, --pipe, black]
+        additional_dependencies:
+          - black==23.3.0
+  - repo: https://github.com/aws-cloudformation/cfn-lint
+    rev: v1.11.0  # Use the latest version available
+    hooks:
+      - id: cfn-lint
+        files: cloudformation/.*\.(json|yml|yaml)$
+  - repo: https://github.com/asottile/pyupgrade
+    rev: v3.17.0
+    hooks:
+      - id: pyupgrade
+        args: [--py310-plus]
+        entry: bash -c 'pyupgrade "$@"; git add -u' --
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.11.2
+    hooks:
+      - id: mypy
+        entry: bash -c 'mypy "$@"; git add -u' --
+  - repo: https://github.com/PyCQA/pylint
+    rev: v3.2.6
+    hooks:
+      - id: pylint
+        args: [--rcfile=.pylintrc]

.pylintrc ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ [MESSAGES CONTROL]
2	+ disable=C0301,E0401,R0914

results.py CHANGED Viewed

@@ -1,3 +1,5 @@
 results = {
     "models": [
         {
@@ -27,7 +29,7 @@ results = {
                     "status": "OK",
                     "tokensPerSecond": "38",
                     "notes": "",
-                }
             ],
         },
         {
@@ -57,7 +59,7 @@ results = {
                     "status": "OK",
                     "tokensPerSecond": "38",
                     "notes": "",
-                }
             ],
         },
         {
@@ -334,7 +336,7 @@ results = {
                     "quantization": "none",
                     "container": "SGLang 0.2.13",
                     "status": "OK",
-                    "tokensPerSecond": "45"
                 },
                 {
                     "region": "AWS",
@@ -345,7 +347,7 @@ results = {
                     "quantization": "none",
                     "container": "vLLM 0.5.5",
                     "status": "OK",
-                    "tokensPerSecond": "43.4"
                 },
                 {
                     "region": "AWS",
@@ -476,8 +478,7 @@ results = {
                 },
             ],
         },
-        {"name": "Arcee-Spark",
-         "modelType": "Qwen2 7B"},
         {
             "name": "Arcee-Lite",
             "modelType": "Qwen2 1.5B distilled from phi-3-medium 14B",
@@ -577,6 +578,28 @@ results = {
                     "status": "OK",
                     "tokensPerSecond": "160",
                 },
             ],
         },
         {

+"""Module containing model configuration results for various AI models and hardware setups."""
 results = {
     "models": [
         {
                     "status": "OK",
                     "tokensPerSecond": "38",
                     "notes": "",
+                },
             ],
         },
         {
                     "status": "OK",
                     "tokensPerSecond": "38",
                     "notes": "",
+                },
             ],
         },
         {
                     "quantization": "none",
                     "container": "SGLang 0.2.13",
                     "status": "OK",
+                    "tokensPerSecond": "45",
                 },
                 {
                     "region": "AWS",
                     "quantization": "none",
                     "container": "vLLM 0.5.5",
                     "status": "OK",
+                    "tokensPerSecond": "43.4",
                 },
                 {
                     "region": "AWS",
                 },
             ],
         },
+        {"name": "Arcee-Spark", "modelType": "Qwen2 7B"},
         {
             "name": "Arcee-Lite",
             "modelType": "Qwen2 1.5B distilled from phi-3-medium 14B",
                     "status": "OK",
                     "tokensPerSecond": "160",
                 },
+                {
+                    "region": "us-west-2",
+                    "instanceType": "g6e.2xlarge",
+                    "cloud": "AWS",
+                    "gpu": "1xNVIDIA L40S",
+                    "gpuRAM": "48 GB",
+                    "quantization": "none",
+                    "container": "vLLM 0.5.5",
+                    "status": "OK",
+                    "tokensPerSecond": "146",
+                },
+                {
+                    "region": "us-west-2",
+                    "instanceType": "g6e.2xlarge",
+                    "cloud": "AWS",
+                    "gpu": "1xNVIDIA L40S",
+                    "gpuRAM": "48 GB",
+                    "quantization": "none",
+                    "container": "SGLang 0.2.13",
+                    "status": "OK",
+                    "tokensPerSecond": "167",
+                },
             ],
         },
         {