English
John6666 commited on
Commit
750941c
·
verified ·
1 Parent(s): c47b141

Upload 2 files

Browse files
Files changed (2) hide show
  1. handler.py +3 -3
  2. requirements.txt +3 -3
handler.py CHANGED
@@ -15,10 +15,10 @@ import subprocess
15
  subprocess.run("pip list", shell=True)
16
 
17
  IS_NEW_GPU = False
18
- IS_COMPILE = True
19
- IS_TURBO = False
20
  IS_4BIT = True
21
- IS_AUTOQ = True
22
 
23
  # Set high precision for float32 matrix multiplications.
24
  # This setting optimizes performance on NVIDIA GPUs with Ampere architecture (e.g., A100, RTX 30 series) or newer.
 
15
  subprocess.run("pip list", shell=True)
16
 
17
  IS_NEW_GPU = False
18
+ IS_COMPILE = False
19
+ IS_TURBO = True
20
  IS_4BIT = True
21
+ IS_AUTOQ = False
22
 
23
  # Set high precision for float32 matrix multiplications.
24
  # This setting optimizes performance on NVIDIA GPUs with Ampere architecture (e.g., A100, RTX 30 series) or newer.
requirements.txt CHANGED
@@ -4,8 +4,7 @@ torchvision
4
  torchaudio
5
  huggingface_hub
6
  torchao>=0.9.0
7
- #diffusers==0.32.2
8
- git+https://github.com/huggingface/diffusers
9
  peft
10
  transformers==4.48.3
11
  numpy
@@ -13,4 +12,5 @@ scipy
13
  Pillow
14
  sentencepiece
15
  protobuf
16
- triton
 
 
4
  torchaudio
5
  huggingface_hub
6
  torchao>=0.9.0
7
+ diffusers==0.32.2
 
8
  peft
9
  transformers==4.48.3
10
  numpy
 
12
  Pillow
13
  sentencepiece
14
  protobuf
15
+ triton
16
+ gemlite