Add support for parallel quantization on Mac
This commit is contained in:
parent
63d66b0572
commit
f6b88da8c1
|
@ -7,6 +7,7 @@ import bz2
|
||||||
import torch
|
import torch
|
||||||
import base64
|
import base64
|
||||||
import ctypes
|
import ctypes
|
||||||
|
import sys
|
||||||
from transformers.utils import logging
|
from transformers.utils import logging
|
||||||
|
|
||||||
from typing import List
|
from typing import List
|
||||||
|
@ -142,8 +143,12 @@ class CPUKernel:
|
||||||
kernel_file = source_code[:-2] + ".so"
|
kernel_file = source_code[:-2] + ".so"
|
||||||
|
|
||||||
if compile_parallel_kernel:
|
if compile_parallel_kernel:
|
||||||
compile_command = "gcc -O3 -fPIC -pthread -fopenmp -std=c99 {} -shared -o {}".format(
|
if sys.platform != 'darwin':
|
||||||
source_code, kernel_file)
|
compile_command = "gcc -O3 -fPIC -pthread -fopenmp -std=c99 {} -shared -o {}".format(
|
||||||
|
source_code, kernel_file)
|
||||||
|
else:
|
||||||
|
compile_command = "clang -O3 -fPIC -pthread -Xclang -fopenmp -lomp -std=c99 {} -shared -o {}".format(
|
||||||
|
source_code, kernel_file)
|
||||||
print("Compiling", compile_command)
|
print("Compiling", compile_command)
|
||||||
exit_state = os.system(compile_command)
|
exit_state = os.system(compile_command)
|
||||||
if not exit_state:
|
if not exit_state:
|
||||||
|
|
Loading…
Reference in New Issue