File tree 3 files changed +16
-1
lines changed
3 files changed +16
-1
lines changed Original file line number Diff line number Diff line change 16
16
17
17
jobs :
18
18
examples-cpu :
19
- name : Test exmaples CPU [${{ matrix.group }}/4 ]
19
+ name : Weight compression [${{ matrix.group }}/2 ]
20
20
runs-on : ubuntu-22.04-16-cores
21
21
strategy :
22
22
fail-fast : false
58
58
${{ github.event.inputs.pytest_args || '' }}
59
59
env :
60
60
TQDM_DISABLE : 1
61
+ HOME_HF : " /home/runner/hf_home"
61
62
- name : Upload artifact
62
63
uses : actions/upload-artifact@v4
63
64
if : ${{ !cancelled() }}
Original file line number Diff line number Diff line change 1
1
{
2
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_awq_backup_mode_none_backend_OV]": 269.111,
3
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_aware_awq_scale_estimation_backend_OV]": 421.082,
4
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_aware_awq_scale_estimation_stateful_backend_OV]": 374.507,
5
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_aware_awq_stateful_backend_OV]": 243.878,
6
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_aware_backend_OV]": 190.344,
7
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_aware_gptq_backend_OV]": 1261.154,
8
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_aware_lora_stateful_backend_OV]": 483.905,
9
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_data_free_backend_OV]": 196.905,
10
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_int8_data_free_backend_TORCH]": 154.724,
11
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_NF4_scale_estimation_stateful_per_channel_backend_OV]": 256.375,
12
+ "tests/post_training/test_quantize_conformance.py::test_weight_compression[tinyllama_scale_estimation_per_channel_backend_OV]": 258.622,
2
13
}
Original file line number Diff line number Diff line change 9
9
# See the License for the specific language governing permissions and
10
10
# limitations under the License.
11
11
12
+ import os
12
13
import re
13
14
import time
14
15
import traceback
30
31
from tests .post_training .pipelines .base import BaseTestPipeline
31
32
from tests .post_training .pipelines .base import RunInfo
32
33
34
+ os .environ ["ONEDNN_MAX_CPU_ISA" ] = "AVX2"
35
+
33
36
DATA_ROOT = Path (__file__ ).parent / "data"
34
37
35
38
You can’t perform that action at this time.
0 commit comments