update,

2025-01-31 22:10:02 +08:00
parent 97df42e0d5
commit 2627562070
2852 changed files with 748727 additions and 0 deletions
--- a/uukssw/quote1/_ref/neural-compressor/test/utils/test_cpu_info.py
+++ b/uukssw/quote1/_ref/neural-compressor/test/utils/test_cpu_info.py
@@ -0,0 +1,9 @@
+from neural_compressor.utils.utility import CpuInfo
+
+
+class TestCPUInfo:
+    def test_get_cpu_info(self):
+        cpu_info = CpuInfo()
+        assert cpu_info.cores >= 1
+        assert cpu_info.sockets >= 1
+        assert cpu_info.cores_per_socket >= 1
--- a/uukssw/quote1/_ref/neural-compressor/test/utils/test_huggingface.py
+++ b/uukssw/quote1/_ref/neural-compressor/test/utils/test_huggingface.py
@@ -0,0 +1,50 @@
+"""Tests for downloading int8 model from huggingface model hub."""
+
+import shutil
+import unittest
+
+import torch
+import transformers
+
+from neural_compressor.model import Model
+from neural_compressor.utils.load_huggingface import save_for_huggingface_upstream
+
+
+class TestQuantization(unittest.TestCase):
+    @classmethod
+    def tearDownClass(self):
+        shutil.rmtree("./saved_results", ignore_errors=True)
+
+    def test_int8_huggingface_model(self):
+        from neural_compressor.utils.load_huggingface import OptimizedModel
+
+        model_name_or_path = "Intel/distilbert-base-uncased-finetuned-sst-2-english-int8-static"
+        tokenizer = transformers.AutoTokenizer.from_pretrained(model_name_or_path)
+        model = OptimizedModel.from_pretrained(
+            model_name_or_path,
+            from_tf=bool(".ckpt" in model_name_or_path),
+            config=None,
+            cache_dir=None,
+            revision=None,
+            use_auth_token=None,
+        )
+
+        stat = model.state_dict()
+        self.assertTrue(stat["classifier.module._packed_params.dtype"] == torch.qint8)
+
+        from huggingface_hub import hf_hub_download
+
+        resolved_weights_file = hf_hub_download(
+            repo_id=model_name_or_path,
+            filename="pytorch_model.bin",
+        )
+        q_config = torch.load(resolved_weights_file)["best_configure"]
+        inc_model = Model(model)
+        inc_model.q_config = q_config
+
+        save_for_huggingface_upstream(inc_model, tokenizer, "saved_results")
+        load_model = OptimizedModel.from_pretrained("saved_results")
+
+
+if __name__ == "__main__":
+    unittest.main()
--- a/uukssw/quote1/_ref/neural-compressor/test/utils/test_layer_histogram.py
+++ b/uukssw/quote1/_ref/neural-compressor/test/utils/test_layer_histogram.py
@@ -0,0 +1,124 @@
+"""Tests for collecting layer histogram."""
+
+import unittest
+from collections import OrderedDict
+
+import numpy as np
+import torch
+import torch.nn as nn
+
+from neural_compressor.utils import logger
+from neural_compressor.utils.collect_layer_histogram import LayerHistogramCollector
+
+
+class InvertedResidual(nn.Module):
+    def __init__(self, inp, oup, stride, expand_ratio):
+        super().__init__()
+        self.stride = stride
+        assert stride in [1, 2]
+
+        hidden_dim = int(inp * expand_ratio)
+        self.use_res_connect = self.stride == 1 and inp == oup
+
+        if expand_ratio == 1:
+            self.conv = nn.Sequential(
+                nn.Conv2d(hidden_dim, hidden_dim, 3, stride, 1, groups=hidden_dim, bias=False),
+                nn.BatchNorm2d(hidden_dim),
+                nn.ReLU6(inplace=True),
+                nn.Conv2d(hidden_dim, oup, 1, 1, 0, bias=False),
+                nn.BatchNorm2d(oup),
+            )
+        else:
+            self.conv = nn.Sequential(
+                nn.Conv2d(inp, hidden_dim, 1, 1, 0, bias=False),
+                nn.BatchNorm2d(hidden_dim),
+                nn.ReLU6(inplace=True),
+                nn.Conv2d(hidden_dim, hidden_dim, 3, stride, 1, groups=hidden_dim, bias=False),
+                nn.BatchNorm2d(hidden_dim),
+                nn.ReLU6(inplace=True),
+                nn.Conv2d(hidden_dim, oup, 1, 1, 0, bias=False),
+                nn.BatchNorm2d(oup),
+            )
+
+    def forward(self, x):
+        if self.use_res_connect:
+            return x + self.conv(x)
+        else:
+            return self.conv(x)
+
+
+class BuildFakeModel(nn.Module):
+    def conv_1x1_bn(self, inp, oup):
+        return nn.Sequential(nn.Conv2d(inp, oup, 1, 1, 0, bias=False), nn.BatchNorm2d(oup), nn.ReLU6(inplace=True))
+
+    def conv_bn(self, inp, oup, stride):
+        return nn.Sequential(nn.Conv2d(inp, oup, 3, stride, 1, bias=False), nn.BatchNorm2d(oup), nn.ReLU6(inplace=True))
+
+    def make_divisible(self, x, divisor=8):
+        return int(np.ceil(x * 1.0 / divisor) * divisor)
+
+    def __init__(self, n_class=1000, input_size=224, width_mult=1.0):
+        super().__init__()
+        block = InvertedResidual
+        input_channel = 32
+        last_channel = 1280
+        interverted_residual = [
+            [1, 16, 1, 1],
+            [6, 24, 2, 2],
+            [6, 32, 3, 2],
+            [6, 64, 4, 2],
+            [6, 96, 3, 1],
+            [6, 160, 3, 2],
+            [6, 320, 1, 1],
+        ]
+
+        assert input_size % 32 == 0
+        self.last_channel = self.make_divisible(last_channel * width_mult) if width_mult > 1.0 else last_channel
+        self.features = [self.conv_bn(3, input_channel, 2)]
+        for t, c, n, s in interverted_residual:
+            output_channel = self.make_divisible(c * width_mult) if t > 1 else c
+            for i in range(n):
+                if i == 0:
+                    self.features.append(block(input_channel, output_channel, s, expand_ratio=t))
+                else:
+                    self.features.append(block(input_channel, output_channel, 1, expand_ratio=t))
+                input_channel = output_channel
+        self.features.append(self.conv_1x1_bn(input_channel, self.last_channel))
+        self.features = nn.Sequential(*self.features)
+        self.classifier = nn.Linear(self.last_channel, n_class)
+
+    def forward(self, x):
+        x = self.features(x)
+        x = torch.mean(x.view(x.size(0), x.size(1), -1), -1)
+        x = self.classifier(x)
+        return x
+
+
+class CollectLayerHistogram(unittest.TestCase):
+    def setUp(self):
+        model = BuildFakeModel(width_mult=1)
+        layer_tensor, include_layer = OrderedDict(), OrderedDict()
+        i = 0
+        for key, value in model.state_dict().items():
+            if not value.ndim:
+                value = np.expand_dims(value, axis=0)
+            if i > 200:
+                pass
+            else:
+                include_layer[key] = np.array(value, dtype=np.float32)
+            layer_tensor[key] = np.array(value, dtype=np.float32)
+            i += 1
+        self.layer_histogram_collector = LayerHistogramCollector(
+            num_bins=8001, layer_tensor=layer_tensor, include_layer=include_layer, logger=logger
+        )
+
+    def test_layer_histogram(self):
+        self.layer_histogram_collector.collect()
+        self.assertEqual(
+            self.layer_histogram_collector.layer_tensor.keys() & self.layer_histogram_collector.include_layer.keys(),
+            self.layer_histogram_collector.hist_dict.keys(),
+        )
+
+
+if __name__ == "__main__":
+    unittest.main()
--- a/uukssw/quote1/_ref/neural-compressor/test/utils/test_logger.py
+++ b/uukssw/quote1/_ref/neural-compressor/test/utils/test_logger.py
@@ -0,0 +1,35 @@
+"""Tests for logging utilities."""
+
+import unittest
+
+from neural_compressor.utils import logger
+
+
+class TestLogger(unittest.TestCase):
+    def test_logger(self):
+        logger.log(0, "call logger log function.")
+        logger.log(1, {"msg": "call logger log function."})
+        logger.debug("call logger debug function.")
+        logger.debug({"msg": "call logger debug function."})
+        logger.error("call logger error function.")
+        logger.error({"msg": "call logger error function."})
+        logger.fatal("call logger fatal function")
+        logger.fatal({"msg": "call logger fatal function"})
+        logger.info("call logger info function")
+        logger.info({"msg": "call logger info function."})
+        logger.warn("call logger warn function")
+        logger.warn({"msg": "call logger warn function"})
+        logger.warning("call logger warning function")
+        logger.warning({"msg": "call logger warning function"})
+        logger.warning(["call logger warning function", "done"])
+        logger.warning(("call logger warning function", "done"))
+        logger.warning({"msg": {("bert", "embedding"): {"weight": {"dtype": ["unint8", "int8"]}}}})
+        logger.warning({"msg": {("bert", "embedding"): {"op": ("a", "b")}}})
+        # the following log will not be prettified
+        logger.warning([{"msg": "call logger warning function"}, {"msg2": "done"}])
+        logger.warning(({"msg": "call logger warning function"}, {"msg2": "done"}))
+        logger.warning(({"msg": [{"sub_msg": "call logger"}, {"sub_msg2": "call warning function"}]}, {"msg2": "done"}))
+
+
+if __name__ == "__main__":
+    unittest.main()