netrans/docs/html/_modules/quantize_hb.html

200 lines
15 KiB
HTML

<!DOCTYPE html>
<html lang="zh" data-content_root="../">
<head>
<meta charset="utf-8" />
<meta name="viewport" content="width=device-width, initial-scale=1.0" />
<title>quantize_hb &#8212; netrans 0.1 文档</title>
<link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=5ecbeea2" />
<link rel="stylesheet" type="text/css" href="../_static/basic.css?v=b08954a9" />
<link rel="stylesheet" type="text/css" href="../_static/alabaster.css?v=27fed22d" />
<script src="../_static/documentation_options.js?v=52efc512"></script>
<script src="../_static/doctools.js?v=9bcbadda"></script>
<script src="../_static/sphinx_highlight.js?v=dc90522c"></script>
<link rel="index" title="索引" href="../genindex.html" />
<link rel="search" title="搜索" href="../search.html" />
<link rel="stylesheet" href="../_static/custom.css" type="text/css" />
</head><body>
<div class="document">
<div class="documentwrapper">
<div class="bodywrapper">
<div class="body" role="main">
<h1>quantize_hb 源代码</h1><div class="highlight"><pre>
<span></span><span class="kn">import</span><span class="w"> </span><span class="nn">os</span>
<span class="kn">import</span><span class="w"> </span><span class="nn">sys</span>
<span class="kn">from</span><span class="w"> </span><span class="nn">utils</span><span class="w"> </span><span class="kn">import</span> <span class="n">check_path</span><span class="p">,</span> <span class="n">AttributeCopier</span><span class="p">,</span> <span class="n">create_cls</span>
<div class="viewcode-block" id="Quantize">
<a class="viewcode-back" href="../quantize_hb.html#quantize_hb.Quantize">[文档]</a>
<span class="k">class</span><span class="w"> </span><span class="nc">Quantize</span><span class="p">(</span><span class="n">AttributeCopier</span><span class="p">):</span>
<span class="k">def</span><span class="w"> </span><span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">source_obj</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="kc">None</span><span class="p">:</span>
<span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">(</span><span class="n">source_obj</span><span class="p">)</span>
<span class="nd">@check_path</span>
<span class="k">def</span><span class="w"> </span><span class="nf">quantize_network</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
<span class="n">netrans</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">netrans</span>
<span class="n">quantized_type</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">quantize_type</span>
<span class="n">name</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">model_name</span>
<span class="c1"># check_env(name)</span>
<span class="c1"># print(os.getcwd())</span>
<span class="n">netrans</span> <span class="o">+=</span> <span class="s2">&quot; quantize&quot;</span>
<span class="c1"># 根据量化类型设置量化参数</span>
<span class="k">if</span> <span class="n">quantized_type</span> <span class="o">==</span> <span class="s1">&#39;float&#39;</span><span class="p">:</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;=========== do not need quantized===========&quot;</span><span class="p">)</span>
<span class="k">return</span>
<span class="k">elif</span> <span class="n">quantized_type</span> <span class="o">==</span> <span class="s1">&#39;uint8&#39;</span><span class="p">:</span>
<span class="n">quantization_type</span> <span class="o">=</span> <span class="s2">&quot;asymmetric_affine&quot;</span>
<span class="k">elif</span> <span class="n">quantized_type</span> <span class="o">==</span> <span class="s1">&#39;int8&#39;</span><span class="p">:</span>
<span class="n">quantization_type</span> <span class="o">=</span> <span class="s2">&quot;dynamic_fixed_point-8&quot;</span>
<span class="k">elif</span> <span class="n">quantized_type</span> <span class="o">==</span> <span class="s1">&#39;int16&#39;</span><span class="p">:</span>
<span class="n">quantization_type</span> <span class="o">=</span> <span class="s2">&quot;dynamic_fixed_point-16&quot;</span>
<span class="k">else</span><span class="p">:</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;=========== wrong quantization_type ! ( uint8 / int8 / int16 )===========&quot;</span><span class="p">)</span>
<span class="k">return</span>
<span class="c1"># 输出量化信息</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot; =======================================================================&quot;</span><span class="p">)</span>
<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s2">&quot; ==== Start Quantizing </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2"> model with type of </span><span class="si">{</span><span class="n">quantization_type</span><span class="si">}</span><span class="s2"> ===&quot;</span><span class="p">)</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot; =======================================================================&quot;</span><span class="p">)</span>
<span class="c1"># 移除已存在的量化文件</span>
<span class="n">quantize_file</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">_</span><span class="si">{</span><span class="n">quantization_type</span><span class="si">}</span><span class="s2">.quantize&quot;</span>
<span class="n">current_directory</span> <span class="o">=</span> <span class="n">os</span><span class="o">.</span><span class="n">getcwd</span><span class="p">()</span>
<span class="n">txt_path</span> <span class="o">=</span> <span class="n">current_directory</span><span class="o">+</span><span class="s2">&quot;/dataset.txt&quot;</span>
<span class="k">with</span> <span class="nb">open</span><span class="p">(</span><span class="n">txt_path</span><span class="p">,</span> <span class="s1">&#39;r&#39;</span><span class="p">,</span> <span class="n">encoding</span><span class="o">=</span><span class="s1">&#39;utf-8&#39;</span><span class="p">)</span> <span class="k">as</span> <span class="n">file</span><span class="p">:</span>
<span class="n">num_lines</span> <span class="o">=</span> <span class="nb">len</span><span class="p">(</span><span class="n">file</span><span class="o">.</span><span class="n">readlines</span><span class="p">())</span>
<span class="c1"># 构建并执行量化命令</span>
<span class="n">cmd</span> <span class="o">=</span> <span class="sa">f</span><span class="s2">&quot;</span><span class="si">{</span><span class="n">netrans</span><span class="si">}</span><span class="s2"> </span><span class="se">\</span>
<span class="s2"> --qtype </span><span class="si">{</span><span class="n">quantized_type</span><span class="si">}</span><span class="s2"> </span><span class="se">\</span>
<span class="s2"> --hybrid </span><span class="se">\</span>
<span class="s2"> --quantizer </span><span class="si">{</span><span class="n">quantization_type</span><span class="o">.</span><span class="n">split</span><span class="p">(</span><span class="s1">&#39;-&#39;</span><span class="p">)[</span><span class="mi">0</span><span class="p">]</span><span class="si">}</span><span class="s2"> </span><span class="se">\</span>
<span class="s2"> --model-quantize </span><span class="si">{</span><span class="n">quantize_file</span><span class="si">}</span><span class="s2"> </span><span class="se">\</span>
<span class="s2"> --model </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">.json </span><span class="se">\</span>
<span class="s2"> --model-data </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">.data </span><span class="se">\</span>
<span class="s2"> --with-input-meta </span><span class="si">{</span><span class="n">name</span><span class="si">}</span><span class="s2">_inputmeta.yml </span><span class="se">\</span>
<span class="s2"> --device CPU </span><span class="se">\</span>
<span class="s2"> --algorithm kl_divergence </span><span class="se">\</span>
<span class="s2"> --divergence-nbins 2048 </span><span class="se">\</span>
<span class="s2"> --iterations </span><span class="si">{</span><span class="n">num_lines</span><span class="si">}</span><span class="s2">&quot;</span>
<span class="n">os</span><span class="o">.</span><span class="n">system</span><span class="p">(</span><span class="n">cmd</span><span class="p">)</span>
<span class="c1"># 检查量化结果</span>
<span class="k">if</span> <span class="n">os</span><span class="o">.</span><span class="n">path</span><span class="o">.</span><span class="n">exists</span><span class="p">(</span><span class="n">quantize_file</span><span class="p">):</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;</span><span class="se">\033</span><span class="s2">[31m QUANTIZED SUCCESS </span><span class="se">\033</span><span class="s2">[0m&quot;</span><span class="p">)</span>
<span class="k">else</span><span class="p">:</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;</span><span class="se">\033</span><span class="s2">[31m ERROR ! </span><span class="se">\033</span><span class="s2">[0m&quot;</span><span class="p">)</span></div>
<div class="viewcode-block" id="main">
<a class="viewcode-back" href="../quantize_hb.html#quantize_hb.main">[文档]</a>
<span class="k">def</span><span class="w"> </span><span class="nf">main</span><span class="p">():</span>
<span class="c1"># 检查命令行参数数量</span>
<span class="k">if</span> <span class="nb">len</span><span class="p">(</span><span class="n">sys</span><span class="o">.</span><span class="n">argv</span><span class="p">)</span> <span class="o">&lt;</span> <span class="mi">3</span><span class="p">:</span>
<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;Input a network name and quantized type ( uint8 / int8 / int16 )&quot;</span><span class="p">)</span>
<span class="n">sys</span><span class="o">.</span><span class="n">exit</span><span class="p">(</span><span class="o">-</span><span class="mi">1</span><span class="p">)</span>
<span class="c1"># 检查网络目录是否存在</span>
<span class="n">network_name</span> <span class="o">=</span> <span class="n">sys</span><span class="o">.</span><span class="n">argv</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span>
<span class="c1"># 定义 netrans 路径</span>
<span class="c1"># netrans = os.path.join(os.environ[&#39;NETRANS_PATH&#39;], &#39;pnnacc&#39;)</span>
<span class="c1"># network_name = sys.argv[1]</span>
<span class="c1"># check_env(network_name)</span>
<span class="n">netrans_path</span> <span class="o">=</span> <span class="n">os</span><span class="o">.</span><span class="n">environ</span><span class="p">[</span><span class="s1">&#39;NETRANS_PATH&#39;</span><span class="p">]</span>
<span class="c1"># netrans = os.path.join(netrans_path, &#39;pnnacc&#39;)</span>
<span class="n">quantize_type</span> <span class="o">=</span> <span class="n">sys</span><span class="o">.</span><span class="n">argv</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span>
<span class="n">cla</span> <span class="o">=</span> <span class="n">create_cls</span><span class="p">(</span><span class="n">netrans_path</span><span class="p">,</span> <span class="n">network_name</span><span class="p">,</span><span class="n">quantize_type</span><span class="p">)</span>
<span class="c1"># 调用量化函数</span>
<span class="n">run</span> <span class="o">=</span> <span class="n">Quantize</span><span class="p">(</span><span class="n">cla</span><span class="p">)</span>
<span class="n">run</span><span class="o">.</span><span class="n">quantize_network</span><span class="p">()</span></div>
<span class="k">if</span> <span class="vm">__name__</span> <span class="o">==</span> <span class="s2">&quot;__main__&quot;</span><span class="p">:</span>
<span class="n">main</span><span class="p">()</span>
</pre></div>
</div>
</div>
</div>
<div class="sphinxsidebar" role="navigation" aria-label="Main">
<div class="sphinxsidebarwrapper">
<h1 class="logo"><a href="../index.html">netrans</a></h1>
<search id="searchbox" style="display: none" role="search">
<div class="searchformwrapper">
<form class="search" action="../search.html" method="get">
<input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false" placeholder="Search"/>
<input type="submit" value="提交" />
</form>
</div>
</search>
<script>document.getElementById('searchbox').style.display = "block"</script><h3>导航</h3>
<p class="caption" role="heading"><span class="caption-text">Contents:</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../quick_start_guide.html">快速入门</a></li>
<li class="toctree-l1"><a class="reference internal" href="../netrans_cli.html">netrans_cli 使用</a></li>
<li class="toctree-l1"><a class="reference internal" href="../netrans_py.html">netrans_py 使用</a></li>
<li class="toctree-l1"><a class="reference internal" href="../appendix.html">附录</a></li>
</ul>
<div class="relations">
<h3>Related Topics</h3>
<ul>
<li><a href="../index.html">Documentation overview</a><ul>
<li><a href="index.html">模块代码</a><ul>
</ul></li>
</ul></li>
</ul>
</div>
</div>
</div>
<div class="clearer"></div>
</div>
<div class="footer">
&#169;2025, ccyh.
|
Powered by <a href="https://www.sphinx-doc.org/">Sphinx 8.2.3</a>
&amp; <a href="https://alabaster.readthedocs.io">Alabaster 1.0.0</a>
</div>
</body>
</html>