Nástroje používateľa

Nástoje správy stránok


blog:odborny:2019-06-28-unicode_normalization_tool

Rozdiely

Tu môžete vidieť rozdiely medzi vybranou verziou a aktuálnou verziou danej stránky.

Odkaz na tento prehľad zmien

Obojstranná predošlá revízia Predchádzajúca revízia
Nasledujúca revízia
Predchádzajúca revízia
Posledná revízia Obojstranná nasledujúca revízia
blog:odborny:2019-06-28-unicode_normalization_tool [2020/02/24 00:52]
Róbert Toth added word and char counting
blog:odborny:2019-06-28-unicode_normalization_tool [2022/03/03 12:22]
Róbert Toth stará verzia bola obnovená (2020/09/10 12:07)
Riadok 6: Riadok 6:
 ===== Source string ===== ===== Source string =====
  
-<php>?>+<html>
  
 <script type="text/javascript"> <script type="text/javascript">
Riadok 68: Riadok 68:
   var resultText = sourceText.normalize(requiredForm);   var resultText = sourceText.normalize(requiredForm);
   resultEl.value = resultText;   resultEl.value = resultText;
 +  
 +  // continue by doing UTF analysis
 +  utfAnalysis();
 } }
  
Riadok 92: Riadok 95:
   // count chars and words   // count chars and words
   analysisText += '<p><div>Characters: ' + sourceText.length + '</div>';   analysisText += '<p><div>Characters: ' + sourceText.length + '</div>';
-  analysisText += '<div>Words: ' + (sourceText.match(/[^\s]+/g) || new Array()).length + '</div>';+  analysisText += '<div>Words: ' + (sourceText.match(/[^\s]+/g) || new Array()).length + '</div></p>';
      
   let iterator = sourceText[Symbol.iterator]();   let iterator = sourceText[Symbol.iterator]();
Riadok 121: Riadok 124:
     var char = String.fromCodePoint(code);     var char = String.fromCodePoint(code);
     var name = (unicode[codeHex] || '[unknown]');     var name = (unicode[codeHex] || '[unknown]');
-    analysisChars += '<tr><td>'+char+'</td><td>0x'+codeHex+'</td><td>&amp;#'+code+';</td><td>'+name.escapeHtml()+'</td><td>'+positions.length+'</td><td>'+positions.join(" ")+'</td></tr>';+    analysisChars += '<tr><td>'+char+'</td><td>0x'+codeHex+'</td><td>&amp;#'+code+';</td><td>'+name.escapeHtml()+'</td><td>'+positions.length+'</td><td><div class="limitHeight">'+positions.join(" ")+'</div></td></tr>';
   }   }
      
Riadok 130: Riadok 133:
 </script> </script>
  
-<textarea id='utfSource' oninput='utfRecalculate();utfAnalysis();' style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:11px;' rows='15' cols='120'></textarea>+<textarea id='utfSource' oninput='utfRecalculate()' style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:11px;' rows='15' cols='120'></textarea>
  
 <div id='utfSourceForm'><b>Source text encoding:</b> undetermined</div> <div id='utfSourceForm'><b>Source text encoding:</b> undetermined</div>
  
-<?php</php>+</html>
  
  
 ===== Normalized text ===== ===== Normalized text =====
  
-<php>?>+<html>
  
-<dl+<div style="float:left; width:49%;"
-  <dt><input type='radioname='utfFormonchange='utfRecalculate()value='NFD'> NFD</dt> +  <dl> 
-  <dd>Canonical Decomposition</dd> +    <dt><input type="radioname="utfFormonchange="utfRecalculate()value="NFD"> NFD</dt> 
-  <dt><input type='radioname='utfFormonchange='utfRecalculate()value='NFCchecked='checked'> NFC</dt> +    <dd>Canonical Decomposition</dd> 
-  <dd>Canonical Decomposition, followed by Canonical Composition</br></dd+    <dt><input type="radioname="utfFormonchange="utfRecalculate()value="NFCchecked="checked"> NFC</dt> 
-  <dt><input type='radioname='utfFormonchange='utfRecalculate()value='NFKD'> NFKD</dt> +    <dd>Canonical Decomposition, followed by Canonical Composition</dd> 
-  <dd>Compatibility Decomposition</dd> +  </dl> 
-  <dt><input type='radioname='utfFormonchange='utfRecalculate()value='NFKC'> NFKC</dt> +</div> 
-  <dd>Compatibility Decomposition, followed by Canonical Composition</dd> +<div style="float:right; width:49%;"
-</dl>+  <dl> 
 +    <dt><input type="radioname="utfFormonchange="utfRecalculate()value="NFKD"> NFKD</dt> 
 +    <dd>Compatibility Decomposition</dd> 
 +    <dt><input type="radioname="utfFormonchange="utfRecalculate()value="NFKC"> NFKC</dt> 
 +    <dd>Compatibility Decomposition, followed by Canonical Composition</dd> 
 +  </dl
 +</div>
  
-<textarea id='utfResult' style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:11px;' rows='10' cols='120'></textarea>+<textarea id='utfResult' style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:11px;' rows='10' cols='120' readonly="readonly"></textarea>
  
-<?php</php>+</html>
  
 ===== Text rundown ===== ===== Text rundown =====
  
-<php>?>+<html>
  
 <style type="text/css"> <style type="text/css">
Riadok 201: Riadok 210:
     text-align: left;     text-align: left;
     text-transform: capitalize;     text-transform: capitalize;
 +  }
 +  
 +  div.limitHeight {
 +    overflow: auto;
 +  }
 +  div.limitHeight:hover {
 +    max-height: fit-content !important;
 +  }
 +  #utfAnalysisCharacters div.limitHeight {
 +    max-height: 3.5em;
   }   }
 </style> </style>
Riadok 206: Riadok 225:
 <div id='utfAnalysisText' style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:11px;'></div> <div id='utfAnalysisText' style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:11px;'></div>
  
-<?php</php>+</html>
  
  
 ===== Analysis of Characters ===== ===== Analysis of Characters =====
  
-<php>?>+<html>
  
 <table id='utfAnalysisCharacters' class="inline" style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:10px;'></table> <table id='utfAnalysisCharacters' class="inline" style='width:100%; font-family:Consolas, "Andale Mono WT", "Andale Mono", "Bitstream Vera Sans Mono", "Nimbus Mono L", Monaco, "Courier New", monospace; font-size:10px;'></table>
  
-<?php</php>+</html>
  
  
Riadok 223: Riadok 242:
  
 ~~socialite~~ ~~socialite~~
-{{tag>tools}}+{{tag>tools Unicode UTF-8}}
  
  
Riadok 230: Riadok 249:
 ~~DISQUS~~ ~~DISQUS~~
  
-<php>?>+<html>
 <script type="text/javascript"> <script type="text/javascript">
  
Riadok 33081: Riadok 33100:
  
 </script> </script>
-<?php</php>+</html>
  
blog/odborny/2019-06-28-unicode_normalization_tool.txt · Posledná úprava: 2022/10/24 11:12 od Róbert Toth