quickgrid commited on
Commit
33ff8e6
Β·
verified Β·
1 Parent(s): befbfc1
Files changed (1) hide show
  1. index.html +65 -10
index.html CHANGED
@@ -576,7 +576,7 @@
576
  <div class="logo">
577
  <div class="logo-hex">T</div>
578
  <span class="logo-name">TokenLens</span>
579
- <span class="logo-tag">v1.3</span>
580
  </div>
581
  <div class="header-divider"></div>
582
  <div class="header-controls">
@@ -747,21 +747,76 @@ Try special characters, code, emojis, or multi-lingual text to compare models.">
747
 
748
  <script type="module">
749
  import { AutoTokenizer, env }
750
- from 'https://cdn.jsdelivr.net/npm/@xenova/transformers@2.17.2';
751
 
752
  env.allowLocalModels = false;
753
  env.useBrowserCache = true;
754
 
755
  // ── Model Registry ─────────────────────────────────────────
756
  const MODELS = [
757
- { id:'Xenova/gpt2', name:'GPT-2', org:'OpenAI', color:'#10a37f', vocab:'50k', type:'BPE', desc:'Classic GPT-2 BPE tokenizer' },
758
- { id:'Xenova/gpt-4', name:'GPT-4', org:'OpenAI', color:'#10a37f', vocab:'100k', type:'tiktoken cl100k', desc:'Used by GPT-3.5 & GPT-4' },
759
- { id:'Xenova/llama-tokenizer', name:'LLaMA 2', org:'Meta', color:'#0466de', vocab:'32k', type:'SP-BPE', desc:'SentencePiece BPE β€” LLaMA / LLaMA-2' },
760
- { id:'Xenova/mistral-tokenizer-v1', name:'Mistral', org:'Mistral AI', color:'#ff7722', vocab:'32k', type:'SP-BPE', desc:'Mistral 7B v0.1 tokenizer' },
761
- { id:'Xenova/bert-base-uncased', name:'BERT', org:'Google', color:'#4285f4', vocab:'30k', type:'WordPiece', desc:'BERT-base uncased WordPiece' },
762
- { id:'Xenova/t5-base', name:'T5', org:'Google', color:'#34a853', vocab:'32k', type:'Unigram', desc:'T5 SentencePiece Unigram' },
763
- { id:'Xenova/claude-tokenizer', name:'Claude', org:'Anthropic', color:'#cc785c', vocab:'~100k', type:'BPE', desc:"Anthropic Claude's tokenizer" },
764
- { id:'Xenova/roberta-base', name:'RoBERTa', org:'Meta', color:'#1a73e8', vocab:'50k', type:'BPE', desc:'RoBERTa byte-level BPE' },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
765
  ];
766
 
767
  // ── Token Color Palettes ───────────────────────────────────
 
576
  <div class="logo">
577
  <div class="logo-hex">T</div>
578
  <span class="logo-name">TokenLens</span>
579
+ <span class="logo-tag">v1.4</span>
580
  </div>
581
  <div class="header-divider"></div>
582
  <div class="header-controls">
 
747
 
748
  <script type="module">
749
  import { AutoTokenizer, env }
750
+ from 'https://cdn.jsdelivr.net/npm/@huggingface/transformers@4.2.0';
751
 
752
  env.allowLocalModels = false;
753
  env.useBrowserCache = true;
754
 
755
  // ── Model Registry ─────────────────────────────────────────
756
  const MODELS = [
757
+ {
758
+ id:'Qwen/Qwen3.6-27B',
759
+ name:'Qwen 3.6 27B',
760
+ org:'Alibaba',
761
+ color:'#0466de',
762
+ vocab:'152k',
763
+ type:'BPE',
764
+ desc:'Qwen tokenizer optimized for multilingual coding and reasoning tasks'
765
+ },
766
+ {
767
+ id:'deepseek-ai/DeepSeek-V4-Pro',
768
+ name:'DeepSeek V4 Pro',
769
+ org:'DeepSeek',
770
+ color:'#4285f4',
771
+ vocab:'129k',
772
+ type:'BPE',
773
+ desc:'DeepSeek multilingual tokenizer designed for code-heavy workloads'
774
+ },
775
+ {
776
+ id:'MiniMaxAI/MiniMax-M2.7',
777
+ name:'MiniMax M2.7',
778
+ org:'MiniMax',
779
+ color:'#1a73e8',
780
+ vocab:'128k',
781
+ type:'SentencePiece',
782
+ desc:'Efficient multilingual tokenizer for long-context multimodal models'
783
+ },
784
+ {
785
+ id:'mistralai/Mistral-Medium-3.5-128B',
786
+ name:'Mistral Medium 3.5',
787
+ org:'Mistral AI',
788
+ color:'#ff7722',
789
+ vocab:'131k',
790
+ type:'Tekken BPE',
791
+ desc:'Mistral Tekken tokenizer with efficient multilingual compression'
792
+ },
793
+ {
794
+ id:'google/gemma-4-31B-it',
795
+ name:'Gemma 4 31B',
796
+ org:'Google',
797
+ color:'#34a853',
798
+ vocab:'256k',
799
+ type:'SentencePiece',
800
+ desc:'Gemma multilingual SentencePiece tokenizer with large vocabulary'
801
+ },
802
+ {
803
+ id:'zai-org/GLM-5.1',
804
+ name:'GLM-5.1',
805
+ org:'Z.ai',
806
+ color:'#10a37f',
807
+ vocab:'151k',
808
+ type:'SentencePiece',
809
+ desc:'GLM multilingual SentencePiece tokenizer with large bilingual vocabulary'
810
+ },
811
+ {
812
+ id:'XiaomiMiMo/MiMo-V2.5-Pro',
813
+ name:'MiMo V2.5 Pro',
814
+ org:'Xiaomi',
815
+ color:'#ff7722',
816
+ vocab:'128k',
817
+ type:'SentencePiece',
818
+ desc:'MoE tokenizer tuned for multilingual reasoning and code generation'
819
+ },
820
  ];
821
 
822
  // ── Token Color Palettes ───────────────────────────────────