saya / tokenizer.js
Dragonnext's picture
Upload 8 files
3b877e1 verified
raw
history blame
312 Bytes
const { getTokenizer } = require('@anthropic-ai/tokenizer');
const tokenizer = getTokenizer();
function getTokenCount(text) {
const tokens = tokenizer.encode(text.normalize('NFKC'), 'all');
return tokens.length;
}
const text = process.argv[2];
const tokenCount = getTokenCount(text);
console.log(tokenCount);