Getting Started
đ§° Learn about individual Toolkitsâ
Here's a quick start guide to help you get started with the Bangla Toolkit (BNTK).
Installationâ
Install the required packages for Bengali natural language processing:
- npm
- Bun
- Yarn
- pnpm
npm install @bntk/tokenization @bntk/stemming @bntk/pos @bntk/ner @bntk/transliteration
bun add @bntk/tokenization @bntk/stemming @bntk/pos @bntk/ner @bntk/transliteration
yarn add @bntk/tokenization @bntk/stemming @bntk/pos @bntk/ner @bntk/transliteration
pnpm add @bntk/tokenization @bntk/stemming @bntk/pos @bntk/ner @bntk/transliteration
Example Usageâ
import * as ner from "@bntk/ner";
import * as pos from "@bntk/pos";
import * as stemming from "@bntk/stemming";
import * as tokenization from "@bntk/tokenization";
import * as transliteration from "@bntk/transliteration";
const contents = `āĻāĻŽāĻŋ āĻŦāĻžāĻāϞāĻž āϞā§āĻāĻžāϰ āĻāύā§āϝ āĻā§āϞāĻŋāĻāĻ āĻŦā§āϝāĻŦāĻšāĻžāϰ āĻāϰāĻāĻŋāĨ¤ āĻāĻŽāĻžāϰ āĻŦāύā§āϧ⧠āϰāĻšāĻŋāĻŽ āĻĸāĻžāĻāĻžāϝāĻŧ āĻĨāĻžāĻā§āύāĨ¤`;
// ==== Tokenization ====
const sentences = tokenization.tokenizeSentences(contents);
console.log(sentences);
// ['āĻāĻŽāĻŋ āĻŦāĻžāĻāϞāĻž āϞā§āĻāĻžāϰ āĻāύā§āϝ āĻā§āϞāĻŋāĻāĻ āĻŦā§āϝāĻŦāĻšāĻžāϰ āĻāϰāĻāĻŋ', 'āĻāĻŽāĻžāϰ āĻŦāύā§āϧ⧠āϰāĻšāĻŋāĻŽ āĻĸāĻžāĻāĻžāϝāĻŧ āĻĨāĻžāĻā§āύ']
const words = tokenization.tokenizeWords(sentences[0]);
console.log(words);
// ['āĻāĻŽāĻŋ', 'āĻŦāĻžāĻāϞāĻž', 'āϞā§āĻāĻžāϰ', 'āĻāύā§āϝ', 'āĻā§āϞāĻŋāĻāĻ', 'āĻŦā§āϝāĻŦāĻšāĻžāϰ', 'āĻāϰāĻāĻŋ']
// ==== Stemming ====
const stemmedWords = stemming.stemWords(words);
console.log(stemmedWords);
// ['āĻāĻŽāĻŋ', 'āĻŦāĻžāĻāϞāĻž', 'āϞā§āĻāĻžāϰ', 'āĻāύā§āϝ', 'āĻā§āϞāĻŋāĻāĻ', 'āĻŦā§āϝāĻŦāĻšāĻžāϰ', 'āĻāϰāĻāĻŋ']
// ==== POS ====
const taggedWords = pos.tagWords(stemmedWords);
console.log(taggedWords);
// ['āĻāĻŽāĻŋ/PRON', 'āĻŦāĻžāĻāϞāĻž/NOUN', 'āϞā§āĻāĻžāϰ/NOUN', 'āĻāύā§āϝ/ADP', 'āĻā§āϞāĻŋāĻāĻ/NOUN', 'āĻŦā§āϝāĻŦāĻšāĻžāϰ/VERB', 'āĻāϰāĻāĻŋ/VERB']
// ==== NER ====
const entities = ner.extractEntities(sentences[1]);
console.log(entities);
// [{type: 'PRONOUN', value: 'āĻāĻŽāĻžāϰ', start: 0, end: 4}, {...}]
// ==== Transliteration ====
const transliterated = transliteration.transliterate("amar name apon.");
console.log(transliterated);
// 'āĻāĻŽāĻžāϰ āύāĻžāĻŽ āĻāĻĒāύāĨ¤'