mca

Posts

nlp

June 13, 2025

1 import nltk from nltk.tokenize import word_tokenize from nltk.stem import PorterStemmer, WordNetLemmatizer from nltk import pos_tag, ne_chunk nltk.download('punkt') text = "Dinesh puri sir kiti bhari HOD ahet." # Tokenization tokens = word_tokenize(text) print("Tokens:", tokens) # Stemming stemmer = PorterStemmer() print("Stemmed:", [stemmer.stem(w) for w in tokens]) # Lemmatization lemmatizer = WordNetLemmatizer() print("Lemmatized:", [lemmatizer.lemmatize(w) for w in tokens]) # Chunking chunks = ne_chunk(pos_tag(tokens)) print("Chunks:", chunks) 2 from nltk.tokenize import word_tokenize def count_lines_words(file): with open(file, 'r') as f: text = f.read() print("Lines:", text.count('\n') + 1) print("Words:", len(word_tokenize(text))) count_lines_words("nlp5.txt") #pracitcal 3 from nltk.tokenize import word_tokenize def count_articles(file): with open(fi...

Search This Blog

mca

Posts

nlp manual

nlp