All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.dizitart.no2.fulltext.languages.Bengali Maven / Gradle / Ivy

There is a newer version: 4.3.0
Show newest version
/*
 *
 * Copyright 2017-2018 Nitrite author or authors.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *        http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 */

package org.dizitart.no2.fulltext.languages;

import org.dizitart.no2.fulltext.Language;

import java.util.Arrays;
import java.util.HashSet;
import java.util.Set;

/**
 * Bengali stop words
 *
 * @since 2.1.0
 * @author Anindya Chatterjee
 */
public class Bengali implements Language {
    @Override
    public Set stopWords() {
        return new HashSet<>(Arrays.asList(
                "অতএব",
                "অথচ",
                "অথবা",
                "অনুযায়ী",
                "অনেক",
                "অনেকে",
                "অনেকেই",
                "অন্তত",
                "অন্য",
                "অবধি",
                "অবশ্য",
                "অর্থাত",
                "আই",
                "আগামী",
                "আগে",
                "আগেই",
                "আছে",
                "আজ",
                "আদ্যভাগে",
                "আপনার",
                "আপনি",
                "আবার",
                "আমরা",
                "আমাকে",
                "আমাদের",
                "আমার",
                "আমি",
                "আর",
                "আরও",
                "ই",
                "ইত্যাদি",
                "ইহা",
                "উচিত",
                "উত্তর",
                "উনি",
                "উপর",
                "উপরে",
                "এ",
                "এঁদের",
                "এঁরা",
                "এই",
                "একই",
                "একটি",
                "একবার",
                "একে",
                "এক্",
                "এখন",
                "এখনও",
                "এখানে",
                "এখানেই",
                "এটা",
                "এটাই",
                "এটি",
                "এত",
                "এতটাই",
                "এতে",
                "এদের",
                "এব",
                "এবং",
                "এবার",
                "এমন",
                "এমনকী",
                "এমনি",
                "এর",
                "এরা",
                "এল",
                "এস",
                "এসে",
                "ঐ",
                "ও",
                "ওঁদের",
                "ওঁর",
                "ওঁরা",
                "ওই",
                "ওকে",
                "ওখানে",
                "ওদের",
                "ওর",
                "ওরা",
                "কখনও",
                "কত",
                "কবে",
                "কমনে",
                "কয়েক",
                "কয়েকটি",
                "করছে",
                "করছেন",
                "করতে",
                "করবে",
                "করবেন",
                "করলে",
                "করলেন",
                "করা",
                "করাই",
                "করায়",
                "করার",
                "করি",
                "করিতে",
                "করিয়া",
                "করিয়ে",
                "করে",
                "করেই",
                "করেছিলেন",
                "করেছে",
                "করেছেন",
                "করেন",
                "কাউকে",
                "কাছ",
                "কাছে",
                "কাজ",
                "কাজে",
                "কারও",
                "কারণ",
                "কি",
                "কিংবা",
                "কিছু",
                "কিছুই",
                "কিন্তু",
                "কী",
                "কে",
                "কেউ",
                "কেউই",
                "কেখা",
                "কেন",
                "কোটি",
                "কোন",
                "কোনও",
                "কোনো",
                "ক্ষেত্রে",
                "কয়েক",
                "খুব",
                "গিয়ে",
                "গিয়েছে",
                "গিয়ে",
                "গুলি",
                "গেছে",
                "গেল",
                "গেলে",
                "গোটা",
                "চলে",
                "চান",
                "চায়",
                "চার",
                "চালু",
                "চেয়ে",
                "চেষ্টা",
                "ছাড়া",
                "ছাড়াও",
                "ছিল",
                "ছিলেন",
                "জন",
                "জনকে",
                "জনের",
                "জন্য",
                "জন্যওজে",
                "জানতে",
                "জানা",
                "জানানো",
                "জানায়",
                "জানিয়ে",
                "জানিয়েছে",
                "জে",
                "জ্নজন",
                "টি",
                "ঠিক",
                "তখন",
                "তত",
                "তথা",
                "তবু",
                "তবে",
                "তা",
                "তাঁকে",
                "তাঁদের",
                "তাঁর",
                "তাঁরা",
                "তাঁাহারা",
                "তাই",
                "তাও",
                "তাকে",
                "তাতে",
                "তাদের",
                "তার",
                "তারপর",
                "তারা",
                "তারৈ",
                "তাহলে",
                "তাহা",
                "তাহাতে",
                "তাহার",
                "তিনঐ",
                "তিনি",
                "তিনিও",
                "তুমি",
                "তুলে",
                "তেমন",
                "তো",
                "তোমার",
                "থাকবে",
                "থাকবেন",
                "থাকা",
                "থাকায়",
                "থাকে",
                "থাকেন",
                "থেকে",
                "থেকেই",
                "থেকেও",
                "দিকে",
                "দিতে",
                "দিন",
                "দিয়ে",
                "দিয়েছে",
                "দিয়েছেন",
                "দিলেন",
                "দু",
                "দুই",
                "দুটি",
                "দুটো",
                "দেওয়া",
                "দেওয়ার",
                "দেওয়া",
                "দেখতে",
                "দেখা",
                "দেখে",
                "দেন",
                "দেয়",
                "দ্বারা",
                "ধরা",
                "ধরে",
                "ধামার",
                "নতুন",
                "নয়",
                "না",
                "নাই",
                "নাকি",
                "নাগাদ",
                "নানা",
                "নিজে",
                "নিজেই",
                "নিজেদের",
                "নিজের",
                "নিতে",
                "নিয়ে",
                "নিয়ে",
                "নেই",
                "নেওয়া",
                "নেওয়ার",
                "নেওয়া",
                "নয়",
                "পক্ষে",
                "পর",
                "পরে",
                "পরেই",
                "পরেও",
                "পর্যন্ত",
                "পাওয়া",
                "পাচ",
                "পারি",
                "পারে",
                "পারেন",
                "পি",
                "পেয়ে",
                "পেয়্র্",
                "প্রতি",
                "প্রথম",
                "প্রভৃতি",
                "প্রযন্ত",
                "প্রাথমিক",
                "প্রায়",
                "প্রায়",
                "ফলে",
                "ফিরে",
                "ফের",
                "বক্তব্য",
                "বদলে",
                "বন",
                "বরং",
                "বলতে",
                "বলল",
                "বললেন",
                "বলা",
                "বলে",
                "বলেছেন",
                "বলেন",
                "বসে",
                "বহু",
                "বা",
                "বাদে",
                "বার",
                "বি",
                "বিনা",
                "বিভিন্ন",
                "বিশেষ",
                "বিষয়টি",
                "বেশ",
                "বেশি",
                "ব্যবহার",
                "ব্যাপারে",
                "ভাবে",
                "ভাবেই",
                "মতো",
                "মতোই",
                "মধ্যভাগে",
                "মধ্যে",
                "মধ্যেই",
                "মধ্যেও",
                "মনে",
                "মাত্র",
                "মাধ্যমে",
                "মোট",
                "মোটেই",
                "যখন",
                "যত",
                "যতটা",
                "যথেষ্ট",
                "যদি",
                "যদিও",
                "যা",
                "যাঁর",
                "যাঁরা",
                "যাওয়া",
                "যাওয়ার",
                "যাওয়া",
                "যাকে",
                "যাচ্ছে",
                "যাতে",
                "যাদের",
                "যান",
                "যাবে",
                "যায়",
                "যার",
                "যারা",
                "যিনি",
                "যে",
                "যেখানে",
                "যেতে",
                "যেন",
                "যেমন",
                "র",
                "রকম",
                "রয়েছে",
                "রাখা",
                "রেখে",
                "লক্ষ",
                "শুধু",
                "শুরু",
                "সঙ্গে",
                "সঙ্গেও",
                "সব",
                "সবার",
                "সমস্ত",
                "সম্প্রতি",
                "সহ",
                "সহিত",
                "সাধারণ",
                "সামনে",
                "সি",
                "সুতরাং",
                "সে",
                "সেই",
                "সেখান",
                "সেখানে",
                "সেটা",
                "সেটাই",
                "সেটাও",
                "সেটি",
                "স্পষ্ট",
                "স্বয়ং",
                "হইতে",
                "হইবে",
                "হইয়া",
                "হওয়া",
                "হওয়ায়",
                "হওয়ার",
                "হচ্ছে",
                "হত",
                "হতে",
                "হতেই",
                "হন",
                "হবে",
                "হবেন",
                "হয়",
                "হয়তো",
                "হয়নি",
                "হয়ে",
                "হয়েই",
                "হয়েছিল",
                "হয়েছে",
                "হয়েছেন",
                "হল",
                "হলে",
                "হলেই",
                "হলেও",
                "হলো",
                "হাজার",
                "হিসাবে",
                "হৈলে",
                "হোক",
                "হয়"
        ));
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy