From 583a203a42acd2f900fa6e7bc81fda7bf53e2ca7 Mon Sep 17 00:00:00 2001 From: Miniyahil Kebede <53700166+hmhard@users.noreply.github.com> Date: Sat, 22 Apr 2023 16:10:16 +0300 Subject: [PATCH 1/2] Added Ethiopian(Amharic) Stop Word --- dist/am.json | 1 + 1 file changed, 1 insertion(+) create mode 100644 dist/am.json diff --git a/dist/am.json b/dist/am.json new file mode 100644 index 0000000..90b781a --- /dev/null +++ b/dist/am.json @@ -0,0 +1 @@ +["የሚችል","ስለ","ከላይ","እንደገና","በመላ","እንደገና","መቃወም","አይደለም","የሚፈቅደው","እኔ","መካከል","መካከል","አንድ","እና","ሌላ","ማንም","ማንም","ሰው","በማንኛውም","መንገድ","ማንም","ማንኛውም","በየትኛውም","ቦታ","ለየት","ይታይ","አመስግኑት","ተገቢ","አይደለም","ዙሪያ","እንደ","ጎን","ጠይቅ","መጠየቅ","ተያይዟል","በ","ይገኛል","ራቅ","አስፈሪ","ለ","ሆነ","መሆን","በፊት","ከኋላ","ሁለቱም","አጭር","ግን","እንበል","መጣ","አይችልም","አይችልም","ምክንያት","በእርግጠኝነት","ማጤን","ማጤን","የያዘ","የያዘ","ይይዛል","የሚዛመደው","አይችልም","ኮርስ","አሁን","መ","በእርግጠኝነት","ይገለጻል","ቢሆንም","አልተደረገም","አልሆነም","የተለየ","አደረገ","አያደርግም","ወደታች","ወደታች","በጊዜው","እያንዳንዱ","ኢዱ","ለምሳሌ","ስምንት","ወይ","ቦታ","በቃ","ምሳሌ","በስተቀር","ሩቅ","ጥቂት","አምስተኛ","መጀመሪያ","አምስት","የተከተለ","መከተል","የሚከተለው","ለ","የቀድሞ","የቀድሞ","የሰጠ","ሂድ","ይሄዳል","ይሄዳል","ሄዷል","አግኝቷል","አደረሳችሁ","ሰላምታ","ሸ","ነበር","አልሆነም","ይከሰታል","በጭንቅ","አለው","የሌለው","የነበረው","የሌለው","ያለው","ሄሎ","እገዛ","ስለዚህ","እሷን","እዚህ","በተስፋ","እንዴት","ይሁን","እንጂ","ይሁን","እንጂ","እኔ","ከሆነ","ተናቆት","ወዲያው","ይልቅ","ወደ","አይደለም","ይሆናል","እራሱ","በቃ","አቆይ","ይጠብቃል","ይጠብቃል","አወቅ","የሚታወቅ","ያውቃል","የመጨረሻው","በቅርቡ","በኋላ","የኋለኛው","እንዳንል","እንወድ","ይመስላል","በዋነኛነት","ብዙ","ይችላል","ምናልባት","እኔ","ማለት","ነው","ይህ","በእንዲህ","እንዳለ","ብቻ","ይችላል","ተጨማሪ","ከዚህ","በላይ","በቅርብ","አስፈላጊ","ፍላጎት","ፍላጎት","አዲስ","ያልሆነ","የለም","ማንም","ጠፍቷል","ብዙውን ጊዜ","ኦህ","እሺ","እሺ","አሮጌው","ላይ","አንድ ጊዜ","አንድ","አንድ","ብቻ","ላይ","ወይም","ሌሎች","ካለበለዚያ","የእኛ","በተለይ","በተለይ","ምናልባትም","የተቀመጠ","እባክዎ","ፕላስ","ይቻላል","የሚገመተው","ምናልባት","ይሰጣል","በአንጻራዊነት","በቅደም","ተከተል","ትክክል","ስ","ተብሏል","ተመሳሳይ","አየው","ይላል","ሲል","ይላል","ሁለተኛ","ሁለተኛ","ማየት","ማየት","ይመስላል","ይመስላል","የሚመስል","ይመስላል","የታየ","እራስ","የላከ","ቁምነገር","ሰባት","በርካታ","ይኖሯታል","አለባት","ጀምሮ","አንድ","ሰው","አንድ","ነገር","አንዳንድ ጊዜ","አንዳንድ","ጊዜ","አንድ","ቦታ","በቅርቡ","ይቅርታ","የተገለጸ","ይግለጹ","የሚገልጽ","አሁንም","ንኡስ","እንደ","እርግጠኛ","ተወስዷል","አመሰግናለሁ","ተመስገን","እነሱ","ናቸው","አስበዋል","መሞከር","ሁለት ጊዜ","ሁለት","ስር","በሚያሳዝን","ሁኔታ","ካልሆነ","በስተቀር","ላይ","እኛ","ጥቅም","ላይ","የዋለ","ጠቃሚ","ይጠቀማል","ይጠቀማል","ይፈልጋል","ይፈልጋል","ነበር","እንሆናለን","እንኳን","ደህና","መጣችሁ","መቼ","የትኛው","እያለ","ወዴት","ሙሉ","ማን","ማን","የማን","ለምን","ይፈቅዳል","የሚፈልግ","የሚመኝ","ከ","አይገርምም","አንተ","ታደርጋለህ","ታደርጋለህ","አንተ","ነህ","አንተ","የራስህ","የራስህ","ራስህ","ራስህ","ዜሮ"] From 40db11e0a887a12ad49003ac53ded3291132fae4 Mon Sep 17 00:00:00 2001 From: Miniyahil Kebede <53700166+hmhard@users.noreply.github.com> Date: Sat, 22 Apr 2023 16:13:31 +0300 Subject: [PATCH 2/2] Updated readme added ethiopian amharic stop words --- README.md | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 38929ab..56e7ba4 100644 --- a/README.md +++ b/README.md @@ -7,7 +7,7 @@ Stopwords for various languages in JSON format. Per [Wikipedia](http://en.wikipe You can use all stopwords with [stopwords-all.json](stopwords-all.json) (keyed by language ISO 639-1 code), or see the below table for individual language stopword files. ## Languages -There are a total of 50 supported languages: +There are a total of 51 supported languages: Language | Stopword count | Filename --- | --- | --- @@ -24,6 +24,7 @@ Croatian | 179 | [hr.json](dist/hr.json) Czech | 346 | [cs.json](dist/cs.json) Danish | 101 | [da.json](dist/da.json) Dutch | 275 | [nl.json](dist/nl.json) +Ethiopian | 295 | [am.json](dist/am.json) English | 570 | [en.json](dist/en.json) Esperanto | 173 | [eo.json](dist/eo.json) Estonian | 35 | [et.json](dist/et.json)