aboutsummaryrefslogtreecommitdiff
path: root/nlp/corpora
diff options
context:
space:
mode:
authorHao Chen2020-04-13 23:53:46 -0500
committerHao Chen2020-04-13 23:53:46 -0500
commit60549a2fb71f4297b683b757926b19440eef8730 (patch)
tree6fb6fd164dd91fa819d0b9d14d256910083ce9de /nlp/corpora
parent62aec91c627ba33e42ba24790e664db53316c4db (diff)
downloadgenecup-60549a2fb71f4297b683b757926b19440eef8730.tar.gz
add eng stopwords
Diffstat (limited to 'nlp/corpora')
-rw-r--r--nlp/corpora/stopwords/english179
1 files changed, 179 insertions, 0 deletions
diff --git a/nlp/corpora/stopwords/english b/nlp/corpora/stopwords/english
new file mode 100644
index 0000000..1280aa3
--- /dev/null
+++ b/nlp/corpora/stopwords/english
@@ -0,0 +1,179 @@
+i
+me
+my
+myself
+we
+our
+ours
+ourselves
+you
+you're
+you've
+you'll
+you'd
+your
+yours
+yourself
+yourselves
+he
+him
+his
+himself
+she
+she's
+her
+hers
+herself
+it
+it's
+its
+itself
+they
+them
+their
+theirs
+themselves
+what
+which
+who
+whom
+this
+that
+that'll
+these
+those
+am
+is
+are
+was
+were
+be
+been
+being
+have
+has
+had
+having
+do
+does
+did
+doing
+a
+an
+the
+and
+but
+if
+or
+because
+as
+until
+while
+of
+at
+by
+for
+with
+about
+against
+between
+into
+through
+during
+before
+after
+above
+below
+to
+from
+up
+down
+in
+out
+on
+off
+over
+under
+again
+further
+then
+once
+here
+there
+when
+where
+why
+how
+all
+any
+both
+each
+few
+more
+most
+other
+some
+such
+no
+nor
+not
+only
+own
+same
+so
+than
+too
+very
+s
+t
+can
+will
+just
+don
+don't
+should
+should've
+now
+d
+ll
+m
+o
+re
+ve
+y
+ain
+aren
+aren't
+couldn
+couldn't
+didn
+didn't
+doesn
+doesn't
+hadn
+hadn't
+hasn
+hasn't
+haven
+haven't
+isn
+isn't
+ma
+mightn
+mightn't
+mustn
+mustn't
+needn
+needn't
+shan
+shan't
+shouldn
+shouldn't
+wasn
+wasn't
+weren
+weren't
+won
+won't
+wouldn
+wouldn't