💾 Archived View for godocs.io › github.com › afjoseph › RAKE.Go captured on 2024-06-16 at 17:10:35. Gemini links have been rewritten to link to archived content

View Raw

More Information

⬅️ Previous capture (2024-03-21)

➡️ Next capture (2024-08-19)

🚧 View Differences

-=-=-=-=-=-=-

package rake - github.com/afjoseph/RAKE.Go - godocs.io

import "github.com/afjoseph/RAKE.Go"

Variables

var StopWordsSlice = []string{
	"a",
	"a's",
	"able",
	"about",
	"above",
	"according",
	"accordingly",
	"across",
	"actually",
	"after",
	"afterwards",
	"again",
	"against",
	"ain't",
	"all",
	"allow",
	"allows",
	"almost",
	"alone",
	"along",
	"already",
	"also",
	"although",
	"always",
	"am",
	"among",
	"amongst",
	"an",
	"and",
	"another",
	"any",
	"anybody",
	"anyhow",
	"anyone",
	"anything",
	"anyway",
	"anyways",
	"anywhere",
	"apart",
	"appear",
	"appreciate",
	"appropriate",
	"are",
	"aren't",
	"around",
	"as",
	"aside",
	"ask",
	"asking",
	"associated",
	"at",
	"available",
	"away",
	"awfully",
	"b",
	"be",
	"became",
	"because",
	"become",
	"becomes",
	"becoming",
	"been",
	"before",
	"beforehand",
	"behind",
	"being",
	"believe",
	"below",
	"beside",
	"besides",
	"best",
	"better",
	"between",
	"beyond",
	"both",
	"brief",
	"but",
	"by",
	"c",
	"c'mon",
	"c's",
	"came",
	"can",
	"can't",
	"cannot",
	"cant",
	"cause",
	"causes",
	"certain",
	"certainly",
	"changes",
	"clearly",
	"co",
	"com",
	"come",
	"comes",
	"concerning",
	"consequently",
	"consider",
	"considering",
	"contain",
	"containing",
	"contains",
	"corresponding",
	"could",
	"couldn't",
	"course",
	"currently",
	"d",
	"definitely",
	"described",
	"despite",
	"did",
	"didn't",
	"different",
	"do",
	"does",
	"doesn't",
	"doing",
	"don't",
	"done",
	"down",
	"downwards",
	"during",
	"e",
	"each",
	"edu",
	"eg",
	"eight",
	"either",
	"else",
	"elsewhere",
	"enough",
	"entirely",
	"especially",
	"et",
	"etc",
	"even",
	"ever",
	"every",
	"everybody",
	"everyone",
	"everything",
	"everywhere",
	"ex",
	"exactly",
	"example",
	"except",
	"f",
	"far",
	"few",
	"fifth",
	"first",
	"five",
	"followed",
	"following",
	"follows",
	"for",
	"former",
	"formerly",
	"forth",
	"four",
	"from",
	"further",
	"furthermore",
	"g",
	"get",
	"gets",
	"getting",
	"given",
	"gives",
	"go",
	"goes",
	"going",
	"gone",
	"got",
	"gotten",
	"greetings",
	"h",
	"had",
	"hadn't",
	"happens",
	"hardly",
	"has",
	"hasn't",
	"have",
	"haven't",
	"having",
	"he",
	"he's",
	"hello",
	"help",
	"hence",
	"her",
	"here",
	"here's",
	"hereafter",
	"hereby",
	"herein",
	"hereupon",
	"hers",
	"herself",
	"hi",
	"him",
	"himself",
	"his",
	"hither",
	"hopefully",
	"how",
	"howbeit",
	"however",
	"i",
	"i'd",
	"i'll",
	"i'm",
	"i've",
	"ie",
	"if",
	"ignored",
	"immediate",
	"in",
	"inasmuch",
	"inc",
	"indeed",
	"indicate",
	"indicated",
	"indicates",
	"inner",
	"insofar",
	"instead",
	"into",
	"inward",
	"is",
	"isn't",
	"it",
	"it'd",
	"it'll",
	"it's",
	"its",
	"itself",
	"j",
	"just",
	"k",
	"keep",
	"keeps",
	"kept",
	"know",
	"knows",
	"known",
	"l",
	"last",
	"lately",
	"later",
	"latter",
	"latterly",
	"least",
	"less",
	"lest",
	"let",
	"let's",
	"like",
	"liked",
	"likely",
	"little",
	"look",
	"looking",
	"looks",
	"ltd",
	"m",
	"mainly",
	"many",
	"may",
	"maybe",
	"me",
	"mean",
	"meanwhile",
	"merely",
	"might",
	"more",
	"moreover",
	"most",
	"mostly",
	"much",
	"must",
	"my",
	"myself",
	"n",
	"name",
	"namely",
	"nd",
	"near",
	"nearly",
	"necessary",
	"need",
	"needs",
	"neither",
	"never",
	"nevertheless",
	"new",
	"next",
	"nine",
	"no",
	"nobody",
	"non",
	"none",
	"noone",
	"nor",
	"normally",
	"not",
	"nothing",
	"novel",
	"now",
	"nowhere",
	"o",
	"obviously",
	"of",
	"off",
	"often",
	"oh",
	"ok",
	"okay",
	"old",
	"on",
	"once",
	"one",
	"ones",
	"only",
	"onto",
	"or",
	"other",
	"others",
	"otherwise",
	"ought",
	"our",
	"ours",
	"ourselves",
	"out",
	"outside",
	"over",
	"overall",
	"own",
	"p",
	"particular",
	"particularly",
	"per",
	"perhaps",
	"placed",
	"please",
	"plus",
	"possible",
	"presumably",
	"probably",
	"provides",
	"q",
	"que",
	"quite",
	"qv",
	"r",
	"rather",
	"rd",
	"re",
	"really",
	"reasonably",
	"regarding",
	"regardless",
	"regards",
	"relatively",
	"respectively",
	"right",
	"s",
	"said",
	"same",
	"saw",
	"say",
	"saying",
	"says",
	"second",
	"secondly",
	"see",
	"seeing",
	"seem",
	"seemed",
	"seeming",
	"seems",
	"seen",
	"self",
	"selves",
	"sensible",
	"sent",
	"serious",
	"seriously",
	"seven",
	"several",
	"shall",
	"she",
	"should",
	"shouldn't",
	"since",
	"six",
	"so",
	"some",
	"somebody",
	"somehow",
	"someone",
	"something",
	"sometime",
	"sometimes",
	"somewhat",
	"somewhere",
	"soon",
	"sorry",
	"specified",
	"specify",
	"specifying",
	"still",
	"sub",
	"such",
	"sup",
	"sure",
	"t",
	"t's",
	"take",
	"taken",
	"tell",
	"tends",
	"th",
	"than",
	"thank",
	"thanks",
	"thanx",
	"that",
	"that's",
	"thats",
	"the",
	"their",
	"theirs",
	"them",
	"themselves",
	"then",
	"thence",
	"there",
	"there's",
	"thereafter",
	"thereby",
	"therefore",
	"therein",
	"theres",
	"thereupon",
	"these",
	"they",
	"they'd",
	"they'll",
	"they're",
	"they've",
	"think",
	"third",
	"this",
	"thorough",
	"thoroughly",
	"those",
	"though",
	"three",
	"through",
	"throughout",
	"thru",
	"thus",
	"to",
	"together",
	"too",
	"took",
	"toward",
	"towards",
	"tried",
	"tries",
	"truly",
	"try",
	"trying",
	"twice",
	"two",
	"u",
	"un",
	"under",
	"unfortunately",
	"unless",
	"unlikely",
	"until",
	"unto",
	"up",
	"upon",
	"us",
	"use",
	"used",
	"useful",
	"uses",
	"using",
	"usually",
	"uucp",
	"v",
	"value",
	"various",
	"very",
	"via",
	"viz",
	"vs",
	"w",
	"want",
	"wants",
	"was",
	"wasn't",
	"way",
	"we",
	"we'd",
	"we'll",
	"we're",
	"we've",
	"welcome",
	"well",
	"went",
	"were",
	"weren't",
	"what",
	"what's",
	"whatever",
	"when",
	"whence",
	"whenever",
	"where",
	"where's",
	"whereafter",
	"whereas",
	"whereby",
	"wherein",
	"whereupon",
	"wherever",
	"whether",
	"which",
	"while",
	"whither",
	"who",
	"who's",
	"whoever",
	"whole",
	"whom",
	"whose",
	"why",
	"will",
	"willing",
	"wish",
	"with",
	"within",
	"without",
	"won't",
	"wonder",
	"would",
	"would",
	"wouldn't",
	"x",
	"y",
	"yes",
	"yet",
	"you",
	"you'd",
	"you'll",
	"you're",
	"you've",
	"your",
	"yours",
	"yourself",
	"yourselves",
	"z",
	"zero",
}

stop word list from SMART (Salton,1971). Available at ftp://ftp.cs.cornell.edu/pub/smart/english.stop

Functions

func CalculateWordScores

func CalculateWordScores(phraseList []string) map[string]float64

CalculateWordScores returns a map of (string,float64) that maps to a candidate word and its score in the text

func GenerateCandidateKeywordScores

func GenerateCandidateKeywordScores(phraseList []string, wordScore map[string]float64) map[string]float64

GenerateCandidateKeywordScores returns a map of (string,float64) that contains keywords and their score in the text

func GenerateCandidateKeywords

func GenerateCandidateKeywords(sentenceList []string, stopWordPattern *regexp.Regexp) []string

GenerateCandidateKeywords returns a slice of candidate keywords from a slice of sentences and a stop-words regex

func IsNumber

func IsNumber(str string) bool

IsNumber returns true if the supplied string is a number

func RegexSplitSentences

func RegexSplitSentences() *regexp.Regexp

RegexSplitSentences returns a regexp object that detects punctuation marks

func RegexSplitWords

func RegexSplitWords() *regexp.Regexp

RegexSplitWords returns a regexp object that split words

func RegexStopWords

func RegexStopWords(stopWordsSlice []string) *regexp.Regexp

RegexStopWords builds "stop-words" regex based on a slice of "stop-words"

func SeperateWords

func SeperateWords(text string) []string

SeperateWords returns a slice of all words that have a length greater than a specified number of characters.

func SetDefaultStringFloat64

func SetDefaultStringFloat64(h map[string]float64, k string, v float64) (set bool, r float64)

SetDefaultStringFloat64 is a util function that serves as a Go replacement for Python's `setDefault`: https://docs.python.org/2/library/stdtypes.html#dict.setdefault Basically, if key is in the dictionary, return its value. If not, insert key with a value of default and return default. default defaults to None.

func SetDefaultStringInt

func SetDefaultStringInt(h map[string]int, k string, v int) (set bool, r int)

SetDefaultStringInt is a util function that serves as a Go replacement for Python's `setDefault`: https://docs.python.org/2/library/stdtypes.html#dict.setdefault Basically, if key is in the dictionary, return its value. If not, insert key with a value of default and return default. default defaults to None.

func SplitSentences

func SplitSentences(text string) []string

SplitSentences returns a slice of sentences.

Types

type Pair

type Pair struct {
	Key   string
	Value float64
}

Pair is a simple struct for a key-value pair of string and float64

type PairList

type PairList []Pair

PairList is just a slice of Pairs

func RunRake

func RunRake(text string) PairList

RunRake wraps RunRakeI18N to respect API

func RunRakeI18N

func RunRakeI18N(text string, stopWords []string) PairList

RunRakeI18N returns a slice of key-value pairs (PairList) of a keyword and its score after running the RAKE algorithm on a given text

func (PairList) Len

func (p PairList) Len() int

func (PairList) Less

func (p PairList) Less(i, j int) bool

func (PairList) Swap

func (p PairList) Swap(i, j int)

Details

Platform: linux/amd64

Imports: 5 packages

Refresh now

Back to home

Search