Filter: Add more detailed documentation

Also remove the corresponding section of the DESIGN file. Signed-off-by: Anna Schumaker <Anna@OcarinaProject.net>
2014-11-08 11:25:13 -05:00 · 2014-11-08 11:25:13 -05:00 · 2a65fe8db0
parent e81f17360e
commit 2a65fe8db0
4 changed files with 35 additions and 46 deletions
--- a/34
+++ b/34
@ -66,40 +66,6 @@ Callbacks:



-Filter:
-	Filtering is used to generate a subset of songs displayed by the UI to
-	that users can choose from.  The inverted index is generated at startup
-	so there is no need for a remove() function, since it will be wiped
-	the next time the application starts.
-
- Parsing:
-	- Scan over the input text to create a list of words using the following
-	  characters as delimiters: \/,;()_-~+"
-	- While scanning, convert the string to lowercase and strip out any
-	  other special characters.
-
- API:
-	std::string filter :: add(const std::string &key, unsigned int track_id);
-		Parse the key into words following the "Parsing" section above.
-		Generate substrings for each word and add each (substring,
-		track_id) pair to the index.  Return the lowercased text to the
-		caller.
-
-		To generate substrings, iterate over the word starting from
-		the front.  For example: "goron" would contain the substrings
-		{g, go, gor, goro, goron}.
-
-	std::string filter :: lowercase(const std::string &text);
-		Parse the text into lowercased words following the "Parsing"
-		section above.  Return the lowercased string to the caller.
-
-	void filter :: search(const std::string &text, std::set<track_id> &res);
-		This function finds all track_ids matching the input text.
-		Parse the string into substrings and take the intersection of
-		all sets returned by the index for each substring.
-
-
-
 Idle queue:
 	The idle queue is used to schedule function calls that run at a later
 	time.
--- a/4
+++ b/4
@ -86,3 +86,7 @@ Future work:
 		- Show gcov graph
 		- Run cppcheck
 	- Read tags with gstreamer?
+	- Move search functions from filter to index code
+		- Move tag index into tagdb
+		- Rename filter.cpp -> text.cpp (or something to reflect
+		  that it is used for text processing)
--- a/core/filter.cpp
+++ b/core/filter.cpp
@ -58,12 +58,12 @@ static void parse_text(const std::string &text, std::list<std::string> &ret)
 		ret.push_back(word);
 }

-static void add_substrings(const std::string &text, unsigned int track_id)
+static void add_substrings(const std::string &text, unsigned int index)
 {
 	std::string substr;
 	for (unsigned int i = 1; i <= text.size(); i++) {
 		substr = text.substr(0, i);
-		filter_index.insert(substr, track_id);
+		filter_index.insert(substr, index);
 	}
 }

@ -81,14 +81,14 @@ static std::string reassemble_text(std::list<std::string> text)
 	return res;
 }

-std::string filter :: add(const std::string &text, unsigned int track_id)
+std::string filter :: add(const std::string &text, unsigned int index)
 {
 	std::list<std::string> parsed;
 	std::list<std::string>::iterator it;

 	parse_text(text, parsed);
 	for (it = parsed.begin(); it != parsed.end(); it++)
-		add_substrings(*it, track_id);
+		add_substrings(*it, index);
 	return reassemble_text(parsed);
 }

--- a/include/core/filter.h
+++ b/include/core/filter.h
@ -9,31 +9,50 @@
 #include <string>

 /**
- * Namespace for searching the tag database.
+ * The filter layer is used to find a subset of songs based on an input
+ * string.  Since this layer does text processing, it also provides a
+ * functions for converting strings to lowercase.
+ *
+ * The text processing is mostly interested in alphanumeric characters, so
+ * any special characters included in the input text will be stripped out.
+ * Tabs, spaces and the following characters are used to delimit words:
+ *
+ * 	\/,;()_-~+"
 */
 namespace filter {

 	/**
-	 * Break a string into words and add each word to an index.
+	 * Convert the key to lowercase and break into individual words.
+	 * Generate substrings for each word and add each (substring, index)
+	 * pair to the Index.
 	 *
-	 * @param  text  The text to parse.
-	 * @param  id    An identifier paired with the text.
+	 * To generate substrings: iterate over the word starting from the
+	 * first character, and append a character for every iteration.  For
+	 * example, the word "goron" would contain the substrings:
+	 * 	{ g, go, gor, goro, goron }.
+	 *
+	 * @param  text   The text to parse.
+	 * @param  index  The track index to pair with the text.
 	 * @return The lowercase form of the input text.
 	 */
 	std::string add(const std::string &, unsigned int);

 	/**
-	 * Search the entire index for identifiers paired with the input text.
+	 * Break the input text into lowercase words and search the Index
+	 * for matches.  The results set should be filled out with the
+	 * intersection of the IndexEntry for each word.  If any word does
+	 * not appear in the index, then the result set should be empty.
 	 *
 	 * @param  text  The text to search for.
-	 * @param  res   The results set will be filled in with the ids found.
+	 * @param  res   The results set to fill in with matching indexes.
 	 */
 	void search(const std::string &, std::set<unsigned int> &);

 	/**
-	 * Returns the lowercase version of the input text.
+	 * Converts the input text to lowercase and returns the result.
 	 *
-	 * @param  text  The text to be converted into lowercase.
+	 * @param  text  The text to be converted.
+	 * @return The lowercase form of the input text.
 	 */
 	std::string lowercase(const std::string &);