diff --git a/Doxyfile b/Doxyfile index 0cdd4af..757b53f 100644 --- a/Doxyfile +++ b/Doxyfile @@ -943,7 +943,7 @@ WARN_LOGFILE = # spaces. See also FILE_PATTERNS and EXTENSION_MAPPING # Note: If this tag is empty the current directory is searched. -INPUT = ./lib/src ./lib/include ./docs/Architecture_documentation +INPUT = ./lib/src ./lib/include ./docs/Architecture_documentation ./search_engine # This tag can be used to specify the character encoding of the source files # that doxygen parses. Internally doxygen uses the UTF-8 encoding. Doxygen uses diff --git a/docs/html/____init_____8py.html b/docs/html/____init_____8py.html new file mode 100644 index 0000000..e31b163 --- /dev/null +++ b/docs/html/____init_____8py.html @@ -0,0 +1,117 @@ + + + + + + + +Search Engine: search_engine/__init__.py File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
__init__.py File Reference
+
+
+ + + + + + +

+Namespaces

namespace  search_engine
 
namespace  search_engine.search_engine
 
+
+
+ + + + diff --git a/docs/html/__hello_8cpp.html b/docs/html/__hello_8cpp.html new file mode 100644 index 0000000..a48f281 --- /dev/null +++ b/docs/html/__hello_8cpp.html @@ -0,0 +1,141 @@ + + + + + + + +Search Engine: lib/src/_hello.cpp File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
_hello.cpp File Reference
+
+
+
#include "Python.h"
+
+Include dependency graph for _hello.cpp:
+
+
+ + + + + +
+
+ + + +

+Macros

#define PY_SSIZE_T_CLEAN
 
+

Macro Definition Documentation

+ +

◆ PY_SSIZE_T_CLEAN

+ +
+
+ + + + +
#define PY_SSIZE_T_CLEAN
+
+ +
+
+
+
+ + + + diff --git a/docs/html/__hello_8cpp.js b/docs/html/__hello_8cpp.js new file mode 100644 index 0000000..45adff6 --- /dev/null +++ b/docs/html/__hello_8cpp.js @@ -0,0 +1,4 @@ +var __hello_8cpp = +[ + [ "PY_SSIZE_T_CLEAN", "__hello_8cpp.html#ac9efdaac9411d0868b715edccca3269d", null ] +]; \ No newline at end of file diff --git a/docs/html/__hello_8cpp__incl.map b/docs/html/__hello_8cpp__incl.map new file mode 100644 index 0000000..0a0a8f3 --- /dev/null +++ b/docs/html/__hello_8cpp__incl.map @@ -0,0 +1,5 @@ + + + + + diff --git a/docs/html/__hello_8cpp__incl.md5 b/docs/html/__hello_8cpp__incl.md5 new file mode 100644 index 0000000..1328584 --- /dev/null +++ b/docs/html/__hello_8cpp__incl.md5 @@ -0,0 +1 @@ +73d361af636423ef27b7b5fff7296cee \ No newline at end of file diff --git a/docs/html/__hello_8cpp__incl.png b/docs/html/__hello_8cpp__incl.png new file mode 100644 index 0000000..22f82ae Binary files /dev/null and b/docs/html/__hello_8cpp__incl.png differ diff --git a/docs/html/__inverted__index_8cpp.html b/docs/html/__inverted__index_8cpp.html new file mode 100644 index 0000000..ed60da2 --- /dev/null +++ b/docs/html/__inverted__index_8cpp.html @@ -0,0 +1,141 @@ + + + + + + + +Search Engine: lib/src/_inverted_index.cpp File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
_inverted_index.cpp File Reference
+
+
+
#include "Python.h"
+
+Include dependency graph for _inverted_index.cpp:
+
+
+ + + + + +
+
+ + + +

+Macros

#define PY_SSIZE_T_CLEAN
 
+

Macro Definition Documentation

+ +

◆ PY_SSIZE_T_CLEAN

+ +
+
+ + + + +
#define PY_SSIZE_T_CLEAN
+
+ +
+
+
+
+ + + + diff --git a/docs/html/__inverted__index_8cpp.js b/docs/html/__inverted__index_8cpp.js new file mode 100644 index 0000000..339b2ab --- /dev/null +++ b/docs/html/__inverted__index_8cpp.js @@ -0,0 +1,4 @@ +var __inverted__index_8cpp = +[ + [ "PY_SSIZE_T_CLEAN", "__inverted__index_8cpp.html#ac9efdaac9411d0868b715edccca3269d", null ] +]; \ No newline at end of file diff --git a/docs/html/__inverted__index_8cpp__incl.map b/docs/html/__inverted__index_8cpp__incl.map new file mode 100644 index 0000000..c3b0f96 --- /dev/null +++ b/docs/html/__inverted__index_8cpp__incl.map @@ -0,0 +1,5 @@ + + + + + diff --git a/docs/html/__inverted__index_8cpp__incl.md5 b/docs/html/__inverted__index_8cpp__incl.md5 new file mode 100644 index 0000000..99ea575 --- /dev/null +++ b/docs/html/__inverted__index_8cpp__incl.md5 @@ -0,0 +1 @@ +8f7e2f457eed733b785ca14972ad3f23 \ No newline at end of file diff --git a/docs/html/__inverted__index_8cpp__incl.png b/docs/html/__inverted__index_8cpp__incl.png new file mode 100644 index 0000000..2b956a0 Binary files /dev/null and b/docs/html/__inverted__index_8cpp__incl.png differ diff --git a/docs/html/annotated.html b/docs/html/annotated.html index 825fe6d..c431381 100644 --- a/docs/html/annotated.html +++ b/docs/html/annotated.html @@ -95,12 +95,21 @@
Here are the classes, structs, unions and interfaces with brief descriptions:
-
[detail level 12]
+
[detail level 12345]
- + + + + + + + + + +
 Ninverted_index
 CdocsStructure that stores information about a document
 Npage_rank
 CGraphRepresents a directed graph used to compute the PageRank algorithm
 CHello
 Nsearch_engine
 Nsearch_engine
 Ncrawler
 CCrawler
 Nexceptions
 CUrlError
 Nhelper
 Nconverter
 CStringToIntConverter
 CHello
diff --git a/docs/html/annotated_dup.js b/docs/html/annotated_dup.js index 489c26d..671a80a 100644 --- a/docs/html/annotated_dup.js +++ b/docs/html/annotated_dup.js @@ -6,5 +6,20 @@ var annotated_dup = [ "page_rank", "namespacepage__rank.html", [ [ "Graph", "classpage__rank_1_1Graph.html", "classpage__rank_1_1Graph" ] ] ], + [ "search_engine", "namespacesearch__engine.html", [ + [ "search_engine", "namespacesearch__engine_1_1search__engine.html", [ + [ "crawler", "namespacesearch__engine_1_1search__engine_1_1crawler.html", [ + [ "Crawler", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler" ] + ] ], + [ "exceptions", "namespacesearch__engine_1_1search__engine_1_1exceptions.html", [ + [ "UrlError", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError" ] + ] ], + [ "helper", "namespacesearch__engine_1_1search__engine_1_1helper.html", [ + [ "converter", "namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html", [ + [ "StringToIntConverter", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter" ] + ] ] + ] ] + ] ] + ] ], [ "Hello", "classHello.html", "classHello" ] ]; \ No newline at end of file diff --git a/docs/html/classes.html b/docs/html/classes.html index 4d2210f..048eb68 100644 --- a/docs/html/classes.html +++ b/docs/html/classes.html @@ -94,17 +94,26 @@
Class Index
-
D | G | H
+
C | D | G | H | S | U
+
C
+
Crawler (search_engine.search_engine.crawler)
+
D
docs (inverted_index)
-
+
G
Graph (page_rank)
-
+
H
Hello
+
+
S
+
StringToIntConverter (search_engine.search_engine.helper.converter)
+
+
U
+
UrlError (search_engine.search_engine.exceptions)
diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler-members.html b/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler-members.html new file mode 100644 index 0000000..58cd129 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler-members.html @@ -0,0 +1,122 @@ + + + + + + + +Search Engine: Member List + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
search_engine.search_engine.crawler.Crawler Member List
+
+
+ +

This is the complete list of members for search_engine.search_engine.crawler.Crawler, including all inherited members.

+ + + + + + + + + + + + + + +
__init__(self, str url_base, str page_name, str initial_page, list[str] remove_pages=[], bool test_mode=False)search_engine.search_engine.crawler.Crawler
_get_links(self, str current_page)search_engine.search_engine.crawler.Crawlerprotected
_get_paragraphs(self, str current_page)search_engine.search_engine.crawler.Crawlerprotected
_validate_url(self, str url)search_engine.search_engine.crawler.Crawlerprotected
convertersearch_engine.search_engine.crawler.Crawler
graphsearch_engine.search_engine.crawler.Crawler
initial_pagesearch_engine.search_engine.crawler.Crawler
page_namesearch_engine.search_engine.crawler.Crawler
REGEXsearch_engine.search_engine.crawler.Crawlerstatic
remove_pagessearch_engine.search_engine.crawler.Crawler
run(self, limit=2)search_engine.search_engine.crawler.Crawler
test_modesearch_engine.search_engine.crawler.Crawler
url_basesearch_engine.search_engine.crawler.Crawler
+
+ + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html b/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html new file mode 100644 index 0000000..d5f2cec --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html @@ -0,0 +1,525 @@ + + + + + + + +Search Engine: search_engine.search_engine.crawler.Crawler Class Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.crawler.Crawler Class Reference
+
+
+ + + + + + +

+Public Member Functions

 __init__ (self, str url_base, str page_name, str initial_page, list[str] remove_pages=[], bool test_mode=False)
 
 run (self, limit=2)
 
+ + + + + + + + + + + + + + + +

+Public Attributes

 url_base
 
 page_name
 
 initial_page
 
 remove_pages
 
 test_mode
 
 graph
 
 converter
 
+ + + +

+Static Public Attributes

 REGEX
 
+ + + + + + + +

+Protected Member Functions

list _get_links (self, str current_page)
 
list _get_paragraphs (self, str current_page)
 
 _validate_url (self, str url)
 
+

Detailed Description

+
A web crawler that traverses a network of web pages, extracts links and paragraphs,
+and constructs a graph using the PageRank algorithm.
+
+This crawler starts from a given base URL and an initial page, and follows links within
+the website to collect data such as links and paragraphs. It constructs a graph based on
+the relationships between pages.
+
+@param url_base: The base URL from which the crawler starts.
+@param page_name: The initial page to start crawling.
+@param remove_pages: A list of pages to exclude from the crawl. (Optional, default is [])
+
+Attributes
+----------
+graph : PyGraph
+    A graph representation used for PageRank calculations.
+
+Examples
+--------
+>>> crawler = Crawler('https://example.com', '/home')
+>>> links, paragraphs = crawler.run()
+

Constructor & Destructor Documentation

+ +

◆ __init__()

+ +
+
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
search_engine.search_engine.crawler.Crawler.__init__ ( self,
str url_base,
str page_name,
str initial_page,
list[str]  remove_pages = [],
bool  test_mode = False 
)
+
+
Initialize the Crawler with a base URL, the starting page, and optionally,
+a list of pages to exclude.
+
+@param url_base: The base URL of the website to crawl.
+@param page_name: The starting page to begin crawling.
+@param remove_pages: Pages to exclude from the crawl (optional).
+@param test_mode: Flag to activate the test mode for crawling. (default: False)
+
+
+
+

Member Function Documentation

+ +

◆ _get_links()

+ +
+
+ + + + + +
+ + + + + + + + + + + + + + + + + + +
list search_engine.search_engine.crawler.Crawler._get_links ( self,
str current_page 
)
+
+protected
+
+
Retrieve all links from the specified page.
+
+@param current_page: The current page to fetch links from.
+
+@return: A list of valid links found on the current page.
+
+@raises UrlError: If the current page URL is invalid or inaccessible.
+
+
+
+ +

◆ _get_paragraphs()

+ +
+
+ + + + + +
+ + + + + + + + + + + + + + + + + + +
list search_engine.search_engine.crawler.Crawler._get_paragraphs ( self,
str current_page 
)
+
+protected
+
+
Retrieve all paragraphs from the specified page.
+
+@param current_page: The current page to fetch paragraphs from.
+
+@return: A list of paragraphs' text found on the current page.
+
+
+
+ +

◆ _validate_url()

+ +
+
+ + + + + +
+ + + + + + + + + + + + + + + + + + +
search_engine.search_engine.crawler.Crawler._validate_url ( self,
str url 
)
+
+protected
+
+
Validate the format of the given URL.
+
+@param url: The URL to validate.
+
+@raises UrlError: If the URL is not valid.
+
+
+
+ +

◆ run()

+ +
+
+ + + + + + + + + + + + + + + + + + +
search_engine.search_engine.crawler.Crawler.run ( self,
 limit = 2 
)
+
+
Run the crawler to collect links and paragraphs starting from the base page.
+It uses a queue to traverse the links in a breadth-first manner.
+
+@param limit: The maximum number of pages to crawl in test mode.
+
+@return: A graph representation of the pages and their links.
+
+
+
+

Member Data Documentation

+ +

◆ converter

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.converter
+
+ +
+
+ +

◆ graph

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.graph
+
+ +
+
+ +

◆ initial_page

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.initial_page
+
+ +
+
+ +

◆ page_name

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.page_name
+
+ +
+
+ +

◆ REGEX

+ +
+
+ + + + + +
+ + + + +
search_engine.search_engine.crawler.Crawler.REGEX
+
+static
+
+Initial value:
= re.compile(
+
r'^(?:http|https)://' # http or https protocol
+
r'(?:\S+(?::\S*)?@)?' # optional authentication
+
r'(?:[a-zA-Z0-9-]+\.)+[a-zA-Z]{2,6}' # domain
+
r'(?::\d{2,5})?' # optional port
+
r'(?:/\S*)?$', # optional path
+
re.IGNORECASE
+
)
+
+
+
+ +

◆ remove_pages

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.remove_pages
+
+ +
+
+ +

◆ test_mode

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.test_mode
+
+ +
+
+ +

◆ url_base

+ +
+
+ + + + +
search_engine.search_engine.crawler.Crawler.url_base
+
+ +
+
+
The documentation for this class was generated from the following file: +
+
+ + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.js b/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.js new file mode 100644 index 0000000..1cc3f33 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.js @@ -0,0 +1,15 @@ +var classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler = +[ + [ "__init__", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a3749cceadf503febd19be1a13c9a0fe9", null ], + [ "_get_links", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ada91bdbc6ff449d14a4b3435189080f9", null ], + [ "_get_paragraphs", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ace884d52406cb35a990f172fe49a40d5", null ], + [ "_validate_url", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a1f219db9f6b0dcd8c7f5b12afc8a0574", null ], + [ "run", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aa4018e5dcd1bac621932a2f70ae0d990", null ], + [ "converter", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a066cf036bc6b4178858f790e0d2625e7", null ], + [ "graph", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aecc008b6c522f033489506a4bb21bc52", null ], + [ "initial_page", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a6e0bc960b9ee2c29b8b75c66a275f570", null ], + [ "page_name", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a2926e956cbfbf24d9c99a1c0e80fae5e", null ], + [ "remove_pages", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a0d917081e91fe9067c457e791efec341", null ], + [ "test_mode", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ab1db7f6a00564e301a65a3560b00450a", null ], + [ "url_base", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#af2b2d5e8f62ba5661b4c87e15a9bc67e", null ] +]; \ No newline at end of file diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError-members.html b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError-members.html new file mode 100644 index 0000000..f8e76a4 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError-members.html @@ -0,0 +1,111 @@ + + + + + + + +Search Engine: Member List + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
search_engine.search_engine.exceptions.UrlError Member List
+
+
+ +

This is the complete list of members for search_engine.search_engine.exceptions.UrlError, including all inherited members.

+ + + +
__init__(self, message="Invalid URL")search_engine.search_engine.exceptions.UrlError
messagesearch_engine.search_engine.exceptions.UrlError
+
+ + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html new file mode 100644 index 0000000..139bc92 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html @@ -0,0 +1,210 @@ + + + + + + + +Search Engine: search_engine.search_engine.exceptions.UrlError Class Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.exceptions.UrlError Class Reference
+
+
+
+Inheritance diagram for search_engine.search_engine.exceptions.UrlError:
+
+
Inheritance graph
+ + + + + +
[legend]
+
+Collaboration diagram for search_engine.search_engine.exceptions.UrlError:
+
+
Collaboration graph
+ + + + + +
[legend]
+ + + + +

+Public Member Functions

 __init__ (self, message="Invalid URL")
 
+ + + +

+Public Attributes

 message
 
+

Detailed Description

+
Exception raised when an invalid URL is provided.
+
+Inherits from the built-in `ValueError` class.
+
+Attributes
+----------
+message : str
+    The error message that describes the cause of the exception.
+    Defaults to "Invalid URL".
+
+Methods
+-------
+__init__(self, message: str = "Invalid URL")
+    Initializes the exception with a custom message or a default message.
+

Constructor & Destructor Documentation

+ +

◆ __init__()

+ +
+
+ + + + + + + + + + + + + + + + + + +
search_engine.search_engine.exceptions.UrlError.__init__ ( self,
 message = "Invalid URL" 
)
+
+
Initializes the UrlError exception with a custom error message.
+
+Parameters
+----------
+message : str, optional
+    The error message to describe the exception. Default is "Invalid URL".
+
+
+
+

Member Data Documentation

+ +

◆ message

+ +
+
+ + + + +
search_engine.search_engine.exceptions.UrlError.message
+
+ +
+
+
The documentation for this class was generated from the following file: +
+
+ + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.js b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.js new file mode 100644 index 0000000..d4b4711 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.js @@ -0,0 +1,5 @@ +var classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError = +[ + [ "__init__", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#aafc565a27959d46203642a601d5468da", null ], + [ "message", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#a40e2fd59c669daada4d42c4c76cee5cb", null ] +]; \ No newline at end of file diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.map b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.map new file mode 100644 index 0000000..551bf54 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.map @@ -0,0 +1,5 @@ + + + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.md5 b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.md5 new file mode 100644 index 0000000..1874dd4 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.md5 @@ -0,0 +1 @@ +39b10afe3a109ed2d5071d6bc683ccc4 \ No newline at end of file diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.png b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.png new file mode 100644 index 0000000..eb66f5f Binary files /dev/null and b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.png differ diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.map b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.map new file mode 100644 index 0000000..551bf54 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.map @@ -0,0 +1,5 @@ + + + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.md5 b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.md5 new file mode 100644 index 0000000..1874dd4 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.md5 @@ -0,0 +1 @@ +39b10afe3a109ed2d5071d6bc683ccc4 \ No newline at end of file diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.png b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.png new file mode 100644 index 0000000..eb66f5f Binary files /dev/null and b/docs/html/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.png differ diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter-members.html b/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter-members.html new file mode 100644 index 0000000..c8c2f73 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter-members.html @@ -0,0 +1,113 @@ + + + + + + + +Search Engine: Member List + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
search_engine.search_engine.helper.converter.StringToIntConverter Member List
+
+
+ +

This is the complete list of members for search_engine.search_engine.helper.converter.StringToIntConverter, including all inherited members.

+ + + + + +
__init__(self)search_engine.search_engine.helper.converter.StringToIntConverter
convert(self, str word)search_engine.search_engine.helper.converter.StringToIntConverter
next_intsearch_engine.search_engine.helper.converter.StringToIntConverter
string_to_intsearch_engine.search_engine.helper.converter.StringToIntConverter
+
+ + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html b/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html new file mode 100644 index 0000000..d4bb9f3 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html @@ -0,0 +1,246 @@ + + + + + + + +Search Engine: search_engine.search_engine.helper.converter.StringToIntConverter Class Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.helper.converter.StringToIntConverter Class Reference
+
+
+ + + + + + +

+Public Member Functions

 __init__ (self)
 
int convert (self, str word)
 
+ + + + + +

+Public Attributes

 string_to_int
 
 next_int
 
+

Detailed Description

+
A class that converts strings to integers. If a string has already been converted,
+it returns the previously assigned integer. Otherwise, it assigns a new integer
+to the string and returns it.
+
+Attributes
+----------
+string_to_int : dict
+    A dictionary mapping strings to their corresponding integers.
+next_int : int
+    The next integer to be assigned to a string.
+
+Methods
+-------
+__init__()
+    Initializes the converter with an empty dictionary and sets the next integer to 0.
+convert(word: str) -> int
+    Converts a given string to an integer. If the string has been seen before,
+    it returns the corresponding integer, otherwise it assigns a new integer to the string.
+

Constructor & Destructor Documentation

+ +

◆ __init__()

+ +
+
+ + + + + + + + +
search_engine.search_engine.helper.converter.StringToIntConverter.__init__ ( self)
+
+
Initializes the StringToIntConverter with an empty dictionary and sets the next integer
+to 0 for string-to-integer mapping.
+
+Attributes
+----------
+string_to_int : dict
+    An empty dictionary to store the mapping of strings to integers.
+next_int : int
+    Initialized to 0, it represents the next available integer to be assigned to a string.
+
+
+
+

Member Function Documentation

+ +

◆ convert()

+ +
+
+ + + + + + + + + + + + + + + + + + +
int search_engine.search_engine.helper.converter.StringToIntConverter.convert ( self,
str word 
)
+
+
Convert a string to an integer. If the string has already been seen,
+return its corresponding integer. Otherwise, assign a new integer to it.
+
+Parameters
+----------
+word : str
+    The string to be converted.
+
+Returns
+-------
+int
+    The integer corresponding to the string.
+
+
+
+

Member Data Documentation

+ +

◆ next_int

+ +
+
+ + + + +
search_engine.search_engine.helper.converter.StringToIntConverter.next_int
+
+ +
+
+ +

◆ string_to_int

+ +
+
+ + + + +
search_engine.search_engine.helper.converter.StringToIntConverter.string_to_int
+
+ +
+
+
The documentation for this class was generated from the following file: +
+
+ + + + diff --git a/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.js b/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.js new file mode 100644 index 0000000..5aa11f9 --- /dev/null +++ b/docs/html/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.js @@ -0,0 +1,7 @@ +var classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter = +[ + [ "__init__", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a2d3bad61678c8f6cf075256b6fb411c7", null ], + [ "convert", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a562ba6756f1cc804678075a02d28eb9f", null ], + [ "next_int", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#af796cd59c12eba4822eb8f8b6bcfed8b", null ], + [ "string_to_int", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a583c2162f4a2a2c6bff496b034e30675", null ] +]; \ No newline at end of file diff --git a/docs/html/converter_8py.html b/docs/html/converter_8py.html new file mode 100644 index 0000000..3e9e641 --- /dev/null +++ b/docs/html/converter_8py.html @@ -0,0 +1,127 @@ + + + + + + + +Search Engine: search_engine/helper/converter.py File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
converter.py File Reference
+
+
+ + + + +

+Classes

class  search_engine.search_engine.helper.converter.StringToIntConverter
 
+ + + + + + + + + +

+Namespaces

namespace  search_engine
 
namespace  search_engine.search_engine
 
namespace  search_engine.search_engine.helper
 
namespace  search_engine.search_engine.helper.converter
 
+
+
+ + + + diff --git a/docs/html/converter_8py.js b/docs/html/converter_8py.js new file mode 100644 index 0000000..fe2ad36 --- /dev/null +++ b/docs/html/converter_8py.js @@ -0,0 +1,4 @@ +var converter_8py = +[ + [ "search_engine.search_engine.helper.converter.StringToIntConverter", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter" ] +]; \ No newline at end of file diff --git a/docs/html/crawler_8py.html b/docs/html/crawler_8py.html new file mode 100644 index 0000000..aba6413 --- /dev/null +++ b/docs/html/crawler_8py.html @@ -0,0 +1,125 @@ + + + + + + + +Search Engine: search_engine/crawler.py File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
crawler.py File Reference
+
+
+ + + + +

+Classes

class  search_engine.search_engine.crawler.Crawler
 
+ + + + + + + +

+Namespaces

namespace  search_engine
 
namespace  search_engine.search_engine
 
namespace  search_engine.search_engine.crawler
 
+
+
+ + + + diff --git a/docs/html/crawler_8py.js b/docs/html/crawler_8py.js new file mode 100644 index 0000000..6d5627c --- /dev/null +++ b/docs/html/crawler_8py.js @@ -0,0 +1,4 @@ +var crawler_8py = +[ + [ "search_engine.search_engine.crawler.Crawler", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler" ] +]; \ No newline at end of file diff --git a/docs/html/dir_000006_000003.html b/docs/html/dir_000006_000003.html new file mode 100644 index 0000000..7d842f7 --- /dev/null +++ b/docs/html/dir_000006_000003.html @@ -0,0 +1,104 @@ + + + + + + + +Search Engine: lib/src -> include Relation + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+

src → include Relation

File in lib/srcIncludes file in lib/include
hello.cpphello.h
inverted_index.cppinverted_index.h
page_rank.cpppage_rank.h
subtraction.cppsubtraction.h
sum.cppsum.h
+
+ + + + diff --git a/docs/html/dir_3077535539cd151b75f9ad358f5d25ba.html b/docs/html/dir_3077535539cd151b75f9ad358f5d25ba.html new file mode 100644 index 0000000..e4e664a --- /dev/null +++ b/docs/html/dir_3077535539cd151b75f9ad358f5d25ba.html @@ -0,0 +1,122 @@ + + + + + + + +Search Engine: search_engine Directory Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
search_engine Directory Reference
+
+
+ + + + +

+Directories

 helper
 
+ + + + + + + +

+Files

 __init__.py
 
 crawler.py
 
 exceptions.py
 
+
+
+ + + + diff --git a/docs/html/dir_3077535539cd151b75f9ad358f5d25ba.js b/docs/html/dir_3077535539cd151b75f9ad358f5d25ba.js new file mode 100644 index 0000000..17a4413 --- /dev/null +++ b/docs/html/dir_3077535539cd151b75f9ad358f5d25ba.js @@ -0,0 +1,7 @@ +var dir_3077535539cd151b75f9ad358f5d25ba = +[ + [ "helper", "dir_a288a6e2e3e1e96db5e8d1e18942be87.html", "dir_a288a6e2e3e1e96db5e8d1e18942be87" ], + [ "__init__.py", "____init_____8py.html", null ], + [ "crawler.py", "crawler_8py.html", "crawler_8py" ], + [ "exceptions.py", "exceptions_8py.html", "exceptions_8py" ] +]; \ No newline at end of file diff --git a/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9.html b/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9.html index 266e6d8..ee3b435 100644 --- a/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9.html +++ b/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9.html @@ -101,8 +101,8 @@ - - + + diff --git a/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.map b/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.map index 179003b..2b7f8a3 100644 --- a/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.map +++ b/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.map @@ -1,7 +1,7 @@ - - + + diff --git a/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 b/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 index 4c3c9fa..50162c4 100644 --- a/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 +++ b/docs/html/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 @@ -1 +1 @@ -bad757f7dc4a7d7c23e3997687d02419 \ No newline at end of file +36f81bcb7d6cafce558a22dbbf92d35d \ No newline at end of file diff --git a/docs/html/dir_a065c5f60305fee3569f887679366939.html b/docs/html/dir_a065c5f60305fee3569f887679366939.html index 74ba807..e1a541d 100644 --- a/docs/html/dir_a065c5f60305fee3569f887679366939.html +++ b/docs/html/dir_a065c5f60305fee3569f887679366939.html @@ -101,14 +101,18 @@ - - + + + + + + diff --git a/docs/html/dir_a065c5f60305fee3569f887679366939.js b/docs/html/dir_a065c5f60305fee3569f887679366939.js index 81bccf1..7d6993a 100644 --- a/docs/html/dir_a065c5f60305fee3569f887679366939.js +++ b/docs/html/dir_a065c5f60305fee3569f887679366939.js @@ -1,5 +1,7 @@ var dir_a065c5f60305fee3569f887679366939 = [ + [ "_hello.cpp", "__hello_8cpp.html", "__hello_8cpp" ], + [ "_inverted_index.cpp", "__inverted__index_8cpp.html", "__inverted__index_8cpp" ], [ "_page_rank.cpp", "__page__rank_8cpp.html", "__page__rank_8cpp" ], [ "hello.cpp", "hello_8cpp.html", null ], [ "inverted_index.cpp", "inverted__index_8cpp.html", null ], diff --git a/docs/html/dir_a065c5f60305fee3569f887679366939_dep.map b/docs/html/dir_a065c5f60305fee3569f887679366939_dep.map index 2e9e346..6a528f1 100644 --- a/docs/html/dir_a065c5f60305fee3569f887679366939_dep.map +++ b/docs/html/dir_a065c5f60305fee3569f887679366939_dep.map @@ -1,7 +1,7 @@ - - + + diff --git a/docs/html/dir_a065c5f60305fee3569f887679366939_dep.md5 b/docs/html/dir_a065c5f60305fee3569f887679366939_dep.md5 index e0c7f1c..7f93305 100644 --- a/docs/html/dir_a065c5f60305fee3569f887679366939_dep.md5 +++ b/docs/html/dir_a065c5f60305fee3569f887679366939_dep.md5 @@ -1 +1 @@ -584dd3f299555fc9d2e667b519e7dbe6 \ No newline at end of file +c9e11af2475bd2b65447242ba16929d0 \ No newline at end of file diff --git a/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87.html b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87.html new file mode 100644 index 0000000..4e10a65 --- /dev/null +++ b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87.html @@ -0,0 +1,124 @@ + + + + + + + +Search Engine: search_engine/helper Directory Reference + + + + + + + + + + + + + + + +
+
+

Files

 _hello.cpp
 
 _inverted_index.cpp
 
 _page_rank.cpp
 
 hello.cpp
+ + + + + +
+
Search Engine +
+
+ + + + + + + + + +
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
helper Directory Reference
+
+
+
+Directory dependency graph for helper:
+
+
search_engine/helper
+ + + + +
+ + + + + + +

+Files

 __init__.py
 
 converter.py
 
+
+
+ + + + diff --git a/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87.js b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87.js new file mode 100644 index 0000000..9317969 --- /dev/null +++ b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87.js @@ -0,0 +1,5 @@ +var dir_a288a6e2e3e1e96db5e8d1e18942be87 = +[ + [ "__init__.py", "helper_2____init_____8py.html", null ], + [ "converter.py", "converter_8py.html", "converter_8py" ] +]; \ No newline at end of file diff --git a/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.map b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.map new file mode 100644 index 0000000..f736f69 --- /dev/null +++ b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.map @@ -0,0 +1,4 @@ + + + + diff --git a/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.md5 b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.md5 new file mode 100644 index 0000000..63a0fc9 --- /dev/null +++ b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.md5 @@ -0,0 +1 @@ +e49a2cf62d6d8871cd3f8432ea3bc52a \ No newline at end of file diff --git a/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.png b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.png new file mode 100644 index 0000000..b70c464 Binary files /dev/null and b/docs/html/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.png differ diff --git a/docs/html/exceptions_8py.html b/docs/html/exceptions_8py.html new file mode 100644 index 0000000..c352b8d --- /dev/null +++ b/docs/html/exceptions_8py.html @@ -0,0 +1,125 @@ + + + + + + + +Search Engine: search_engine/exceptions.py File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
exceptions.py File Reference
+
+
+ + + + +

+Classes

class  search_engine.search_engine.exceptions.UrlError
 
+ + + + + + + +

+Namespaces

namespace  search_engine
 
namespace  search_engine.search_engine
 
namespace  search_engine.search_engine.exceptions
 
+
+
+ + + + diff --git a/docs/html/exceptions_8py.js b/docs/html/exceptions_8py.js new file mode 100644 index 0000000..fc97e98 --- /dev/null +++ b/docs/html/exceptions_8py.js @@ -0,0 +1,4 @@ +var exceptions_8py = +[ + [ "search_engine.search_engine.exceptions.UrlError", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError" ] +]; \ No newline at end of file diff --git a/docs/html/files.html b/docs/html/files.html index dd456c4..4e7b754 100644 --- a/docs/html/files.html +++ b/docs/html/files.html @@ -106,12 +106,21 @@  subtraction.h  sum.h   src - _page_rank.cpp - hello.cpp - inverted_index.cpp - page_rank.cpp - subtraction.cpp - sum.cpp + _hello.cpp + _inverted_index.cpp + _page_rank.cpp + hello.cpp + inverted_index.cpp + page_rank.cpp + subtraction.cpp + sum.cpp +  search_engine +  helper + __init__.py + converter.py + __init__.py + crawler.py + exceptions.py diff --git a/docs/html/files_dup.js b/docs/html/files_dup.js index e4b5c41..f638b3c 100644 --- a/docs/html/files_dup.js +++ b/docs/html/files_dup.js @@ -1,5 +1,6 @@ var files_dup = [ [ "docs", "dir_49e56c817e5e54854c35e136979f97ca.html", "dir_49e56c817e5e54854c35e136979f97ca" ], - [ "lib", "dir_97aefd0d527b934f1d99a682da8fe6a9.html", "dir_97aefd0d527b934f1d99a682da8fe6a9" ] + [ "lib", "dir_97aefd0d527b934f1d99a682da8fe6a9.html", "dir_97aefd0d527b934f1d99a682da8fe6a9" ], + [ "search_engine", "dir_3077535539cd151b75f9ad358f5d25ba.html", "dir_3077535539cd151b75f9ad358f5d25ba" ] ]; \ No newline at end of file diff --git a/docs/html/functions.html b/docs/html/functions.html index d34bcd4..8df1906 100644 --- a/docs/html/functions.html +++ b/docs/html/functions.html @@ -91,21 +91,100 @@
-
Here is a list of all class members with links to the classes they belong to:
diff --git a/docs/html/functions_func.html b/docs/html/functions_func.html index 6f1586d..9b75b0c 100644 --- a/docs/html/functions_func.html +++ b/docs/html/functions_func.html @@ -92,8 +92,13 @@
Here is a list of all functions with links to the classes they belong to:
diff --git a/docs/html/functions_vars.html b/docs/html/functions_vars.html index f2b19de..ef16ca6 100644 --- a/docs/html/functions_vars.html +++ b/docs/html/functions_vars.html @@ -92,9 +92,20 @@
Here is a list of all variables with links to the classes they belong to:
diff --git a/docs/html/globals.html b/docs/html/globals.html index 585b49f..7c2eedc 100644 --- a/docs/html/globals.html +++ b/docs/html/globals.html @@ -93,7 +93,7 @@
Here is a list of all file members with links to the files they belong to:
diff --git a/docs/html/globals_defs.html b/docs/html/globals_defs.html index 7c58063..4313d8b 100644 --- a/docs/html/globals_defs.html +++ b/docs/html/globals_defs.html @@ -93,7 +93,7 @@
Here is a list of all macros with links to the files they belong to:
diff --git a/docs/html/helper_2____init_____8py.html b/docs/html/helper_2____init_____8py.html new file mode 100644 index 0000000..53c544f --- /dev/null +++ b/docs/html/helper_2____init_____8py.html @@ -0,0 +1,107 @@ + + + + + + + +Search Engine: search_engine/helper/__init__.py File Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
__init__.py File Reference
+
+
+
+
+ + + + diff --git a/docs/html/hierarchy.html b/docs/html/hierarchy.html new file mode 100644 index 0000000..aafe747 --- /dev/null +++ b/docs/html/hierarchy.html @@ -0,0 +1,119 @@ + + + + + + + +Search Engine: Class Hierarchy + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
Class Hierarchy
+
+
+
+

Go to the graphical class hierarchy

+This inheritance list is sorted roughly, but not completely, alphabetically:
+
[detail level 12]
+ + + + + + + +
 Csearch_engine.search_engine.crawler.Crawler
 Cinverted_index::docsStructure that stores information about a document
 Cpage_rank::GraphRepresents a directed graph used to compute the PageRank algorithm
 CHello
 Csearch_engine.search_engine.helper.converter.StringToIntConverter
 CValueError
 Csearch_engine.search_engine.exceptions.UrlError
+
+
+
+ + + + diff --git a/docs/html/hierarchy.js b/docs/html/hierarchy.js new file mode 100644 index 0000000..2b69fc1 --- /dev/null +++ b/docs/html/hierarchy.js @@ -0,0 +1,11 @@ +var hierarchy = +[ + [ "search_engine.search_engine.crawler.Crawler", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html", null ], + [ "inverted_index::docs", "structinverted__index_1_1docs.html", null ], + [ "page_rank::Graph", "classpage__rank_1_1Graph.html", null ], + [ "Hello", "classHello.html", null ], + [ "search_engine.search_engine.helper.converter.StringToIntConverter", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html", null ], + [ "ValueError", null, [ + [ "search_engine.search_engine.exceptions.UrlError", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html", null ] + ] ] +]; \ No newline at end of file diff --git a/docs/html/inherit_graph_0.map b/docs/html/inherit_graph_0.map new file mode 100644 index 0000000..2a82e85 --- /dev/null +++ b/docs/html/inherit_graph_0.map @@ -0,0 +1,3 @@ + + + diff --git a/docs/html/inherit_graph_0.md5 b/docs/html/inherit_graph_0.md5 new file mode 100644 index 0000000..4251112 --- /dev/null +++ b/docs/html/inherit_graph_0.md5 @@ -0,0 +1 @@ +e109474ed8a558adbae1d751c5ee6a0b \ No newline at end of file diff --git a/docs/html/inherit_graph_0.png b/docs/html/inherit_graph_0.png new file mode 100644 index 0000000..91fc672 Binary files /dev/null and b/docs/html/inherit_graph_0.png differ diff --git a/docs/html/inherit_graph_1.map b/docs/html/inherit_graph_1.map new file mode 100644 index 0000000..03c8e35 --- /dev/null +++ b/docs/html/inherit_graph_1.map @@ -0,0 +1,3 @@ + + + diff --git a/docs/html/inherit_graph_1.md5 b/docs/html/inherit_graph_1.md5 new file mode 100644 index 0000000..9008860 --- /dev/null +++ b/docs/html/inherit_graph_1.md5 @@ -0,0 +1 @@ +dee35dcb140f7a0d91140d2364fceab1 \ No newline at end of file diff --git a/docs/html/inherit_graph_1.png b/docs/html/inherit_graph_1.png new file mode 100644 index 0000000..ed63176 Binary files /dev/null and b/docs/html/inherit_graph_1.png differ diff --git a/docs/html/inherit_graph_2.map b/docs/html/inherit_graph_2.map new file mode 100644 index 0000000..4cc182e --- /dev/null +++ b/docs/html/inherit_graph_2.map @@ -0,0 +1,3 @@ + + + diff --git a/docs/html/inherit_graph_2.md5 b/docs/html/inherit_graph_2.md5 new file mode 100644 index 0000000..80ed6d6 --- /dev/null +++ b/docs/html/inherit_graph_2.md5 @@ -0,0 +1 @@ +048793f918c9f3695dd4bd2651ff7b92 \ No newline at end of file diff --git a/docs/html/inherit_graph_2.png b/docs/html/inherit_graph_2.png new file mode 100644 index 0000000..60129cb Binary files /dev/null and b/docs/html/inherit_graph_2.png differ diff --git a/docs/html/inherit_graph_3.map b/docs/html/inherit_graph_3.map new file mode 100644 index 0000000..e688dcb --- /dev/null +++ b/docs/html/inherit_graph_3.map @@ -0,0 +1,3 @@ + + + diff --git a/docs/html/inherit_graph_3.md5 b/docs/html/inherit_graph_3.md5 new file mode 100644 index 0000000..4d40a3a --- /dev/null +++ b/docs/html/inherit_graph_3.md5 @@ -0,0 +1 @@ +1d3b22495fb4c78ec54d27519f73a414 \ No newline at end of file diff --git a/docs/html/inherit_graph_3.png b/docs/html/inherit_graph_3.png new file mode 100644 index 0000000..0c6082e Binary files /dev/null and b/docs/html/inherit_graph_3.png differ diff --git a/docs/html/inherit_graph_4.map b/docs/html/inherit_graph_4.map new file mode 100644 index 0000000..7ed9a29 --- /dev/null +++ b/docs/html/inherit_graph_4.map @@ -0,0 +1,3 @@ + + + diff --git a/docs/html/inherit_graph_4.md5 b/docs/html/inherit_graph_4.md5 new file mode 100644 index 0000000..bd10f09 --- /dev/null +++ b/docs/html/inherit_graph_4.md5 @@ -0,0 +1 @@ +2b3649379905a6a09344d83f8de59ddb \ No newline at end of file diff --git a/docs/html/inherit_graph_4.png b/docs/html/inherit_graph_4.png new file mode 100644 index 0000000..953da25 Binary files /dev/null and b/docs/html/inherit_graph_4.png differ diff --git a/docs/html/inherit_graph_5.map b/docs/html/inherit_graph_5.map new file mode 100644 index 0000000..2c584ba --- /dev/null +++ b/docs/html/inherit_graph_5.map @@ -0,0 +1,5 @@ + + + + + diff --git a/docs/html/inherit_graph_5.md5 b/docs/html/inherit_graph_5.md5 new file mode 100644 index 0000000..59f6b67 --- /dev/null +++ b/docs/html/inherit_graph_5.md5 @@ -0,0 +1 @@ +3bf9addd485db522f8f5f416124eaa6d \ No newline at end of file diff --git a/docs/html/inherit_graph_5.png b/docs/html/inherit_graph_5.png new file mode 100644 index 0000000..11792f6 Binary files /dev/null and b/docs/html/inherit_graph_5.png differ diff --git a/docs/html/inherits.html b/docs/html/inherits.html new file mode 100644 index 0000000..7362c00 --- /dev/null +++ b/docs/html/inherits.html @@ -0,0 +1,142 @@ + + + + + + + +Search Engine: Class Hierarchy + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+
Class Hierarchy
+
+
+ + + + + + + +
+ + + +
+ + + +
+ + + +
+ + + +
+ + + +
+ + + + + +
+
+
+ + + + diff --git a/docs/html/menudata.js b/docs/html/menudata.js index cd9c973..9b91329 100644 --- a/docs/html/menudata.js +++ b/docs/html/menudata.js @@ -34,8 +34,25 @@ var menudata={children:[ {text:"Classes",url:"annotated.html",children:[ {text:"Class List",url:"annotated.html"}, {text:"Class Index",url:"classes.html"}, +{text:"Class Hierarchy",url:"inherits.html"}, {text:"Class Members",url:"functions.html",children:[ -{text:"All",url:"functions.html"}, +{text:"All",url:"functions.html",children:[ +{text:"_",url:"functions.html#index__5F"}, +{text:"a",url:"functions.html#index_a"}, +{text:"c",url:"functions.html#index_c"}, +{text:"f",url:"functions.html#index_f"}, +{text:"g",url:"functions.html#index_g"}, +{text:"h",url:"functions.html#index_h"}, +{text:"i",url:"functions.html#index_i"}, +{text:"l",url:"functions.html#index_l"}, +{text:"m",url:"functions.html#index_m"}, +{text:"n",url:"functions.html#index_n"}, +{text:"o",url:"functions.html#index_o"}, +{text:"p",url:"functions.html#index_p"}, +{text:"r",url:"functions.html#index_r"}, +{text:"s",url:"functions.html#index_s"}, +{text:"t",url:"functions.html#index_t"}, +{text:"u",url:"functions.html#index_u"}]}, {text:"Functions",url:"functions_func.html"}, {text:"Variables",url:"functions_vars.html"}, {text:"Related Symbols",url:"functions_rela.html"}]}]}, diff --git a/docs/html/namespaces.html b/docs/html/namespaces.html index 58e5165..065fc72 100644 --- a/docs/html/namespaces.html +++ b/docs/html/namespaces.html @@ -95,11 +95,20 @@
Here is a list of all namespaces with brief descriptions:
-
[detail level 12]
+
[detail level 12345]
+ + + + + + + + +
 Ninverted_index
 CdocsStructure that stores information about a document
 Npage_rank
 CGraphRepresents a directed graph used to compute the PageRank algorithm
 Nsearch_engine
 Nsearch_engine
 Ncrawler
 CCrawler
 Nexceptions
 CUrlError
 Nhelper
 Nconverter
 CStringToIntConverter
diff --git a/docs/html/namespaces_dup.js b/docs/html/namespaces_dup.js index f4db024..6b5f820 100644 --- a/docs/html/namespaces_dup.js +++ b/docs/html/namespaces_dup.js @@ -1,5 +1,6 @@ var namespaces_dup = [ [ "inverted_index", "namespaceinverted__index.html", "namespaceinverted__index" ], - [ "page_rank", "namespacepage__rank.html", "namespacepage__rank" ] + [ "page_rank", "namespacepage__rank.html", "namespacepage__rank" ], + [ "search_engine", "namespacesearch__engine.html", "namespacesearch__engine" ] ]; \ No newline at end of file diff --git a/docs/html/namespacesearch__engine.html b/docs/html/namespacesearch__engine.html new file mode 100644 index 0000000..fc98ece --- /dev/null +++ b/docs/html/namespacesearch__engine.html @@ -0,0 +1,115 @@ + + + + + + + +Search Engine: search_engine Namespace Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine Namespace Reference
+
+
+ + + + +

+Namespaces

namespace  search_engine
 
+
+
+ + + + diff --git a/docs/html/namespacesearch__engine.js b/docs/html/namespacesearch__engine.js new file mode 100644 index 0000000..dc3fd7c --- /dev/null +++ b/docs/html/namespacesearch__engine.js @@ -0,0 +1,4 @@ +var namespacesearch__engine = +[ + [ "search_engine", "namespacesearch__engine_1_1search__engine.html", "namespacesearch__engine_1_1search__engine" ] +]; \ No newline at end of file diff --git a/docs/html/namespacesearch__engine_1_1search__engine.html b/docs/html/namespacesearch__engine_1_1search__engine.html new file mode 100644 index 0000000..b1a549d --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine.html @@ -0,0 +1,119 @@ + + + + + + + +Search Engine: search_engine.search_engine Namespace Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine Namespace Reference
+
+
+ + + + + + + + +

+Namespaces

namespace  crawler
 
namespace  exceptions
 
namespace  helper
 
+
+
+ + + + diff --git a/docs/html/namespacesearch__engine_1_1search__engine.js b/docs/html/namespacesearch__engine_1_1search__engine.js new file mode 100644 index 0000000..10cef7d --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine.js @@ -0,0 +1,6 @@ +var namespacesearch__engine_1_1search__engine = +[ + [ "crawler", "namespacesearch__engine_1_1search__engine_1_1crawler.html", "namespacesearch__engine_1_1search__engine_1_1crawler" ], + [ "exceptions", "namespacesearch__engine_1_1search__engine_1_1exceptions.html", "namespacesearch__engine_1_1search__engine_1_1exceptions" ], + [ "helper", "namespacesearch__engine_1_1search__engine_1_1helper.html", "namespacesearch__engine_1_1search__engine_1_1helper" ] +]; \ No newline at end of file diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1crawler.html b/docs/html/namespacesearch__engine_1_1search__engine_1_1crawler.html new file mode 100644 index 0000000..e1d720e --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1crawler.html @@ -0,0 +1,115 @@ + + + + + + + +Search Engine: search_engine.search_engine.crawler Namespace Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.crawler Namespace Reference
+
+
+ + + + +

+Classes

class  Crawler
 
+
+
+ + + + diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1crawler.js b/docs/html/namespacesearch__engine_1_1search__engine_1_1crawler.js new file mode 100644 index 0000000..055ab8e --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1crawler.js @@ -0,0 +1,4 @@ +var namespacesearch__engine_1_1search__engine_1_1crawler = +[ + [ "Crawler", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html", "classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler" ] +]; \ No newline at end of file diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1exceptions.html b/docs/html/namespacesearch__engine_1_1search__engine_1_1exceptions.html new file mode 100644 index 0000000..b88b5d9 --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1exceptions.html @@ -0,0 +1,115 @@ + + + + + + + +Search Engine: search_engine.search_engine.exceptions Namespace Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.exceptions Namespace Reference
+
+
+ + + + +

+Classes

class  UrlError
 
+
+
+ + + + diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1exceptions.js b/docs/html/namespacesearch__engine_1_1search__engine_1_1exceptions.js new file mode 100644 index 0000000..b9b7c6a --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1exceptions.js @@ -0,0 +1,4 @@ +var namespacesearch__engine_1_1search__engine_1_1exceptions = +[ + [ "UrlError", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html", "classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError" ] +]; \ No newline at end of file diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1helper.html b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper.html new file mode 100644 index 0000000..dabe6b6 --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper.html @@ -0,0 +1,115 @@ + + + + + + + +Search Engine: search_engine.search_engine.helper Namespace Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.helper Namespace Reference
+
+
+ + + + +

+Namespaces

namespace  converter
 
+
+
+ + + + diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1helper.js b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper.js new file mode 100644 index 0000000..50ece7b --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper.js @@ -0,0 +1,4 @@ +var namespacesearch__engine_1_1search__engine_1_1helper = +[ + [ "converter", "namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html", "namespacesearch__engine_1_1search__engine_1_1helper_1_1converter" ] +]; \ No newline at end of file diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html new file mode 100644 index 0000000..e4b6789 --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html @@ -0,0 +1,115 @@ + + + + + + + +Search Engine: search_engine.search_engine.helper.converter Namespace Reference + + + + + + + + + + + + + + + +
+
+ + + + + + +
+
Search Engine +
+
+
+ + + + + + + +
+
+ +
+
+
+ +
+ +
+
+ + +
+
+
+
+
+
Loading...
+
Searching...
+
No Matches
+
+
+
+
+ +
+ +
search_engine.search_engine.helper.converter Namespace Reference
+
+
+ + + + +

+Classes

class  StringToIntConverter
 
+
+
+ + + + diff --git a/docs/html/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.js b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.js new file mode 100644 index 0000000..8e08405 --- /dev/null +++ b/docs/html/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.js @@ -0,0 +1,4 @@ +var namespacesearch__engine_1_1search__engine_1_1helper_1_1converter = +[ + [ "StringToIntConverter", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html", "classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter" ] +]; \ No newline at end of file diff --git a/docs/html/navtreedata.js b/docs/html/navtreedata.js index 11339c9..7d1514c 100644 --- a/docs/html/navtreedata.js +++ b/docs/html/navtreedata.js @@ -87,6 +87,7 @@ var NAVTREE = [ "Classes", "annotated.html", [ [ "Class List", "annotated.html", "annotated_dup" ], [ "Class Index", "classes.html", null ], + [ "Class Hierarchy", "hierarchy.html", "hierarchy" ], [ "Class Members", "functions.html", [ [ "All", "functions.html", null ], [ "Functions", "functions_func.html", null ], diff --git a/docs/html/navtreeindex0.js b/docs/html/navtreeindex0.js index eb45fe3..a82d603 100644 --- a/docs/html/navtreeindex0.js +++ b/docs/html/navtreeindex0.js @@ -41,41 +41,95 @@ var NAVTREEINDEX0 = "Chap_11_Technical_risks.html#Chap_11_2_Technical_debt":[0,12,1], "Chap_12_Glossary.html":[0,13], "Chap_12_Glossary.html#References":[0,13,0], -"__page__rank_8cpp.html":[3,0,1,1,0], -"__page__rank_8cpp.html#ac9efdaac9411d0868b715edccca3269d":[3,0,1,1,0,0], +"____init_____8py.html":[3,0,2,1], +"__hello_8cpp.html":[3,0,1,1,0], +"__hello_8cpp.html#ac9efdaac9411d0868b715edccca3269d":[3,0,1,1,0,0], +"__inverted__index_8cpp.html":[3,0,1,1,1], +"__inverted__index_8cpp.html#ac9efdaac9411d0868b715edccca3269d":[3,0,1,1,1,0], +"__page__rank_8cpp.html":[3,0,1,1,2], +"__page__rank_8cpp.html#ac9efdaac9411d0868b715edccca3269d":[3,0,1,1,2,0], "annotated.html":[2,0], -"classHello.html":[2,0,2], -"classHello.html#a935f8ae8833c9cac314fce1a87907a08":[2,0,2,1], -"classHello.html#aaa8dc2cd664f8a83b9119a06b2f2790c":[2,0,2,0], +"classHello.html":[2,0,3], +"classHello.html#a935f8ae8833c9cac314fce1a87907a08":[2,0,3,1], +"classHello.html#aaa8dc2cd664f8a83b9119a06b2f2790c":[2,0,3,0], "classes.html":[2,1], -"classpage__rank_1_1Graph.html":[1,0,1,0], "classpage__rank_1_1Graph.html":[2,0,1,0], -"classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0":[1,0,1,0,3], +"classpage__rank_1_1Graph.html":[1,0,1,0], "classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0":[2,0,1,0,3], -"classpage__rank_1_1Graph.html#a740d64110326e1e6bf09351b37440460":[1,0,1,0,1], +"classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0":[1,0,1,0,3], "classpage__rank_1_1Graph.html#a740d64110326e1e6bf09351b37440460":[2,0,1,0,1], +"classpage__rank_1_1Graph.html#a740d64110326e1e6bf09351b37440460":[1,0,1,0,1], "classpage__rank_1_1Graph.html#a83683b548468555d24ddfc58c268bab0":[1,0,1,0,0], "classpage__rank_1_1Graph.html#a83683b548468555d24ddfc58c268bab0":[2,0,1,0,0], -"classpage__rank_1_1Graph.html#ae87e6a531c87ecf28d4bd8739f69b61a":[2,0,1,0,2], "classpage__rank_1_1Graph.html#ae87e6a531c87ecf28d4bd8739f69b61a":[1,0,1,0,2], +"classpage__rank_1_1Graph.html#ae87e6a531c87ecf28d4bd8739f69b61a":[2,0,1,0,2], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html":[2,0,2,0,0,0], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html":[1,0,2,0,0,0], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a066cf036bc6b4178858f790e0d2625e7":[1,0,2,0,0,0,5], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a066cf036bc6b4178858f790e0d2625e7":[2,0,2,0,0,0,5], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a0d917081e91fe9067c457e791efec341":[2,0,2,0,0,0,9], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a0d917081e91fe9067c457e791efec341":[1,0,2,0,0,0,9], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a1f219db9f6b0dcd8c7f5b12afc8a0574":[2,0,2,0,0,0,3], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a1f219db9f6b0dcd8c7f5b12afc8a0574":[1,0,2,0,0,0,3], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a2926e956cbfbf24d9c99a1c0e80fae5e":[2,0,2,0,0,0,8], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a2926e956cbfbf24d9c99a1c0e80fae5e":[1,0,2,0,0,0,8], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a3749cceadf503febd19be1a13c9a0fe9":[1,0,2,0,0,0,0], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a3749cceadf503febd19be1a13c9a0fe9":[2,0,2,0,0,0,0], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a6e0bc960b9ee2c29b8b75c66a275f570":[2,0,2,0,0,0,7], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a6e0bc960b9ee2c29b8b75c66a275f570":[1,0,2,0,0,0,7], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aa4018e5dcd1bac621932a2f70ae0d990":[2,0,2,0,0,0,4], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aa4018e5dcd1bac621932a2f70ae0d990":[1,0,2,0,0,0,4], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ab1db7f6a00564e301a65a3560b00450a":[2,0,2,0,0,0,10], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ab1db7f6a00564e301a65a3560b00450a":[1,0,2,0,0,0,10], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ace884d52406cb35a990f172fe49a40d5":[2,0,2,0,0,0,2], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ace884d52406cb35a990f172fe49a40d5":[1,0,2,0,0,0,2], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ada91bdbc6ff449d14a4b3435189080f9":[2,0,2,0,0,0,1], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ada91bdbc6ff449d14a4b3435189080f9":[1,0,2,0,0,0,1], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aecc008b6c522f033489506a4bb21bc52":[1,0,2,0,0,0,6], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aecc008b6c522f033489506a4bb21bc52":[2,0,2,0,0,0,6], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#af2b2d5e8f62ba5661b4c87e15a9bc67e":[2,0,2,0,0,0,11], +"classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#af2b2d5e8f62ba5661b4c87e15a9bc67e":[1,0,2,0,0,0,11], +"classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html":[2,0,2,0,1,0], +"classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html":[1,0,2,0,1,0], +"classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#a40e2fd59c669daada4d42c4c76cee5cb":[1,0,2,0,1,0,1], +"classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#a40e2fd59c669daada4d42c4c76cee5cb":[2,0,2,0,1,0,1], +"classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#aafc565a27959d46203642a601d5468da":[2,0,2,0,1,0,0], +"classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#aafc565a27959d46203642a601d5468da":[1,0,2,0,1,0,0], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html":[1,0,2,0,2,0,0], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html":[2,0,2,0,2,0,0], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a2d3bad61678c8f6cf075256b6fb411c7":[1,0,2,0,2,0,0,0], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a2d3bad61678c8f6cf075256b6fb411c7":[2,0,2,0,2,0,0,0], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a562ba6756f1cc804678075a02d28eb9f":[1,0,2,0,2,0,0,1], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a562ba6756f1cc804678075a02d28eb9f":[2,0,2,0,2,0,0,1], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a583c2162f4a2a2c6bff496b034e30675":[1,0,2,0,2,0,0,3], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a583c2162f4a2a2c6bff496b034e30675":[2,0,2,0,2,0,0,3], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#af796cd59c12eba4822eb8f8b6bcfed8b":[1,0,2,0,2,0,0,2], +"classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#af796cd59c12eba4822eb8f8b6bcfed8b":[2,0,2,0,2,0,0,2], +"converter_8py.html":[3,0,2,0,1], +"crawler_8py.html":[3,0,2,2], +"dir_3077535539cd151b75f9ad358f5d25ba.html":[3,0,2], "dir_49e56c817e5e54854c35e136979f97ca.html":[3,0,0], "dir_5a30104352ef4255dc24354b02eb2d20.html":[3,0,1,0], "dir_6d7ee3ff6458c72ecda1e3d04d8690bc.html":[3,0,0,0], "dir_97aefd0d527b934f1d99a682da8fe6a9.html":[3,0,1], "dir_a065c5f60305fee3569f887679366939.html":[3,0,1,1], +"dir_a288a6e2e3e1e96db5e8d1e18942be87.html":[3,0,2,0], +"exceptions_8py.html":[3,0,2,3], "files.html":[3,0], -"functions.html":[2,2,0], -"functions_func.html":[2,2,1], -"functions_rela.html":[2,2,3], -"functions_vars.html":[2,2,2], +"functions.html":[2,3,0], +"functions_func.html":[2,3,1], +"functions_rela.html":[2,3,3], +"functions_vars.html":[2,3,2], "globals.html":[3,1,0], "globals_defs.html":[3,1,2], "globals_func.html":[3,1,1], -"hello_8cpp.html":[3,0,1,1,1], +"hello_8cpp.html":[3,0,1,1,3], "hello_8h.html":[3,0,1,0,0], "hello_8h_source.html":[3,0,1,0,0], +"helper_2____init_____8py.html":[3,0,2,0,0], +"hierarchy.html":[2,2], "index.html":[], -"inverted__index_8cpp.html":[3,0,1,1,2], +"inverted__index_8cpp.html":[3,0,1,1,4], "inverted__index_8h.html":[3,0,1,0,1], "inverted__index_8h.html#a12560c3b47a4f48755b32ad63cd8ccd1":[3,0,1,0,1,4], "inverted__index_8h.html#a13797fc328d8f34927c3f7368966ac48":[3,0,1,0,1,2], @@ -109,7 +163,13 @@ var NAVTREEINDEX0 = "namespacemembers_type.html":[1,1,2], "namespacepage__rank.html":[1,0,1], "namespaces.html":[1,0], -"page__rank_8cpp.html":[3,0,1,1,3], +"namespacesearch__engine.html":[1,0,2], +"namespacesearch__engine_1_1search__engine.html":[1,0,2,0], +"namespacesearch__engine_1_1search__engine_1_1crawler.html":[1,0,2,0,0], +"namespacesearch__engine_1_1search__engine_1_1exceptions.html":[1,0,2,0,1], +"namespacesearch__engine_1_1search__engine_1_1helper.html":[1,0,2,0,2], +"namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html":[1,0,2,0,2,0], +"page__rank_8cpp.html":[3,0,1,1,5], "page__rank_8h.html":[3,0,1,0,2], "page__rank_8h_source.html":[3,0,1,0,2], "pages.html":[], @@ -119,23 +179,23 @@ var NAVTREEINDEX0 = "structinverted__index_1_1docs.html#a0dee7a56613409b307976525f002f100":[1,0,0,0,6], "structinverted__index_1_1docs.html#a217103c61707d6e219fdac64eb4022c8":[2,0,0,0,5], "structinverted__index_1_1docs.html#a217103c61707d6e219fdac64eb4022c8":[1,0,0,0,5], -"structinverted__index_1_1docs.html#a8c50490f2708078748f15edd7628f721":[1,0,0,0,0], "structinverted__index_1_1docs.html#a8c50490f2708078748f15edd7628f721":[2,0,0,0,0], -"structinverted__index_1_1docs.html#abd578731f060f11c422137f2909d103b":[2,0,0,0,2], +"structinverted__index_1_1docs.html#a8c50490f2708078748f15edd7628f721":[1,0,0,0,0], "structinverted__index_1_1docs.html#abd578731f060f11c422137f2909d103b":[1,0,0,0,2], +"structinverted__index_1_1docs.html#abd578731f060f11c422137f2909d103b":[2,0,0,0,2], "structinverted__index_1_1docs.html#ad3f6c536dffb2b1a43e386b97ab8603d":[1,0,0,0,3], "structinverted__index_1_1docs.html#ad3f6c536dffb2b1a43e386b97ab8603d":[2,0,0,0,3], -"structinverted__index_1_1docs.html#ad40a502bb97dced4cd8c7634958df2f5":[2,0,0,0,4], "structinverted__index_1_1docs.html#ad40a502bb97dced4cd8c7634958df2f5":[1,0,0,0,4], -"structinverted__index_1_1docs.html#ae1cb30b20b66fae23666b68d45972ec6":[2,0,0,0,1], +"structinverted__index_1_1docs.html#ad40a502bb97dced4cd8c7634958df2f5":[2,0,0,0,4], "structinverted__index_1_1docs.html#ae1cb30b20b66fae23666b68d45972ec6":[1,0,0,0,1], -"subtraction_8cpp.html":[3,0,1,1,4], -"subtraction_8cpp.html#a5620e8715eb9f46a17fdd22f9485f2b0":[3,0,1,1,4,0], +"structinverted__index_1_1docs.html#ae1cb30b20b66fae23666b68d45972ec6":[2,0,0,0,1], +"subtraction_8cpp.html":[3,0,1,1,6], +"subtraction_8cpp.html#a5620e8715eb9f46a17fdd22f9485f2b0":[3,0,1,1,6,0], "subtraction_8h.html":[3,0,1,0,3], "subtraction_8h.html#a5620e8715eb9f46a17fdd22f9485f2b0":[3,0,1,0,3,0], "subtraction_8h_source.html":[3,0,1,0,3], -"sum_8cpp.html":[3,0,1,1,5], -"sum_8cpp.html#aed1f1c5da982a62827227c3c45b5fccb":[3,0,1,1,5,0], +"sum_8cpp.html":[3,0,1,1,7], +"sum_8cpp.html#aed1f1c5da982a62827227c3c45b5fccb":[3,0,1,1,7,0], "sum_8h.html":[3,0,1,0,4], "sum_8h.html#aed1f1c5da982a62827227c3c45b5fccb":[3,0,1,0,4,0], "sum_8h_source.html":[3,0,1,0,4] diff --git a/docs/html/search/all_11.js b/docs/html/search/all_11.js index 24d9e6c..4ba282b 100644 --- a/docs/html/search/all_11.js +++ b/docs/html/search/all_11.js @@ -3,6 +3,6 @@ var searchData= ['get_5fadjlist_0',['get_adjList',['../classpage__rank_1_1Graph.html#ae87e6a531c87ecf28d4bd8739f69b61a',1,'page_rank::Graph']]], ['glossary_1',['12 Glossary',['../Chap_12_Glossary.html',1,'Chap_00_Architecture_documentation']]], ['goals_2',['1.3 Quality goals',['../Chap_01_Introduction.html#Chap_01_03_Quality_goals',1,'']]], - ['graph_3',['Graph',['../classpage__rank_1_1Graph.html',1,'page_rank']]], + ['graph_3',['graph',['../classpage__rank_1_1Graph.html',1,'page_rank::Graph'],['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aecc008b6c522f033489506a4bb21bc52',1,'search_engine.search_engine.crawler.Crawler.graph']]], ['greet_4',['greet',['../classHello.html#a935f8ae8833c9cac314fce1a87907a08',1,'Hello']]] ]; diff --git a/docs/html/search/all_13.js b/docs/html/search/all_13.js index cfebe54..e9b2fa1 100644 --- a/docs/html/search/all_13.js +++ b/docs/html/search/all_13.js @@ -1,9 +1,10 @@ var searchData= [ - ['interface_0',['interface',['../Chap_08_Concepts.html#Chap_08_02_User_interface',1,'8.2 User Interface'],['../Chap_05_Building_block_view.html#Chap_05_01_01_02',1,'Interface']]], - ['internationalization_1',['8.6 Internationalization',['../Chap_08_Concepts.html#Chap_08_06_Internationalization',1,'']]], - ['introduction_2',['1 Introduction',['../Chap_01_Introduction.html',1,'Chap_00_Architecture_documentation']]], - ['inverted_5findex_3',['inverted_index',['../namespaceinverted__index.html',1,'']]], - ['inverted_5findex_2ecpp_4',['inverted_index.cpp',['../inverted__index_8cpp.html',1,'']]], - ['inverted_5findex_2eh_5',['inverted_index.h',['../inverted__index_8h.html',1,'']]] + ['initial_5fpage_0',['initial_page',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a6e0bc960b9ee2c29b8b75c66a275f570',1,'search_engine::search_engine::crawler::Crawler']]], + ['interface_1',['interface',['../Chap_08_Concepts.html#Chap_08_02_User_interface',1,'8.2 User Interface'],['../Chap_05_Building_block_view.html#Chap_05_01_01_02',1,'Interface']]], + ['internationalization_2',['8.6 Internationalization',['../Chap_08_Concepts.html#Chap_08_06_Internationalization',1,'']]], + ['introduction_3',['1 Introduction',['../Chap_01_Introduction.html',1,'Chap_00_Architecture_documentation']]], + ['inverted_5findex_4',['inverted_index',['../namespaceinverted__index.html',1,'']]], + ['inverted_5findex_2ecpp_5',['inverted_index.cpp',['../inverted__index_8cpp.html',1,'']]], + ['inverted_5findex_2eh_6',['inverted_index.h',['../inverted__index_8h.html',1,'']]] ]; diff --git a/docs/html/search/all_15.js b/docs/html/search/all_15.js index 6f56155..01a03a9 100644 --- a/docs/html/search/all_15.js +++ b/docs/html/search/all_15.js @@ -1,4 +1,5 @@ var searchData= [ - ['map_5fstr_5fdocs_0',['map_str_docs',['../namespaceinverted__index.html#a12560c3b47a4f48755b32ad63cd8ccd1',1,'inverted_index']]] + ['map_5fstr_5fdocs_0',['map_str_docs',['../namespaceinverted__index.html#a12560c3b47a4f48755b32ad63cd8ccd1',1,'inverted_index']]], + ['message_1',['message',['../classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#a40e2fd59c669daada4d42c4c76cee5cb',1,'search_engine::search_engine::exceptions::UrlError']]] ]; diff --git a/docs/html/search/all_16.js b/docs/html/search/all_16.js index 7efaa42..a3999f7 100644 --- a/docs/html/search/all_16.js +++ b/docs/html/search/all_16.js @@ -1,4 +1,5 @@ var searchData= [ - ['name_5fdoc_0',['name_doc',['../structinverted__index_1_1docs.html#a0dee7a56613409b307976525f002f100',1,'inverted_index::docs']]] + ['name_5fdoc_0',['name_doc',['../structinverted__index_1_1docs.html#a0dee7a56613409b307976525f002f100',1,'inverted_index::docs']]], + ['next_5fint_1',['next_int',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#af796cd59c12eba4822eb8f8b6bcfed8b',1,'search_engine::search_engine::helper::converter::StringToIntConverter']]] ]; diff --git a/docs/html/search/all_18.js b/docs/html/search/all_18.js index 41064fe..db69099 100644 --- a/docs/html/search/all_18.js +++ b/docs/html/search/all_18.js @@ -1,9 +1,10 @@ var searchData= [ - ['page_5frank_0',['page_rank',['../namespacepage__rank.html',1,'']]], - ['page_5frank_2ecpp_1',['page_rank.cpp',['../page__rank_8cpp.html',1,'']]], - ['page_5frank_2eh_2',['page_rank.h',['../page__rank_8h.html',1,'']]], - ['persistency_3',['8.1 Persistency',['../Chap_08_Concepts.html#Chap_08_01_Persistency',1,'']]], - ['print_4',['print',['../classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0',1,'page_rank::Graph']]], - ['py_5fssize_5ft_5fclean_5',['PY_SSIZE_T_CLEAN',['../__page__rank_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'_page_rank.cpp']]] + ['page_5fname_0',['page_name',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a2926e956cbfbf24d9c99a1c0e80fae5e',1,'search_engine::search_engine::crawler::Crawler']]], + ['page_5frank_1',['page_rank',['../namespacepage__rank.html',1,'']]], + ['page_5frank_2ecpp_2',['page_rank.cpp',['../page__rank_8cpp.html',1,'']]], + ['page_5frank_2eh_3',['page_rank.h',['../page__rank_8h.html',1,'']]], + ['persistency_4',['8.1 Persistency',['../Chap_08_Concepts.html#Chap_08_01_Persistency',1,'']]], + ['print_5',['print',['../classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0',1,'page_rank::Graph']]], + ['py_5fssize_5ft_5fclean_6',['py_ssize_t_clean',['../__hello_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'PY_SSIZE_T_CLEAN: _hello.cpp'],['../__inverted__index_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'PY_SSIZE_T_CLEAN: _inverted_index.cpp'],['../__page__rank_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'PY_SSIZE_T_CLEAN: _page_rank.cpp']]] ]; diff --git a/docs/html/search/all_1a.js b/docs/html/search/all_1a.js index 4d3de4b..9392c57 100644 --- a/docs/html/search/all_1a.js +++ b/docs/html/search/all_1a.js @@ -2,9 +2,12 @@ var searchData= [ ['reasons_20for_20decomposition_0',['Reasons for decomposition',['../Chap_05_Building_block_view.html#Chap_05_01_01_04',1,'']]], ['references_1',['1.2 References',['../Chap_01_Introduction.html#Chap_01_02_References',1,'']]], - ['requirements_20overview_2',['1.1 Requirements Overview',['../Chap_01_Introduction.html#Chap_01_01_Requirements_Overview',1,'']]], - ['responsibility_3',['Responsibility',['../Chap_05_Building_block_view.html#Chap_05_01_01_01',1,'']]], - ['reusability_4',['8.7 Reusability',['../Chap_08_Concepts.html#Chap_08_07_Reusability',1,'']]], - ['risks_5',['risks',['../Chap_11_Technical_risks.html',1,'11 Technical risks'],['../Chap_11_Technical_risks.html#Chap_11_1_Technical_risks',1,'11.1 Technical risks']]], - ['runtime_20view_6',['6 Runtime View',['../Chap_06_Runtime_View.html',1,'Chap_00_Architecture_documentation']]] + ['regex_2',['REGEX',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a9b7fdc122b15d78d9967e0a6a567cf9f',1,'search_engine::search_engine::crawler::Crawler']]], + ['remove_5fpages_3',['remove_pages',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a0d917081e91fe9067c457e791efec341',1,'search_engine::search_engine::crawler::Crawler']]], + ['requirements_20overview_4',['1.1 Requirements Overview',['../Chap_01_Introduction.html#Chap_01_01_Requirements_Overview',1,'']]], + ['responsibility_5',['Responsibility',['../Chap_05_Building_block_view.html#Chap_05_01_01_01',1,'']]], + ['reusability_6',['8.7 Reusability',['../Chap_08_Concepts.html#Chap_08_07_Reusability',1,'']]], + ['risks_7',['risks',['../Chap_11_Technical_risks.html',1,'11 Technical risks'],['../Chap_11_Technical_risks.html#Chap_11_1_Technical_risks',1,'11.1 Technical risks']]], + ['run_8',['run',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aa4018e5dcd1bac621932a2f70ae0d990',1,'search_engine::search_engine::crawler::Crawler']]], + ['runtime_20view_9',['6 Runtime View',['../Chap_06_Runtime_View.html',1,'Chap_00_Architecture_documentation']]] ]; diff --git a/docs/html/search/all_1b.js b/docs/html/search/all_1b.js index 3addd4b..e446c49 100644 --- a/docs/html/search/all_1b.js +++ b/docs/html/search/all_1b.js @@ -2,18 +2,26 @@ var searchData= [ ['scenarios_0',['10 Quality scenarios',['../Chap_10_Quality_scenarios.html',1,'Chap_00_Architecture_documentation']]], ['scope_20and_20context_1',['3 System Scope and Context',['../Chap_03_System_scope_and_context.html',1,'Chap_00_Architecture_documentation']]], - ['set_5fdocs_2',['set_docs',['../namespaceinverted__index.html#a173ab89b0eb7a4b54b7b6f7239edc51d',1,'inverted_index']]], - ['shrink_5fstring_3',['shrink_string',['../namespaceinverted__index.html#ac0c99343822e08b34bb0f874759b1c56',1,'inverted_index']]], - ['solution_20strategy_4',['4 Solution strategy',['../Chap_04_Solution_strategy.html',1,'Chap_00_Architecture_documentation']]], - ['split_5',['split',['../namespaceinverted__index.html#a35a9f1cb5d6ae865560f7eabb3def5c9',1,'inverted_index']]], - ['stakeholders_6',['1.4 Stakeholders',['../Chap_01_Introduction.html#Chap_01_04_Stakeholders',1,'']]], - ['str_7',['str',['../namespaceinverted__index.html#a7a967eb8fcbea5b66739ec4d4f05be39',1,'inverted_index']]], - ['strategy_8',['4 Solution strategy',['../Chap_04_Solution_strategy.html',1,'Chap_00_Architecture_documentation']]], - ['subtraction_9',['subtraction',['../subtraction_8h.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp'],['../subtraction_8cpp.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp']]], - ['subtraction_2ecpp_10',['subtraction.cpp',['../subtraction_8cpp.html',1,'']]], - ['subtraction_2eh_11',['subtraction.h',['../subtraction_8h.html',1,'']]], - ['sum_12',['sum',['../sum_8cpp.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp'],['../sum_8h.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp']]], - ['sum_2ecpp_13',['sum.cpp',['../sum_8cpp.html',1,'']]], - ['sum_2eh_14',['sum.h',['../sum_8h.html',1,'']]], - ['system_20scope_20and_20context_15',['3 System Scope and Context',['../Chap_03_System_scope_and_context.html',1,'Chap_00_Architecture_documentation']]] + ['search_5fengine_2',['search_engine',['../namespacesearch__engine.html',1,'']]], + ['search_5fengine_3a_3asearch_5fengine_3',['search_engine',['../namespacesearch__engine_1_1search__engine.html',1,'search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3acrawler_4',['crawler',['../namespacesearch__engine_1_1search__engine_1_1crawler.html',1,'search_engine::search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3aexceptions_5',['exceptions',['../namespacesearch__engine_1_1search__engine_1_1exceptions.html',1,'search_engine::search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3ahelper_6',['helper',['../namespacesearch__engine_1_1search__engine_1_1helper.html',1,'search_engine::search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3ahelper_3a_3aconverter_7',['converter',['../namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html',1,'search_engine::search_engine::helper']]], + ['set_5fdocs_8',['set_docs',['../namespaceinverted__index.html#a173ab89b0eb7a4b54b7b6f7239edc51d',1,'inverted_index']]], + ['shrink_5fstring_9',['shrink_string',['../namespaceinverted__index.html#ac0c99343822e08b34bb0f874759b1c56',1,'inverted_index']]], + ['solution_20strategy_10',['4 Solution strategy',['../Chap_04_Solution_strategy.html',1,'Chap_00_Architecture_documentation']]], + ['split_11',['split',['../namespaceinverted__index.html#a35a9f1cb5d6ae865560f7eabb3def5c9',1,'inverted_index']]], + ['stakeholders_12',['1.4 Stakeholders',['../Chap_01_Introduction.html#Chap_01_04_Stakeholders',1,'']]], + ['str_13',['str',['../namespaceinverted__index.html#a7a967eb8fcbea5b66739ec4d4f05be39',1,'inverted_index']]], + ['strategy_14',['4 Solution strategy',['../Chap_04_Solution_strategy.html',1,'Chap_00_Architecture_documentation']]], + ['string_5fto_5fint_15',['string_to_int',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a583c2162f4a2a2c6bff496b034e30675',1,'search_engine::search_engine::helper::converter::StringToIntConverter']]], + ['stringtointconverter_16',['StringToIntConverter',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html',1,'search_engine::search_engine::helper::converter']]], + ['subtraction_17',['subtraction',['../subtraction_8cpp.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp'],['../subtraction_8h.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp']]], + ['subtraction_2ecpp_18',['subtraction.cpp',['../subtraction_8cpp.html',1,'']]], + ['subtraction_2eh_19',['subtraction.h',['../subtraction_8h.html',1,'']]], + ['sum_20',['sum',['../sum_8cpp.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp'],['../sum_8h.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp']]], + ['sum_2ecpp_21',['sum.cpp',['../sum_8cpp.html',1,'']]], + ['sum_2eh_22',['sum.h',['../sum_8h.html',1,'']]], + ['system_20scope_20and_20context_23',['3 System Scope and Context',['../Chap_03_System_scope_and_context.html',1,'Chap_00_Architecture_documentation']]] ]; diff --git a/docs/html/search/all_1c.js b/docs/html/search/all_1c.js index 21099a6..995c892 100644 --- a/docs/html/search/all_1c.js +++ b/docs/html/search/all_1c.js @@ -6,7 +6,8 @@ var searchData= ['technical_20debt_3',['11.2 Technical debt',['../Chap_11_Technical_risks.html#Chap_11_2_Technical_debt',1,'']]], ['technical_20risks_4',['technical risks',['../Chap_11_Technical_risks.html',1,'11 Technical risks'],['../Chap_11_Technical_risks.html#Chap_11_1_Technical_risks',1,'11.1 Technical risks']]], ['template_20disclosure_5',['Template disclosure',['../Chap_00_Architecture_documentation.html#Template_disclosure',1,'']]], - ['testability_6',['8.8 Testability',['../Chap_08_Concepts.html#Chap_08_08_Testability',1,'']]], - ['to_5flowercase_7',['to_lowercase',['../namespaceinverted__index.html#a2caf9e19f6557b6fce93e8a555e55ae4',1,'inverted_index']]], - ['tracing_8',['8.4 Logging, tracing',['../Chap_08_Concepts.html#Chap_08_04_Logging_tracing',1,'']]] + ['test_5fmode_6',['test_mode',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ab1db7f6a00564e301a65a3560b00450a',1,'search_engine::search_engine::crawler::Crawler']]], + ['testability_7',['8.8 Testability',['../Chap_08_Concepts.html#Chap_08_08_Testability',1,'']]], + ['to_5flowercase_8',['to_lowercase',['../namespaceinverted__index.html#a2caf9e19f6557b6fce93e8a555e55ae4',1,'inverted_index']]], + ['tracing_9',['8.4 Logging, tracing',['../Chap_08_Concepts.html#Chap_08_04_Logging_tracing',1,'']]] ]; diff --git a/docs/html/search/all_1d.js b/docs/html/search/all_1d.js index c8dae73..7b0b87b 100644 --- a/docs/html/search/all_1d.js +++ b/docs/html/search/all_1d.js @@ -1,4 +1,6 @@ var searchData= [ - ['user_20interface_0',['8.2 User Interface',['../Chap_08_Concepts.html#Chap_08_02_User_interface',1,'']]] + ['url_5fbase_0',['url_base',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#af2b2d5e8f62ba5661b4c87e15a9bc67e',1,'search_engine::search_engine::crawler::Crawler']]], + ['urlerror_1',['UrlError',['../classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html',1,'search_engine::search_engine::exceptions']]], + ['user_20interface_2',['8.2 User Interface',['../Chap_08_Concepts.html#Chap_08_02_User_interface',1,'']]] ]; diff --git a/docs/html/search/all_a.js b/docs/html/search/all_a.js index 5d75d08..882a463 100644 --- a/docs/html/search/all_a.js +++ b/docs/html/search/all_a.js @@ -1,4 +1,11 @@ var searchData= [ - ['_5fpage_5frank_2ecpp_0',['_page_rank.cpp',['../__page__rank_8cpp.html',1,'']]] + ['_5f_5finit_5f_5f_0',['__init__',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a3749cceadf503febd19be1a13c9a0fe9',1,'search_engine.search_engine.crawler.Crawler.__init__()'],['../classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#aafc565a27959d46203642a601d5468da',1,'search_engine.search_engine.exceptions.UrlError.__init__()'],['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a2d3bad61678c8f6cf075256b6fb411c7',1,'search_engine.search_engine.helper.converter.StringToIntConverter.__init__()']]], + ['_5f_5finit_5f_5f_2epy_1',['__init__.py',['../____init_____8py.html',1,'(Global Namespace)'],['../helper_2____init_____8py.html',1,'(Global Namespace)']]], + ['_5fget_5flinks_2',['_get_links',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ada91bdbc6ff449d14a4b3435189080f9',1,'search_engine::search_engine::crawler::Crawler']]], + ['_5fget_5fparagraphs_3',['_get_paragraphs',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ace884d52406cb35a990f172fe49a40d5',1,'search_engine::search_engine::crawler::Crawler']]], + ['_5fhello_2ecpp_4',['_hello.cpp',['../__hello_8cpp.html',1,'']]], + ['_5finverted_5findex_2ecpp_5',['_inverted_index.cpp',['../__inverted__index_8cpp.html',1,'']]], + ['_5fpage_5frank_2ecpp_6',['_page_rank.cpp',['../__page__rank_8cpp.html',1,'']]], + ['_5fvalidate_5furl_7',['_validate_url',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a1f219db9f6b0dcd8c7f5b12afc8a0574',1,'search_engine::search_engine::crawler::Crawler']]] ]; diff --git a/docs/html/search/all_d.js b/docs/html/search/all_d.js index 8497997..f5dd40c 100644 --- a/docs/html/search/all_d.js +++ b/docs/html/search/all_d.js @@ -6,5 +6,10 @@ var searchData= ['constraints_3',['constraints',['../Chap_02_Architectural_constraints.html',1,'2 Architectural Constraints'],['../Chap_02_Architectural_constraints.html#Chap_02_01_Technical_constraints',1,'2.1 Technical constraints'],['../Chap_02_Architectural_constraints.html#Chap_02_02_Organisational_constraints',1,'2.2 Organisational constraints']]], ['contents_4',['Table of contents',['../Chap_00_Architecture_documentation.html#Table_of_contents',1,'']]], ['context_5',['context',['../Chap_03_System_scope_and_context.html',1,'3 System Scope and Context'],['../Chap_03_System_scope_and_context.html#Chap_03_01_Business_context',1,'3.1 Business context'],['../Chap_03_System_scope_and_context.html#Chap_03_02_Technical_context',1,'3.2 Technical context']]], - ['conventions_6',['2.3 Conventions',['../Chap_02_Architectural_constraints.html#Chap_02_03_Conventions',1,'']]] + ['conventions_6',['2.3 Conventions',['../Chap_02_Architectural_constraints.html#Chap_02_03_Conventions',1,'']]], + ['convert_7',['convert',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a562ba6756f1cc804678075a02d28eb9f',1,'search_engine::search_engine::helper::converter::StringToIntConverter']]], + ['converter_8',['converter',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a066cf036bc6b4178858f790e0d2625e7',1,'search_engine::search_engine::crawler::Crawler']]], + ['converter_2epy_9',['converter.py',['../converter_8py.html',1,'']]], + ['crawler_10',['Crawler',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html',1,'search_engine::search_engine::crawler']]], + ['crawler_2epy_11',['crawler.py',['../crawler_8py.html',1,'']]] ]; diff --git a/docs/html/search/all_f.js b/docs/html/search/all_f.js index 1b52c31..9004fea 100644 --- a/docs/html/search/all_f.js +++ b/docs/html/search/all_f.js @@ -1,5 +1,6 @@ var searchData= [ ['error_20handling_0',['8.3 Exception/Error Handling',['../Chap_08_Concepts.html#Chap_08_03_Exception_and_error_handling',1,'']]], - ['exception_20error_20handling_1',['8.3 Exception/Error Handling',['../Chap_08_Concepts.html#Chap_08_03_Exception_and_error_handling',1,'']]] + ['exception_20error_20handling_1',['8.3 Exception/Error Handling',['../Chap_08_Concepts.html#Chap_08_03_Exception_and_error_handling',1,'']]], + ['exceptions_2epy_2',['exceptions.py',['../exceptions_8py.html',1,'']]] ]; diff --git a/docs/html/search/classes_0.js b/docs/html/search/classes_0.js index b5a5840..065671d 100644 --- a/docs/html/search/classes_0.js +++ b/docs/html/search/classes_0.js @@ -1,4 +1,4 @@ var searchData= [ - ['docs_0',['docs',['../structinverted__index_1_1docs.html',1,'inverted_index']]] + ['crawler_0',['Crawler',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html',1,'search_engine::search_engine::crawler']]] ]; diff --git a/docs/html/search/classes_1.js b/docs/html/search/classes_1.js index 5e925f5..b5a5840 100644 --- a/docs/html/search/classes_1.js +++ b/docs/html/search/classes_1.js @@ -1,4 +1,4 @@ var searchData= [ - ['graph_0',['Graph',['../classpage__rank_1_1Graph.html',1,'page_rank']]] + ['docs_0',['docs',['../structinverted__index_1_1docs.html',1,'inverted_index']]] ]; diff --git a/docs/html/search/classes_2.js b/docs/html/search/classes_2.js index d6f079c..5e925f5 100644 --- a/docs/html/search/classes_2.js +++ b/docs/html/search/classes_2.js @@ -1,4 +1,4 @@ var searchData= [ - ['hello_0',['Hello',['../classHello.html',1,'']]] + ['graph_0',['Graph',['../classpage__rank_1_1Graph.html',1,'page_rank']]] ]; diff --git a/docs/html/search/classes_3.js b/docs/html/search/classes_3.js new file mode 100644 index 0000000..d6f079c --- /dev/null +++ b/docs/html/search/classes_3.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['hello_0',['Hello',['../classHello.html',1,'']]] +]; diff --git a/docs/html/search/classes_4.js b/docs/html/search/classes_4.js new file mode 100644 index 0000000..586d154 --- /dev/null +++ b/docs/html/search/classes_4.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['stringtointconverter_0',['StringToIntConverter',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html',1,'search_engine::search_engine::helper::converter']]] +]; diff --git a/docs/html/search/classes_5.js b/docs/html/search/classes_5.js new file mode 100644 index 0000000..73b3892 --- /dev/null +++ b/docs/html/search/classes_5.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['urlerror_0',['UrlError',['../classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html',1,'search_engine::search_engine::exceptions']]] +]; diff --git a/docs/html/search/defines_1.js b/docs/html/search/defines_1.js index a20ecf7..3dbc694 100644 --- a/docs/html/search/defines_1.js +++ b/docs/html/search/defines_1.js @@ -1,4 +1,4 @@ var searchData= [ - ['py_5fssize_5ft_5fclean_0',['PY_SSIZE_T_CLEAN',['../__page__rank_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'_page_rank.cpp']]] + ['py_5fssize_5ft_5fclean_0',['py_ssize_t_clean',['../__hello_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'PY_SSIZE_T_CLEAN: _hello.cpp'],['../__inverted__index_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'PY_SSIZE_T_CLEAN: _inverted_index.cpp'],['../__page__rank_8cpp.html#ac9efdaac9411d0868b715edccca3269d',1,'PY_SSIZE_T_CLEAN: _page_rank.cpp']]] ]; diff --git a/docs/html/search/files_2.js b/docs/html/search/files_2.js index 5d75d08..0cea5ed 100644 --- a/docs/html/search/files_2.js +++ b/docs/html/search/files_2.js @@ -1,4 +1,7 @@ var searchData= [ - ['_5fpage_5frank_2ecpp_0',['_page_rank.cpp',['../__page__rank_8cpp.html',1,'']]] + ['_5f_5finit_5f_5f_2epy_0',['__init__.py',['../____init_____8py.html',1,'(Global Namespace)'],['../helper_2____init_____8py.html',1,'(Global Namespace)']]], + ['_5fhello_2ecpp_1',['_hello.cpp',['../__hello_8cpp.html',1,'']]], + ['_5finverted_5findex_2ecpp_2',['_inverted_index.cpp',['../__inverted__index_8cpp.html',1,'']]], + ['_5fpage_5frank_2ecpp_3',['_page_rank.cpp',['../__page__rank_8cpp.html',1,'']]] ]; diff --git a/docs/html/search/files_3.js b/docs/html/search/files_3.js index 966deb6..1277a25 100644 --- a/docs/html/search/files_3.js +++ b/docs/html/search/files_3.js @@ -1,5 +1,5 @@ var searchData= [ - ['hello_2ecpp_0',['hello.cpp',['../hello_8cpp.html',1,'']]], - ['hello_2eh_1',['hello.h',['../hello_8h.html',1,'']]] + ['converter_2epy_0',['converter.py',['../converter_8py.html',1,'']]], + ['crawler_2epy_1',['crawler.py',['../crawler_8py.html',1,'']]] ]; diff --git a/docs/html/search/files_4.js b/docs/html/search/files_4.js index 708e4d2..25d080f 100644 --- a/docs/html/search/files_4.js +++ b/docs/html/search/files_4.js @@ -1,5 +1,4 @@ var searchData= [ - ['inverted_5findex_2ecpp_0',['inverted_index.cpp',['../inverted__index_8cpp.html',1,'']]], - ['inverted_5findex_2eh_1',['inverted_index.h',['../inverted__index_8h.html',1,'']]] + ['exceptions_2epy_0',['exceptions.py',['../exceptions_8py.html',1,'']]] ]; diff --git a/docs/html/search/files_5.js b/docs/html/search/files_5.js index 41d9f15..966deb6 100644 --- a/docs/html/search/files_5.js +++ b/docs/html/search/files_5.js @@ -1,5 +1,5 @@ var searchData= [ - ['page_5frank_2ecpp_0',['page_rank.cpp',['../page__rank_8cpp.html',1,'']]], - ['page_5frank_2eh_1',['page_rank.h',['../page__rank_8h.html',1,'']]] + ['hello_2ecpp_0',['hello.cpp',['../hello_8cpp.html',1,'']]], + ['hello_2eh_1',['hello.h',['../hello_8h.html',1,'']]] ]; diff --git a/docs/html/search/files_6.js b/docs/html/search/files_6.js index 1d15b42..708e4d2 100644 --- a/docs/html/search/files_6.js +++ b/docs/html/search/files_6.js @@ -1,7 +1,5 @@ var searchData= [ - ['subtraction_2ecpp_0',['subtraction.cpp',['../subtraction_8cpp.html',1,'']]], - ['subtraction_2eh_1',['subtraction.h',['../subtraction_8h.html',1,'']]], - ['sum_2ecpp_2',['sum.cpp',['../sum_8cpp.html',1,'']]], - ['sum_2eh_3',['sum.h',['../sum_8h.html',1,'']]] + ['inverted_5findex_2ecpp_0',['inverted_index.cpp',['../inverted__index_8cpp.html',1,'']]], + ['inverted_5findex_2eh_1',['inverted_index.h',['../inverted__index_8h.html',1,'']]] ]; diff --git a/docs/html/search/files_7.js b/docs/html/search/files_7.js new file mode 100644 index 0000000..41d9f15 --- /dev/null +++ b/docs/html/search/files_7.js @@ -0,0 +1,5 @@ +var searchData= +[ + ['page_5frank_2ecpp_0',['page_rank.cpp',['../page__rank_8cpp.html',1,'']]], + ['page_5frank_2eh_1',['page_rank.h',['../page__rank_8h.html',1,'']]] +]; diff --git a/docs/html/search/files_8.js b/docs/html/search/files_8.js new file mode 100644 index 0000000..1d15b42 --- /dev/null +++ b/docs/html/search/files_8.js @@ -0,0 +1,7 @@ +var searchData= +[ + ['subtraction_2ecpp_0',['subtraction.cpp',['../subtraction_8cpp.html',1,'']]], + ['subtraction_2eh_1',['subtraction.h',['../subtraction_8h.html',1,'']]], + ['sum_2ecpp_2',['sum.cpp',['../sum_8cpp.html',1,'']]], + ['sum_2eh_3',['sum.h',['../sum_8h.html',1,'']]] +]; diff --git a/docs/html/search/functions_0.js b/docs/html/search/functions_0.js index 8d2f9f4..681dbc7 100644 --- a/docs/html/search/functions_0.js +++ b/docs/html/search/functions_0.js @@ -1,5 +1,7 @@ var searchData= [ - ['add_5fdoc_0',['add_doc',['../namespaceinverted__index.html#acb018ece565f44fec205e85a42cfd34a',1,'inverted_index']]], - ['add_5fedge_1',['add_edge',['../classpage__rank_1_1Graph.html#a83683b548468555d24ddfc58c268bab0',1,'page_rank::Graph']]] + ['_5f_5finit_5f_5f_0',['__init__',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a3749cceadf503febd19be1a13c9a0fe9',1,'search_engine.search_engine.crawler.Crawler.__init__()'],['../classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#aafc565a27959d46203642a601d5468da',1,'search_engine.search_engine.exceptions.UrlError.__init__()'],['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a2d3bad61678c8f6cf075256b6fb411c7',1,'search_engine.search_engine.helper.converter.StringToIntConverter.__init__()']]], + ['_5fget_5flinks_1',['_get_links',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ada91bdbc6ff449d14a4b3435189080f9',1,'search_engine::search_engine::crawler::Crawler']]], + ['_5fget_5fparagraphs_2',['_get_paragraphs',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ace884d52406cb35a990f172fe49a40d5',1,'search_engine::search_engine::crawler::Crawler']]], + ['_5fvalidate_5furl_3',['_validate_url',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a1f219db9f6b0dcd8c7f5b12afc8a0574',1,'search_engine::search_engine::crawler::Crawler']]] ]; diff --git a/docs/html/search/functions_1.js b/docs/html/search/functions_1.js index 26b6563..8d2f9f4 100644 --- a/docs/html/search/functions_1.js +++ b/docs/html/search/functions_1.js @@ -1,4 +1,5 @@ var searchData= [ - ['compute_5fpage_5frank_0',['compute_page_rank',['../classpage__rank_1_1Graph.html#a740d64110326e1e6bf09351b37440460',1,'page_rank::Graph']]] + ['add_5fdoc_0',['add_doc',['../namespaceinverted__index.html#acb018ece565f44fec205e85a42cfd34a',1,'inverted_index']]], + ['add_5fedge_1',['add_edge',['../classpage__rank_1_1Graph.html#a83683b548468555d24ddfc58c268bab0',1,'page_rank::Graph']]] ]; diff --git a/docs/html/search/functions_2.js b/docs/html/search/functions_2.js index e305dcf..d4a830a 100644 --- a/docs/html/search/functions_2.js +++ b/docs/html/search/functions_2.js @@ -1,5 +1,5 @@ var searchData= [ - ['find_5fanswer_0',['find_answer',['../namespaceinverted__index.html#ace9195b82649cfae96566f56ea285f86',1,'inverted_index']]], - ['find_5fdoc_1',['find_doc',['../namespaceinverted__index.html#ab00d739725897ea7ab9e82fcaa7a9326',1,'inverted_index']]] + ['compute_5fpage_5frank_0',['compute_page_rank',['../classpage__rank_1_1Graph.html#a740d64110326e1e6bf09351b37440460',1,'page_rank::Graph']]], + ['convert_1',['convert',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a562ba6756f1cc804678075a02d28eb9f',1,'search_engine::search_engine::helper::converter::StringToIntConverter']]] ]; diff --git a/docs/html/search/functions_3.js b/docs/html/search/functions_3.js index 73f0dd8..e305dcf 100644 --- a/docs/html/search/functions_3.js +++ b/docs/html/search/functions_3.js @@ -1,5 +1,5 @@ var searchData= [ - ['get_5fadjlist_0',['get_adjList',['../classpage__rank_1_1Graph.html#ae87e6a531c87ecf28d4bd8739f69b61a',1,'page_rank::Graph']]], - ['greet_1',['greet',['../classHello.html#a935f8ae8833c9cac314fce1a87907a08',1,'Hello']]] + ['find_5fanswer_0',['find_answer',['../namespaceinverted__index.html#ace9195b82649cfae96566f56ea285f86',1,'inverted_index']]], + ['find_5fdoc_1',['find_doc',['../namespaceinverted__index.html#ab00d739725897ea7ab9e82fcaa7a9326',1,'inverted_index']]] ]; diff --git a/docs/html/search/functions_4.js b/docs/html/search/functions_4.js index 31dd61d..73f0dd8 100644 --- a/docs/html/search/functions_4.js +++ b/docs/html/search/functions_4.js @@ -1,4 +1,5 @@ var searchData= [ - ['hello_0',['Hello',['../classHello.html#aaa8dc2cd664f8a83b9119a06b2f2790c',1,'Hello']]] + ['get_5fadjlist_0',['get_adjList',['../classpage__rank_1_1Graph.html#ae87e6a531c87ecf28d4bd8739f69b61a',1,'page_rank::Graph']]], + ['greet_1',['greet',['../classHello.html#a935f8ae8833c9cac314fce1a87907a08',1,'Hello']]] ]; diff --git a/docs/html/search/functions_5.js b/docs/html/search/functions_5.js index 7c542a7..31dd61d 100644 --- a/docs/html/search/functions_5.js +++ b/docs/html/search/functions_5.js @@ -1,6 +1,4 @@ var searchData= [ - ['operator_2b_3d_0',['operator+=',['../structinverted__index_1_1docs.html#a8c50490f2708078748f15edd7628f721',1,'inverted_index::docs']]], - ['operator_3c_1',['operator<',['../structinverted__index_1_1docs.html#ae1cb30b20b66fae23666b68d45972ec6',1,'inverted_index::docs']]], - ['operator_3d_3d_2',['operator==',['../structinverted__index_1_1docs.html#abd578731f060f11c422137f2909d103b',1,'inverted_index::docs']]] + ['hello_0',['Hello',['../classHello.html#aaa8dc2cd664f8a83b9119a06b2f2790c',1,'Hello']]] ]; diff --git a/docs/html/search/functions_6.js b/docs/html/search/functions_6.js index 71f029a..7c542a7 100644 --- a/docs/html/search/functions_6.js +++ b/docs/html/search/functions_6.js @@ -1,4 +1,6 @@ var searchData= [ - ['print_0',['print',['../classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0',1,'page_rank::Graph']]] + ['operator_2b_3d_0',['operator+=',['../structinverted__index_1_1docs.html#a8c50490f2708078748f15edd7628f721',1,'inverted_index::docs']]], + ['operator_3c_1',['operator<',['../structinverted__index_1_1docs.html#ae1cb30b20b66fae23666b68d45972ec6',1,'inverted_index::docs']]], + ['operator_3d_3d_2',['operator==',['../structinverted__index_1_1docs.html#abd578731f060f11c422137f2909d103b',1,'inverted_index::docs']]] ]; diff --git a/docs/html/search/functions_7.js b/docs/html/search/functions_7.js index 43b7396..71f029a 100644 --- a/docs/html/search/functions_7.js +++ b/docs/html/search/functions_7.js @@ -1,7 +1,4 @@ var searchData= [ - ['shrink_5fstring_0',['shrink_string',['../namespaceinverted__index.html#ac0c99343822e08b34bb0f874759b1c56',1,'inverted_index']]], - ['split_1',['split',['../namespaceinverted__index.html#a35a9f1cb5d6ae865560f7eabb3def5c9',1,'inverted_index']]], - ['subtraction_2',['subtraction',['../subtraction_8cpp.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp'],['../subtraction_8h.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp']]], - ['sum_3',['sum',['../sum_8cpp.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp'],['../sum_8h.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp']]] + ['print_0',['print',['../classpage__rank_1_1Graph.html#a4902e8e101899f05c2b1920c0b5ea9c0',1,'page_rank::Graph']]] ]; diff --git a/docs/html/search/functions_8.js b/docs/html/search/functions_8.js index 91d94c0..82fe806 100644 --- a/docs/html/search/functions_8.js +++ b/docs/html/search/functions_8.js @@ -1,4 +1,4 @@ var searchData= [ - ['to_5flowercase_0',['to_lowercase',['../namespaceinverted__index.html#a2caf9e19f6557b6fce93e8a555e55ae4',1,'inverted_index']]] + ['run_0',['run',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aa4018e5dcd1bac621932a2f70ae0d990',1,'search_engine::search_engine::crawler::Crawler']]] ]; diff --git a/docs/html/search/functions_9.js b/docs/html/search/functions_9.js new file mode 100644 index 0000000..43b7396 --- /dev/null +++ b/docs/html/search/functions_9.js @@ -0,0 +1,7 @@ +var searchData= +[ + ['shrink_5fstring_0',['shrink_string',['../namespaceinverted__index.html#ac0c99343822e08b34bb0f874759b1c56',1,'inverted_index']]], + ['split_1',['split',['../namespaceinverted__index.html#a35a9f1cb5d6ae865560f7eabb3def5c9',1,'inverted_index']]], + ['subtraction_2',['subtraction',['../subtraction_8cpp.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp'],['../subtraction_8h.html#a5620e8715eb9f46a17fdd22f9485f2b0',1,'Subtraction(double x, double y): subtraction.cpp']]], + ['sum_3',['sum',['../sum_8cpp.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp'],['../sum_8h.html#aed1f1c5da982a62827227c3c45b5fccb',1,'Sum(double x, double y): sum.cpp']]] +]; diff --git a/docs/html/search/functions_a.js b/docs/html/search/functions_a.js new file mode 100644 index 0000000..91d94c0 --- /dev/null +++ b/docs/html/search/functions_a.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['to_5flowercase_0',['to_lowercase',['../namespaceinverted__index.html#a2caf9e19f6557b6fce93e8a555e55ae4',1,'inverted_index']]] +]; diff --git a/docs/html/search/namespaces_2.js b/docs/html/search/namespaces_2.js new file mode 100644 index 0000000..7260025 --- /dev/null +++ b/docs/html/search/namespaces_2.js @@ -0,0 +1,9 @@ +var searchData= +[ + ['search_5fengine_0',['search_engine',['../namespacesearch__engine.html',1,'']]], + ['search_5fengine_3a_3asearch_5fengine_1',['search_engine',['../namespacesearch__engine_1_1search__engine.html',1,'search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3acrawler_2',['crawler',['../namespacesearch__engine_1_1search__engine_1_1crawler.html',1,'search_engine::search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3aexceptions_3',['exceptions',['../namespacesearch__engine_1_1search__engine_1_1exceptions.html',1,'search_engine::search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3ahelper_4',['helper',['../namespacesearch__engine_1_1search__engine_1_1helper.html',1,'search_engine::search_engine']]], + ['search_5fengine_3a_3asearch_5fengine_3a_3ahelper_3a_3aconverter_5',['converter',['../namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.html',1,'search_engine::search_engine::helper']]] +]; diff --git a/docs/html/search/searchdata.js b/docs/html/search/searchdata.js index 8d694e4..7a79c62 100644 --- a/docs/html/search/searchdata.js +++ b/docs/html/search/searchdata.js @@ -1,11 +1,11 @@ var indexSectionsWithContent = { 0: "0123456789_abcdefghilmnopqrstuvx", - 1: "dgh", - 2: "ip", - 3: "01_hips", - 4: "acfghopst", - 5: "fln", + 1: "cdghsu", + 2: "ips", + 3: "01_cehips", + 4: "_acfghoprst", + 5: "cfgilmnprstu", 6: "lmsv", 7: "o", 8: "dp", diff --git a/docs/html/search/variables_0.js b/docs/html/search/variables_0.js index c55340f..5399ee9 100644 --- a/docs/html/search/variables_0.js +++ b/docs/html/search/variables_0.js @@ -1,4 +1,4 @@ var searchData= [ - ['freq_0',['freq',['../structinverted__index_1_1docs.html#ad40a502bb97dced4cd8c7634958df2f5',1,'inverted_index::docs']]] + ['converter_0',['converter',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a066cf036bc6b4178858f790e0d2625e7',1,'search_engine::search_engine::crawler::Crawler']]] ]; diff --git a/docs/html/search/variables_1.js b/docs/html/search/variables_1.js index 1e07b36..c55340f 100644 --- a/docs/html/search/variables_1.js +++ b/docs/html/search/variables_1.js @@ -1,4 +1,4 @@ var searchData= [ - ['links_5fdocs_0',['links_docs',['../structinverted__index_1_1docs.html#a217103c61707d6e219fdac64eb4022c8',1,'inverted_index::docs']]] + ['freq_0',['freq',['../structinverted__index_1_1docs.html#ad40a502bb97dced4cd8c7634958df2f5',1,'inverted_index::docs']]] ]; diff --git a/docs/html/search/variables_2.js b/docs/html/search/variables_2.js index 7efaa42..5539c40 100644 --- a/docs/html/search/variables_2.js +++ b/docs/html/search/variables_2.js @@ -1,4 +1,4 @@ var searchData= [ - ['name_5fdoc_0',['name_doc',['../structinverted__index_1_1docs.html#a0dee7a56613409b307976525f002f100',1,'inverted_index::docs']]] + ['graph_0',['graph',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#aecc008b6c522f033489506a4bb21bc52',1,'search_engine::search_engine::crawler::Crawler']]] ]; diff --git a/docs/html/search/variables_3.js b/docs/html/search/variables_3.js new file mode 100644 index 0000000..ec884af --- /dev/null +++ b/docs/html/search/variables_3.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['initial_5fpage_0',['initial_page',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a6e0bc960b9ee2c29b8b75c66a275f570',1,'search_engine::search_engine::crawler::Crawler']]] +]; diff --git a/docs/html/search/variables_4.js b/docs/html/search/variables_4.js new file mode 100644 index 0000000..1e07b36 --- /dev/null +++ b/docs/html/search/variables_4.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['links_5fdocs_0',['links_docs',['../structinverted__index_1_1docs.html#a217103c61707d6e219fdac64eb4022c8',1,'inverted_index::docs']]] +]; diff --git a/docs/html/search/variables_5.js b/docs/html/search/variables_5.js new file mode 100644 index 0000000..f8bfdf6 --- /dev/null +++ b/docs/html/search/variables_5.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['message_0',['message',['../classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.html#a40e2fd59c669daada4d42c4c76cee5cb',1,'search_engine::search_engine::exceptions::UrlError']]] +]; diff --git a/docs/html/search/variables_6.js b/docs/html/search/variables_6.js new file mode 100644 index 0000000..a3999f7 --- /dev/null +++ b/docs/html/search/variables_6.js @@ -0,0 +1,5 @@ +var searchData= +[ + ['name_5fdoc_0',['name_doc',['../structinverted__index_1_1docs.html#a0dee7a56613409b307976525f002f100',1,'inverted_index::docs']]], + ['next_5fint_1',['next_int',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#af796cd59c12eba4822eb8f8b6bcfed8b',1,'search_engine::search_engine::helper::converter::StringToIntConverter']]] +]; diff --git a/docs/html/search/variables_7.js b/docs/html/search/variables_7.js new file mode 100644 index 0000000..a36cc55 --- /dev/null +++ b/docs/html/search/variables_7.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['page_5fname_0',['page_name',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a2926e956cbfbf24d9c99a1c0e80fae5e',1,'search_engine::search_engine::crawler::Crawler']]] +]; diff --git a/docs/html/search/variables_8.js b/docs/html/search/variables_8.js new file mode 100644 index 0000000..aad077d --- /dev/null +++ b/docs/html/search/variables_8.js @@ -0,0 +1,5 @@ +var searchData= +[ + ['regex_0',['REGEX',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a9b7fdc122b15d78d9967e0a6a567cf9f',1,'search_engine::search_engine::crawler::Crawler']]], + ['remove_5fpages_1',['remove_pages',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#a0d917081e91fe9067c457e791efec341',1,'search_engine::search_engine::crawler::Crawler']]] +]; diff --git a/docs/html/search/variables_9.js b/docs/html/search/variables_9.js new file mode 100644 index 0000000..600e010 --- /dev/null +++ b/docs/html/search/variables_9.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['string_5fto_5fint_0',['string_to_int',['../classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.html#a583c2162f4a2a2c6bff496b034e30675',1,'search_engine::search_engine::helper::converter::StringToIntConverter']]] +]; diff --git a/docs/html/search/variables_a.js b/docs/html/search/variables_a.js new file mode 100644 index 0000000..1baa5d1 --- /dev/null +++ b/docs/html/search/variables_a.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['test_5fmode_0',['test_mode',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#ab1db7f6a00564e301a65a3560b00450a',1,'search_engine::search_engine::crawler::Crawler']]] +]; diff --git a/docs/html/search/variables_b.js b/docs/html/search/variables_b.js new file mode 100644 index 0000000..fb09075 --- /dev/null +++ b/docs/html/search/variables_b.js @@ -0,0 +1,4 @@ +var searchData= +[ + ['url_5fbase_0',['url_base',['../classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.html#af2b2d5e8f62ba5661b4c87e15a9bc67e',1,'search_engine::search_engine::crawler::Crawler']]] +]; diff --git a/docs/latex/____init_____8py.tex b/docs/latex/____init_____8py.tex new file mode 100644 index 0000000..1679bed --- /dev/null +++ b/docs/latex/____init_____8py.tex @@ -0,0 +1,9 @@ +\doxysection{search\+\_\+engine/\+\_\+\+\_\+init\+\_\+\+\_\+.py File Reference} +\hypertarget{____init_____8py}{}\label{____init_____8py}\index{search\_engine/\_\_init\_\_.py@{search\_engine/\_\_init\_\_.py}} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine}{search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine}{search\+\_\+engine.\+search\+\_\+engine}} +\end{DoxyCompactItemize} diff --git a/docs/latex/__hello_8cpp.tex b/docs/latex/__hello_8cpp.tex new file mode 100644 index 0000000..c76fdea --- /dev/null +++ b/docs/latex/__hello_8cpp.tex @@ -0,0 +1,24 @@ +\doxysection{lib/src/\+\_\+hello.cpp File Reference} +\hypertarget{__hello_8cpp}{}\label{__hello_8cpp}\index{lib/src/\_hello.cpp@{lib/src/\_hello.cpp}} +{\ttfamily \#include "{}Python.\+h"{}}\newline +Include dependency graph for \+\_\+hello.\+cpp\+:\nopagebreak +\begin{figure}[H] +\begin{center} +\leavevmode +\includegraphics[width=170pt]{__hello_8cpp__incl} +\end{center} +\end{figure} +\doxysubsubsection*{Macros} +\begin{DoxyCompactItemize} +\item +\#define \mbox{\hyperlink{__hello_8cpp_ac9efdaac9411d0868b715edccca3269d}{PY\+\_\+\+SSIZE\+\_\+\+T\+\_\+\+CLEAN}} +\end{DoxyCompactItemize} + + +\doxysubsection{Macro Definition Documentation} +\Hypertarget{__hello_8cpp_ac9efdaac9411d0868b715edccca3269d}\label{__hello_8cpp_ac9efdaac9411d0868b715edccca3269d} +\index{\_hello.cpp@{\_hello.cpp}!PY\_SSIZE\_T\_CLEAN@{PY\_SSIZE\_T\_CLEAN}} +\index{PY\_SSIZE\_T\_CLEAN@{PY\_SSIZE\_T\_CLEAN}!\_hello.cpp@{\_hello.cpp}} +\doxysubsubsection{\texorpdfstring{PY\_SSIZE\_T\_CLEAN}{PY\_SSIZE\_T\_CLEAN}} +{\footnotesize\ttfamily \#define PY\+\_\+\+SSIZE\+\_\+\+T\+\_\+\+CLEAN} + diff --git a/docs/latex/__hello_8cpp__incl.md5 b/docs/latex/__hello_8cpp__incl.md5 new file mode 100644 index 0000000..411b1fb --- /dev/null +++ b/docs/latex/__hello_8cpp__incl.md5 @@ -0,0 +1 @@ +084e34a6deb38c87b85a69503558240b \ No newline at end of file diff --git a/docs/latex/__hello_8cpp__incl.pdf b/docs/latex/__hello_8cpp__incl.pdf new file mode 100644 index 0000000..c9c2e15 Binary files /dev/null and b/docs/latex/__hello_8cpp__incl.pdf differ diff --git a/docs/latex/__inverted__index_8cpp.tex b/docs/latex/__inverted__index_8cpp.tex new file mode 100644 index 0000000..2796514 --- /dev/null +++ b/docs/latex/__inverted__index_8cpp.tex @@ -0,0 +1,24 @@ +\doxysection{lib/src/\+\_\+inverted\+\_\+index.cpp File Reference} +\hypertarget{__inverted__index_8cpp}{}\label{__inverted__index_8cpp}\index{lib/src/\_inverted\_index.cpp@{lib/src/\_inverted\_index.cpp}} +{\ttfamily \#include "{}Python.\+h"{}}\newline +Include dependency graph for \+\_\+inverted\+\_\+index.\+cpp\+:\nopagebreak +\begin{figure}[H] +\begin{center} +\leavevmode +\includegraphics[width=213pt]{__inverted__index_8cpp__incl} +\end{center} +\end{figure} +\doxysubsubsection*{Macros} +\begin{DoxyCompactItemize} +\item +\#define \mbox{\hyperlink{__inverted__index_8cpp_ac9efdaac9411d0868b715edccca3269d}{PY\+\_\+\+SSIZE\+\_\+\+T\+\_\+\+CLEAN}} +\end{DoxyCompactItemize} + + +\doxysubsection{Macro Definition Documentation} +\Hypertarget{__inverted__index_8cpp_ac9efdaac9411d0868b715edccca3269d}\label{__inverted__index_8cpp_ac9efdaac9411d0868b715edccca3269d} +\index{\_inverted\_index.cpp@{\_inverted\_index.cpp}!PY\_SSIZE\_T\_CLEAN@{PY\_SSIZE\_T\_CLEAN}} +\index{PY\_SSIZE\_T\_CLEAN@{PY\_SSIZE\_T\_CLEAN}!\_inverted\_index.cpp@{\_inverted\_index.cpp}} +\doxysubsubsection{\texorpdfstring{PY\_SSIZE\_T\_CLEAN}{PY\_SSIZE\_T\_CLEAN}} +{\footnotesize\ttfamily \#define PY\+\_\+\+SSIZE\+\_\+\+T\+\_\+\+CLEAN} + diff --git a/docs/latex/__inverted__index_8cpp__incl.md5 b/docs/latex/__inverted__index_8cpp__incl.md5 new file mode 100644 index 0000000..2ae4afc --- /dev/null +++ b/docs/latex/__inverted__index_8cpp__incl.md5 @@ -0,0 +1 @@ +d65ae21d99979c5c1fb55b0131cba8da \ No newline at end of file diff --git a/docs/latex/__inverted__index_8cpp__incl.pdf b/docs/latex/__inverted__index_8cpp__incl.pdf new file mode 100644 index 0000000..0d54590 Binary files /dev/null and b/docs/latex/__inverted__index_8cpp__incl.pdf differ diff --git a/docs/latex/annotated.tex b/docs/latex/annotated.tex index 25f3ff9..a275535 100644 --- a/docs/latex/annotated.tex +++ b/docs/latex/annotated.tex @@ -1,6 +1,9 @@ \doxysection{Class List} Here are the classes, structs, unions and interfaces with brief descriptions\+:\begin{DoxyCompactList} +\item\contentsline{section}{\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}{search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler}} }{\pageref{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}}{} \item\contentsline{section}{\mbox{\hyperlink{structinverted__index_1_1docs}{inverted\+\_\+index\+::docs}} \\*Structure that stores information about a document }{\pageref{structinverted__index_1_1docs}}{} \item\contentsline{section}{\mbox{\hyperlink{classpage__rank_1_1Graph}{page\+\_\+rank\+::\+Graph}} \\*Represents a directed graph used to compute the Page\+Rank algorithm }{\pageref{classpage__rank_1_1Graph}}{} \item\contentsline{section}{\mbox{\hyperlink{classHello}{Hello}} }{\pageref{classHello}}{} +\item\contentsline{section}{\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter}} }{\pageref{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}}{} +\item\contentsline{section}{\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}{search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error}} }{\pageref{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}}{} \end{DoxyCompactList} diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.tex b/docs/latex/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.tex new file mode 100644 index 0000000..f12339a --- /dev/null +++ b/docs/latex/classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler.tex @@ -0,0 +1,203 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler Class Reference} +\hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}{}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection*{Public Member Functions} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a3749cceadf503febd19be1a13c9a0fe9}{\+\_\+\+\_\+init\+\_\+\+\_\+}} (self, str \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_af2b2d5e8f62ba5661b4c87e15a9bc67e}{url\+\_\+base}}, str \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a2926e956cbfbf24d9c99a1c0e80fae5e}{page\+\_\+name}}, str \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a6e0bc960b9ee2c29b8b75c66a275f570}{initial\+\_\+page}}, list\mbox{[}str\mbox{]} \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a0d917081e91fe9067c457e791efec341}{remove\+\_\+pages}}=\mbox{[}$\,$\mbox{]}, bool \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ab1db7f6a00564e301a65a3560b00450a}{test\+\_\+mode}}=False) +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_aa4018e5dcd1bac621932a2f70ae0d990}{run}} (self, limit=2) +\end{DoxyCompactItemize} +\doxysubsubsection*{Public Attributes} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_af2b2d5e8f62ba5661b4c87e15a9bc67e}{url\+\_\+base}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a2926e956cbfbf24d9c99a1c0e80fae5e}{page\+\_\+name}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a6e0bc960b9ee2c29b8b75c66a275f570}{initial\+\_\+page}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a0d917081e91fe9067c457e791efec341}{remove\+\_\+pages}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ab1db7f6a00564e301a65a3560b00450a}{test\+\_\+mode}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_aecc008b6c522f033489506a4bb21bc52}{graph}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a066cf036bc6b4178858f790e0d2625e7}{converter}} +\end{DoxyCompactItemize} +\doxysubsubsection*{Static Public Attributes} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a9b7fdc122b15d78d9967e0a6a567cf9f}{REGEX}} +\end{DoxyCompactItemize} +\doxysubsubsection*{Protected Member Functions} +\begin{DoxyCompactItemize} +\item +list \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ada91bdbc6ff449d14a4b3435189080f9}{\+\_\+get\+\_\+links}} (self, str current\+\_\+page) +\item +list \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ace884d52406cb35a990f172fe49a40d5}{\+\_\+get\+\_\+paragraphs}} (self, str current\+\_\+page) +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a1f219db9f6b0dcd8c7f5b12afc8a0574}{\+\_\+validate\+\_\+url}} (self, str url) +\end{DoxyCompactItemize} + + +\doxysubsection{Detailed Description} +\begin{DoxyVerb}A web crawler that traverses a network of web pages, extracts links and paragraphs, +and constructs a graph using the PageRank algorithm. + +This crawler starts from a given base URL and an initial page, and follows links within +the website to collect data such as links and paragraphs. It constructs a graph based on +the relationships between pages. + +@param url_base: The base URL from which the crawler starts. +@param page_name: The initial page to start crawling. +@param remove_pages: A list of pages to exclude from the crawl. (Optional, default is []) + +Attributes +---------- +graph : PyGraph + A graph representation used for PageRank calculations. + +Examples +-------- +>>> crawler = Crawler('https://example.com', '/home') +>>> links, paragraphs = crawler.run() +\end{DoxyVerb} + + +\doxysubsection{Constructor \& Destructor Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a3749cceadf503febd19be1a13c9a0fe9}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a3749cceadf503febd19be1a13c9a0fe9} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!\_\_init\_\_@{\_\_init\_\_}} +\index{\_\_init\_\_@{\_\_init\_\_}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{\_\_init\_\_()}{\_\_init\_\_()}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+\_\+\+\_\+init\+\_\+\+\_\+ (\begin{DoxyParamCaption}\item[{}]{self, }\item[{str}]{url\+\_\+base, }\item[{str}]{page\+\_\+name, }\item[{str}]{initial\+\_\+page, }\item[{list\mbox{[}str\mbox{]} }]{remove\+\_\+pages = {\ttfamily \mbox{[}\mbox{]}}, }\item[{bool }]{test\+\_\+mode = {\ttfamily False} }\end{DoxyParamCaption})} + +\begin{DoxyVerb}Initialize the Crawler with a base URL, the starting page, and optionally, +a list of pages to exclude. + +@param url_base: The base URL of the website to crawl. +@param page_name: The starting page to begin crawling. +@param remove_pages: Pages to exclude from the crawl (optional). +@param test_mode: Flag to activate the test mode for crawling. (default: False) +\end{DoxyVerb} + + +\doxysubsection{Member Function Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ada91bdbc6ff449d14a4b3435189080f9}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ada91bdbc6ff449d14a4b3435189080f9} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!\_get\_links@{\_get\_links}} +\index{\_get\_links@{\_get\_links}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{\_get\_links()}{\_get\_links()}} +{\footnotesize\ttfamily list search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+\_\+get\+\_\+links (\begin{DoxyParamCaption}\item[{}]{self, }\item[{str}]{current\+\_\+page }\end{DoxyParamCaption})\hspace{0.3cm}{\ttfamily [protected]}} + +\begin{DoxyVerb}Retrieve all links from the specified page. + +@param current_page: The current page to fetch links from. + +@return: A list of valid links found on the current page. + +@raises UrlError: If the current page URL is invalid or inaccessible. +\end{DoxyVerb} + \Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ace884d52406cb35a990f172fe49a40d5}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ace884d52406cb35a990f172fe49a40d5} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!\_get\_paragraphs@{\_get\_paragraphs}} +\index{\_get\_paragraphs@{\_get\_paragraphs}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{\_get\_paragraphs()}{\_get\_paragraphs()}} +{\footnotesize\ttfamily list search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+\_\+get\+\_\+paragraphs (\begin{DoxyParamCaption}\item[{}]{self, }\item[{str}]{current\+\_\+page }\end{DoxyParamCaption})\hspace{0.3cm}{\ttfamily [protected]}} + +\begin{DoxyVerb}Retrieve all paragraphs from the specified page. + +@param current_page: The current page to fetch paragraphs from. + +@return: A list of paragraphs' text found on the current page. +\end{DoxyVerb} + \Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a1f219db9f6b0dcd8c7f5b12afc8a0574}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a1f219db9f6b0dcd8c7f5b12afc8a0574} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!\_validate\_url@{\_validate\_url}} +\index{\_validate\_url@{\_validate\_url}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{\_validate\_url()}{\_validate\_url()}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+\_\+validate\+\_\+url (\begin{DoxyParamCaption}\item[{}]{self, }\item[{str}]{url }\end{DoxyParamCaption})\hspace{0.3cm}{\ttfamily [protected]}} + +\begin{DoxyVerb}Validate the format of the given URL. + +@param url: The URL to validate. + +@raises UrlError: If the URL is not valid. +\end{DoxyVerb} + \Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_aa4018e5dcd1bac621932a2f70ae0d990}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_aa4018e5dcd1bac621932a2f70ae0d990} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!run@{run}} +\index{run@{run}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{run()}{run()}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+run (\begin{DoxyParamCaption}\item[{}]{self, }\item[{}]{limit = {\ttfamily 2} }\end{DoxyParamCaption})} + +\begin{DoxyVerb}Run the crawler to collect links and paragraphs starting from the base page. +It uses a queue to traverse the links in a breadth-first manner. + +@param limit: The maximum number of pages to crawl in test mode. + +@return: A graph representation of the pages and their links. +\end{DoxyVerb} + + +\doxysubsection{Member Data Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a066cf036bc6b4178858f790e0d2625e7}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a066cf036bc6b4178858f790e0d2625e7} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!converter@{converter}} +\index{converter@{converter}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{converter}{converter}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+converter} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_aecc008b6c522f033489506a4bb21bc52}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_aecc008b6c522f033489506a4bb21bc52} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!graph@{graph}} +\index{graph@{graph}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{graph}{graph}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+graph} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a6e0bc960b9ee2c29b8b75c66a275f570}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a6e0bc960b9ee2c29b8b75c66a275f570} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!initial\_page@{initial\_page}} +\index{initial\_page@{initial\_page}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{initial\_page}{initial\_page}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+initial\+\_\+page} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a2926e956cbfbf24d9c99a1c0e80fae5e}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a2926e956cbfbf24d9c99a1c0e80fae5e} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!page\_name@{page\_name}} +\index{page\_name@{page\_name}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{page\_name}{page\_name}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+page\+\_\+name} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a9b7fdc122b15d78d9967e0a6a567cf9f}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a9b7fdc122b15d78d9967e0a6a567cf9f} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!REGEX@{REGEX}} +\index{REGEX@{REGEX}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{REGEX}{REGEX}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+REGEX\hspace{0.3cm}{\ttfamily [static]}} + +{\bfseries Initial value\+:} +\begin{DoxyCode}{0} +\DoxyCodeLine{=\ \ re.compile(} +\DoxyCodeLine{\ \ \ \ \ \ \ \ \textcolor{stringliteral}{r'\string^(?:http|https)://'}\ \ \textcolor{comment}{\#\ http\ or\ https\ protocol}} +\DoxyCodeLine{\ \ \ \ \ \ \ \ \textcolor{stringliteral}{r'(?:\(\backslash\)S+(?::\(\backslash\)S*)?@)?'}\ \ \textcolor{comment}{\#\ optional\ authentication}} +\DoxyCodeLine{\ \ \ \ \ \ \ \ \textcolor{stringliteral}{r'(?:[a-\/zA-\/Z0-\/9-\/]+\(\backslash\).)+[a-\/zA-\/Z]\{2,6\}'}\ \ \textcolor{comment}{\#\ domain}} +\DoxyCodeLine{\ \ \ \ \ \ \ \ \textcolor{stringliteral}{r'(?::\(\backslash\)d\{2,5\})?'}\ \ \textcolor{comment}{\#\ optional\ port}} +\DoxyCodeLine{\ \ \ \ \ \ \ \ \textcolor{stringliteral}{r'(?:/\(\backslash\)S*)?\$'},\ \ \textcolor{comment}{\#\ optional\ path}} +\DoxyCodeLine{\ \ \ \ \ \ \ \ re.IGNORECASE} +\DoxyCodeLine{\ \ \ \ )} + +\end{DoxyCode} +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a0d917081e91fe9067c457e791efec341}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_a0d917081e91fe9067c457e791efec341} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!remove\_pages@{remove\_pages}} +\index{remove\_pages@{remove\_pages}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{remove\_pages}{remove\_pages}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+remove\+\_\+pages} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ab1db7f6a00564e301a65a3560b00450a}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_ab1db7f6a00564e301a65a3560b00450a} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!test\_mode@{test\_mode}} +\index{test\_mode@{test\_mode}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{test\_mode}{test\_mode}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+test\+\_\+mode} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_af2b2d5e8f62ba5661b4c87e15a9bc67e}\label{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler_af2b2d5e8f62ba5661b4c87e15a9bc67e} +\index{search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}!url\_base@{url\_base}} +\index{url\_base@{url\_base}!search\_engine.search\_engine.crawler.Crawler@{search\_engine.search\_engine.crawler.Crawler}} +\doxysubsubsection{\texorpdfstring{url\_base}{url\_base}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler.\+url\+\_\+base} + + + +The documentation for this class was generated from the following file\+:\begin{DoxyCompactItemize} +\item +search\+\_\+engine/\mbox{\hyperlink{crawler_8py}{crawler.\+py}}\end{DoxyCompactItemize} diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.tex b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.tex new file mode 100644 index 0000000..1965ec4 --- /dev/null +++ b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError.tex @@ -0,0 +1,78 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error Class Reference} +\hypertarget{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}{}\label{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}\index{search\_engine.search\_engine.exceptions.UrlError@{search\_engine.search\_engine.exceptions.UrlError}} + + +Inheritance diagram for search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error\+:\nopagebreak +\begin{figure}[H] +\begin{center} +\leavevmode +\includegraphics[width=217pt]{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph} +\end{center} +\end{figure} + + +Collaboration diagram for search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error\+:\nopagebreak +\begin{figure}[H] +\begin{center} +\leavevmode +\includegraphics[width=217pt]{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph} +\end{center} +\end{figure} +\doxysubsubsection*{Public Member Functions} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_aafc565a27959d46203642a601d5468da}{\+\_\+\+\_\+init\+\_\+\+\_\+}} (self, \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_a40e2fd59c669daada4d42c4c76cee5cb}{message}}="{}Invalid URL"{}) +\end{DoxyCompactItemize} +\doxysubsubsection*{Public Attributes} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_a40e2fd59c669daada4d42c4c76cee5cb}{message}} +\end{DoxyCompactItemize} + + +\doxysubsection{Detailed Description} +\begin{DoxyVerb}Exception raised when an invalid URL is provided. + +Inherits from the built-in `ValueError` class. + +Attributes +---------- +message : str + The error message that describes the cause of the exception. + Defaults to "Invalid URL". + +Methods +------- +__init__(self, message: str = "Invalid URL") + Initializes the exception with a custom message or a default message. +\end{DoxyVerb} + + +\doxysubsection{Constructor \& Destructor Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_aafc565a27959d46203642a601d5468da}\label{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_aafc565a27959d46203642a601d5468da} +\index{search\_engine.search\_engine.exceptions.UrlError@{search\_engine.search\_engine.exceptions.UrlError}!\_\_init\_\_@{\_\_init\_\_}} +\index{\_\_init\_\_@{\_\_init\_\_}!search\_engine.search\_engine.exceptions.UrlError@{search\_engine.search\_engine.exceptions.UrlError}} +\doxysubsubsection{\texorpdfstring{\_\_init\_\_()}{\_\_init\_\_()}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error.\+\_\+\+\_\+init\+\_\+\+\_\+ (\begin{DoxyParamCaption}\item[{}]{self, }\item[{}]{message = {\ttfamily "{}Invalid~URL"{}} }\end{DoxyParamCaption})} + +\begin{DoxyVerb}Initializes the UrlError exception with a custom error message. + +Parameters +---------- +message : str, optional + The error message to describe the exception. Default is "Invalid URL". +\end{DoxyVerb} + + +\doxysubsection{Member Data Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_a40e2fd59c669daada4d42c4c76cee5cb}\label{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError_a40e2fd59c669daada4d42c4c76cee5cb} +\index{search\_engine.search\_engine.exceptions.UrlError@{search\_engine.search\_engine.exceptions.UrlError}!message@{message}} +\index{message@{message}!search\_engine.search\_engine.exceptions.UrlError@{search\_engine.search\_engine.exceptions.UrlError}} +\doxysubsubsection{\texorpdfstring{message}{message}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error.\+message} + + + +The documentation for this class was generated from the following file\+:\begin{DoxyCompactItemize} +\item +search\+\_\+engine/\mbox{\hyperlink{exceptions_8py}{exceptions.\+py}}\end{DoxyCompactItemize} diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.md5 b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.md5 new file mode 100644 index 0000000..9fe7f4e --- /dev/null +++ b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.md5 @@ -0,0 +1 @@ +bb5c97d5c2ff4921366a9f0605bbeb8a \ No newline at end of file diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.pdf b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.pdf new file mode 100644 index 0000000..e5f81cd Binary files /dev/null and b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__coll__graph.pdf differ diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.md5 b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.md5 new file mode 100644 index 0000000..9fe7f4e --- /dev/null +++ b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.md5 @@ -0,0 +1 @@ +bb5c97d5c2ff4921366a9f0605bbeb8a \ No newline at end of file diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.pdf b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.pdf new file mode 100644 index 0000000..e5f81cd Binary files /dev/null and b/docs/latex/classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError__inherit__graph.pdf differ diff --git a/docs/latex/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.tex b/docs/latex/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.tex new file mode 100644 index 0000000..2406a67 --- /dev/null +++ b/docs/latex/classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter.tex @@ -0,0 +1,99 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter Class Reference} +\hypertarget{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}{}\label{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}\index{search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}} +\doxysubsubsection*{Public Member Functions} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a2d3bad61678c8f6cf075256b6fb411c7}{\+\_\+\+\_\+init\+\_\+\+\_\+}} (self) +\item +int \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a562ba6756f1cc804678075a02d28eb9f}{convert}} (self, str word) +\end{DoxyCompactItemize} +\doxysubsubsection*{Public Attributes} +\begin{DoxyCompactItemize} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a583c2162f4a2a2c6bff496b034e30675}{string\+\_\+to\+\_\+int}} +\item +\mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_af796cd59c12eba4822eb8f8b6bcfed8b}{next\+\_\+int}} +\end{DoxyCompactItemize} + + +\doxysubsection{Detailed Description} +\begin{DoxyVerb}A class that converts strings to integers. If a string has already been converted, +it returns the previously assigned integer. Otherwise, it assigns a new integer +to the string and returns it. + +Attributes +---------- +string_to_int : dict + A dictionary mapping strings to their corresponding integers. +next_int : int + The next integer to be assigned to a string. + +Methods +------- +__init__() + Initializes the converter with an empty dictionary and sets the next integer to 0. +convert(word: str) -> int + Converts a given string to an integer. If the string has been seen before, + it returns the corresponding integer, otherwise it assigns a new integer to the string. +\end{DoxyVerb} + + +\doxysubsection{Constructor \& Destructor Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a2d3bad61678c8f6cf075256b6fb411c7}\label{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a2d3bad61678c8f6cf075256b6fb411c7} +\index{search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}!\_\_init\_\_@{\_\_init\_\_}} +\index{\_\_init\_\_@{\_\_init\_\_}!search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}} +\doxysubsubsection{\texorpdfstring{\_\_init\_\_()}{\_\_init\_\_()}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter.\+\_\+\+\_\+init\+\_\+\+\_\+ (\begin{DoxyParamCaption}\item[{}]{self }\end{DoxyParamCaption})} + +\begin{DoxyVerb}Initializes the StringToIntConverter with an empty dictionary and sets the next integer +to 0 for string-to-integer mapping. + +Attributes +---------- +string_to_int : dict + An empty dictionary to store the mapping of strings to integers. +next_int : int + Initialized to 0, it represents the next available integer to be assigned to a string. +\end{DoxyVerb} + + +\doxysubsection{Member Function Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a562ba6756f1cc804678075a02d28eb9f}\label{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a562ba6756f1cc804678075a02d28eb9f} +\index{search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}!convert@{convert}} +\index{convert@{convert}!search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}} +\doxysubsubsection{\texorpdfstring{convert()}{convert()}} +{\footnotesize\ttfamily int search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter.\+convert (\begin{DoxyParamCaption}\item[{}]{self, }\item[{str}]{word }\end{DoxyParamCaption})} + +\begin{DoxyVerb}Convert a string to an integer. If the string has already been seen, +return its corresponding integer. Otherwise, assign a new integer to it. + +Parameters +---------- +word : str + The string to be converted. + +Returns +------- +int + The integer corresponding to the string. +\end{DoxyVerb} + + +\doxysubsection{Member Data Documentation} +\Hypertarget{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_af796cd59c12eba4822eb8f8b6bcfed8b}\label{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_af796cd59c12eba4822eb8f8b6bcfed8b} +\index{search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}!next\_int@{next\_int}} +\index{next\_int@{next\_int}!search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}} +\doxysubsubsection{\texorpdfstring{next\_int}{next\_int}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter.\+next\+\_\+int} + +\Hypertarget{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a583c2162f4a2a2c6bff496b034e30675}\label{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter_a583c2162f4a2a2c6bff496b034e30675} +\index{search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}!string\_to\_int@{string\_to\_int}} +\index{string\_to\_int@{string\_to\_int}!search\_engine.search\_engine.helper.converter.StringToIntConverter@{search\_engine.search\_engine.helper.converter.StringToIntConverter}} +\doxysubsubsection{\texorpdfstring{string\_to\_int}{string\_to\_int}} +{\footnotesize\ttfamily search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter.\+string\+\_\+to\+\_\+int} + + + +The documentation for this class was generated from the following file\+:\begin{DoxyCompactItemize} +\item +search\+\_\+engine/helper/\mbox{\hyperlink{converter_8py}{converter.\+py}}\end{DoxyCompactItemize} diff --git a/docs/latex/converter_8py.tex b/docs/latex/converter_8py.tex new file mode 100644 index 0000000..ec41e78 --- /dev/null +++ b/docs/latex/converter_8py.tex @@ -0,0 +1,18 @@ +\doxysection{search\+\_\+engine/helper/converter.py File Reference} +\hypertarget{converter_8py}{}\label{converter_8py}\index{search\_engine/helper/converter.py@{search\_engine/helper/converter.py}} +\doxysubsubsection*{Classes} +\begin{DoxyCompactItemize} +\item +class \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter}} +\end{DoxyCompactItemize} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine}{search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine}{search\+\_\+engine.\+search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1helper}{search\+\_\+engine.\+search\+\_\+engine.\+helper}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter}{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter}} +\end{DoxyCompactItemize} diff --git a/docs/latex/crawler_8py.tex b/docs/latex/crawler_8py.tex new file mode 100644 index 0000000..897231b --- /dev/null +++ b/docs/latex/crawler_8py.tex @@ -0,0 +1,16 @@ +\doxysection{search\+\_\+engine/crawler.py File Reference} +\hypertarget{crawler_8py}{}\label{crawler_8py}\index{search\_engine/crawler.py@{search\_engine/crawler.py}} +\doxysubsubsection*{Classes} +\begin{DoxyCompactItemize} +\item +class \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}{search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler}} +\end{DoxyCompactItemize} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine}{search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine}{search\+\_\+engine.\+search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1crawler}{search\+\_\+engine.\+search\+\_\+engine.\+crawler}} +\end{DoxyCompactItemize} diff --git a/docs/latex/dir_3077535539cd151b75f9ad358f5d25ba.tex b/docs/latex/dir_3077535539cd151b75f9ad358f5d25ba.tex new file mode 100644 index 0000000..0edf533 --- /dev/null +++ b/docs/latex/dir_3077535539cd151b75f9ad358f5d25ba.tex @@ -0,0 +1,16 @@ +\doxysection{search\+\_\+engine Directory Reference} +\hypertarget{dir_3077535539cd151b75f9ad358f5d25ba}{}\label{dir_3077535539cd151b75f9ad358f5d25ba}\index{search\_engine Directory Reference@{search\_engine Directory Reference}} +\doxysubsubsection*{Directories} +\begin{DoxyCompactItemize} +\item +directory \mbox{\hyperlink{dir_a288a6e2e3e1e96db5e8d1e18942be87}{helper}} +\end{DoxyCompactItemize} +\doxysubsubsection*{Files} +\begin{DoxyCompactItemize} +\item +file \mbox{\hyperlink{____init_____8py}{\+\_\+\+\_\+init\+\_\+\+\_\+.\+py}} +\item +file \mbox{\hyperlink{crawler_8py}{crawler.\+py}} +\item +file \mbox{\hyperlink{exceptions_8py}{exceptions.\+py}} +\end{DoxyCompactItemize} diff --git a/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 b/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 index 4c3c9fa..50162c4 100644 --- a/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 +++ b/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.md5 @@ -1 +1 @@ -bad757f7dc4a7d7c23e3997687d02419 \ No newline at end of file +36f81bcb7d6cafce558a22dbbf92d35d \ No newline at end of file diff --git a/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.pdf b/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.pdf index 5a5b67b..9c0fab7 100644 Binary files a/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.pdf and b/docs/latex/dir_97aefd0d527b934f1d99a682da8fe6a9_dep.pdf differ diff --git a/docs/latex/dir_a065c5f60305fee3569f887679366939.tex b/docs/latex/dir_a065c5f60305fee3569f887679366939.tex index 4f3063e..effc5ce 100644 --- a/docs/latex/dir_a065c5f60305fee3569f887679366939.tex +++ b/docs/latex/dir_a065c5f60305fee3569f887679366939.tex @@ -10,6 +10,10 @@ \doxysubsubsection*{Files} \begin{DoxyCompactItemize} \item +file \mbox{\hyperlink{__hello_8cpp}{\+\_\+hello.\+cpp}} +\item +file \mbox{\hyperlink{__inverted__index_8cpp}{\+\_\+inverted\+\_\+index.\+cpp}} +\item file \mbox{\hyperlink{__page__rank_8cpp}{\+\_\+page\+\_\+rank.\+cpp}} \item file \mbox{\hyperlink{hello_8cpp}{hello.\+cpp}} diff --git a/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.md5 b/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.md5 index e0c7f1c..7f93305 100644 --- a/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.md5 +++ b/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.md5 @@ -1 +1 @@ -584dd3f299555fc9d2e667b519e7dbe6 \ No newline at end of file +c9e11af2475bd2b65447242ba16929d0 \ No newline at end of file diff --git a/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.pdf b/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.pdf index bb245de..63d3e3e 100644 Binary files a/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.pdf and b/docs/latex/dir_a065c5f60305fee3569f887679366939_dep.pdf differ diff --git a/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87.tex b/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87.tex new file mode 100644 index 0000000..06fe645 --- /dev/null +++ b/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87.tex @@ -0,0 +1,16 @@ +\doxysection{search\+\_\+engine/helper Directory Reference} +\hypertarget{dir_a288a6e2e3e1e96db5e8d1e18942be87}{}\label{dir_a288a6e2e3e1e96db5e8d1e18942be87}\index{search\_engine/helper Directory Reference@{search\_engine/helper Directory Reference}} +Directory dependency graph for helper\+:\nopagebreak +\begin{figure}[H] +\begin{center} +\leavevmode +\includegraphics[width=176pt]{dir_a288a6e2e3e1e96db5e8d1e18942be87_dep} +\end{center} +\end{figure} +\doxysubsubsection*{Files} +\begin{DoxyCompactItemize} +\item +file \mbox{\hyperlink{helper_2____init_____8py}{\+\_\+\+\_\+init\+\_\+\+\_\+.\+py}} +\item +file \mbox{\hyperlink{converter_8py}{converter.\+py}} +\end{DoxyCompactItemize} diff --git a/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.md5 b/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.md5 new file mode 100644 index 0000000..63a0fc9 --- /dev/null +++ b/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.md5 @@ -0,0 +1 @@ +e49a2cf62d6d8871cd3f8432ea3bc52a \ No newline at end of file diff --git a/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.pdf b/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.pdf new file mode 100644 index 0000000..7a29c1f Binary files /dev/null and b/docs/latex/dir_a288a6e2e3e1e96db5e8d1e18942be87_dep.pdf differ diff --git a/docs/latex/exceptions_8py.tex b/docs/latex/exceptions_8py.tex new file mode 100644 index 0000000..4b21c5b --- /dev/null +++ b/docs/latex/exceptions_8py.tex @@ -0,0 +1,16 @@ +\doxysection{search\+\_\+engine/exceptions.py File Reference} +\hypertarget{exceptions_8py}{}\label{exceptions_8py}\index{search\_engine/exceptions.py@{search\_engine/exceptions.py}} +\doxysubsubsection*{Classes} +\begin{DoxyCompactItemize} +\item +class \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}{search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error}} +\end{DoxyCompactItemize} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine}{search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine}{search\+\_\+engine.\+search\+\_\+engine}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1exceptions}{search\+\_\+engine.\+search\+\_\+engine.\+exceptions}} +\end{DoxyCompactItemize} diff --git a/docs/latex/files.tex b/docs/latex/files.tex index 56ded4a..27e752e 100644 --- a/docs/latex/files.tex +++ b/docs/latex/files.tex @@ -5,10 +5,17 @@ \item\contentsline{section}{lib/include/\mbox{\hyperlink{page__rank_8h}{page\+\_\+rank.\+h}} }{\pageref{page__rank_8h}}{} \item\contentsline{section}{lib/include/\mbox{\hyperlink{subtraction_8h}{subtraction.\+h}} }{\pageref{subtraction_8h}}{} \item\contentsline{section}{lib/include/\mbox{\hyperlink{sum_8h}{sum.\+h}} }{\pageref{sum_8h}}{} +\item\contentsline{section}{lib/src/\mbox{\hyperlink{__hello_8cpp}{\+\_\+hello.\+cpp}} }{\pageref{__hello_8cpp}}{} +\item\contentsline{section}{lib/src/\mbox{\hyperlink{__inverted__index_8cpp}{\+\_\+inverted\+\_\+index.\+cpp}} }{\pageref{__inverted__index_8cpp}}{} \item\contentsline{section}{lib/src/\mbox{\hyperlink{__page__rank_8cpp}{\+\_\+page\+\_\+rank.\+cpp}} }{\pageref{__page__rank_8cpp}}{} \item\contentsline{section}{lib/src/\mbox{\hyperlink{hello_8cpp}{hello.\+cpp}} }{\pageref{hello_8cpp}}{} \item\contentsline{section}{lib/src/\mbox{\hyperlink{inverted__index_8cpp}{inverted\+\_\+index.\+cpp}} }{\pageref{inverted__index_8cpp}}{} \item\contentsline{section}{lib/src/\mbox{\hyperlink{page__rank_8cpp}{page\+\_\+rank.\+cpp}} }{\pageref{page__rank_8cpp}}{} \item\contentsline{section}{lib/src/\mbox{\hyperlink{subtraction_8cpp}{subtraction.\+cpp}} }{\pageref{subtraction_8cpp}}{} \item\contentsline{section}{lib/src/\mbox{\hyperlink{sum_8cpp}{sum.\+cpp}} }{\pageref{sum_8cpp}}{} +\item\contentsline{section}{search\+\_\+engine/\mbox{\hyperlink{____init_____8py}{\+\_\+\+\_\+init\+\_\+\+\_\+.\+py}} }{\pageref{____init_____8py}}{} +\item\contentsline{section}{search\+\_\+engine/\mbox{\hyperlink{crawler_8py}{crawler.\+py}} }{\pageref{crawler_8py}}{} +\item\contentsline{section}{search\+\_\+engine/\mbox{\hyperlink{exceptions_8py}{exceptions.\+py}} }{\pageref{exceptions_8py}}{} +\item\contentsline{section}{search\+\_\+engine/helper/\mbox{\hyperlink{helper_2____init_____8py}{\+\_\+\+\_\+init\+\_\+\+\_\+.\+py}} }{\pageref{helper_2____init_____8py}}{} +\item\contentsline{section}{search\+\_\+engine/helper/\mbox{\hyperlink{converter_8py}{converter.\+py}} }{\pageref{converter_8py}}{} \end{DoxyCompactList} diff --git a/docs/latex/helper_2____init_____8py.tex b/docs/latex/helper_2____init_____8py.tex new file mode 100644 index 0000000..06424b6 --- /dev/null +++ b/docs/latex/helper_2____init_____8py.tex @@ -0,0 +1,2 @@ +\doxysection{search\+\_\+engine/helper/\+\_\+\+\_\+init\+\_\+\+\_\+.py File Reference} +\hypertarget{helper_2____init_____8py}{}\label{helper_2____init_____8py}\index{search\_engine/helper/\_\_init\_\_.py@{search\_engine/helper/\_\_init\_\_.py}} diff --git a/docs/latex/hierarchy.tex b/docs/latex/hierarchy.tex new file mode 100644 index 0000000..f2a1591 --- /dev/null +++ b/docs/latex/hierarchy.tex @@ -0,0 +1,11 @@ +\doxysection{Class Hierarchy} +This inheritance list is sorted roughly, but not completely, alphabetically\+:\begin{DoxyCompactList} +\item \contentsline{section}{search\+\_\+engine.\+search\+\_\+engine.\+crawler.\+Crawler}{\pageref{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}}{} +\item \contentsline{section}{inverted\+\_\+index\+::docs}{\pageref{structinverted__index_1_1docs}}{} +\item \contentsline{section}{page\+\_\+rank\+::Graph}{\pageref{classpage__rank_1_1Graph}}{} +\item \contentsline{section}{Hello}{\pageref{classHello}}{} +\item \contentsline{section}{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter.\+String\+To\+Int\+Converter}{\pageref{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}}{} +\item Value\+Error\begin{DoxyCompactList} +\item \contentsline{section}{search\+\_\+engine.\+search\+\_\+engine.\+exceptions.\+Url\+Error}{\pageref{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}}{} +\end{DoxyCompactList} +\end{DoxyCompactList} diff --git a/docs/latex/namespaces.tex b/docs/latex/namespaces.tex index 7196a3b..0c31f84 100644 --- a/docs/latex/namespaces.tex +++ b/docs/latex/namespaces.tex @@ -2,4 +2,10 @@ Here is a list of all namespaces with brief descriptions\+:\begin{DoxyCompactList} \item\contentsline{section}{\mbox{\hyperlink{namespaceinverted__index}{inverted\+\_\+index}} }{\pageref{namespaceinverted__index}}{} \item\contentsline{section}{\mbox{\hyperlink{namespacepage__rank}{page\+\_\+rank}} }{\pageref{namespacepage__rank}}{} +\item\contentsline{section}{\mbox{\hyperlink{namespacesearch__engine}{search\+\_\+engine}} }{\pageref{namespacesearch__engine}}{} +\item\contentsline{section}{\mbox{\hyperlink{namespacesearch__engine_1_1search__engine}{search\+\_\+engine.\+search\+\_\+engine}} }{\pageref{namespacesearch__engine_1_1search__engine}}{} +\item\contentsline{section}{\mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1crawler}{search\+\_\+engine.\+search\+\_\+engine.\+crawler}} }{\pageref{namespacesearch__engine_1_1search__engine_1_1crawler}}{} +\item\contentsline{section}{\mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1exceptions}{search\+\_\+engine.\+search\+\_\+engine.\+exceptions}} }{\pageref{namespacesearch__engine_1_1search__engine_1_1exceptions}}{} +\item\contentsline{section}{\mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1helper}{search\+\_\+engine.\+search\+\_\+engine.\+helper}} }{\pageref{namespacesearch__engine_1_1search__engine_1_1helper}}{} +\item\contentsline{section}{\mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter}{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter}} }{\pageref{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter}}{} \end{DoxyCompactList} diff --git a/docs/latex/namespacesearch__engine.tex b/docs/latex/namespacesearch__engine.tex new file mode 100644 index 0000000..006274f --- /dev/null +++ b/docs/latex/namespacesearch__engine.tex @@ -0,0 +1,7 @@ +\doxysection{search\+\_\+engine Namespace Reference} +\hypertarget{namespacesearch__engine}{}\label{namespacesearch__engine}\index{search\_engine@{search\_engine}} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine}{search\+\_\+engine}} +\end{DoxyCompactItemize} diff --git a/docs/latex/namespacesearch__engine_1_1search__engine.tex b/docs/latex/namespacesearch__engine_1_1search__engine.tex new file mode 100644 index 0000000..52b246f --- /dev/null +++ b/docs/latex/namespacesearch__engine_1_1search__engine.tex @@ -0,0 +1,11 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine Namespace Reference} +\hypertarget{namespacesearch__engine_1_1search__engine}{}\label{namespacesearch__engine_1_1search__engine}\index{search\_engine.search\_engine@{search\_engine.search\_engine}} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1crawler}{crawler}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1exceptions}{exceptions}} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1helper}{helper}} +\end{DoxyCompactItemize} diff --git a/docs/latex/namespacesearch__engine_1_1search__engine_1_1crawler.tex b/docs/latex/namespacesearch__engine_1_1search__engine_1_1crawler.tex new file mode 100644 index 0000000..1f2dcf2 --- /dev/null +++ b/docs/latex/namespacesearch__engine_1_1search__engine_1_1crawler.tex @@ -0,0 +1,7 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+crawler Namespace Reference} +\hypertarget{namespacesearch__engine_1_1search__engine_1_1crawler}{}\label{namespacesearch__engine_1_1search__engine_1_1crawler}\index{search\_engine.search\_engine.crawler@{search\_engine.search\_engine.crawler}} +\doxysubsubsection*{Classes} +\begin{DoxyCompactItemize} +\item +class \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler}{Crawler}} +\end{DoxyCompactItemize} diff --git a/docs/latex/namespacesearch__engine_1_1search__engine_1_1exceptions.tex b/docs/latex/namespacesearch__engine_1_1search__engine_1_1exceptions.tex new file mode 100644 index 0000000..3222b39 --- /dev/null +++ b/docs/latex/namespacesearch__engine_1_1search__engine_1_1exceptions.tex @@ -0,0 +1,7 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+exceptions Namespace Reference} +\hypertarget{namespacesearch__engine_1_1search__engine_1_1exceptions}{}\label{namespacesearch__engine_1_1search__engine_1_1exceptions}\index{search\_engine.search\_engine.exceptions@{search\_engine.search\_engine.exceptions}} +\doxysubsubsection*{Classes} +\begin{DoxyCompactItemize} +\item +class \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError}{Url\+Error}} +\end{DoxyCompactItemize} diff --git a/docs/latex/namespacesearch__engine_1_1search__engine_1_1helper.tex b/docs/latex/namespacesearch__engine_1_1search__engine_1_1helper.tex new file mode 100644 index 0000000..bc8c130 --- /dev/null +++ b/docs/latex/namespacesearch__engine_1_1search__engine_1_1helper.tex @@ -0,0 +1,7 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+helper Namespace Reference} +\hypertarget{namespacesearch__engine_1_1search__engine_1_1helper}{}\label{namespacesearch__engine_1_1search__engine_1_1helper}\index{search\_engine.search\_engine.helper@{search\_engine.search\_engine.helper}} +\doxysubsubsection*{Namespaces} +\begin{DoxyCompactItemize} +\item +namespace \mbox{\hyperlink{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter}{converter}} +\end{DoxyCompactItemize} diff --git a/docs/latex/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.tex b/docs/latex/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.tex new file mode 100644 index 0000000..242a983 --- /dev/null +++ b/docs/latex/namespacesearch__engine_1_1search__engine_1_1helper_1_1converter.tex @@ -0,0 +1,7 @@ +\doxysection{search\+\_\+engine.\+search\+\_\+engine.\+helper.\+converter Namespace Reference} +\hypertarget{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter}{}\label{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter}\index{search\_engine.search\_engine.helper.converter@{search\_engine.search\_engine.helper.converter}} +\doxysubsubsection*{Classes} +\begin{DoxyCompactItemize} +\item +class \mbox{\hyperlink{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter}{String\+To\+Int\+Converter}} +\end{DoxyCompactItemize} diff --git a/docs/latex/refman.tex b/docs/latex/refman.tex index 04bc3bd..52387c1 100644 --- a/docs/latex/refman.tex +++ b/docs/latex/refman.tex @@ -209,6 +209,8 @@ \input{Chap_00_Architecture_documentation} \chapter{Namespace Index} \input{namespaces} +\chapter{Hierarchical Index} +\input{hierarchy} \chapter{Class Index} \input{annotated} \chapter{File Index} @@ -216,10 +218,19 @@ \chapter{File Index} \chapter{Namespace Documentation} \input{namespaceinverted__index} \input{namespacepage__rank} +\input{namespacesearch__engine} +\input{namespacesearch__engine_1_1search__engine} +\input{namespacesearch__engine_1_1search__engine_1_1crawler} +\input{namespacesearch__engine_1_1search__engine_1_1exceptions} +\input{namespacesearch__engine_1_1search__engine_1_1helper} +\input{namespacesearch__engine_1_1search__engine_1_1helper_1_1converter} \chapter{Class Documentation} +\input{classsearch__engine_1_1search__engine_1_1crawler_1_1Crawler} \input{structinverted__index_1_1docs} \input{classpage__rank_1_1Graph} \input{classHello} +\input{classsearch__engine_1_1search__engine_1_1helper_1_1converter_1_1StringToIntConverter} +\input{classsearch__engine_1_1search__engine_1_1exceptions_1_1UrlError} \chapter{File Documentation} \input{00__Mainpage_8dox} \input{01__Introduction_8dox} @@ -244,12 +255,19 @@ \chapter{File Documentation} \input{subtraction_8h_source} \input{sum_8h} \input{sum_8h_source} +\input{__hello_8cpp} +\input{__inverted__index_8cpp} \input{__page__rank_8cpp} \input{hello_8cpp} \input{inverted__index_8cpp} \input{page__rank_8cpp} \input{subtraction_8cpp} \input{sum_8cpp} +\input{crawler_8py} +\input{exceptions_8py} +\input{____init_____8py} +\input{helper_2____init_____8py} +\input{converter_8py} %--- End generated contents --- % Index \backmatter diff --git a/search_engine/crawler.py b/search_engine/crawler.py index 2561998..c964b97 100644 --- a/search_engine/crawler.py +++ b/search_engine/crawler.py @@ -10,23 +10,22 @@ class Crawler: """ - A web crawler that traverses a network of web pages, extracts links and paragraphs, + A web crawler that traverses a network of web pages, extracts links and paragraphs, and constructs a graph using the PageRank algorithm. - Parameters - ---------- - url_base : str - The base URL from which the crawler starts. - page_name : str - The initial page to start crawling. - remove_pages : list of str, optional (default=[]) - A list of pages to exclude from the crawl. - + This crawler starts from a given base URL and an initial page, and follows links within + the website to collect data such as links and paragraphs. It constructs a graph based on + the relationships between pages. + + @param url_base: The base URL from which the crawler starts. + @param page_name: The initial page to start crawling. + @param remove_pages: A list of pages to exclude from the crawl. (Optional, default is []) + Attributes ---------- graph : PyGraph A graph representation used for PageRank calculations. - + Examples -------- >>> crawler = Crawler('https://example.com', '/home') @@ -45,17 +44,13 @@ class Crawler: def __init__(self, url_base: str, page_name: str, initial_page: str, remove_pages: list[str] = [], test_mode:bool = False): """ - Initialize the Crawler with a base URL, the starting page, and optionally, + Initialize the Crawler with a base URL, the starting page, and optionally, a list of pages to exclude. - Parameters - ---------- - url_base : str - The base URL of the website to crawl. - page_name : str - The starting page to begin crawling. - remove_pages : list of str, optional - Pages to exclude from the crawl. + @param url_base: The base URL of the website to crawl. + @param page_name: The starting page to begin crawling. + @param remove_pages: Pages to exclude from the crawl (optional). + @param test_mode: Flag to activate the test mode for crawling. (default: False) """ self.url_base = url_base self.page_name = page_name @@ -67,53 +62,38 @@ def __init__(self, url_base: str, page_name: str, initial_page: str, remove_page # Initialize the graph for PageRank self.graph = PyGraph() self.converter = StringToIntConverter() - + def _get_links(self, current_page: str) -> list: """ Retrieve all links from the specified page. - Parameters - ---------- - current_page : str - The current page to fetch links from. - - Returns - ------- - links : list of str - A list of valid links found on the current page. - - Raises - ------ - UrlError - If the current page URL is invalid or inaccessible. + @param current_page: The current page to fetch links from. + + @return: A list of valid links found on the current page. + + @raises UrlError: If the current page URL is invalid or inaccessible. """ if current_page is None: raise UrlError() - + response = requests.get(self.url_base + self.page_name + current_page) if response.status_code == 200: soup = BeautifulSoup(response.content, 'html.parser') # Find all tags

paragraphs = soup.find_all('p') # Find links in tag

- links = [a.get('href') for p in paragraphs for a in p.find_all('a', href=True) + links = [a.get('href') for p in paragraphs for a in p.find_all('a', href=True) if a.get('href').startswith(self.page_name)] return links return [] - + def _get_paragraphs(self, current_page: str) -> list: """ Retrieve all paragraphs from the specified page. - Parameters - ---------- - current_page : str - The current page to fetch paragraphs from. - - Returns - ------- - paragraphs : list of str - A list of paragraphs' text found on the current page. + @param current_page: The current page to fetch paragraphs from. + + @return: A list of paragraphs' text found on the current page. """ response = requests.get(self.url_base + self.page_name + current_page) if response.status_code == 200: @@ -125,37 +105,28 @@ def _validate_url(self, url: str): """ Validate the format of the given URL. - Parameters - ---------- - url : str - The URL to validate. - - Raises - ------ - UrlError - If the URL is not valid. + @param url: The URL to validate. + + @raises UrlError: If the URL is not valid. """ if not re.match(self.REGEX, url): raise UrlError() - + def run(self, limit = 2): """ Run the crawler to collect links and paragraphs starting from the base page. It uses a queue to traverse the links in a breadth-first manner. - Returns - ------- - all_links : list of str - A list of all links found during the crawling process. - all_paragraphs : list of str - A list of all paragraphs found during the crawling process. + @param limit: The maximum number of pages to crawl in test mode. + + @return: A graph representation of the pages and their links. """ # Initialize queue with the starting page queue = deque([self.initial_page]) visited = set() # Track visited pages to avoid processing them multiple times all_links = [] # Store all the links found during crawling all_paragraphs = [] # Store all the paragraphs found during crawling - + run = True counter = 0 @@ -186,13 +157,13 @@ def run(self, limit = 2): # Add new links to the queue if they haven't been visited for link in links: if link not in visited and link not in queue and link not in self.remove_pages: - # Extrai a ultima página + # Extract the last part of the link as the next page next_page = link.split('/')[-1] next_page_int = self.converter.convert(next_page) # Make graph self.graph.add_edge(current_page_int, next_page_int) queue.append(next_page) - + # Only when test_mode is activated if self.test_mode: counter += 1 diff --git a/search_engine/exceptions.py b/search_engine/exceptions.py index 014c885..25267a5 100644 --- a/search_engine/exceptions.py +++ b/search_engine/exceptions.py @@ -1,5 +1,29 @@ class UrlError(ValueError): - """Raised when an invalid URL is provided.""" + """ + Exception raised when an invalid URL is provided. + + Inherits from the built-in `ValueError` class. + + Attributes + ---------- + message : str + The error message that describes the cause of the exception. + Defaults to "Invalid URL". + + Methods + ------- + __init__(self, message: str = "Invalid URL") + Initializes the exception with a custom message or a default message. + """ + def __init__(self, message="Invalid URL"): + """ + Initializes the UrlError exception with a custom error message. + + Parameters + ---------- + message : str, optional + The error message to describe the exception. Default is "Invalid URL". + """ self.message = message - super().__init__(self.message) \ No newline at end of file + super().__init__(self.message) diff --git a/search_engine/helper/converter.py b/search_engine/helper/converter.py index 798ab4c..cc1f981 100644 --- a/search_engine/helper/converter.py +++ b/search_engine/helper/converter.py @@ -1,5 +1,37 @@ class StringToIntConverter: + """ + A class that converts strings to integers. If a string has already been converted, + it returns the previously assigned integer. Otherwise, it assigns a new integer + to the string and returns it. + + Attributes + ---------- + string_to_int : dict + A dictionary mapping strings to their corresponding integers. + next_int : int + The next integer to be assigned to a string. + + Methods + ------- + __init__() + Initializes the converter with an empty dictionary and sets the next integer to 0. + convert(word: str) -> int + Converts a given string to an integer. If the string has been seen before, + it returns the corresponding integer, otherwise it assigns a new integer to the string. + """ + def __init__(self): + """ + Initializes the StringToIntConverter with an empty dictionary and sets the next integer + to 0 for string-to-integer mapping. + + Attributes + ---------- + string_to_int : dict + An empty dictionary to store the mapping of strings to integers. + next_int : int + Initialized to 0, it represents the next available integer to be assigned to a string. + """ self.string_to_int = {} self.next_int = 0 @@ -7,12 +39,12 @@ def convert(self, word: str) -> int: """ Convert a string to an integer. If the string has already been seen, return its corresponding integer. Otherwise, assign a new integer to it. - + Parameters ---------- word : str The string to be converted. - + Returns ------- int @@ -21,4 +53,4 @@ def convert(self, word: str) -> int: if word not in self.string_to_int: self.string_to_int[word] = self.next_int self.next_int += 1 - return self.string_to_int[word] \ No newline at end of file + return self.string_to_int[word]