10 changed files with 133 additions and 8366 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1,7 +1,3 @@
 __pycache__
 *.html
 .venv
 neuralWeights.json
 neuralWeights.json.*
 .imgLinkCache.json
 .idea
--- a/README.md
+++ b/README.md
@ -1,4 +1,4 @@
 # CaliGraph
 CaliGraph connects to the database of your local Calibre-Instance in order to recommend which unread books are likely to be enjoyed. The recommendations are displayed in a graph which explains the recommendation by showing correlations to previously read books, authors, recommendations by same individuals, tags...
-![Screenshot](./Screenshot_README.png)
+![Screenshot](https://gitea.dominik.roth.ml/dodox/CaliGraph/raw/branch/master/Screenshot_README.png)
--- a/Screenshot_README.png
+++ b/Screenshot_README.png
--- a/caliGraph.py
+++ b/caliGraph.py
--- a/perfTests/1645539905.png
+++ b/perfTests/1645539905.png
--- a/rec_dbs/mrb_db.csv
+++ b/rec_dbs/mrb_db.csv
--- a/rec_dbs/tgb_1.csv
+++ b/rec_dbs/tgb_1.csv
--- a/rec_dbs/tgb_2.csv
+++ b/rec_dbs/tgb_2.csv
--- a/requirements.txt
+++ b/requirements.txt
@ -1,14 +0,0 @@
 numpy
 scipy
 matplotlib
 networkx
 pyvis
 fuzzywuzzy
 rake_nltk
 ptpython
 requests
 pandas
 plotly
 wikipedia
 argcomplete
 pyzshcomplete
--- a/zSearch.py
+++ b/zSearch.py
@ -1,155 +0,0 @@
 import requests
 from bs4 import BeautifulSoup
 class Search:
    def __init__(self):
        self.searchType = "general"
        self.searchOptions = {"e": "", "yearFrom": "", \
                            "yearTo": "", "language": "", \
                            "extension": "", "page":"1", \
                            "order":""}
        self.searchResults = "books"
        self.input = ""
    def nextPage(self):
        '''Goes to next page'''
        self.searchOptions["page"] = str(int(self.searchOptions["page"])+1)
    def previousPage(self):
        '''Goes to previous page'''
        if self.searchOptions["page"] != "1":
            self.searchOptions["page"] = str(int(self.searchOptions["page"])-1)
        else:
            return 1
    def updateSearchOptions(self):
        '''Depending on searchType and searchResults, updates appropriately
        searchOptions
        '''
        if self.searchType == "general":
            self.searchOptions.pop("matchPhrase", None)
        else: 
            self.searchOptions["matchPhrase"] = ""
        if self.searchResults == "books":
            self.searchOptions["language"] = ""
            self.searchOptions["extension"] = ""
        else:
            self.searchOptions.pop("language", None)
            self.searchOptions.pop("extension", None)
    def executeSearch(self):
        '''Executes get request and returns response'''
        if self.searchResults == "books":
            url = "http://b-ok.cc"
        else:
            url = "http://booksc.xyz"
        r = requests.get(url+"/s/"+self.input, params=self.searchOptions)
        return r
    def getResults(self):
        '''Fetches search results. Returns a list of books
        '''
        r = self.executeSearch()
        soup = BeautifulSoup(r.text, "html.parser")
        match = soup.find_all(class_="resItemBox")
        counter = 1
        results=[]
        for e in match:
            title = e.find(itemprop="name")
            author = e.find(class_="authors")
            year = e.find(class_="bookProperty property_year")
            language = e.find(class_="bookProperty property_language")
            fileInfo = e.find(class_="bookProperty property__file")
            link = e.find("a", href=True)
            link = link["href"]
            if self.searchResults == "books":
                fullLink = "https://b-ok.cc" + link
            else:
                fullLink = "booksc.xyz" + link
            title = isNone(title)
            author = isNone(author)
            year = isNone(year)
            language = isNone(language)
            fileInfo = isNone(fileInfo)
            book = Book(title,author,year,language,fileInfo,fullLink)
            results += [book]
        return results
    def reset(self):
        '''Clears the search and resets to default options'''
        self.searchType = "general"
        self.searchOptions = {"e": "", "yearFrom": "", \
                            "yearTo": "", "language": "", \
                            "extension": "", "page":"1", \
                            "order":""}
        self.searchResults = "books"
        self.input = ""
 def isNone(e):
    if e != None:
        return "".join(e.text.splitlines())
    else:
        return ""
 class Book:
    def __init__(self,title,author,year,language,fileInfo,link):
        self.title = title
        self.author = author
        self.year = year
        self.language = language
        self.fType, self.size = fileInfo.split(', ')
        self.link = link
        self.dlLink = None
        self.page = None
    def __repr__(self):
        return '<zBook: '+str(self)+'>'
    def __str__(self):
        return " / ".join([self.title,self.author,self.year,\
                self.language,self.fType,self.size])
    def getDetails(self):
        '''Returns more specific info about the book. The info is retrieved by the
        link attribute
        '''
        if self.page == None:
            self.page = requests.get(self.link).text
        soup = BeautifulSoup(self.page, "html.parser")
        # for some reason, bookProperty also shows properties from other books
        # the line below prevents this
        soup = soup.find(class_="row cardBooks")
        match = soup.find_all(class_="bookProperty")
        results = ""
        for e in match:
            results += "".join(e.text.splitlines())
            results += "\n"
        # this makes writing the category easier for some books
        results = results.replace("\\\\", " \\ ")
        return results
    def getDownloadURL(self):
        if self.dlLink == None:
            if self.page == None:
                self.page = requests.get(self.link).text
            soup = BeautifulSoup(self.page, "html.parser")
            self.dlLink = soup.find('a', 'btn btn-primary dlButton addDownloadedBook')['href']
        return 'https://b-ok.cc' + self.dlLink + '?dsource=recommend'
    def saveBook(self, path):
        r = requests.get(self.getDownloadURL(), allow_redirects=True)
        with open(path, 'wb') as f:
            f.write(r.content)