mirror of https://github.com/tiyn/beaker-blog
parent
a936fd5ee6
commit
8796169ff7
@ -0,0 +1,16 @@
|
|||||||
|
import os
|
||||||
|
|
||||||
|
from flask_wtf import CSRFProtect, FlaskForm
|
||||||
|
from wtforms import StringField, SubmitField, ValidationError, validators
|
||||||
|
|
||||||
|
|
||||||
|
def register_csrf(app):
|
||||||
|
csrf = CSRFProtect()
|
||||||
|
SECRET_KEY = os.urandom(32)
|
||||||
|
app.secret_key = SECRET_KEY
|
||||||
|
csrf.init_app(app)
|
||||||
|
|
||||||
|
|
||||||
|
class SearchForm(FlaskForm):
|
||||||
|
query_str = StringField("Query", [validators.DataRequired("Please enter the search term")])
|
||||||
|
# submit = SubmitField("Search")
|
@ -1,2 +1,7 @@
|
|||||||
Flask
|
Flask
|
||||||
Markdown
|
Markdown
|
||||||
|
Whoosh
|
||||||
|
WTForms
|
||||||
|
Flask_WTF
|
||||||
|
MarkupSafe
|
||||||
|
Font-Awesome-Flask
|
||||||
|
@ -0,0 +1,72 @@
|
|||||||
|
import os
|
||||||
|
|
||||||
|
from whoosh import scoring
|
||||||
|
from whoosh.fields import ID, TEXT, Schema
|
||||||
|
from whoosh.index import create_in, open_dir
|
||||||
|
from whoosh.qparser import QueryParser
|
||||||
|
|
||||||
|
import config
|
||||||
|
|
||||||
|
INDEX_DIR = "indexdir"
|
||||||
|
DEF_TOPN = 10
|
||||||
|
ENTRY_DIR = config.ENTRY_DIR
|
||||||
|
|
||||||
|
|
||||||
|
def createSearchableData(root):
|
||||||
|
"""
|
||||||
|
|
||||||
|
Schema definition: title(name of file), path(as ID), content(indexed but not stored), textdata (stored text content)
|
||||||
|
source:
|
||||||
|
https://appliedmachinelearning.blog/2018/07/31/developing-a-fast-indexing-and-full-text-search-engine-with-whoosh-a-pure-pythhon-library/
|
||||||
|
"""
|
||||||
|
schema = Schema(title=TEXT(stored=True), path=ID(stored=True), content=TEXT)
|
||||||
|
if not os.path.exists(INDEX_DIR):
|
||||||
|
os.mkdir(INDEX_DIR)
|
||||||
|
ix = create_in(INDEX_DIR, schema)
|
||||||
|
writer = ix.writer()
|
||||||
|
for r, _, f in os.walk(root):
|
||||||
|
for file in f:
|
||||||
|
path = os.path.join(r, file)
|
||||||
|
fp = open(path, encoding="utf-8")
|
||||||
|
title = fp.readline()
|
||||||
|
text = title + fp.read()
|
||||||
|
writer.add_document(title=title, path=path, content=text)
|
||||||
|
fp.close()
|
||||||
|
writer.commit()
|
||||||
|
|
||||||
|
|
||||||
|
def search_times(query_str, topN):
|
||||||
|
"""
|
||||||
|
Search for a given term and returns a specific amount of results.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
query_str (string): term to search for
|
||||||
|
topN (int): number of results to return
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
string: html-formatted string including the hits of the search
|
||||||
|
"""
|
||||||
|
ix = open_dir(INDEX_DIR)
|
||||||
|
results = []
|
||||||
|
with ix.searcher(weighting=scoring.BM25F) as s:
|
||||||
|
query = QueryParser("content", ix.schema).parse(query_str)
|
||||||
|
matches = s.search(query, limit=topN)
|
||||||
|
for match in matches:
|
||||||
|
results.append({"title": match["title"], "path": match["path"], "match": match.score})
|
||||||
|
return results
|
||||||
|
|
||||||
|
|
||||||
|
def search(query_str):
|
||||||
|
"""
|
||||||
|
Search for a given term and show the predefined amount of results.
|
||||||
|
|
||||||
|
Parameters:
|
||||||
|
query_str (string): term to search for
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
string: html-formatted string including the hits of the search
|
||||||
|
"""
|
||||||
|
return search_times(query_str, DEF_TOPN)
|
||||||
|
|
||||||
|
|
||||||
|
createSearchableData(ENTRY_DIR)
|
@ -0,0 +1,19 @@
|
|||||||
|
{% extends "template.html" %}
|
||||||
|
{% block content %}
|
||||||
|
|
||||||
|
<div class="container">
|
||||||
|
<div class="search">
|
||||||
|
<h1>{% if language=="de-de" %}Suche{% else %}Search{% endif %}</h1><br>
|
||||||
|
<form class="search" action="{{ url_for('search') }}" method=post>
|
||||||
|
{{ form.hidden_tag() }}
|
||||||
|
{{ form.query_str }}
|
||||||
|
<!-- {{ form.submit }} -->
|
||||||
|
<button id="submit" name="submit" type="submit" value="Search">{{ font_awesome.render_icon("fas fa-search")
|
||||||
|
}}</button>
|
||||||
|
</form>
|
||||||
|
{% autoescape off %}
|
||||||
|
{{ content }}
|
||||||
|
{% endautoescape %}
|
||||||
|
</div>
|
||||||
|
</div>
|
||||||
|
{% endblock %}
|
Loading…
Reference in new issue