diff options
Diffstat (limited to 'search/strus/README')
-rw-r--r-- | search/strus/README | 26 |
1 files changed, 26 insertions, 0 deletions
diff --git a/search/strus/README b/search/strus/README new file mode 100644 index 0000000..4f2ad15 --- /dev/null +++ b/search/strus/README @@ -0,0 +1,26 @@ +# Search index with strus + +# For now create an XML from the content, later have a directory iterator +# over 'content' and read TOML/YAML headers and markdown... + +# TODO: this becomes obsolete with a Hugo segmenter which undestands +# YAML/TOML/JSON and Markdown: +# remarshal (https://github.com/dbohdan/remarshal) +# pandoc (http://pandoc.org/) +# client-side needs: +# https://github.com/fortnightlabs/snowball-js + +./create_xml.sh > posts.xml + +xmllint -noout posts.xml + +# test configuration of document analysis + +strusAnalyze document.ana posts.xml |& less + +# Create the strus search index: + +rm -rf storage +mkdir storage +strusCreate -s 'path=storage/wwwandreasbaumanncc; metadata=doclen UINT16, publish_date UINT16' +strusInsert -c 1000 -f 1 -t 1 -s "path=storage/wwwandreasbaumanncc" document.ana posts.xml |