1
0
mirror of https://github.com/thangisme/notes.git synced 2025-01-18 04:56:27 -05:00
notes/lib/tasks/search.rake

87 lines
4.3 KiB
Ruby
Raw Normal View History

2017-06-08 14:24:29 -04:00
namespace :search do
2017-06-09 09:43:20 -04:00
desc 'Generate the files needed for search functionality'
2017-06-08 14:24:29 -04:00
task :init do
2017-06-09 09:43:20 -04:00
puts 'Creating search data json file...'
2018-10-24 16:34:11 -04:00
mkdir_p 'assets/js'
2020-06-27 05:02:36 -04:00
touch 'assets/js/zzzz-search-data.json'
2018-10-23 13:09:23 -04:00
puts 'Done.'
2018-10-23 12:51:11 -04:00
puts 'Generating content...'
2020-06-27 05:02:36 -04:00
File.open('assets/js/zzzz-search-data.json', 'w') do |f|
2017-06-09 10:58:35 -04:00
f.puts '---
2020-06-27 05:02:36 -04:00
permalink: /assets/js/search-data.json
2017-06-09 10:58:35 -04:00
---
{
{%- assign i = 0 -%}
{%- assign pages_array = '' | split: '' -%}
2020-07-09 16:14:57 -04:00
{%- assign pages_array = pages_array | push: site.html_pages -%}
{%- if site.just_the_docs.collections -%}
{%- for collection_entry in site.just_the_docs.collections -%}
{%- assign collection_key = collection_entry[0] -%}
{%- assign collection_value = collection_entry[1] -%}
{%- assign collection = site[collection_key] -%}
{%- if collection_value.search_exclude != true -%}
{%- assign pages_array = pages_array | push: collection -%}
{%- endif -%}
2020-07-09 16:14:57 -04:00
{%- endfor -%}
{%- endif -%}
{%- for pages in pages_array -%}
{%- for page in pages -%}
2020-06-27 05:02:36 -04:00
{%- if page.title and page.search_exclude != true -%}
{%- assign page_content = page.content -%}
{%- assign heading_level = site.search.heading_level | default: 2 -%}
{%- for j in (2..heading_level) -%}
{%- assign tag = \'<h\' | append: j -%}
{%- assign closing_tag = \'</h\' | append: j -%}
{%- assign page_content = page_content | replace: tag, \'<h1\' | replace: closing_tag, \'</h1\' -%}
{%- endfor -%}
{%- assign parts = page_content | split: \'<h1\' -%}
{%- assign title_found = false -%}
2020-07-09 16:14:57 -04:00
{%- for part in parts offset: 1 -%}
2020-06-27 05:02:36 -04:00
{%- assign titleAndContent = part | split: \'</h1>\' -%}
{%- assign title = titleAndContent[0] | replace_first: \'>\', \'<h1>\' | split: \'<h1>\' -%}
{%- assign title = title[1] | strip_html -%}
{%- assign content = titleAndContent[1] -%}
{%- assign url = page.url -%}
{%- if title == page.title and parts[0] == \'\' -%}
{%- assign title_found = true -%}
{%- else -%}
{%- assign id = titleAndContent[0] -%}
{%- assign id = id | split: \'id="\' -%}
{%- if id.size == 2 -%}
{%- assign id = id[1] -%}
{%- assign id = id | split: \'"\' -%}
{%- assign id = id[0] -%}
{%- capture url -%}{{ url | append: \'#\' | append: id }}{%- endcapture -%}
{%- endif -%}
{%- endif -%}
{%- unless i == 0 -%},{%- endunless -%}
"{{ i }}": {
"doc": {{ page.title | jsonify }},
"title": {{ title | jsonify }},
"content": {{ content | replace: \'</h\', \' . </h\' | replace: \'<hr\', \' . <hr\' | replace: \'</p\', \' . </p\' | replace: \'<ul\', \' . <ul\' | replace: \'</ul\', \' . </ul\' | replace: \'<ol\', \' . <ol\' | replace: \'</ol\', \' . </ol\' | replace: \'</tr\', \' . </tr\' | replace: \'<li\', \' | <li\' | replace: \'</li\', \' | </li\' | replace: \'</td\', \' | </td\' | replace: \'<td\', \' | <td\' | replace: \'</th\', \' | </th\' | replace: \'<th\', \' | <th\' | strip_html | remove: \'Table of contents\' | normalize_whitespace | replace: \'. . .\', \'.\' | replace: \'. .\', \'.\' | replace: \'| |\', \'|\' | append: \' \' | jsonify }},
"url": "{{ url | relative_url }}",
"relUrl": "{{ url }}"
}
{%- assign i = i | plus: 1 -%}
{%- endfor -%}
{%- unless title_found -%}
{%- unless i == 0 -%},{%- endunless -%}
"{{ i }}": {
"doc": {{ page.title | jsonify }},
"title": {{ page.title | jsonify }},
"content": {{ parts[0] | replace: \'</h\', \' . </h\' | replace: \'<hr\', \' . <hr\' | replace: \'</p\', \' . </p\' | replace: \'<ul\', \' . <ul\' | replace: \'</ul\', \' . </ul\' | replace: \'<ol\', \' . <ol\' | replace: \'</ol\', \' . </ol\' | replace: \'</tr\', \' . </tr\' | replace: \'<li\', \' | <li\' | replace: \'</li\', \' | </li\' | replace: \'</td\', \' | </td\' | replace: \'<td\', \' | <td\' | replace: \'</th\', \' | </th\' | replace: \'<th\', \' | <th\' | strip_html | remove: \'Table of contents\' | normalize_whitespace | replace: \'. . .\', \'.\' | replace: \'. .\', \'.\' | replace: \'| |\', \'|\' | append: \' \' | jsonify }},
2020-06-26 06:41:50 -04:00
"url": "{{ page.url | relative_url }}",
"relUrl": "{{ page.url }}"
2020-06-27 05:02:36 -04:00
}
{%- assign i = i | plus: 1 -%}
{%- endunless -%}
{%- endif -%}
2020-07-09 16:14:57 -04:00
{%- endfor -%}
{%- endfor %}
2017-06-09 10:58:35 -04:00
}'
2017-06-08 14:24:29 -04:00
end
2018-10-23 12:51:11 -04:00
puts 'Done.'
2017-06-04 17:49:20 -04:00
end
2017-06-08 09:43:33 -04:00
end