diff --git a/configs/eggjs.json b/configs/eggjs.json index c562936c9..7077597c5 100644 --- a/configs/eggjs.json +++ b/configs/eggjs.json @@ -49,5 +49,5 @@ "328319625" ], "strip_chars": " .,;:#", - "nb_hits": 7209 + "nb_hits": 7346 } \ No newline at end of file diff --git a/configs/ethereal-react.json b/configs/ethereal-react.json new file mode 100644 index 000000000..f912fa543 --- /dev/null +++ b/configs/ethereal-react.json @@ -0,0 +1,47 @@ +{ + "index_name": "ethereal-react", + "start_urls": [ + "https://kesne.github.io/ethereal-react/" + ], + "sitemap_urls": [ + "https://kesne.github.io/ethereal-react/sitemap.xml" + ], + "sitemap_alternate_links": true, + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]", + "type": "xpath", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "header h1", + "lvl2": "article h2", + "lvl3": "article h3", + "lvl4": "article h4", + "lvl5": "article h5, article td:first-child", + "text": "article p, article li, article td:last-child" + }, + "strip_chars": " .,;:#", + "custom_settings": { + "separatorsToIndex": "_", + "attributesForFaceting": [ + "language", + "version", + "type", + "docusaurus_tag" + ], + "attributesToRetrieve": [ + "hierarchy", + "content", + "anchor", + "url", + "url_without_anchor", + "type" + ] + }, + "conversation_id": [ + "1659094726" + ], + "nb_hits": 402 +} \ No newline at end of file diff --git a/configs/evcc.json b/configs/evcc.json new file mode 100644 index 000000000..21e530282 --- /dev/null +++ b/configs/evcc.json @@ -0,0 +1,47 @@ +{ + "index_name": "evcc", + "start_urls": [ + "https://docs.evcc.io/" + ], + "sitemap_urls": [ + "https://docs.evcc.io/sitemap.xml" + ], + "sitemap_alternate_links": true, + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]", + "type": "xpath", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "header h1", + "lvl2": "article h2", + "lvl3": "article h3", + "lvl4": "article h4", + "lvl5": "article h5, article td:first-child", + "text": "article p, article li, article td:last-child" + }, + "strip_chars": " .,;:#", + "custom_settings": { + "separatorsToIndex": "_", + "attributesForFaceting": [ + "language", + "version", + "type", + "docusaurus_tag" + ], + "attributesToRetrieve": [ + "hierarchy", + "content", + "anchor", + "url", + "url_without_anchor", + "type" + ] + }, + "conversation_id": [ + "1648095467" + ], + "nb_hits": 295 +} \ No newline at end of file diff --git a/configs/icalendar.json b/configs/icalendar.json new file mode 100644 index 000000000..0a1343a4b --- /dev/null +++ b/configs/icalendar.json @@ -0,0 +1,27 @@ +{ + "index_name": "icalendar", + "start_urls": [ + "https://nystudio107.com/docs/icalendar/" + ], + "sitemap_urls": [ + "https://nystudio107.com/sitemap.xml" + ], + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "main h1", + "lvl2": "main h2", + "lvl3": "main h3", + "lvl4": "main h4", + "lvl5": "main h5", + "text": "main p, main li" + }, + "conversation_id": [ + "1663785710" + ], + "nb_hits": 41 +} \ No newline at end of file diff --git a/configs/labnotes.json b/configs/labnotes.json new file mode 100644 index 000000000..831c1eb4b --- /dev/null +++ b/configs/labnotes.json @@ -0,0 +1,25 @@ +{ + "index_name": "labnotes", + "start_urls": [ + "https://labnotes.org" + ], + "sitemap_urls": [ + "https://labnotes.org/sitemap.xml" + ], + "stop_urls": [ + "/page/" + ], + "selectors": { + "lvl0": "article h1", + "lvl1": "article h2", + "lvl2": "article h3", + "lvl3": "article h4", + "lvl4": "article h5", + "lvl5": "article h6", + "text": "article p, article li" + }, + "conversation_id": [ + "1649358329" + ], + "nb_hits": 27305 +} \ No newline at end of file diff --git a/configs/myparcelnl.json b/configs/myparcelnl.json new file mode 100644 index 000000000..0e905c2c2 --- /dev/null +++ b/configs/myparcelnl.json @@ -0,0 +1,40 @@ +{ + "index_name": "myparcelnl", + "start_urls": [ + "https://myparcelnl.github.io/sdk/" + ], + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "p.sidebar-heading.open", + "global": true, + "default_value": "Documentation" + }, + "lvl1": ".theme-default-content h1", + "lvl2": ".theme-default-content h2", + "lvl3": ".theme-default-content h3", + "lvl4": ".theme-default-content h4", + "lvl5": ".theme-default-content h5", + "text": ".theme-default-content p, .theme-default-content li", + "lang": { + "selector": "/html/@lang", + "type": "xpath", + "global": true, + "default_value": "en-US" + } + }, + "selectors_exclude": [ + ".table-of-contents" + ], + "strip_chars": " .,;:#", + "custom_settings": { + "attributesForFaceting": [ + "lang" + ] + }, + "conversation_id": [ + "1665893964" + ], + "scrape_start_urls": false, + "nb_hits": 192 +} \ No newline at end of file diff --git a/configs/odo.json b/configs/odo.json new file mode 100644 index 000000000..bd0fe66cd --- /dev/null +++ b/configs/odo.json @@ -0,0 +1,47 @@ +{ + "index_name": "odo", + "start_urls": [ + "https://odo.dev/" + ], + "sitemap_urls": [ + "https://odo.dev/sitemap.xml" + ], + "sitemap_alternate_links": true, + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]", + "type": "xpath", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "header h1", + "lvl2": "article h2", + "lvl3": "article h3", + "lvl4": "article h4", + "lvl5": "article h5, article td:first-child", + "text": "article p, article li, article td:last-child" + }, + "strip_chars": " .,;:#", + "custom_settings": { + "separatorsToIndex": "_", + "attributesForFaceting": [ + "language", + "version", + "type", + "docusaurus_tag" + ], + "attributesToRetrieve": [ + "hierarchy", + "content", + "anchor", + "url", + "url_without_anchor", + "type" + ] + }, + "conversation_id": [ + "1664715260" + ], + "nb_hits": 615 +} \ No newline at end of file diff --git a/configs/scala-cli.json b/configs/scala-cli.json new file mode 100644 index 000000000..fc24a1fdd --- /dev/null +++ b/configs/scala-cli.json @@ -0,0 +1,47 @@ +{ + "index_name": "scala-cli", + "start_urls": [ + "https://scala-cli.virtuslab.org/" + ], + "sitemap_urls": [ + "https://scala-cli.virtuslab.org/sitemap.xml" + ], + "sitemap_alternate_links": true, + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]", + "type": "xpath", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "header h1", + "lvl2": "article h2", + "lvl3": "article h3", + "lvl4": "article h4", + "lvl5": "article h5, article td:first-child", + "text": "article p, article li, article td:last-child" + }, + "strip_chars": " .,;:#", + "custom_settings": { + "separatorsToIndex": "_", + "attributesForFaceting": [ + "language", + "version", + "type", + "docusaurus_tag" + ], + "attributesToRetrieve": [ + "hierarchy", + "content", + "anchor", + "url", + "url_without_anchor", + "type" + ] + }, + "conversation_id": [ + "1661509029" + ], + "nb_hits": 1350 +} \ No newline at end of file diff --git a/configs/synapseML.json b/configs/synapseML.json new file mode 100644 index 000000000..39cd43617 --- /dev/null +++ b/configs/synapseML.json @@ -0,0 +1,47 @@ +{ + "index_name": "synapseML", + "start_urls": [ + "https://microsoft.github.io/SynapseML/" + ], + "sitemap_urls": [ + "https://microsoft.github.io/SynapseML/sitemap.xml" + ], + "sitemap_alternate_links": true, + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]", + "type": "xpath", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "header h1", + "lvl2": "article h2", + "lvl3": "article h3", + "lvl4": "article h4", + "lvl5": "article h5, article td:first-child", + "text": "article p, article li, article td:last-child" + }, + "strip_chars": " .,;:#", + "custom_settings": { + "separatorsToIndex": "_", + "attributesForFaceting": [ + "language", + "version", + "type", + "docusaurus_tag" + ], + "attributesToRetrieve": [ + "hierarchy", + "content", + "anchor", + "url", + "url_without_anchor", + "type" + ] + }, + "conversation_id": [ + "1667154862" + ], + "nb_hits": 3498 +} \ No newline at end of file diff --git a/configs/typescript-type-challenge.json b/configs/typescript-type-challenge.json new file mode 100644 index 000000000..975013916 --- /dev/null +++ b/configs/typescript-type-challenge.json @@ -0,0 +1,47 @@ +{ + "index_name": "typescript-type-challenge", + "start_urls": [ + "https://typescript-type-challenges-list.vercel.app/" + ], + "sitemap_urls": [ + "https://typescript-type-challenges-list.vercel.app/sitemap.xml" + ], + "sitemap_alternate_links": true, + "stop_urls": [], + "selectors": { + "lvl0": { + "selector": "(//ul[contains(@class,'menu__list')]//a[contains(@class, 'menu__link menu__link--sublist menu__link--active')]/text() | //nav[contains(@class, 'navbar')]//a[contains(@class, 'navbar__link--active')]/text())[last()]", + "type": "xpath", + "global": true, + "default_value": "Documentation" + }, + "lvl1": "header h1", + "lvl2": "article h2", + "lvl3": "article h3", + "lvl4": "article h4", + "lvl5": "article h5, article td:first-child", + "text": "article p, article li, article td:last-child" + }, + "strip_chars": " .,;:#", + "custom_settings": { + "separatorsToIndex": "_", + "attributesForFaceting": [ + "language", + "version", + "type", + "docusaurus_tag" + ], + "attributesToRetrieve": [ + "hierarchy", + "content", + "anchor", + "url", + "url_without_anchor", + "type" + ] + }, + "conversation_id": [ + "1655397738" + ], + "nb_hits": 202 +} \ No newline at end of file