/** * NavigatorPlugins.java * (C) 2016 by reger24; https://github.com/reger24 * * This is a part of YaCy, a peer-to-peer based web search engine * * LICENSE * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. * If not, see . */ package net.yacy.search.navigator; import static net.yacy.search.query.SearchEvent.log; import java.util.Collections; import java.util.HashSet; import java.util.LinkedHashMap; import java.util.LinkedHashSet; import java.util.Locale; import java.util.Map; import java.util.Set; import java.util.TreeMap; import net.yacy.crawler.CrawlSwitchboard; import net.yacy.search.schema.CollectionSchema; /** * Class to create and manipulate search navigator plugin list */ public class NavigatorPlugins { /** * Separator for specific properties in each navigator configuration */ public static final String NAV_PROPS_CONFIG_SEPARATOR = ":"; /** * List of available navigators * @return Map key=navigatorCfgname, value=std.DisplayName */ static public Map listAvailable() { Map defaultnavplugins = new TreeMap(); defaultnavplugins.put("filetype", "Filetype"); defaultnavplugins.put("hosts", "Provider"); defaultnavplugins.put("language", "Language"); defaultnavplugins.put("authors", "Authors"); defaultnavplugins.put("collections", "Collection"); defaultnavplugins.put("namespace", "Wiki Name Space"); defaultnavplugins.put("year", "Year"); // defaultnavplugins.put("year:dates_in_content_dts:Event","Event"); defaultnavplugins.put("keywords", "Keywords"); return defaultnavplugins; } /** * @param navConfig a navigator configuration String * @return the name identifying the navigator, or null when navConfig is null */ public static final String getNavName(final String navConfig) { String name = navConfig; if(navConfig != null) { final int navConfigPopsIndex = navConfig.indexOf(NAV_PROPS_CONFIG_SEPARATOR); if(navConfigPopsIndex >= 0) { name = navConfig.substring(0, navConfigPopsIndex); } } return name; } /** * @param navName a navigator name * @return the default sort properties to apply for the given navigator */ public static final NavigatorSort getDefaultSort(final String navName) { if("year".equals(navName)) { return NavigatorSort.LABEL_DESC; } return NavigatorSort.COUNT_DESC; } /** *

* Parse a navigator configuration entry and return the sort properties to * apply. *

*

* Supported formats : *

    *
  • "navName" : descending sort by count values (except for the year navigator, where the default is by descending displayed labels)
  • *
  • "navName:count" : descending sort by count values
  • *
  • "navName:label" : ascending sort by displayed labels
  • *
  • "navName:count:asc" : ascending sort by count values
  • *
  • "navName:count:desc" : descending sort by count values
  • *
  • "navName:label:asc" : ascending sort by displayed labels
  • *
  • "navName:label:desc" : descending sort by displayed labels
  • *
*

* * @param navConfig a navigator configuration String * @return return the sort properties of the navigator */ public static final NavigatorSort parseNavSortConfig(final String navConfig) { return parseNavSortConfig(navConfig, getDefaultSort(getNavName(navConfig))); } /** *

* Parse a navigator configuration entry and return the sort properties to * apply. *

*

* Supported formats : *

    *
  • "navName" : apply provided default sort/li> *
  • "navName:count" : descending sort by count values
  • *
  • "navName:label" : ascending sort by displayed labels
  • *
  • "navName:count:asc" : ascending sort by count values
  • *
  • "navName:count:desc" : descending sort by count values
  • *
  • "navName:label:asc" : ascending sort by displayed labels
  • *
  • "navName:label:desc" : descending sort by displayed labels
  • *
*

* * @param navConfig a navigator configuration String * @param defaultSort the default sort properties to apply when the * configuration String does not specify sort properties * @return return the sort properties of the navigator */ public static final NavigatorSort parseNavSortConfig(final String navConfig, final NavigatorSort defaultSort) { if (navConfig == null) { return defaultSort; } final Set navProperties = new HashSet<>(); Collections.addAll(navProperties, navConfig.split(NAV_PROPS_CONFIG_SEPARATOR)); NavigatorSort sort = defaultSort; if (navProperties.contains(NavigatorSortType.LABEL.toString().toLowerCase(Locale.ROOT))) { sort = NavigatorSort.LABEL_ASC; // default label sort if (navProperties.contains(NavigatorSortDirection.DESC.toString().toLowerCase(Locale.ROOT))) { sort = NavigatorSort.LABEL_DESC; } } if (navProperties.contains(NavigatorSortType.COUNT.toString().toLowerCase(Locale.ROOT))) { sort = NavigatorSort.COUNT_DESC; // default count sort if (navProperties.contains(NavigatorSortDirection.ASC.toString().toLowerCase(Locale.ROOT))) { sort = NavigatorSort.COUNT_ASC; } } return sort; } /** * Creates map of active search navigators from navigator config strings * @param navConfigs navigator configuration strings * @return map key=navigatorname, value=navigator.plugin reference */ public static Map initFromCfgStrings(final Set navConfigs) { final LinkedHashMap navigatorPlugins = new LinkedHashMap<>(); if(navConfigs == null) { return navigatorPlugins; } for (final String navConfig : navConfigs) { final String navName = getNavName(navConfig); if ("authors".equals(navName)) { navigatorPlugins.put("authors", new StringNavigator("Authors", CollectionSchema.author_sxt, parseNavSortConfig(navConfig))); } else if ("collections".equals(navName)) { RestrictedStringNavigator tmpnav = new RestrictedStringNavigator("Collection", CollectionSchema.collection_sxt, parseNavSortConfig(navConfig)); // exclude default internal collection names tmpnav.addForbidden("dht"); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_AUTOCRAWL_DEEP); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_AUTOCRAWL_SHALLOW); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_PROXY); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_REMOTE); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_SNIPPET_LOCAL_TEXT); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_SNIPPET_GLOBAL_TEXT); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_GREEDY_LEARNING_TEXT); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_SNIPPET_LOCAL_MEDIA); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_SNIPPET_GLOBAL_MEDIA); tmpnav.addForbidden("robot_" + CrawlSwitchboard.CRAWL_PROFILE_SURROGATE); navigatorPlugins.put("collections", tmpnav); } else if ("filetype".equals(navName)) { navigatorPlugins.put("filetype", new FileTypeNavigator("Filetype", CollectionSchema.url_file_ext_s, parseNavSortConfig(navConfig))); } else if("hosts".equals(navName)) { navigatorPlugins.put("hosts", new HostNavigator("Provider", CollectionSchema.host_s, parseNavSortConfig(navConfig))); } else if ("language".equals(navName)) { navigatorPlugins.put("language", new LanguageNavigator("Language", parseNavSortConfig(navConfig))); } else if ("namespace".equals(navName)) { navigatorPlugins.put("namespace", new NameSpaceNavigator("Wiki Name Space", parseNavSortConfig(navConfig))); } else if ("year".equals(navName)) { // YearNavigator with possible def of :fieldname:title in configstring final LinkedHashSet navProperties = new LinkedHashSet<>(); Collections.addAll(navProperties, navConfig.split(NAV_PROPS_CONFIG_SEPARATOR)); /* Remove sort related properties */ for(final NavigatorSortType sortType : NavigatorSortType.values()) { navProperties.remove(sortType.toString().toLowerCase(Locale.ROOT)); } for(final NavigatorSortDirection sortDir : NavigatorSortDirection.values()) { navProperties.remove(sortDir.toString().toLowerCase(Locale.ROOT)); } final String[] navfielddef = navProperties.toArray(new String[navProperties.size()]); if (navfielddef.length > 1) { try { // year:fieldname:title CollectionSchema field = CollectionSchema.valueOf(navfielddef[1]); if (navfielddef.length > 2) { navigatorPlugins.put(navfielddef[1], new YearNavigator(navfielddef[2], field, parseNavSortConfig(navConfig))); } else { navigatorPlugins.put(navfielddef[1], new YearNavigator("Year-" + navfielddef[1], field, parseNavSortConfig(navConfig))); } } catch (final java.lang.IllegalArgumentException ex) { log.severe("wrong navigator name in config: \"" + navConfig + "\" " + ex.getMessage()); } } else { // "year" only use default last_modified navigatorPlugins.put("year", new YearNavigator("Year", CollectionSchema.last_modified, parseNavSortConfig(navConfig))); } } else if ("keywords".equals(navName)) { navigatorPlugins.put("keywords", new TokenizedStringNavigator("Keywords", CollectionSchema.keywords, parseNavSortConfig(navConfig))); } } return navigatorPlugins; } }