📄 keywordsearch.java
字号:
/* * $Id: KeywordSearch.java 5540 2005-08-13 20:48:15Z jonesde $ * * Copyright (c) 2001-2005 The Open For Business Project (www.ofbiz.org) * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included * in all copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT * OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR * THE USE OR OTHER DEALINGS IN THE SOFTWARE. */package org.ofbiz.product.product;import java.util.HashMap;import java.util.HashSet;import java.util.Iterator;import java.util.List;import java.util.Map;import java.util.Set;import java.util.StringTokenizer;import java.util.TreeSet;import org.ofbiz.base.util.Debug;import org.ofbiz.base.util.UtilMisc;import org.ofbiz.base.util.UtilProperties;import org.ofbiz.base.util.UtilValidate;import org.ofbiz.entity.GenericDelegator;import org.ofbiz.entity.GenericEntityException;import org.ofbiz.entity.GenericValue;/** * Does a product search by keyword using the PRODUCT_KEYWORD table. * <br/>Special thanks to Glen Thorne and the Weblogic Commerce Server for ideas. * * @author <a href="mailto:jonesde@ofbiz.org">David E. Jones</a> * @version $Rev: 5540 $ * @since 2.1 */public class KeywordSearch { public static final String module = KeywordSearch.class.getName(); public static Set thesaurusRelsToInclude = new HashSet(); public static Set thesaurusRelsForReplace = new HashSet(); static { thesaurusRelsToInclude.add("KWTR_UF"); thesaurusRelsToInclude.add("KWTR_USE"); thesaurusRelsToInclude.add("KWTR_CS"); thesaurusRelsToInclude.add("KWTR_NT"); thesaurusRelsToInclude.add("KWTR_BT"); thesaurusRelsToInclude.add("KWTR_RT"); thesaurusRelsForReplace.add("KWTR_USE"); thesaurusRelsForReplace.add("KWTR_CS"); } public static String getSeparators() { // String separators = ";: ,.!?\t\"\'\r\n\\/()[]{}*%<>-+_"; String seps = UtilProperties.getPropertyValue("prodsearch", "index.keyword.separators", ";: ,.!?\t\"\'\r\n\\/()[]{}*%<>-+_"); return seps; } public static String getStopWordBagOr() { return UtilProperties.getPropertyValue("prodsearch", "stop.word.bag.or"); } public static String getStopWordBagAnd() { return UtilProperties.getPropertyValue("prodsearch", "stop.word.bag.and"); } public static boolean getRemoveStems() { String removeStemsStr = UtilProperties.getPropertyValue("prodsearch", "remove.stems"); return "true".equals(removeStemsStr); } public static Set getStemSet() { String stemBag = UtilProperties.getPropertyValue("prodsearch", "stem.bag"); Set stemSet = new TreeSet(); if (UtilValidate.isNotEmpty(stemBag)) { String curToken; StringTokenizer tokenizer = new StringTokenizer(stemBag, ": "); while (tokenizer.hasMoreTokens()) { curToken = tokenizer.nextToken(); stemSet.add(curToken); } } return stemSet; } public static void processForKeywords(String str, Map keywords, boolean forSearch, boolean anyPrefix, boolean anySuffix, boolean isAnd) { String separators = getSeparators(); String stopWordBagOr = getStopWordBagOr(); String stopWordBagAnd = getStopWordBagAnd(); boolean removeStems = getRemoveStems(); Set stemSet = getStemSet(); processForKeywords(str, keywords, separators, stopWordBagAnd, stopWordBagOr, removeStems, stemSet, forSearch, anyPrefix, anySuffix, isAnd); } public static void processKeywordsForIndex(String str, Map keywords, String separators, String stopWordBagAnd, String stopWordBagOr, boolean removeStems, Set stemSet) { processForKeywords(str, keywords, separators, stopWordBagAnd, stopWordBagOr, removeStems, stemSet, false, false, false, false); } public static void processForKeywords(String str, Map keywords, String separators, String stopWordBagAnd, String stopWordBagOr, boolean removeStems, Set stemSet, boolean forSearch, boolean anyPrefix, boolean anySuffix, boolean isAnd) { Set keywordSet = makeKeywordSet(str, separators, forSearch); fixupKeywordSet(keywordSet, keywords, stopWordBagAnd, stopWordBagOr, removeStems, stemSet, forSearch, anyPrefix, anySuffix, isAnd); } public static void fixupKeywordSet(Set keywordSet, Map keywords, String stopWordBagAnd, String stopWordBagOr, boolean removeStems, Set stemSet, boolean forSearch, boolean anyPrefix, boolean anySuffix, boolean isAnd) { if (keywordSet == null) { return; } Iterator keywordIter = keywordSet.iterator(); while (keywordIter.hasNext()) { String token = (String) keywordIter.next(); // when cleaning up the tokens the ordering is inportant: check stop words, remove stems, then get rid of 1 character tokens (1 digit okay) // check stop words String colonToken = ":" + token + ":"; if (forSearch) { if ((isAnd && stopWordBagAnd.indexOf(colonToken) >= 0) || (!isAnd && stopWordBagOr.indexOf(colonToken) >= 0)) { continue; } } else { if (stopWordBagOr.indexOf(colonToken) >= 0 && stopWordBagAnd.indexOf(colonToken) >= 0) { continue; } } // remove stems if (removeStems) { Iterator stemIter = stemSet.iterator(); while (stemIter.hasNext()) { String stem = (String) stemIter.next(); if (token.endsWith(stem)) { token = token.substring(0, token.length() - stem.length()); } } } // get rid of all length 0 tokens now if (token.length() == 0) { continue; } // get rid of all length 1 character only tokens, pretty much useless if (token.length() == 1 && Character.isLetter(token.charAt(0))) { continue; } if (forSearch) { StringBuffer strSb = new StringBuffer(); if (anyPrefix) strSb.append('%'); strSb.append(token); if (anySuffix) strSb.append('%'); // replace all %% with % int dblPercIdx = -1; while ((dblPercIdx = strSb.indexOf("%%")) >= 0) { //Debug.logInfo("before strSb: " + strSb, module); strSb.replace(dblPercIdx, dblPercIdx+2, "%"); //Debug.logInfo("after strSb: " + strSb, module); } token = strSb.toString(); } // group by word, add up weight Long curWeight = (Long) keywords.get(token); if (curWeight == null) { keywords.put(token, new Long(1)); } else { keywords.put(token, new Long(curWeight.longValue() + 1)); } } } public static Set makeKeywordSet(String str, String separators, boolean forSearch) { if (separators == null) separators = getSeparators(); Set keywords = new TreeSet(); if (str.length() > 0) { if (forSearch) { // remove %_*? from separators if is for a search StringBuffer sb = new StringBuffer(separators); if (sb.indexOf("%") >= 0) sb.deleteCharAt(sb.indexOf("%")); if (sb.indexOf("_") >= 0) sb.deleteCharAt(sb.indexOf("_")); if (sb.indexOf("*") >= 0) sb.deleteCharAt(sb.indexOf("*")); if (sb.indexOf("?") >= 0) sb.deleteCharAt(sb.indexOf("?")); separators = sb.toString(); } StringTokenizer tokener = new StringTokenizer(str, separators, false); while (tokener.hasMoreTokens()) { // make sure it is lower case before doing anything else String token = tokener.nextToken().toLowerCase(); if (forSearch) { // these characters will only be present if it is for a search, ie not for indexing token = token.replace('*', '%'); token = token.replace('?', '_'); } keywords.add(token); } } return keywords; } public static Set fixKeywordsForSearch(Set keywordSet, boolean anyPrefix, boolean anySuffix, boolean removeStems, boolean isAnd) { Map keywords = new HashMap(); fixupKeywordSet(keywordSet, keywords, getStopWordBagAnd(), getStopWordBagOr(), removeStems, getStemSet(), true, anyPrefix, anySuffix, isAnd); return keywords.keySet(); } public static boolean expandKeywordForSearch(String enteredKeyword, Set addToSet, GenericDelegator delegator) { boolean replaceEnteredKeyword = false; try { List thesaurusList = delegator.findByAndCache("KeywordThesaurus", UtilMisc.toMap("enteredKeyword", enteredKeyword)); Iterator thesaurusIter = thesaurusList.iterator(); while (thesaurusIter.hasNext()) { GenericValue keywordThesaurus = (GenericValue) thesaurusIter.next(); String relationshipEnumId = (String) keywordThesaurus.get("relationshipEnumId"); if (thesaurusRelsToInclude.contains(relationshipEnumId)) { addToSet.addAll(makeKeywordSet(keywordThesaurus.getString("alternateKeyword"), null, true)); if (thesaurusRelsForReplace.contains(relationshipEnumId)) { replaceEnteredKeyword = true; } } } } catch (GenericEntityException e) { Debug.logError(e, "Error expanding entered keyword", module); } Debug.logInfo("Expanded keyword [" + enteredKeyword + "], got set: " + addToSet, module); return replaceEnteredKeyword; } public static void induceKeywords(GenericValue product) throws GenericEntityException { if (product == null) return; KeywordIndex.indexKeywords(product, false); } public static void induceKeywords(GenericValue product, boolean doAll) throws GenericEntityException { if (product == null) return; KeywordIndex.indexKeywords(product, doAll); }}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -