Implement trivial custom analyzer
This commit is contained in:
		
							parent
							
								
									6405617858
								
							
						
					
					
						commit
						c61932d99d
					
				| @ -7,8 +7,12 @@ import java.io.Reader; | |||||||
| import java.nio.file.Paths; | import java.nio.file.Paths; | ||||||
| import java.text.ParseException; | import java.text.ParseException; | ||||||
| import java.util.HashMap; | import java.util.HashMap; | ||||||
|  | import java.util.List; | ||||||
| import java.util.Map; | import java.util.Map; | ||||||
| import org.apache.lucene.analysis.Analyzer; | import org.apache.lucene.analysis.Analyzer; | ||||||
|  | import org.apache.lucene.analysis.core.WhitespaceAnalyzer; | ||||||
|  | import org.apache.lucene.analysis.en.EnglishAnalyzer; | ||||||
|  | import org.apache.lucene.analysis.miscellaneous.PerFieldAnalyzerWrapper; | ||||||
| import org.apache.lucene.analysis.standard.StandardAnalyzer; | import org.apache.lucene.analysis.standard.StandardAnalyzer; | ||||||
| import org.apache.lucene.document.Document; | import org.apache.lucene.document.Document; | ||||||
| import org.apache.lucene.index.IndexWriter; | import org.apache.lucene.index.IndexWriter; | ||||||
| @ -17,20 +21,29 @@ import org.apache.lucene.index.IndexWriterConfig.OpenMode; | |||||||
| import org.apache.lucene.store.Directory; | import org.apache.lucene.store.Directory; | ||||||
| import org.apache.lucene.store.FSDirectory; | import org.apache.lucene.store.FSDirectory; | ||||||
| import org.json.simple.JSONArray; | import org.json.simple.JSONArray; | ||||||
|  | import org.json.simple.JSONObject; | ||||||
| import org.json.simple.JSONValue; | import org.json.simple.JSONValue; | ||||||
| 
 | 
 | ||||||
| public class Indexer { | public class Indexer { | ||||||
|     IndexWriter index; |     IndexWriter index; | ||||||
|     String folderPath; |     String folderPath; | ||||||
|     Map<String, Analyzer> analyzerPerField; |     PerFieldAnalyzerWrapper customAnalyzer; | ||||||
| 
 | 
 | ||||||
|     Indexer(String folderPath) throws IOException, ParseException { |     Indexer(String folderPath) throws IOException, ParseException { | ||||||
|         this.folderPath = folderPath; |         this.folderPath = folderPath; | ||||||
|         analyzerPerField = new HashMap<>(); |         customAnalyzer = createAnalyzer(); | ||||||
|         createIndex(folderPath); |  | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     public JSONArray parseJSONFile(String filePath) throws IOException, ParseException { |     PerFieldAnalyzerWrapper createAnalyzer() { | ||||||
|  |         Map<String, Analyzer> analyzerPerField = new HashMap<>(); | ||||||
|  |         analyzerPerField.put("title", new EnglishAnalyzer()); | ||||||
|  |         analyzerPerField.put("abstract", new EnglishAnalyzer()); | ||||||
|  |         PerFieldAnalyzerWrapper customAnalyzer = new PerFieldAnalyzerWrapper(new WhitespaceAnalyzer(), | ||||||
|  |                 analyzerPerField); | ||||||
|  |         return customAnalyzer; | ||||||
|  |     } | ||||||
|  | 
 | ||||||
|  |     JSONArray parseJSONFile(String filePath) throws IOException, ParseException { | ||||||
|         InputStream jsonFile = getClass().getResourceAsStream(filePath); |         InputStream jsonFile = getClass().getResourceAsStream(filePath); | ||||||
|         Reader readerJson = new InputStreamReader(jsonFile); |         Reader readerJson = new InputStreamReader(jsonFile); | ||||||
|         Object fileObjects = JSONValue.parse(readerJson); |         Object fileObjects = JSONValue.parse(readerJson); | ||||||
| @ -38,25 +51,26 @@ public class Indexer { | |||||||
|         return arrayObjects; |         return arrayObjects; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     public void openIndex() throws IOException { |     void openIndex() throws IOException { | ||||||
|         Directory dir = FSDirectory.open(Paths.get(folderPath)); |         Directory dir = FSDirectory.open(Paths.get(folderPath)); | ||||||
|         Analyzer analyzer = new StandardAnalyzer(); |         IndexWriterConfig config = new IndexWriterConfig(customAnalyzer); | ||||||
|         IndexWriterConfig config = new IndexWriterConfig(analyzer); |  | ||||||
|         config.setOpenMode(OpenMode.CREATE_OR_APPEND); |         config.setOpenMode(OpenMode.CREATE_OR_APPEND); | ||||||
|         index = new IndexWriter(dir, config); |         index = new IndexWriter(dir, config); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     public void addDocuments(JSONArray jsonObjects) throws IOException { |     void addDocuments(JSONArray jsonObjects) throws IOException { | ||||||
|  |         for (JSONObject object : (List<JSONObject>) jsonObjects) { | ||||||
|             Document doc = new Document(); |             Document doc = new Document(); | ||||||
|             index.addDocument(doc); |             index.addDocument(doc); | ||||||
|         } |         } | ||||||
|  |     } | ||||||
| 
 | 
 | ||||||
|     public void commitChanges() throws IOException { |     void commitChanges() throws IOException { | ||||||
|         index.commit(); |         index.commit(); | ||||||
|         index.close(); |         index.close(); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     public void createIndex(String folderPath) throws IOException, ParseException { |     void createIndex() throws IOException, ParseException { | ||||||
|         JSONArray jsonObjects = parseJSONFile(folderPath); |         JSONArray jsonObjects = parseJSONFile(folderPath); | ||||||
|         openIndex(); |         openIndex(); | ||||||
|         addDocuments(jsonObjects); |         addDocuments(jsonObjects); | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user