Mercurial Hosting > junotu
view src/junotu/Database.java @ 67:3f0b4e44c6ef
Hide cards with specific tags from search results
For example board columns and board column cards.
author | Fox |
---|---|
date | Sat, 24 Dec 2022 01:27:22 +0100 |
parents | 4dd7d78e19a1 |
children | fc040f668d55 |
line wrap: on
line source
package junotu; import java.lang.RuntimeException; import java.io.IOException; import java.io.File; import java.util.Set; import org.apache.lucene.queryParser.ParseException; import org.apache.lucene.index.IndexWriter; import org.apache.lucene.search.IndexSearcher; import org.apache.lucene.store.Directory; import org.apache.lucene.store.FSDirectory; import org.apache.lucene.analysis.standard.StandardAnalyzer; import org.apache.lucene.util.Version; import org.apache.lucene.document.Fieldable; import org.apache.lucene.document.Field; import org.apache.lucene.document.NumericField; import org.apache.lucene.document.Document; import org.apache.lucene.search.TopDocs; import org.apache.lucene.search.ScoreDoc; import org.apache.lucene.search.Sort; import org.apache.lucene.search.SortField; import org.apache.lucene.search.Query; import org.apache.lucene.search.TermQuery; import org.apache.lucene.search.WildcardQuery; import org.apache.lucene.search.BooleanQuery; import org.apache.lucene.search.MatchAllDocsQuery; import org.apache.lucene.search.NumericRangeQuery; import org.apache.lucene.queryParser.QueryParser; import org.apache.lucene.index.Term; import org.apache.lucene.search.BooleanClause; import junotu.Card; public class Database { public static final String DATABASE_DIRECTORY = "./database"; public static final Version LUCENE_VERSION = Version.LUCENE_30; private IndexWriter luceneWriter; private IndexSearcher luceneSearcher; private long highestIdentifier; private Query[] hideQueries; public Database() { try { Directory indexDirectory = FSDirectory.open( new File( DATABASE_DIRECTORY ) ); luceneWriter = new IndexWriter( indexDirectory, new StandardAnalyzer(LUCENE_VERSION), null, IndexWriter.MaxFieldLength.UNLIMITED ); luceneSearcher = new IndexSearcher( luceneWriter.getReader() ); /* Find highest unique identifier. */ TopDocs topDocuments = luceneSearcher.search( new MatchAllDocsQuery(), null, 1, new Sort( new SortField( Card.TAG_IDENTIFIER, SortField.LONG, true ) ) ); if( topDocuments.scoreDocs.length == 0 ) { highestIdentifier = 0; } else { /** TODO: Find a way to get NumericField from document. */ highestIdentifier = Long.valueOf( luceneSearcher.doc( topDocuments.scoreDocs[0].doc ).get( Card.TAG_IDENTIFIER ) ); } } catch( IOException e ) { /* Also catches CorruptIndexException from Lucene */ throw new RuntimeException(e); } hideQueries = new Query[Card.HIDE_TAGS.length+Card.HIDE_TAG_VALUES.length/2]; int pos = 0; for( int i = 0; i < Card.HIDE_TAGS.length; i++ ) { hideQueries[pos] = new WildcardQuery( new Term(Card.HIDE_TAGS[i], "*") ); pos += 1; } for( int i = 0; i < Card.HIDE_TAG_VALUES.length/2; i++ ) { hideQueries[pos] = new TermQuery( new Term(Card.HIDE_TAG_VALUES[i*2], Card.HIDE_TAG_VALUES[i*2+1]) ); pos += 1; } } public void databaseCommit() { System.out.print( "Saving database to disk..\n" ); try { luceneWriter.commit(); } catch( IOException e ) { throw new RuntimeException(e); } } private void searcherRefresh() { try { luceneSearcher = new IndexSearcher( luceneWriter.getReader() ); } catch( IOException e ) { throw new RuntimeException(e); } } private Document documentByIdentifier( long identifier ) { try { TopDocs topDocuments = luceneSearcher.search( NumericRangeQuery.newLongRange( Card.TAG_IDENTIFIER, identifier, identifier, true, true ), 1 ); if( topDocuments.scoreDocs.length == 0 ) { return null; } return luceneSearcher.doc( topDocuments.scoreDocs[0].doc ); } catch( IOException e ) { throw new RuntimeException(e); } } private Document cardToDocument( Card card ) { Document document = new Document(); String search = ""; for( String tag : card.tags.keySet() ) { Set<Object> values = card.tags.get( tag ); for( Object value : values ) { if( value == null ) { search += tag+" "; } else { search += tag+" "+value.toString()+" "; } if( value == null ) { if( !tag.equals("") ) { document.add( new Field( tag, "", Field.Store.YES, Field.Index.NOT_ANALYZED ) ); } } else if( value instanceof String ) { document.add( new Field( tag, (String)value, Field.Store.YES, Field.Index.ANALYZED ) ); } else if( value instanceof Number ) { NumericField field = new NumericField( tag, Field.Store.YES, true ); if( value instanceof Long ) { field.setLongValue( ((Long)value).longValue() ); } else { throw new RuntimeException( "Unknown tag number type." ); } document.add( field ); } } } document.add( new Field( Card.TAG_SEARCH, search, Field.Store.NO, Field.Index.ANALYZED ) ); return document; } private Card cardFromDocument( Document document ) { Card card = new Card(); for( Fieldable field : document.getFields() ) { /** TODO: Find how to get NumericField from document. */ String value = field.stringValue(); card.tagValueAdd( field.name(), value.equals("") ? null : value ); } card.tagValueSetOnly( Card.TAG_IDENTIFIER, Long.valueOf( document.get( Card.TAG_IDENTIFIER ) ) ); return card; } public long cardAdd( Card card ) { highestIdentifier++; card.tagValueSetOnly( Card.TAG_IDENTIFIER, new Long( highestIdentifier ) ); card.tagValueSetOnly( Card.TAG_LAST_EDIT, new Long( System.currentTimeMillis() ) ); try { luceneWriter.addDocument( cardToDocument( card ) ); } catch( IOException e ) { throw new RuntimeException(e); } System.out.print( "Added card with identifier "+Long.toString(highestIdentifier)+": '"+card.titleGet()+"'\n" ); searcherRefresh(); //luceneWriter.commit(); return highestIdentifier; } public void cardUpdate( Card card ) { TopDocs topDocuments; Query query = NumericRangeQuery.newLongRange( card.TAG_IDENTIFIER, card.identifierGet(), card.identifierGet(), true, true ); try { topDocuments = luceneSearcher.search( query, 1 ); } catch( IOException e ) { throw new RuntimeException(e); } if( topDocuments.scoreDocs.length == 0 ) { throw new RuntimeException( "Failed to update card with identifier "+Long.toString( card.identifierGet() )+", not found." ); } card.tagValueSetOnly( Card.TAG_LAST_EDIT, new Long( System.currentTimeMillis() ) ); int documentNumber = topDocuments.scoreDocs[0].doc; try { luceneWriter.deleteDocuments( query ); luceneWriter.addDocument( cardToDocument( card ) ); } catch( IOException e ) { throw new RuntimeException(e); } System.out.print( "Updated card with identifier "+Long.toString(card.identifierGet())+": '"+card.titleGet()+"'\n" ); searcherRefresh(); //luceneWriter.commit(); } public void cardDelete( Card card ) { cardDelete( card, false ); } public void cardDelete( Card card, boolean cautious ) { if( cautious ) { String tag; if( (tag = card.<String>tagGetAs(Card.TAG_BOARD_COLUMN_CARD)) != null && tag.equals(Card.VALUE_BOARD_COLUMN_CARD_ONLY) ) { //pass } else { return; /* Don't delete. */ } } String tag; Card[] cards; if( card.tagHas(Card.TAG_BOARD) ) { tag = card.<String>tagGetAsOr(Card.TAG_BOARD_COLUMNS, ""); cards = TagUtility.parseCardList(tag); for( int i = 0; i < cards.length; i++ ) { if( cards[i] == null ) { continue; } cardDelete( cards[i], false ); } } if( card.tagHas(Card.TAG_BOARD_COLUMN) ) { tag = card.<String>tagGetAsOr(Card.TAG_BOARD_COLUMN_CARDS, ""); cards = TagUtility.parseCardList(tag); for( int i = 0; i < cards.length; i++ ) { if( cards[i] == null ) { continue; } cardDelete( cards[i], true ); } } cardDeleteRaw(card.identifierGet()); } public void cardDeleteByIdentifier( long identifier ) { cardDeleteByIdentifier( identifier, false ); } public void cardDeleteByIdentifier( long identifier, boolean cautious ) { Card card = cardGetByIdentifier(identifier); if( card != null ) { cardDelete(card); } else { throw new RuntimeException( "Failed to delete card by identifier "+Long.toString(identifier)+", not found." ); } } public void cardDeleteRaw( long identifier ) { TopDocs topDocuments; Query query = NumericRangeQuery.newLongRange( Card.TAG_IDENTIFIER, identifier, identifier, true, true ); try { topDocuments = luceneSearcher.search( query, 1 ); } catch( IOException e ) { throw new RuntimeException(e); } if( topDocuments.scoreDocs.length == 0 ) { throw new RuntimeException( "Failed to delete card with identifier "+Long.toString( identifier )+", not found." ); } int documentNumber = topDocuments.scoreDocs[0].doc; try { luceneWriter.deleteDocuments( query ); } catch( IOException e ) { throw new RuntimeException(e); } System.out.print("Deleted card with identifier "+Long.toString(identifier)+"\n"); searcherRefresh(); } public Card cardGetByIdentifier( long identifier ) { Document document = documentByIdentifier( identifier ); if( document == null ) { return null; } return cardFromDocument( document ); } /** Return up to 'amount' of recently modified cards. */ public Card[] searchTopRecent( int amount ) { BooleanQuery finalQuery = new BooleanQuery(); finalQuery.add( new MatchAllDocsQuery(), BooleanClause.Occur.SHOULD ); for( int i = 0; i < hideQueries.length; i++ ) { finalQuery.add( hideQueries[i], BooleanClause.Occur.MUST_NOT ); } try { TopDocs topDocuments = luceneSearcher.search( finalQuery, null, amount, new Sort( new SortField( Card.TAG_LAST_EDIT, SortField.LONG, true ) ) ); Card[] cards = new Card[topDocuments.scoreDocs.length]; for( int i = 0; i < topDocuments.scoreDocs.length; i++ ) { Document document = luceneSearcher.doc( topDocuments.scoreDocs[i].doc ); cards[i] = cardFromDocument( document ); } return cards; } catch( IOException e ) { throw new RuntimeException(e); } } public Card[] searchSimple( String query ) { Query parsedQuery; BooleanQuery finalQuery; try { QueryParser queryParser = new QueryParser( LUCENE_VERSION, Card.TAG_SEARCH, new StandardAnalyzer(LUCENE_VERSION) ); queryParser.setAllowLeadingWildcard( true ); parsedQuery = queryParser.parse( query ); } catch( ParseException e ) { System.out.print( "Search query parsing exception, returning zero results: "+e.getMessage()+"\n" ); return new Card[0]; } finalQuery = new BooleanQuery(); finalQuery.add( parsedQuery, BooleanClause.Occur.SHOULD ); for( int i = 0; i < hideQueries.length; i++ ) { finalQuery.add( hideQueries[i], BooleanClause.Occur.MUST_NOT ); } try { TopDocs hits = luceneSearcher.search( finalQuery, 32 ); Card[] cards = new Card[hits.scoreDocs.length]; for( int i = 0; i < hits.scoreDocs.length; i++ ) { Document document = luceneSearcher.doc( hits.scoreDocs[i].doc ); cards[i] = cardFromDocument( document ); } return cards; } catch( IOException e ) { throw new RuntimeException(e); } } }