mirror of
				https://github.com/go-gitea/gitea.git
				synced 2025-10-27 00:23:41 +09:00 
			
		
		
		
	Make indexer code more reusable (#2590)
This commit is contained in:
		| @@ -9,6 +9,8 @@ import ( | ||||
| 	"strconv" | ||||
|  | ||||
| 	"github.com/blevesearch/bleve" | ||||
| 	"github.com/blevesearch/bleve/analysis/token/unicodenorm" | ||||
| 	"github.com/blevesearch/bleve/mapping" | ||||
| 	"github.com/blevesearch/bleve/search/query" | ||||
| ) | ||||
|  | ||||
| @@ -41,3 +43,50 @@ func newMatchPhraseQuery(matchPhrase, field, analyzer string) *query.MatchPhrase | ||||
| 	q.Analyzer = analyzer | ||||
| 	return q | ||||
| } | ||||
|  | ||||
| const unicodeNormalizeName = "unicodeNormalize" | ||||
|  | ||||
| func addUnicodeNormalizeTokenFilter(m *mapping.IndexMappingImpl) error { | ||||
| 	return m.AddCustomTokenFilter(unicodeNormalizeName, map[string]interface{}{ | ||||
| 		"type": unicodenorm.Name, | ||||
| 		"form": unicodenorm.NFC, | ||||
| 	}) | ||||
| } | ||||
|  | ||||
| // Update represents an update to an indexer | ||||
| type Update interface { | ||||
| 	addToBatch(batch *bleve.Batch) error | ||||
| } | ||||
|  | ||||
| const maxBatchSize = 16 | ||||
|  | ||||
| // Batch batch of indexer updates that automatically flushes once it | ||||
| // reaches a certain size | ||||
| type Batch struct { | ||||
| 	batch *bleve.Batch | ||||
| 	index bleve.Index | ||||
| } | ||||
|  | ||||
| // Add add update to batch, possibly flushing | ||||
| func (batch *Batch) Add(update Update) error { | ||||
| 	if err := update.addToBatch(batch.batch); err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| 	return batch.flushIfFull() | ||||
| } | ||||
|  | ||||
| func (batch *Batch) flushIfFull() error { | ||||
| 	if batch.batch.Size() >= maxBatchSize { | ||||
| 		return batch.Flush() | ||||
| 	} | ||||
| 	return nil | ||||
| } | ||||
|  | ||||
| // Flush manually flush the batch, regardless of its size | ||||
| func (batch *Batch) Flush() error { | ||||
| 	if err := batch.index.Batch(batch.batch); err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| 	batch.batch.Reset() | ||||
| 	return nil | ||||
| } | ||||
|   | ||||
| @@ -13,7 +13,6 @@ import ( | ||||
| 	"github.com/blevesearch/bleve" | ||||
| 	"github.com/blevesearch/bleve/analysis/analyzer/custom" | ||||
| 	"github.com/blevesearch/bleve/analysis/token/lowercase" | ||||
| 	"github.com/blevesearch/bleve/analysis/token/unicodenorm" | ||||
| 	"github.com/blevesearch/bleve/analysis/tokenizer/unicode" | ||||
| 	"github.com/blevesearch/bleve/index/upsidedown" | ||||
| ) | ||||
| @@ -35,6 +34,10 @@ type IssueIndexerUpdate struct { | ||||
| 	Data    *IssueIndexerData | ||||
| } | ||||
|  | ||||
| func (update IssueIndexerUpdate) addToBatch(batch *bleve.Batch) error { | ||||
| 	return batch.Index(indexerID(update.IssueID), update.Data) | ||||
| } | ||||
|  | ||||
| const issueIndexerAnalyzer = "issueIndexer" | ||||
|  | ||||
| // InitIssueIndexer initialize issue indexer | ||||
| @@ -74,17 +77,13 @@ func createIssueIndexer() error { | ||||
| 	docMapping.AddFieldMappingsAt("Content", textFieldMapping) | ||||
| 	docMapping.AddFieldMappingsAt("Comments", textFieldMapping) | ||||
|  | ||||
| 	const unicodeNormNFC = "unicodeNormNFC" | ||||
| 	if err := mapping.AddCustomTokenFilter(unicodeNormNFC, map[string]interface{}{ | ||||
| 		"type": unicodenorm.Name, | ||||
| 		"form": unicodenorm.NFC, | ||||
| 	}); err != nil { | ||||
| 	if err := addUnicodeNormalizeTokenFilter(mapping); err != nil { | ||||
| 		return err | ||||
| 	} else if err = mapping.AddCustomAnalyzer(issueIndexerAnalyzer, map[string]interface{}{ | ||||
| 		"type":          custom.Name, | ||||
| 		"char_filters":  []string{}, | ||||
| 		"tokenizer":     unicode.Name, | ||||
| 		"token_filters": []string{unicodeNormNFC, lowercase.Name}, | ||||
| 		"token_filters": []string{unicodeNormalizeName, lowercase.Name}, | ||||
| 	}); err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| @@ -97,21 +96,12 @@ func createIssueIndexer() error { | ||||
| 	return err | ||||
| } | ||||
|  | ||||
| // UpdateIssue update the issue indexer | ||||
| func UpdateIssue(update IssueIndexerUpdate) error { | ||||
| 	return issueIndexer.Index(indexerID(update.IssueID), update.Data) | ||||
| } | ||||
|  | ||||
| // BatchUpdateIssues perform a batch update of the issue indexer | ||||
| func BatchUpdateIssues(updates ...IssueIndexerUpdate) error { | ||||
| 	batch := issueIndexer.NewBatch() | ||||
| 	for _, update := range updates { | ||||
| 		err := batch.Index(indexerID(update.IssueID), update.Data) | ||||
| 		if err != nil { | ||||
| 			return err | ||||
| 		} | ||||
| // IssueIndexerBatch batch to add updates to | ||||
| func IssueIndexerBatch() *Batch { | ||||
| 	return &Batch{ | ||||
| 		batch: issueIndexer.NewBatch(), | ||||
| 		index: issueIndexer, | ||||
| 	} | ||||
| 	return issueIndexer.Batch(batch) | ||||
| } | ||||
|  | ||||
| // SearchIssuesByKeyword searches for issues by given conditions. | ||||
|   | ||||
		Reference in New Issue
	
	Block a user