Платформа ЦРНП "Мирокод" для разработки проектов
https://git.mirocod.ru
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
143 lines
4.3 KiB
143 lines
4.3 KiB
// Copyright 2017 The Gitea Authors. All rights reserved. |
|
// Use of this source code is governed by a MIT-style |
|
// license that can be found in the LICENSE file. |
|
|
|
package indexer |
|
|
|
import ( |
|
"os" |
|
|
|
"code.gitea.io/gitea/modules/log" |
|
"code.gitea.io/gitea/modules/setting" |
|
|
|
"github.com/blevesearch/bleve" |
|
"github.com/blevesearch/bleve/analysis/analyzer/custom" |
|
"github.com/blevesearch/bleve/analysis/token/lowercase" |
|
"github.com/blevesearch/bleve/analysis/token/unicodenorm" |
|
"github.com/blevesearch/bleve/analysis/tokenizer/unicode" |
|
) |
|
|
|
// issueIndexer (thread-safe) index for searching issues |
|
var issueIndexer bleve.Index |
|
|
|
// IssueIndexerData data stored in the issue indexer |
|
type IssueIndexerData struct { |
|
RepoID int64 |
|
Title string |
|
Content string |
|
Comments []string |
|
} |
|
|
|
// IssueIndexerUpdate an update to the issue indexer |
|
type IssueIndexerUpdate struct { |
|
IssueID int64 |
|
Data *IssueIndexerData |
|
} |
|
|
|
const issueIndexerAnalyzer = "issueIndexer" |
|
|
|
// InitIssueIndexer initialize issue indexer |
|
func InitIssueIndexer(populateIndexer func() error) { |
|
_, err := os.Stat(setting.Indexer.IssuePath) |
|
if err != nil { |
|
if os.IsNotExist(err) { |
|
if err = createIssueIndexer(); err != nil { |
|
log.Fatal(4, "CreateIssuesIndexer: %v", err) |
|
} |
|
if err = populateIndexer(); err != nil { |
|
log.Fatal(4, "PopulateIssuesIndex: %v", err) |
|
} |
|
} else { |
|
log.Fatal(4, "InitIssuesIndexer: %v", err) |
|
} |
|
} else { |
|
issueIndexer, err = bleve.Open(setting.Indexer.IssuePath) |
|
if err != nil { |
|
log.Error(4, "Unable to open issues indexer (%s)."+ |
|
" If the error is due to incompatible versions, try deleting the indexer files;"+ |
|
" gitea will recreate them with the appropriate version the next time it runs."+ |
|
" Deleting the indexer files will not result in loss of data.", |
|
setting.Indexer.IssuePath) |
|
log.Fatal(4, "InitIssuesIndexer, open index: %v", err) |
|
} |
|
} |
|
} |
|
|
|
// createIssueIndexer create an issue indexer if one does not already exist |
|
func createIssueIndexer() error { |
|
mapping := bleve.NewIndexMapping() |
|
docMapping := bleve.NewDocumentMapping() |
|
|
|
docMapping.AddFieldMappingsAt("RepoID", bleve.NewNumericFieldMapping()) |
|
|
|
textFieldMapping := bleve.NewTextFieldMapping() |
|
docMapping.AddFieldMappingsAt("Title", textFieldMapping) |
|
docMapping.AddFieldMappingsAt("Content", textFieldMapping) |
|
docMapping.AddFieldMappingsAt("Comments", textFieldMapping) |
|
|
|
const unicodeNormNFC = "unicodeNormNFC" |
|
if err := mapping.AddCustomTokenFilter(unicodeNormNFC, map[string]interface{}{ |
|
"type": unicodenorm.Name, |
|
"form": unicodenorm.NFC, |
|
}); err != nil { |
|
return err |
|
} else if err = mapping.AddCustomAnalyzer(issueIndexerAnalyzer, map[string]interface{}{ |
|
"type": custom.Name, |
|
"char_filters": []string{}, |
|
"tokenizer": unicode.Name, |
|
"token_filters": []string{unicodeNormNFC, lowercase.Name}, |
|
}); err != nil { |
|
return err |
|
} |
|
|
|
mapping.DefaultAnalyzer = issueIndexerAnalyzer |
|
mapping.AddDocumentMapping("issues", docMapping) |
|
|
|
var err error |
|
issueIndexer, err = bleve.New(setting.Indexer.IssuePath, mapping) |
|
return err |
|
} |
|
|
|
// UpdateIssue update the issue indexer |
|
func UpdateIssue(update IssueIndexerUpdate) error { |
|
return issueIndexer.Index(indexerID(update.IssueID), update.Data) |
|
} |
|
|
|
// BatchUpdateIssues perform a batch update of the issue indexer |
|
func BatchUpdateIssues(updates ...IssueIndexerUpdate) error { |
|
batch := issueIndexer.NewBatch() |
|
for _, update := range updates { |
|
err := batch.Index(indexerID(update.IssueID), update.Data) |
|
if err != nil { |
|
return err |
|
} |
|
} |
|
return issueIndexer.Batch(batch) |
|
} |
|
|
|
// SearchIssuesByKeyword searches for issues by given conditions. |
|
// Returns the matching issue IDs |
|
func SearchIssuesByKeyword(repoID int64, keyword string) ([]int64, error) { |
|
indexerQuery := bleve.NewConjunctionQuery( |
|
numericEqualityQuery(repoID, "RepoID"), |
|
bleve.NewDisjunctionQuery( |
|
newMatchPhraseQuery(keyword, "Title", issueIndexerAnalyzer), |
|
newMatchPhraseQuery(keyword, "Content", issueIndexerAnalyzer), |
|
newMatchPhraseQuery(keyword, "Comments", issueIndexerAnalyzer), |
|
)) |
|
search := bleve.NewSearchRequestOptions(indexerQuery, 2147483647, 0, false) |
|
|
|
result, err := issueIndexer.Search(search) |
|
if err != nil { |
|
return nil, err |
|
} |
|
|
|
issueIDs := make([]int64, len(result.Hits)) |
|
for i, hit := range result.Hits { |
|
issueIDs[i], err = idOfIndexerID(hit.ID) |
|
if err != nil { |
|
return nil, err |
|
} |
|
} |
|
return issueIDs, nil |
|
}
|
|
|