dispatch/vendor/github.com/blevesearch/bleve/utils/bleve_index/main.go

116 lines
2.4 KiB
Go

// Copyright (c) 2014 Couchbase, Inc.
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file
// except in compliance with the License. You may obtain a copy of the License at
// http://www.apache.org/licenses/LICENSE-2.0
// Unless required by applicable law or agreed to in writing, software distributed under the
// License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
// either express or implied. See the License for the specific language governing permissions
// and limitations under the License.
package main
import (
"flag"
"io/ioutil"
"log"
"os"
"path/filepath"
"github.com/blevesearch/bleve"
)
var indexPath = flag.String("index", "", "index path")
var keepExt = flag.Bool("keepExt", false, "keep extension in doc id")
var keepDir = flag.Bool("keepDir", false, "keep dir in doc id")
func main() {
flag.Parse()
if *indexPath == "" {
log.Fatal("must specify index path")
}
// open the index
index, err := bleve.Open(*indexPath)
if err != nil {
log.Fatal(err)
}
defer func() {
cerr := index.Close()
if cerr != nil {
log.Fatalf("error closing index: %v", err)
}
}()
if flag.NArg() < 1 {
log.Fatal("must specify at least one path to index")
}
for file := range handleArgs(flag.Args()) {
// index the files
docID := file.filename
if !*keepDir {
_, docID = filepath.Split(docID)
}
if !*keepExt {
ext := filepath.Ext(docID)
docID = docID[0 : len(docID)-len(ext)]
}
log.Printf("Indexing: %s", docID)
err = index.Index(docID, file.contents)
if err != nil {
log.Fatal(err)
}
}
}
type file struct {
filename string
contents []byte
}
func handleArgs(args []string) chan file {
rv := make(chan file)
go func() {
for _, arg := range args {
arg = filepath.Clean(arg)
handleArgRecursive(arg, rv)
}
close(rv)
}()
return rv
}
func handleArgRecursive(arg string, results chan file) {
stat, err := os.Stat(arg)
if err != nil {
log.Print(err)
return
}
if stat.IsDir() {
// open the directory
dirEntries, err := ioutil.ReadDir(arg)
if err != nil {
log.Fatal(err)
}
// walk the directory entries
for _, dirEntry := range dirEntries {
handleArgRecursive(arg+string(os.PathSeparator)+dirEntry.Name(), results)
}
} else {
bytes, err := ioutil.ReadFile(arg)
if err != nil {
log.Fatal(err)
}
results <- file{
filename: arg,
contents: bytes,
}
}
}