Optimizations
Re-arrange some channels set all channels to a size of 1 Reset the image download buffer Allocate the correct slice size for the CV API Add a flag to only download the original image
This commit is contained in:
parent
8a9aec4884
commit
75d60339ee
@ -162,6 +162,7 @@ type Opts struct {
|
|||||||
APIKey string
|
APIKey string
|
||||||
path string
|
path string
|
||||||
thumbOnly bool
|
thumbOnly bool
|
||||||
|
originalOnly bool
|
||||||
hashDownloaded bool
|
hashDownloaded bool
|
||||||
keepDownloaded bool
|
keepDownloaded bool
|
||||||
}
|
}
|
||||||
@ -196,6 +197,7 @@ func main() {
|
|||||||
flag.StringVar(&opts.cv.APIKey, "cv-api-key", "", "API Key to use to access the ComicVine API")
|
flag.StringVar(&opts.cv.APIKey, "cv-api-key", "", "API Key to use to access the ComicVine API")
|
||||||
flag.StringVar(&opts.cv.path, "cv-path", "", fmt.Sprintf("Path to store ComicVine data in (default %v)", filepath.Join(wd, "comicvine")))
|
flag.StringVar(&opts.cv.path, "cv-path", "", fmt.Sprintf("Path to store ComicVine data in (default %v)", filepath.Join(wd, "comicvine")))
|
||||||
flag.BoolVar(&opts.cv.thumbOnly, "cv-thumb-only", true, "Only downloads the thumbnail image from comicvine, when false sets -only-hash-new-ids=false")
|
flag.BoolVar(&opts.cv.thumbOnly, "cv-thumb-only", true, "Only downloads the thumbnail image from comicvine, when false sets -only-hash-new-ids=false")
|
||||||
|
flag.BoolVar(&opts.cv.originalOnly, "cv-original-only", true, "Only downloads the original image from comicvine, when false sets -only-hash-new-ids=false")
|
||||||
flag.BoolVar(&opts.cv.hashDownloaded, "cv-hash-downloaded", true, "Hash already downloaded images")
|
flag.BoolVar(&opts.cv.hashDownloaded, "cv-hash-downloaded", true, "Hash already downloaded images")
|
||||||
flag.BoolVar(&opts.cv.keepDownloaded, "cv-keep-downloaded", true, "Keep downloaded images. When set to false does not ever write to the filesystem, a crash or exiting can mean some images need to be re-downloaded")
|
flag.BoolVar(&opts.cv.keepDownloaded, "cv-keep-downloaded", true, "Keep downloaded images. When set to false does not ever write to the filesystem, a crash or exiting can mean some images need to be re-downloaded")
|
||||||
flag.Parse()
|
flag.Parse()
|
||||||
@ -639,20 +641,10 @@ func (s *Server) DecodeHashes(format Format, hashes []byte) error {
|
|||||||
}
|
}
|
||||||
|
|
||||||
func (s *Server) HashLocalImages(opts Opts) {
|
func (s *Server) HashLocalImages(opts Opts) {
|
||||||
|
if opts.coverPath == "" {
|
||||||
|
return
|
||||||
|
}
|
||||||
go func() {
|
go func() {
|
||||||
alreadyQuit := false
|
|
||||||
if opts.coverPath == "" {
|
|
||||||
select {
|
|
||||||
case sig := <-s.signalQueue:
|
|
||||||
log.Printf("Signal: %v\n", sig)
|
|
||||||
s.cancel()
|
|
||||||
case <-s.Context.Done():
|
|
||||||
log.Println("Recieved quit")
|
|
||||||
}
|
|
||||||
err := s.httpServer.Shutdown(context.TODO())
|
|
||||||
log.Println("Err:", err)
|
|
||||||
return
|
|
||||||
}
|
|
||||||
log.Println("Hashing covers at ", opts.coverPath)
|
log.Println("Hashing covers at ", opts.coverPath)
|
||||||
start := time.Now()
|
start := time.Now()
|
||||||
err := filepath.WalkDir(opts.coverPath, func(path string, d fs.DirEntry, err error) error {
|
err := filepath.WalkDir(opts.coverPath, func(path string, d fs.DirEntry, err error) error {
|
||||||
@ -660,11 +652,6 @@ func (s *Server) HashLocalImages(opts Opts) {
|
|||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
select {
|
select {
|
||||||
case signal := <-s.signalQueue:
|
|
||||||
err = s.httpServer.Shutdown(context.TODO())
|
|
||||||
alreadyQuit = true
|
|
||||||
s.cancel()
|
|
||||||
return fmt.Errorf("signal: %v, %w", signal, err)
|
|
||||||
case <-s.Context.Done():
|
case <-s.Context.Done():
|
||||||
log.Println("Recieved quit")
|
log.Println("Recieved quit")
|
||||||
err = s.httpServer.Shutdown(context.TODO())
|
err = s.httpServer.Shutdown(context.TODO())
|
||||||
@ -680,16 +667,21 @@ func (s *Server) HashLocalImages(opts Opts) {
|
|||||||
})
|
})
|
||||||
elapsed := time.Since(start)
|
elapsed := time.Since(start)
|
||||||
log.Println("Err:", err, "local hashing took", elapsed)
|
log.Println("Err:", err, "local hashing took", elapsed)
|
||||||
|
|
||||||
sig := <-s.signalQueue
|
|
||||||
if !alreadyQuit {
|
|
||||||
s.cancel()
|
|
||||||
}
|
|
||||||
err = s.httpServer.Shutdown(context.TODO())
|
|
||||||
log.Printf("Signal: %v, error: %v", sig, err)
|
|
||||||
}()
|
}()
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func signalHandler(s *Server) {
|
||||||
|
select {
|
||||||
|
case sig := <-s.signalQueue:
|
||||||
|
log.Printf("Signal: %v\n", sig)
|
||||||
|
s.cancel()
|
||||||
|
case <-s.Context.Done():
|
||||||
|
log.Println("Recieved quit: Attempting to shutdown gracefully")
|
||||||
|
}
|
||||||
|
err := s.httpServer.Shutdown(context.TODO())
|
||||||
|
log.Println("Err:", err)
|
||||||
|
}
|
||||||
|
|
||||||
func initializeStorage(opts Opts) (ch.HashStorage, error) {
|
func initializeStorage(opts Opts) (ch.HashStorage, error) {
|
||||||
switch opts.storageType {
|
switch opts.storageType {
|
||||||
case Map:
|
case Map:
|
||||||
@ -787,6 +779,7 @@ func saveHashes(opts Opts, encodeHashes func(format Format) ([]byte, error)) {
|
|||||||
func downloadProcessor(chdb ch.CHDB, opts Opts, imagePaths chan cv.Download, server Server) {
|
func downloadProcessor(chdb ch.CHDB, opts Opts, imagePaths chan cv.Download, server Server) {
|
||||||
defer func() {
|
defer func() {
|
||||||
log.Println("Download Processor completed")
|
log.Println("Download Processor completed")
|
||||||
|
close(server.hashingQueue)
|
||||||
}()
|
}()
|
||||||
for path := range imagePaths {
|
for path := range imagePaths {
|
||||||
id := ch.ID{Domain: ch.ComicVine, ID: path.IssueID}
|
id := ch.ID{Domain: ch.ComicVine, ID: path.IssueID}
|
||||||
@ -831,12 +824,7 @@ func downloadProcessor(chdb ch.CHDB, opts Opts, imagePaths chan cv.Download, ser
|
|||||||
ID: id,
|
ID: id,
|
||||||
NewOnly: opts.onlyHashNewIDs,
|
NewOnly: opts.onlyHashNewIDs,
|
||||||
}
|
}
|
||||||
select {
|
server.hashingQueue <- im
|
||||||
case <-server.Context.Done():
|
|
||||||
log.Println("Recieved quit")
|
|
||||||
return
|
|
||||||
case server.hashingQueue <- im:
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -857,7 +845,7 @@ func startServer(opts Opts) {
|
|||||||
Context: ctx,
|
Context: ctx,
|
||||||
cancel: cancel,
|
cancel: cancel,
|
||||||
signalQueue: make(chan os.Signal, 1),
|
signalQueue: make(chan os.Signal, 1),
|
||||||
readerQueue: make(chan string, 100),
|
readerQueue: make(chan string, 1),
|
||||||
hashingQueue: make(chan ch.Im, 1),
|
hashingQueue: make(chan ch.Im, 1),
|
||||||
mappingQueue: make(chan ch.ImageHash, 1),
|
mappingQueue: make(chan ch.ImageHash, 1),
|
||||||
mux: mux,
|
mux: mux,
|
||||||
@ -912,7 +900,7 @@ func startServer(opts Opts) {
|
|||||||
|
|
||||||
log.Println("Init downloaders")
|
log.Println("Init downloaders")
|
||||||
dwg := sync.WaitGroup{}
|
dwg := sync.WaitGroup{}
|
||||||
finishedDownloadQueue := make(chan cv.Download, 10)
|
finishedDownloadQueue := make(chan cv.Download, 1)
|
||||||
go downloadProcessor(chdb, opts, finishedDownloadQueue, server)
|
go downloadProcessor(chdb, opts, finishedDownloadQueue, server)
|
||||||
|
|
||||||
if opts.cv.downloadCovers {
|
if opts.cv.downloadCovers {
|
||||||
@ -921,6 +909,9 @@ func startServer(opts Opts) {
|
|||||||
if opts.cv.thumbOnly {
|
if opts.cv.thumbOnly {
|
||||||
imageTypes = append(imageTypes, "thumb_url")
|
imageTypes = append(imageTypes, "thumb_url")
|
||||||
}
|
}
|
||||||
|
if opts.cv.originalOnly {
|
||||||
|
imageTypes = append(imageTypes, "original_url")
|
||||||
|
}
|
||||||
cvdownloader := cv.NewCVDownloader(server.Context, bufPool, chdb, opts.cv.path, opts.cv.APIKey, imageTypes, opts.cv.keepDownloaded, opts.cv.hashDownloaded, finishedDownloadQueue)
|
cvdownloader := cv.NewCVDownloader(server.Context, bufPool, chdb, opts.cv.path, opts.cv.APIKey, imageTypes, opts.cv.keepDownloaded, opts.cv.hashDownloaded, finishedDownloadQueue)
|
||||||
go func() {
|
go func() {
|
||||||
defer dwg.Done()
|
defer dwg.Done()
|
||||||
@ -937,6 +928,7 @@ func startServer(opts Opts) {
|
|||||||
}()
|
}()
|
||||||
}
|
}
|
||||||
|
|
||||||
|
go signalHandler(&server)
|
||||||
log.Println("Listening on ", server.httpServer.Addr)
|
log.Println("Listening on ", server.httpServer.Addr)
|
||||||
err = server.httpServer.ListenAndServe()
|
err = server.httpServer.ListenAndServe()
|
||||||
if err != nil {
|
if err != nil {
|
||||||
@ -950,9 +942,14 @@ func startServer(opts Opts) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
log.Println("waiting on downloaders")
|
log.Println("waiting on downloaders")
|
||||||
dwg.Wait() // Downloaders send to server.hashingQueue
|
dwg.Wait() // Downloaders send to finishedDownloadQueue which sends to server.hashingQueue
|
||||||
|
|
||||||
close(server.hashingQueue)
|
log.Println("waiting on downloader")
|
||||||
|
close(finishedDownloadQueue)
|
||||||
|
for range finishedDownloadQueue {
|
||||||
|
}
|
||||||
|
|
||||||
|
// close(server.hashingQueue) // Closed by downloadProcessor
|
||||||
log.Println("waiting on hashers")
|
log.Println("waiting on hashers")
|
||||||
hwg.Wait()
|
hwg.Wait()
|
||||||
for range server.hashingQueue {
|
for range server.hashingQueue {
|
||||||
@ -968,10 +965,6 @@ func startServer(opts Opts) {
|
|||||||
for range server.signalQueue {
|
for range server.signalQueue {
|
||||||
}
|
}
|
||||||
|
|
||||||
log.Println("waiting on downloader")
|
|
||||||
close(finishedDownloadQueue)
|
|
||||||
for range finishedDownloadQueue {
|
|
||||||
}
|
|
||||||
_ = chdb.Close()
|
_ = chdb.Close()
|
||||||
|
|
||||||
// server.EncodeHashes would normally need a read lock
|
// server.EncodeHashes would normally need a read lock
|
||||||
|
11
cv/cv.go
11
cv/cv.go
@ -108,7 +108,7 @@ func (c *CVDownloader) readJson() ([]*CVResult, error) {
|
|||||||
return issues, nil
|
return issues, nil
|
||||||
}
|
}
|
||||||
func (c *CVDownloader) loadIssues(file_entry fs.DirEntry) (*CVResult, error) {
|
func (c *CVDownloader) loadIssues(file_entry fs.DirEntry) (*CVResult, error) {
|
||||||
tmp := &CVResult{}
|
tmp := &CVResult{Results: make([]Issue, 0, 100)}
|
||||||
file, err := os.Open(filepath.Join(c.JSONPath, file_entry.Name()))
|
file, err := os.Open(filepath.Join(c.JSONPath, file_entry.Name()))
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return nil, err
|
return nil, err
|
||||||
@ -377,6 +377,7 @@ func (c *CVDownloader) start_downloader() {
|
|||||||
|
|
||||||
} else {
|
} else {
|
||||||
image := c.bufPool.Get().(*bytes.Buffer)
|
image := c.bufPool.Get().(*bytes.Buffer)
|
||||||
|
image.Reset()
|
||||||
log.Println("downloading", dl.dest)
|
log.Println("downloading", dl.dest)
|
||||||
_, err = io.Copy(image, resp.Body)
|
_, err = io.Copy(image, resp.Body)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
@ -574,10 +575,10 @@ func NewCVDownloader(ctx context.Context, bufPool *sync.Pool, chdb ch.CHDB, work
|
|||||||
JSONPath: filepath.Join(workPath, "_json"),
|
JSONPath: filepath.Join(workPath, "_json"),
|
||||||
ImagePath: filepath.Join(workPath, "_image"),
|
ImagePath: filepath.Join(workPath, "_image"),
|
||||||
APIKey: APIKey,
|
APIKey: APIKey,
|
||||||
downloadQueue: make(chan *CVResult, 1000), // This is just json it shouldn't take up much more than 122 MB
|
downloadQueue: make(chan *CVResult, 1), // This is just json it shouldn't take up much more than 122 MB
|
||||||
imageDownloads: make(chan download, 250), // These are just URLs should only take a few MB
|
imageDownloads: make(chan download, 1), // These are just URLs should only take a few MB
|
||||||
notFound: make(chan download, 100), // Same here
|
notFound: make(chan download, 1), // Same here
|
||||||
bufPool: bufPool, // Only used if keepDownloadedImages is false to save space on byte buffers. The buffers get sent back via finishedDownloadQueue
|
bufPool: bufPool, // Only used if keepDownloadedImages is false to save space on byte buffers. The buffers get sent back via finishedDownloadQueue
|
||||||
FinishedDownloadQueue: finishedDownloadQueue,
|
FinishedDownloadQueue: finishedDownloadQueue,
|
||||||
SendExistingImages: sendExistingImages,
|
SendExistingImages: sendExistingImages,
|
||||||
KeepDownloadedImages: keepDownloadedImages,
|
KeepDownloadedImages: keepDownloadedImages,
|
||||||
|
Loading…
Reference in New Issue
Block a user