mirror of
https://github.com/stashapp/stash.git
synced 2025-12-06 16:34:02 +01:00
* Push scrapeByURL into scrapers Replace ScrapePerfomerByURL, ScrapeMovie..., ... with ScrapeByURL in the scraperActionImpl interface. This allows us to delete a lot of repeated code in the scrapers and replace the central part with a switch on the scraper type. * Fold name scraping into one call Follow up on scraper refactoring. Name scrapers use the same code path. This allows us to restructure some code and kill some functions, adding variance to the name scraping code. It allows us to remove some code repetition as well. * Do not export loop refs. * Simplify fragment scraping Generalize fragment scrapers into ScrapeByFragment. This simplifies fragment code flows into a simpler pathing which should be easier to handle in the future. * Eliminate more context.TODO() In a number of cases, we have a context now. Use the context rather than TODO() for those cases in order to make those operations cancellable. * Pass the context for the stashbox scraper This removes all context.TODO() in the path of the stashbox scraper, and replaces it with the context that's present on each of the paths. * Pass the context into subscrapers Mostly a mechanical update, where we pass in the context for subscraping. This removes the final context.TODO() in the scraper code. * Warn on unknown fields from scripts A common mistake for new script writers are that they return fields not known to stash. For instance the name "description" is used rather than "details". Decode disallowing unknown fields. If this fails, use a tee-reader to fall back to the old behavior, but print a warning for the user in this case. Thus, we retain the old behavior, but print warnings for scripts which fails the more strict unknown-fields detection. * Nil-check before running the postprocessing chain Fixes panics when scraping returns nil values. * Lift nil-ness in post-postprocessing If the struct we are trying to post-process is nil, we shouldn't enter the postprocessing flow at all. Pass the struct as a value rather than a pointer, eliminating nil-checks as we go. Use the top-level postProcess call to make the nil-check and then abort there if the object we are looking at is nil. * Allow conversion routines to handle values If we have a non-pointer type in the interface, we should also convert those into ScrapedContent. Otherwise we get errors on deprecated functions.
373 lines
12 KiB
Go
373 lines
12 KiB
Go
package api
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"strconv"
|
|
|
|
"github.com/stashapp/stash/pkg/manager/config"
|
|
"github.com/stashapp/stash/pkg/models"
|
|
"github.com/stashapp/stash/pkg/scraper"
|
|
"github.com/stashapp/stash/pkg/scraper/stashbox"
|
|
)
|
|
|
|
func (r *queryResolver) ScrapeURL(ctx context.Context, url string, ty models.ScrapeContentType) (models.ScrapedContent, error) {
|
|
return r.scraperCache().ScrapeURL(ctx, url, ty)
|
|
}
|
|
|
|
// deprecated
|
|
func (r *queryResolver) ScrapeFreeonesPerformerList(ctx context.Context, query string) ([]string, error) {
|
|
content, err := r.scraperCache().ScrapeName(ctx, scraper.FreeonesScraperID, query, models.ScrapeContentTypePerformer)
|
|
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
performers, err := marshalScrapedPerformers(content)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var ret []string
|
|
for _, p := range performers {
|
|
if p.Name != nil {
|
|
ret = append(ret, *p.Name)
|
|
}
|
|
}
|
|
|
|
return ret, nil
|
|
}
|
|
|
|
func (r *queryResolver) ListScrapers(ctx context.Context, types []models.ScrapeContentType) ([]*models.Scraper, error) {
|
|
return r.scraperCache().ListScrapers(types), nil
|
|
}
|
|
|
|
func (r *queryResolver) ListPerformerScrapers(ctx context.Context) ([]*models.Scraper, error) {
|
|
return r.scraperCache().ListScrapers([]models.ScrapeContentType{models.ScrapeContentTypePerformer}), nil
|
|
}
|
|
|
|
func (r *queryResolver) ListSceneScrapers(ctx context.Context) ([]*models.Scraper, error) {
|
|
return r.scraperCache().ListScrapers([]models.ScrapeContentType{models.ScrapeContentTypeScene}), nil
|
|
}
|
|
|
|
func (r *queryResolver) ListGalleryScrapers(ctx context.Context) ([]*models.Scraper, error) {
|
|
return r.scraperCache().ListScrapers([]models.ScrapeContentType{models.ScrapeContentTypeGallery}), nil
|
|
}
|
|
|
|
func (r *queryResolver) ListMovieScrapers(ctx context.Context) ([]*models.Scraper, error) {
|
|
return r.scraperCache().ListScrapers([]models.ScrapeContentType{models.ScrapeContentTypeMovie}), nil
|
|
}
|
|
|
|
func (r *queryResolver) ScrapePerformerList(ctx context.Context, scraperID string, query string) ([]*models.ScrapedPerformer, error) {
|
|
if query == "" {
|
|
return nil, nil
|
|
}
|
|
|
|
content, err := r.scraperCache().ScrapeName(ctx, scraperID, query, models.ScrapeContentTypePerformer)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedPerformers(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapePerformer(ctx context.Context, scraperID string, scrapedPerformer models.ScrapedPerformerInput) (*models.ScrapedPerformer, error) {
|
|
content, err := r.scraperCache().ScrapeFragment(ctx, scraperID, scraper.Input{Performer: &scrapedPerformer})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return marshalScrapedPerformer(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapePerformerURL(ctx context.Context, url string) (*models.ScrapedPerformer, error) {
|
|
content, err := r.scraperCache().ScrapeURL(ctx, url, models.ScrapeContentTypePerformer)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedPerformer(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeSceneQuery(ctx context.Context, scraperID string, query string) ([]*models.ScrapedScene, error) {
|
|
if query == "" {
|
|
return nil, nil
|
|
}
|
|
|
|
content, err := r.scraperCache().ScrapeName(ctx, scraperID, query, models.ScrapeContentTypeScene)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedScenes(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeScene(ctx context.Context, scraperID string, scene models.SceneUpdateInput) (*models.ScrapedScene, error) {
|
|
id, err := strconv.Atoi(scene.ID)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%w: scene.ID is not an integer: '%s'", ErrInput, scene.ID)
|
|
}
|
|
|
|
content, err := r.scraperCache().ScrapeID(ctx, scraperID, id, models.ScrapeContentTypeScene)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedScene(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeSceneURL(ctx context.Context, url string) (*models.ScrapedScene, error) {
|
|
content, err := r.scraperCache().ScrapeURL(ctx, url, models.ScrapeContentTypeScene)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedScene(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeGallery(ctx context.Context, scraperID string, gallery models.GalleryUpdateInput) (*models.ScrapedGallery, error) {
|
|
id, err := strconv.Atoi(gallery.ID)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%w: gallery id is not an integer: '%s'", ErrInput, gallery.ID)
|
|
}
|
|
|
|
content, err := r.scraperCache().ScrapeID(ctx, scraperID, id, models.ScrapeContentTypeGallery)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedGallery(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeGalleryURL(ctx context.Context, url string) (*models.ScrapedGallery, error) {
|
|
content, err := r.scraperCache().ScrapeURL(ctx, url, models.ScrapeContentTypeGallery)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedGallery(content)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeMovieURL(ctx context.Context, url string) (*models.ScrapedMovie, error) {
|
|
content, err := r.scraperCache().ScrapeURL(ctx, url, models.ScrapeContentTypeMovie)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedMovie(content)
|
|
}
|
|
|
|
func (r *queryResolver) QueryStashBoxScene(ctx context.Context, input models.StashBoxSceneQueryInput) ([]*models.ScrapedScene, error) {
|
|
boxes := config.GetInstance().GetStashBoxes()
|
|
|
|
if input.StashBoxIndex < 0 || input.StashBoxIndex >= len(boxes) {
|
|
return nil, fmt.Errorf("%w: invalid stash_box_index %d", ErrInput, input.StashBoxIndex)
|
|
}
|
|
|
|
client := stashbox.NewClient(*boxes[input.StashBoxIndex], r.txnManager)
|
|
|
|
if len(input.SceneIds) > 0 {
|
|
return client.FindStashBoxScenesByFingerprintsFlat(ctx, input.SceneIds)
|
|
}
|
|
|
|
if input.Q != nil {
|
|
return client.QueryStashBoxScene(ctx, *input.Q)
|
|
}
|
|
|
|
return nil, nil
|
|
}
|
|
|
|
func (r *queryResolver) QueryStashBoxPerformer(ctx context.Context, input models.StashBoxPerformerQueryInput) ([]*models.StashBoxPerformerQueryResult, error) {
|
|
boxes := config.GetInstance().GetStashBoxes()
|
|
|
|
if input.StashBoxIndex < 0 || input.StashBoxIndex >= len(boxes) {
|
|
return nil, fmt.Errorf("%w: invalid stash_box_index %d", ErrInput, input.StashBoxIndex)
|
|
}
|
|
|
|
client := stashbox.NewClient(*boxes[input.StashBoxIndex], r.txnManager)
|
|
|
|
if len(input.PerformerIds) > 0 {
|
|
return client.FindStashBoxPerformersByNames(ctx, input.PerformerIds)
|
|
}
|
|
|
|
if input.Q != nil {
|
|
return client.QueryStashBoxPerformer(ctx, *input.Q)
|
|
}
|
|
|
|
return nil, nil
|
|
}
|
|
|
|
func (r *queryResolver) getStashBoxClient(index int) (*stashbox.Client, error) {
|
|
boxes := config.GetInstance().GetStashBoxes()
|
|
|
|
if index < 0 || index >= len(boxes) {
|
|
return nil, fmt.Errorf("%w: invalid stash_box_index %d", ErrInput, index)
|
|
}
|
|
|
|
return stashbox.NewClient(*boxes[index], r.txnManager), nil
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeSingleScene(ctx context.Context, source models.ScraperSourceInput, input models.ScrapeSingleSceneInput) ([]*models.ScrapedScene, error) {
|
|
if source.ScraperID != nil {
|
|
var c models.ScrapedContent
|
|
var content []models.ScrapedContent
|
|
var err error
|
|
|
|
switch {
|
|
case input.SceneID != nil:
|
|
var sceneID int
|
|
sceneID, err = strconv.Atoi(*input.SceneID)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%w: sceneID is not an integer: '%s'", ErrInput, *input.SceneID)
|
|
}
|
|
c, err = r.scraperCache().ScrapeID(ctx, *source.ScraperID, sceneID, models.ScrapeContentTypeScene)
|
|
content = []models.ScrapedContent{c}
|
|
case input.SceneInput != nil:
|
|
c, err = r.scraperCache().ScrapeFragment(ctx, *source.ScraperID, scraper.Input{Scene: input.SceneInput})
|
|
content = []models.ScrapedContent{c}
|
|
case input.Query != nil:
|
|
content, err = r.scraperCache().ScrapeName(ctx, *source.ScraperID, *input.Query, models.ScrapeContentTypeScene)
|
|
default:
|
|
err = fmt.Errorf("%w: scene_id, scene_input, or query must be set", ErrInput)
|
|
}
|
|
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedScenes(content)
|
|
} else if source.StashBoxIndex != nil {
|
|
client, err := r.getStashBoxClient(*source.StashBoxIndex)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if input.SceneID != nil {
|
|
return client.FindStashBoxScenesByFingerprintsFlat(ctx, []string{*input.SceneID})
|
|
} else if input.Query != nil {
|
|
return client.QueryStashBoxScene(ctx, *input.Query)
|
|
}
|
|
|
|
return nil, fmt.Errorf("%w: scene_id or query must be set", ErrInput)
|
|
}
|
|
|
|
return nil, fmt.Errorf("%w: scraper_id or stash_box_index must be set", ErrInput)
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeMultiScenes(ctx context.Context, source models.ScraperSourceInput, input models.ScrapeMultiScenesInput) ([][]*models.ScrapedScene, error) {
|
|
if source.ScraperID != nil {
|
|
return nil, ErrNotImplemented
|
|
} else if source.StashBoxIndex != nil {
|
|
client, err := r.getStashBoxClient(*source.StashBoxIndex)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return client.FindStashBoxScenesByFingerprints(ctx, input.SceneIds)
|
|
}
|
|
|
|
return nil, errors.New("scraper_id or stash_box_index must be set")
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeSinglePerformer(ctx context.Context, source models.ScraperSourceInput, input models.ScrapeSinglePerformerInput) ([]*models.ScrapedPerformer, error) {
|
|
if source.ScraperID != nil {
|
|
if input.PerformerInput != nil {
|
|
performer, err := r.scraperCache().ScrapeFragment(ctx, *source.ScraperID, scraper.Input{Performer: input.PerformerInput})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedPerformers([]models.ScrapedContent{performer})
|
|
}
|
|
|
|
if input.Query != nil {
|
|
content, err := r.scraperCache().ScrapeName(ctx, *source.ScraperID, *input.Query, models.ScrapeContentTypePerformer)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return marshalScrapedPerformers(content)
|
|
}
|
|
|
|
return nil, ErrNotImplemented
|
|
} else if source.StashBoxIndex != nil {
|
|
client, err := r.getStashBoxClient(*source.StashBoxIndex)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var ret []*models.StashBoxPerformerQueryResult
|
|
switch {
|
|
case input.PerformerID != nil:
|
|
ret, err = client.FindStashBoxPerformersByNames(ctx, []string{*input.PerformerID})
|
|
case input.Query != nil:
|
|
ret, err = client.QueryStashBoxPerformer(ctx, *input.Query)
|
|
default:
|
|
return nil, ErrNotImplemented
|
|
}
|
|
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
if len(ret) > 0 {
|
|
return ret[0].Results, nil
|
|
}
|
|
|
|
return nil, nil
|
|
}
|
|
|
|
return nil, errors.New("scraper_id or stash_box_index must be set")
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeMultiPerformers(ctx context.Context, source models.ScraperSourceInput, input models.ScrapeMultiPerformersInput) ([][]*models.ScrapedPerformer, error) {
|
|
if source.ScraperID != nil {
|
|
return nil, ErrNotImplemented
|
|
} else if source.StashBoxIndex != nil {
|
|
client, err := r.getStashBoxClient(*source.StashBoxIndex)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return client.FindStashBoxPerformersByPerformerNames(ctx, input.PerformerIds)
|
|
}
|
|
|
|
return nil, errors.New("scraper_id or stash_box_index must be set")
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeSingleGallery(ctx context.Context, source models.ScraperSourceInput, input models.ScrapeSingleGalleryInput) ([]*models.ScrapedGallery, error) {
|
|
if source.StashBoxIndex != nil {
|
|
return nil, ErrNotSupported
|
|
}
|
|
|
|
if source.ScraperID == nil {
|
|
return nil, fmt.Errorf("%w: scraper_id must be set", ErrInput)
|
|
}
|
|
|
|
var c models.ScrapedContent
|
|
|
|
switch {
|
|
case input.GalleryID != nil:
|
|
galleryID, err := strconv.Atoi(*input.GalleryID)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("%w: gallery id is not an integer: '%s'", ErrInput, *input.GalleryID)
|
|
}
|
|
c, err = r.scraperCache().ScrapeID(ctx, *source.ScraperID, galleryID, models.ScrapeContentTypeGallery)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return marshalScrapedGalleries([]models.ScrapedContent{c})
|
|
case input.GalleryInput != nil:
|
|
c, err := r.scraperCache().ScrapeFragment(ctx, *source.ScraperID, scraper.Input{Gallery: input.GalleryInput})
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return marshalScrapedGalleries([]models.ScrapedContent{c})
|
|
default:
|
|
return nil, ErrNotImplemented
|
|
}
|
|
}
|
|
|
|
func (r *queryResolver) ScrapeSingleMovie(ctx context.Context, source models.ScraperSourceInput, input models.ScrapeSingleMovieInput) ([]*models.ScrapedMovie, error) {
|
|
return nil, ErrNotSupported
|
|
}
|