diff options
author | Martin Czygan <martin.czygan@gmail.com> | 2021-04-30 22:43:07 +0200 |
---|---|---|
committer | Martin Czygan <martin.czygan@gmail.com> | 2021-04-30 22:43:07 +0200 |
commit | 77ca4cd924993188e0e9f8dd072af9f173eaad91 (patch) | |
tree | 10ef046df67c459412bd272b263b8109cb80b455 /skate/cmd/skate-ref-to-release | |
parent | 403df865aa7f86ce10e19eb8a7ed67bf772c901b (diff) | |
download | refcat-77ca4cd924993188e0e9f8dd072af9f173eaad91.tar.gz refcat-77ca4cd924993188e0e9f8dd072af9f173eaad91.zip |
rename skate-ref-to-release to skate-conv
Diffstat (limited to 'skate/cmd/skate-ref-to-release')
-rw-r--r-- | skate/cmd/skate-ref-to-release/main.go | 81 |
1 files changed, 0 insertions, 81 deletions
diff --git a/skate/cmd/skate-ref-to-release/main.go b/skate/cmd/skate-ref-to-release/main.go deleted file mode 100644 index d547e62..0000000 --- a/skate/cmd/skate-ref-to-release/main.go +++ /dev/null @@ -1,81 +0,0 @@ -// skate-ref-to-release converts a "ref" document to a "release" document. -// -package main - -import ( - "flag" - "log" - "os" - "runtime" - "strings" - - "git.archive.org/martin/cgraph/skate" - "github.com/miku/parallel" - - json "github.com/segmentio/encoding/json" -) - -var ( - numWorkers = flag.Int("w", runtime.NumCPU(), "number of workers") - batchSize = flag.Int("b", 100000, "batch size") - fromFormat = flag.String("f", "ref", "import data shape") - - bytesNewline = []byte("\n") -) - -func refToRelease(p []byte) ([]byte, error) { - var ref skate.Ref - if err := json.Unmarshal(p, &ref); err != nil { - return nil, err - } - release, err := skate.RefToRelease(&ref) - if err != nil { - return nil, err - } - release.Extra.Skate.Status = "ref" // means: converted from ref - release.Extra.Skate.Ref.Index = ref.Index - release.Extra.Skate.Ref.Key = ref.Key - b, err := json.Marshal(release) - b = append(b, bytesNewline...) - return b, err -} - -func rgSitemapToRelease(p []byte) ([]byte, error) { - var ( - s skate.Sitemap - release skate.Release - ) - if err := json.Unmarshal(p, &s); err != nil { - return nil, err - } - release.Title = s.Title - if len(s.URL) > 41 { - // XXX: A pseudo ident, maybe irritating. - release.Ident = strings.Split(s.URL[41:], "_")[0] - } - release.Extra.Skate.Status = "rg" - release.Extra.Skate.ResearchGate.URL = s.URL - b, err := json.Marshal(release) - b = append(b, bytesNewline...) - return b, err -} - -func main() { - flag.Parse() - switch *fromFormat { - case "ref": - pp := parallel.NewProcessor(os.Stdin, os.Stdout, refToRelease) - pp.NumWorkers = *numWorkers - pp.BatchSize = *batchSize - if err := pp.Run(); err != nil { - log.Fatal(err) - } - case "rg": - pp := parallel.NewProcessor(os.Stdin, os.Stdout, rgSitemapToRelease) - pp.NumWorkers = *numWorkers - pp.BatchSize = *batchSize - if err := pp.Run(); err != nil { - log.Fatal(err) - } - } -} |