- Fix Nodes.First() panic on empty slice (return nil) - Fix ticker leak in archive.go (create once, defer Stop) - Fix cookie path matching for empty and root paths - Fix lost query params in google.go (u.Query().Set was discarded) - Fix type assertion panic in useragents.go - Fix dropped date parse error in powerball.go - Remove unreachable dead code in megamillions.go and powerball.go - Simplify document.go WaitForNetworkIdle, remove unused root field - Remove debug fmt.Println calls across codebase - Replace panic(err) with stderr+exit in all cmd/ programs - Fix duckduckgo cmd: remove useless defer, return error on bad safesearch - Fix archive cmd: ToConfig returns error instead of panicking - Add 39+ unit tests across 6 new test files - Add Gitea Actions CI workflow (build, test, vet in parallel) Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
81 lines
1.6 KiB
Go
81 lines
1.6 KiB
Go
package main
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"io"
|
|
"os"
|
|
|
|
"github.com/urfave/cli/v3"
|
|
|
|
"gitea.stevedudenhoeffer.com/steve/go-extractor"
|
|
"gitea.stevedudenhoeffer.com/steve/go-extractor/cmd/browser/pkg/browser"
|
|
)
|
|
|
|
func deferClose(cl io.Closer) {
|
|
_ = cl.Close()
|
|
}
|
|
func main() {
|
|
cmd := &cli.Command{
|
|
Name: "browser",
|
|
Flags: browser.Flags,
|
|
Usage: "<url>",
|
|
Action: func(ctx context.Context, cli *cli.Command) error {
|
|
target := cli.Args().First()
|
|
if target == "" {
|
|
return fmt.Errorf("no url specified")
|
|
}
|
|
|
|
b, err := browser.FromCommand(ctx, cli)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
defer deferClose(b)
|
|
|
|
// now open the user specified url
|
|
doc, err := b.Open(ctx, target, extractor.OpenPageOptions{})
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
defer deferClose(doc)
|
|
|
|
article, err := extractor.Readability(ctx, doc)
|
|
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
content := ""
|
|
|
|
if article.Content != "" {
|
|
|
|
if len(article.Content) > 32 {
|
|
content = article.Content[:32] + "..."
|
|
} else {
|
|
content = article.Content
|
|
}
|
|
}
|
|
|
|
fmt.Println("Title:", article.Title)
|
|
fmt.Println("Byline:", article.Byline)
|
|
fmt.Println("Site:", article.SiteName)
|
|
fmt.Println("Published:", article.PublishedTime)
|
|
fmt.Println("Excerpt:", article.Excerpt)
|
|
fmt.Println("Length:", article.Length)
|
|
fmt.Println("Lang:", article.Lang)
|
|
fmt.Println("Content:", content)
|
|
fmt.Println("TextContent:", article.TextContent)
|
|
return nil
|
|
},
|
|
}
|
|
|
|
err := cmd.Run(context.Background(), os.Args)
|
|
|
|
if err != nil {
|
|
fmt.Fprintf(os.Stderr, "error: %v\n", err)
|
|
os.Exit(1)
|
|
}
|
|
}
|