go/main.go

249 lines
5.9 KiB
Go
Raw Normal View History

package main
import (
"bytes"
2023-02-14 19:06:46 +00:00
"errors"
"fmt"
cp "github.com/otiai10/copy"
"os"
2023-02-04 01:39:51 +00:00
"path/filepath"
"strings"
"text/template"
"github.com/PuerkitoBio/goquery"
2022-08-30 21:52:53 +00:00
"github.com/avelino/awesome-go/pkg/slug"
)
type Link struct {
Title string
Url string
Description string
}
type Object struct {
Title string
Slug string
Description string
Items []Link
}
2023-02-14 17:58:36 +00:00
// Source files
2023-02-04 01:39:51 +00:00
const readmePath = "README.md"
2023-02-14 17:58:36 +00:00
// This files should be copied 'as is' to outDir directory
var staticFiles = []string{
"tmpl/assets",
"tmpl/_redirects",
"tmpl/robots.txt",
}
2023-02-04 01:39:51 +00:00
2023-02-14 18:12:57 +00:00
// TODO: embed
// Templates
var tplIndex = template.Must(template.ParseFiles("tmpl/tmpl.html"))
var tplCategoryIndex = template.Must(template.ParseFiles("tmpl/cat-tmpl.html"))
var tplSitemap = template.Must(template.ParseFiles("tmpl/sitemap-tmpl.xml"))
2023-02-04 01:39:51 +00:00
2023-02-14 17:58:36 +00:00
// Output files
const outDir = "out/" // NOTE: trailing slash is required
var outIndexFile = filepath.Join(outDir, "index.html")
var outSitemapFile = filepath.Join(outDir, "sitemap.xml")
2023-02-04 01:39:51 +00:00
func main() {
2023-02-14 22:10:50 +00:00
if err := renderAll(); err != nil {
panic(err)
}
}
// FIXME: choose a better name
func renderAll() error {
2023-02-04 02:01:22 +00:00
// Cleanup and re-create output directory
{
if err := os.RemoveAll(outDir); err != nil {
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to remove target dir: %w", err)
2023-02-04 02:01:22 +00:00
}
if err := mkdirAll(outDir); err != nil {
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to create target dir: %w", err)
2023-02-04 02:01:22 +00:00
}
}
2023-02-14 21:55:56 +00:00
err := ConvertAndRenderIndex(readmePath, outIndexFile)
if err != nil {
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to convert markdown to html: %w", err)
}
2023-02-04 01:39:51 +00:00
input, err := os.ReadFile(outIndexFile)
if err != nil {
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to read converted html: %w", err)
}
2023-02-04 01:39:51 +00:00
2023-02-14 18:12:57 +00:00
query, err := goquery.NewDocumentFromReader(bytes.NewReader(input))
if err != nil {
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to create goquery instance: %w", err)
}
2023-02-14 18:56:32 +00:00
objs := make(map[string]Object)
query.Find("body #contents").NextFiltered("ul").Find("ul").Each(func(_ int, s *goquery.Selection) {
s.Find("li a").Each(func(_ int, s *goquery.Selection) {
selector, exists := s.Attr("href")
if !exists {
return
}
2023-02-14 22:10:50 +00:00
2023-02-14 19:06:46 +00:00
obj, err := makeObjByID(selector, query.Find("body"))
if err != nil {
return
}
2023-02-14 19:06:46 +00:00
2023-02-14 18:56:32 +00:00
objs[selector] = *obj
})
})
2023-02-04 01:39:51 +00:00
if err := makeSiteStruct(objs); err != nil {
// FIXME: remove all panics
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to render categories: %w", err)
2023-02-04 01:39:51 +00:00
}
changeLinksInIndex(string(input), query, objs)
makeSitemap(objs)
for _, srcFilename := range staticFiles {
dstFilename := filepath.Join(outDir, filepath.Base(srcFilename))
fmt.Printf("Copy static file: %s -> %s\n", srcFilename, dstFilename)
if err := cp.Copy(srcFilename, dstFilename); err != nil {
2023-02-14 22:10:50 +00:00
return fmt.Errorf("unable to copy static file `%s` to `%s`: %w", srcFilename, dstFilename, err)
}
}
2023-02-14 22:10:50 +00:00
return nil
}
2023-02-04 01:39:51 +00:00
func mkdirAll(path string) error {
_, err := os.Stat(path)
// NOTE: directory is exists
if err == nil {
return nil
}
// NOTE: unknown error
if !os.IsNotExist(err) {
return err
}
// NOTE: directory is not exists
2023-02-14 20:26:37 +00:00
// FIXME: fix rights
2023-02-04 01:39:51 +00:00
if err := os.MkdirAll(path, 0o755); err != nil {
return err
}
return nil
}
2023-02-14 18:56:32 +00:00
func makeSiteStruct(objs map[string]Object) error {
for _, obj := range objs {
categoryDir := filepath.Join(outDir, obj.Slug)
if err := mkdirAll(categoryDir); err != nil {
2023-02-04 01:39:51 +00:00
return err
}
// FIXME: embed templates
// FIXME: parse templates once at start
2023-02-14 17:50:14 +00:00
categoryIndexFilename := filepath.Join(categoryDir, "index.html")
f, err := os.Create(categoryIndexFilename)
if err != nil {
2023-02-04 01:39:51 +00:00
return err
}
2023-02-14 17:50:14 +00:00
fmt.Printf("Write category Index file: %s\n", categoryIndexFilename)
2023-02-14 18:12:57 +00:00
if err := tplCategoryIndex.Execute(f, obj); err != nil {
2023-02-04 01:39:51 +00:00
return err
}
}
2023-02-04 01:39:51 +00:00
return nil
}
2023-02-14 18:56:32 +00:00
func makeSitemap(objs map[string]Object) {
2023-02-14 17:50:14 +00:00
// FIXME: handle error
f, _ := os.Create(outSitemapFile)
2023-02-14 17:50:14 +00:00
fmt.Printf("Render Sitemap to: %s\n", outSitemapFile)
2023-02-14 18:12:57 +00:00
_ = tplSitemap.Execute(f, objs)
}
2023-02-14 19:06:46 +00:00
func makeObjByID(selector string, s *goquery.Selection) (*Object, error) {
var obj Object
var err error
2023-02-14 19:24:30 +00:00
s.Find(selector).Each(func(_ int, selCatHeader *goquery.Selection) {
selDescr := selCatHeader.NextFiltered("p")
// FIXME: bug. this would select links from all neighboring
// sub-categories until the next category. To prevent this we should
// find only first ul
ul := selCatHeader.NextFilteredUntil("ul", "h2")
2023-02-14 19:06:46 +00:00
var links []Link
2023-02-14 19:24:30 +00:00
ul.Find("li").Each(func(_ int, selLi *goquery.Selection) {
selLink := selLi.Find("a")
url, _ := selLink.Attr("href")
link := Link{
2023-02-14 19:24:30 +00:00
Title: selLink.Text(),
// FIXME: Title contains only title but description contains Title + description
Description: selLi.Text(),
Url: url,
}
links = append(links, link)
})
2023-02-14 19:06:46 +00:00
// FIXME: In this case we would have an empty category in main index.html with link to 404 page.
2022-08-30 14:21:44 +00:00
if len(links) == 0 {
2023-02-14 19:06:46 +00:00
err = errors.New("object has no links")
2022-08-30 14:21:44 +00:00
return
}
2023-02-14 19:06:46 +00:00
obj = Object{
2023-02-14 19:24:30 +00:00
Slug: slug.Generate(selCatHeader.Text()),
Title: selCatHeader.Text(),
Description: selDescr.Text(),
Items: links,
}
})
2023-02-14 19:06:46 +00:00
if err != nil {
return nil, fmt.Errorf("unable to build an object: %w", err)
}
return &obj, nil
}
2023-02-14 18:56:32 +00:00
func changeLinksInIndex(html string, query *goquery.Document, objs map[string]Object) {
query.Find("body #content ul li ul li a").Each(func(_ int, s *goquery.Selection) {
href, hrefExists := s.Attr("href")
if !hrefExists {
2023-02-14 18:46:53 +00:00
// FIXME: looks like is an error. Tag `a` in our case always
// should have `href` attr.
return
}
// do not replace links if no page has been created for it
_, objExists := objs[href]
if !objExists {
return
}
2023-02-14 18:46:53 +00:00
// FIXME: parse url
uri := strings.SplitAfter(href, "#")
if len(uri) >= 2 && uri[1] != "contents" {
2023-02-14 18:46:53 +00:00
// FIXME: use s.SetAttr
html = strings.ReplaceAll(
2023-02-14 18:46:53 +00:00
html,
fmt.Sprintf(`href="%s"`, href),
fmt.Sprintf(`href="%s"`, uri[1]),
)
}
})
2023-02-14 17:50:14 +00:00
fmt.Printf("Rewrite links in Index file: %s\n", outIndexFile)
_ = os.WriteFile(outIndexFile, []byte(html), 0644)
}