2019-05-27 18:01:53 +08:00
|
|
|
package webserver
|
|
|
|
|
|
|
|
import (
|
2019-08-05 19:26:37 +08:00
|
|
|
"bytes"
|
|
|
|
"compress/gzip"
|
2019-08-04 22:34:23 +08:00
|
|
|
"fmt"
|
|
|
|
"html/template"
|
2019-05-27 18:01:53 +08:00
|
|
|
"io"
|
|
|
|
"net/http"
|
2019-08-08 21:16:25 +08:00
|
|
|
nurl "net/url"
|
2019-05-27 18:01:53 +08:00
|
|
|
"os"
|
|
|
|
"path"
|
|
|
|
fp "path/filepath"
|
2019-08-04 22:34:23 +08:00
|
|
|
"strconv"
|
2019-05-27 18:01:53 +08:00
|
|
|
"strings"
|
|
|
|
|
2019-08-05 19:26:37 +08:00
|
|
|
"github.com/PuerkitoBio/goquery"
|
|
|
|
"github.com/go-shiori/shiori/pkg/warc"
|
2019-05-27 18:01:53 +08:00
|
|
|
"github.com/julienschmidt/httprouter"
|
|
|
|
)
|
|
|
|
|
|
|
|
// serveFile is handler for general file request
|
|
|
|
func (h *handler) serveFile(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
err := serveFile(w, r.URL.Path, true)
|
|
|
|
checkError(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// serveJsFile is handler for GET /js/*filepath
|
|
|
|
func (h *handler) serveJsFile(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
filePath := r.URL.Path
|
|
|
|
fileName := path.Base(filePath)
|
|
|
|
fileDir := path.Dir(filePath)
|
|
|
|
|
|
|
|
if developmentMode && fp.Ext(fileName) == ".js" && strings.HasSuffix(fileName, ".min.js") {
|
|
|
|
fileName = strings.TrimSuffix(fileName, ".min.js") + ".js"
|
|
|
|
filePath = path.Join(fileDir, fileName)
|
|
|
|
if assetExists(filePath) {
|
|
|
|
redirectPage(w, r, filePath)
|
2019-08-07 00:37:52 +08:00
|
|
|
return
|
2019-05-27 18:01:53 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
err := serveFile(w, r.URL.Path, true)
|
|
|
|
checkError(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// serveIndexPage is handler for GET /
|
|
|
|
func (h *handler) serveIndexPage(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
// Make sure session still valid
|
|
|
|
err := h.validateSession(r)
|
|
|
|
if err != nil {
|
2019-08-29 16:44:03 +08:00
|
|
|
redirectURL := createRedirectURL("/login", r.URL.String())
|
|
|
|
redirectPage(w, r, redirectURL)
|
2019-05-27 18:01:53 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
err = serveFile(w, "index.html", false)
|
|
|
|
checkError(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// serveLoginPage is handler for GET /login
|
|
|
|
func (h *handler) serveLoginPage(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
// Make sure session is not valid
|
|
|
|
err := h.validateSession(r)
|
|
|
|
if err == nil {
|
|
|
|
redirectPage(w, r, "/")
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
err = serveFile(w, "login.html", false)
|
|
|
|
checkError(err)
|
|
|
|
}
|
|
|
|
|
2019-08-04 22:34:23 +08:00
|
|
|
// serveBookmarkContent is handler for GET /bookmark/:id/content
|
|
|
|
func (h *handler) serveBookmarkContent(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
// Get bookmark ID from URL
|
|
|
|
strID := ps.ByName("id")
|
|
|
|
id, err := strconv.Atoi(strID)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
// Get bookmark in database
|
|
|
|
bookmark, exist := h.DB.GetBookmark(id, "")
|
|
|
|
if !exist {
|
|
|
|
panic(fmt.Errorf("Bookmark not found"))
|
|
|
|
}
|
|
|
|
|
2019-08-08 21:16:25 +08:00
|
|
|
// If it's not public, make sure session still valid
|
|
|
|
if bookmark.Public != 1 {
|
|
|
|
err = h.validateSession(r)
|
|
|
|
if err != nil {
|
2019-08-29 16:44:03 +08:00
|
|
|
redirectURL := createRedirectURL("/login", r.URL.String())
|
|
|
|
redirectPage(w, r, redirectURL)
|
2019-08-08 21:16:25 +08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-08-12 10:02:59 +08:00
|
|
|
// Check if it has archive.
|
2019-08-05 23:06:00 +08:00
|
|
|
archivePath := fp.Join(h.DataDir, "archive", strID)
|
|
|
|
if fileExists(archivePath) {
|
|
|
|
bookmark.HasArchive = true
|
2019-08-12 10:02:59 +08:00
|
|
|
|
|
|
|
// Open archive, look in cache first
|
|
|
|
var archive *warc.Archive
|
|
|
|
cacheData, found := h.ArchiveCache.Get(strID)
|
|
|
|
|
|
|
|
if found {
|
|
|
|
archive = cacheData.(*warc.Archive)
|
|
|
|
} else {
|
|
|
|
archivePath := fp.Join(h.DataDir, "archive", strID)
|
|
|
|
archive, err = warc.Open(archivePath)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
h.ArchiveCache.Set(strID, archive, 0)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Find all image and convert its source to use the archive URL.
|
|
|
|
createArchivalURL := func(archivalName string) string {
|
|
|
|
archivalURL := *r.URL
|
|
|
|
archivalURL.Path = path.Join("/", "bookmark", strID, "archive", archivalName)
|
|
|
|
return archivalURL.String()
|
|
|
|
}
|
|
|
|
|
|
|
|
buffer := strings.NewReader(bookmark.HTML)
|
|
|
|
doc, err := goquery.NewDocumentFromReader(buffer)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
doc.Find("img, picture, figure, source").Each(func(_ int, node *goquery.Selection) {
|
|
|
|
// Get the needed attributes
|
|
|
|
src, _ := node.Attr("src")
|
|
|
|
strSrcSets, _ := node.Attr("srcset")
|
|
|
|
|
|
|
|
// Convert `src` attributes
|
|
|
|
if src != "" {
|
|
|
|
archivalName := getArchivalName(src)
|
|
|
|
if archivalName != "" && archive.HasResource(archivalName) {
|
|
|
|
node.SetAttr("src", createArchivalURL(archivalName))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Split srcset by comma, then process it like any URLs
|
|
|
|
srcSets := strings.Split(strSrcSets, ",")
|
|
|
|
for i, srcSet := range srcSets {
|
|
|
|
srcSet = strings.TrimSpace(srcSet)
|
|
|
|
parts := strings.SplitN(srcSet, " ", 2)
|
|
|
|
if parts[0] == "" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
archivalName := getArchivalName(parts[0])
|
|
|
|
if archivalName != "" && archive.HasResource(archivalName) {
|
|
|
|
archivalURL := createArchivalURL(archivalName)
|
|
|
|
srcSets[i] = strings.Replace(srcSets[i], parts[0], archivalURL, 1)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if len(srcSets) > 0 {
|
|
|
|
node.SetAttr("srcset", strings.Join(srcSets, ","))
|
|
|
|
}
|
|
|
|
})
|
|
|
|
|
|
|
|
bookmark.HTML, err = goquery.OuterHtml(doc.Selection)
|
|
|
|
checkError(err)
|
2019-08-05 23:06:00 +08:00
|
|
|
}
|
|
|
|
|
2019-08-04 22:34:23 +08:00
|
|
|
// Create template
|
|
|
|
funcMap := template.FuncMap{
|
|
|
|
"html": func(s string) template.HTML {
|
|
|
|
return template.HTML(s)
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
tplCache, err := createTemplate("content.html", funcMap)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
// Execute template
|
|
|
|
err = tplCache.Execute(w, &bookmark)
|
|
|
|
checkError(err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// serveThumbnailImage is handler for GET /bookmark/:id/thumb
|
2019-05-27 18:01:53 +08:00
|
|
|
func (h *handler) serveThumbnailImage(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
// Get bookmark ID from URL
|
|
|
|
id := ps.ByName("id")
|
|
|
|
|
|
|
|
// Open image
|
|
|
|
imgPath := fp.Join(h.DataDir, "thumb", id)
|
|
|
|
img, err := os.Open(imgPath)
|
|
|
|
checkError(err)
|
|
|
|
defer img.Close()
|
|
|
|
|
|
|
|
// Get image type from its 512 first bytes
|
|
|
|
buffer := make([]byte, 512)
|
|
|
|
_, err = img.Read(buffer)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
mimeType := http.DetectContentType(buffer)
|
|
|
|
w.Header().Set("Content-Type", mimeType)
|
|
|
|
|
2019-08-20 15:29:38 +08:00
|
|
|
// Set cache value
|
|
|
|
info, err := img.Stat()
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
etag := fmt.Sprintf(`W/"%x-%x"`, info.ModTime().Unix(), info.Size())
|
|
|
|
w.Header().Set("ETag", etag)
|
|
|
|
w.Header().Set("Cache-Control", "max-age=86400")
|
|
|
|
|
2019-05-27 18:01:53 +08:00
|
|
|
// Serve image
|
|
|
|
img.Seek(0, 0)
|
|
|
|
_, err = io.Copy(w, img)
|
|
|
|
checkError(err)
|
|
|
|
}
|
2019-08-05 19:26:37 +08:00
|
|
|
|
|
|
|
// serveBookmarkArchive is handler for GET /bookmark/:id/archive/*filepath
|
|
|
|
func (h *handler) serveBookmarkArchive(w http.ResponseWriter, r *http.Request, ps httprouter.Params) {
|
|
|
|
// Get parameter from URL
|
|
|
|
strID := ps.ByName("id")
|
|
|
|
resourcePath := ps.ByName("filepath")
|
|
|
|
resourcePath = strings.TrimPrefix(resourcePath, "/")
|
|
|
|
|
|
|
|
// Get bookmark from database
|
|
|
|
id, err := strconv.Atoi(strID)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
bookmark, exist := h.DB.GetBookmark(id, "")
|
|
|
|
if !exist {
|
|
|
|
panic(fmt.Errorf("Bookmark not found"))
|
|
|
|
}
|
|
|
|
|
2019-08-08 21:16:25 +08:00
|
|
|
// If it's not public, make sure session still valid
|
|
|
|
if bookmark.Public != 1 {
|
|
|
|
err = h.validateSession(r)
|
|
|
|
if err != nil {
|
|
|
|
urlQueries := nurl.Values{}
|
|
|
|
urlQueries.Set("dst", r.URL.Path)
|
|
|
|
|
|
|
|
redirectURL, _ := nurl.Parse("/login")
|
|
|
|
redirectURL.RawQuery = urlQueries.Encode()
|
|
|
|
|
|
|
|
redirectPage(w, r, redirectURL.String())
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-08-05 19:26:37 +08:00
|
|
|
// Open archive, look in cache first
|
|
|
|
var archive *warc.Archive
|
|
|
|
cacheData, found := h.ArchiveCache.Get(strID)
|
|
|
|
|
|
|
|
if found {
|
|
|
|
archive = cacheData.(*warc.Archive)
|
|
|
|
} else {
|
|
|
|
archivePath := fp.Join(h.DataDir, "archive", strID)
|
|
|
|
archive, err = warc.Open(archivePath)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
h.ArchiveCache.Set(strID, archive, 0)
|
|
|
|
}
|
|
|
|
|
|
|
|
content, contentType, err := archive.Read(resourcePath)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
// Set response header
|
|
|
|
w.Header().Set("Content-Encoding", "gzip")
|
|
|
|
w.Header().Set("Content-Type", contentType)
|
|
|
|
|
|
|
|
// If this is HTML and root, inject shiori header
|
|
|
|
if strings.Contains(strings.ToLower(contentType), "text/html") && resourcePath == "" {
|
|
|
|
// Extract gzip
|
|
|
|
buffer := bytes.NewBuffer(content)
|
|
|
|
gzipReader, err := gzip.NewReader(buffer)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
// Parse gzipped content
|
|
|
|
doc, err := goquery.NewDocumentFromReader(gzipReader)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
// Add Shiori overlay
|
2019-08-05 23:06:00 +08:00
|
|
|
tpl, err := template.New("archive").Parse(
|
2019-08-05 19:26:37 +08:00
|
|
|
`<div id="shiori-archive-header">
|
2019-08-05 23:06:00 +08:00
|
|
|
<p id="shiori-logo"><span>栞</span>shiori</p>
|
2019-08-05 19:26:37 +08:00
|
|
|
<div class="spacer"></div>
|
2019-08-05 23:06:00 +08:00
|
|
|
<a href="{{.URL}}" target="_blank">View Original</a>
|
|
|
|
{{if .HasContent}}
|
|
|
|
<a href="/bookmark/{{.ID}}/content">View Readable</a>
|
|
|
|
{{end}}
|
|
|
|
</div>`)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
tplOutput := bytes.NewBuffer(nil)
|
|
|
|
err = tpl.Execute(tplOutput, &bookmark)
|
|
|
|
checkError(err)
|
2019-08-05 19:26:37 +08:00
|
|
|
|
2019-08-06 09:45:39 +08:00
|
|
|
doc.Find("head").AppendHtml(`<link href="/css/source-sans-pro.min.css" rel="stylesheet">`)
|
2019-08-05 19:26:37 +08:00
|
|
|
doc.Find("head").AppendHtml(`<link href="/css/archive.css" rel="stylesheet">`)
|
2019-08-05 23:06:00 +08:00
|
|
|
doc.Find("body").PrependHtml(tplOutput.String())
|
2019-08-05 19:26:37 +08:00
|
|
|
|
|
|
|
// Revert back to HTML
|
|
|
|
outerHTML, err := goquery.OuterHtml(doc.Selection)
|
|
|
|
checkError(err)
|
|
|
|
|
|
|
|
// Gzip it again and send to response writer
|
|
|
|
gzipWriter := gzip.NewWriter(w)
|
|
|
|
gzipWriter.Write([]byte(outerHTML))
|
|
|
|
gzipWriter.Flush()
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Serve content
|
|
|
|
w.Write(content)
|
|
|
|
}
|