package cmd import ( "fmt" nurl "net/url" "os" "strconv" "strings" "time" "github.com/PuerkitoBio/goquery" "github.com/go-shiori/shiori/internal/model" "github.com/spf13/cobra" ) func importCmd() *cobra.Command { cmd := &cobra.Command{ Use: "import source-file", Short: "Import bookmarks from HTML file in Netscape Bookmark format", Args: cobra.ExactArgs(1), Run: importHandler, } cmd.Flags().BoolP("generate-tag", "t", false, "Auto generate tag from bookmark's category") return cmd } func importHandler(cmd *cobra.Command, args []string) { // Parse flags generateTag := cmd.Flags().Changed("generate-tag") // If user doesn't specify, ask if tag need to be generated if !generateTag { var submit string fmt.Print("Add parents folder as tag? (y/N): ") fmt.Scanln(&submit) generateTag = submit == "y" } // Prepare bookmark's ID bookID, err := DB.CreateNewID("bookmark") if err != nil { cError.Printf("Failed to create ID: %v\n", err) return } // Open bookmark's file srcFile, err := os.Open(args[0]) if err != nil { cError.Printf("Failed to open %s: %v\n", args[0], err) return } defer srcFile.Close() // Parse bookmark's file bookmarks := []model.Bookmark{} mapURL := make(map[string]struct{}) doc, err := goquery.NewDocumentFromReader(srcFile) if err != nil { cError.Printf("Failed to parse bookmark: %v\n", err) return } doc.Find("dt>a").Each(func(_ int, a *goquery.Selection) { // Get related elements dt := a.Parent() dl := dt.Parent() h3 := dl.Parent().Find("h3").First() // Get metadata title := a.Text() url, _ := a.Attr("href") strTags, _ := a.Attr("tags") strModified, _ := a.Attr("last_modified") intModified, _ := strconv.ParseInt(strModified, 10, 64) modified := time.Unix(intModified, 0) // Clean up URL by removing its fragment and UTM parameters tmp, err := nurl.Parse(url) if err != nil || tmp.Scheme == "" || tmp.Hostname() == "" { cError.Printf("Skip %s: URL is not valid\n", url) return } tmp.Fragment = "" clearUTMParams(tmp) url = tmp.String() // Check if the URL already exist before, both in bookmark // file or in database if _, exist := mapURL[url]; exist { cError.Printf("Skip %s: URL already exists\n", url) return } if _, exist := DB.GetBookmark(0, url); exist { cError.Printf("Skip %s: URL already exists\n", url) mapURL[url] = struct{}{} return } // Get bookmark tags tags := []model.Tag{} for _, strTag := range strings.Split(strTags, ",") { strTag = normalizeSpace(strTag) if strTag != "" { tags = append(tags, model.Tag{Name: strTag}) } } // Get category name for this bookmark // and add it as tags (if necessary) category := normalizeSpace(h3.Text()) if category != "" && generateTag { tags = append(tags, model.Tag{Name: category}) } // Add item to list bookmark := model.Bookmark{ ID: bookID, URL: url, Title: normalizeSpace(title), Modified: modified.Format("2006-01-02 15:04:05"), Tags: tags, } bookID++ mapURL[url] = struct{}{} bookmarks = append(bookmarks, bookmark) }) // Save bookmark to database bookmarks, err = DB.SaveBookmarks(bookmarks...) if err != nil { cError.Printf("Failed to save bookmarks: %v\n", err) return } // Print imported bookmark fmt.Println() printBookmarks(bookmarks...) }