623 lines
19 KiB
Go
623 lines
19 KiB
Go
package readlist
|
|
|
|
import (
|
|
"bytes"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io"
|
|
"net/http"
|
|
"strings"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/go-shiori/go-readability"
|
|
"github.com/google/uuid"
|
|
"gorm.io/gorm"
|
|
"jaytaylor.com/html2text"
|
|
)
|
|
|
|
// ImportStatus represents the status of a Shiori import operation
|
|
type ImportStatus struct {
|
|
ID string `json:"id"`
|
|
TotalBookmarks int `json:"totalBookmarks"`
|
|
ImportedCount int `json:"importedCount"`
|
|
FailedCount int `json:"failedCount"`
|
|
InProgress bool `json:"inProgress"`
|
|
StartedAt time.Time `json:"startedAt"`
|
|
CompletedAt *time.Time `json:"completedAt"`
|
|
Error string `json:"error,omitempty"`
|
|
}
|
|
|
|
// Service handles read later operations
|
|
type Service struct {
|
|
db *gorm.DB
|
|
imports map[string]*ImportStatus
|
|
importsMutex sync.RWMutex
|
|
rateLimiter *time.Ticker // For rate limiting API calls
|
|
}
|
|
|
|
// NewService creates a new read later service
|
|
func NewService(db *gorm.DB) *Service {
|
|
return &Service{
|
|
db: db,
|
|
imports: make(map[string]*ImportStatus),
|
|
importsMutex: sync.RWMutex{},
|
|
rateLimiter: time.NewTicker(500 * time.Millisecond), // 500ms delay between requests
|
|
}
|
|
}
|
|
|
|
// Create adds a new URL to read later
|
|
func (s *Service) Create(url string) (*ReadLaterItem, error) {
|
|
item := &ReadLaterItem{
|
|
ID: uuid.New().String(),
|
|
URL: url,
|
|
CreatedAt: time.Now(),
|
|
UpdatedAt: time.Now(),
|
|
}
|
|
|
|
// Parse URL and extract content
|
|
if err := item.ParseURL(); err != nil {
|
|
return nil, fmt.Errorf("failed to parse URL: %w", err)
|
|
}
|
|
|
|
if err := s.db.Create(item).Error; err != nil {
|
|
return nil, fmt.Errorf("failed to create read later item: %w", err)
|
|
}
|
|
|
|
return item, nil
|
|
}
|
|
|
|
// Get retrieves a read later item by ID
|
|
func (s *Service) Get(id string) (*ReadLaterItem, error) {
|
|
var item ReadLaterItem
|
|
if err := s.db.First(&item, "id = ?", id).Error; err != nil {
|
|
if err == gorm.ErrRecordNotFound {
|
|
return nil, nil
|
|
}
|
|
return nil, fmt.Errorf("failed to get read later item: %w", err)
|
|
}
|
|
return &item, nil
|
|
}
|
|
|
|
// List retrieves all read later items
|
|
func (s *Service) List(includeArchived bool) ([]ReadLaterItem, error) {
|
|
var items []ReadLaterItem
|
|
query := s.db.Order("created_at desc")
|
|
|
|
if !includeArchived {
|
|
query = query.Where("archived_at IS NULL")
|
|
}
|
|
|
|
if err := query.Find(&items).Error; err != nil {
|
|
return nil, fmt.Errorf("failed to list read later items: %w", err)
|
|
}
|
|
return items, nil
|
|
}
|
|
|
|
// MarkRead marks an item as read
|
|
func (s *Service) MarkRead(id string) error {
|
|
now := time.Now()
|
|
if err := s.db.Model(&ReadLaterItem{}).
|
|
Where("id = ?", id).
|
|
Updates(map[string]interface{}{
|
|
"read_at": &now,
|
|
"updated_at": now,
|
|
}).Error; err != nil {
|
|
return fmt.Errorf("failed to mark item as read: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// Archive marks an item as archived
|
|
func (s *Service) Archive(id string) error {
|
|
now := time.Now()
|
|
if err := s.db.Model(&ReadLaterItem{}).
|
|
Where("id = ?", id).
|
|
Updates(map[string]interface{}{
|
|
"archived_at": &now,
|
|
"updated_at": now,
|
|
}).Error; err != nil {
|
|
return fmt.Errorf("failed to archive item: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// Unarchive removes the archived status from an item
|
|
func (s *Service) Unarchive(id string) error {
|
|
now := time.Now()
|
|
if err := s.db.Model(&ReadLaterItem{}).
|
|
Where("id = ?", id).
|
|
Updates(map[string]interface{}{
|
|
"archived_at": nil,
|
|
"updated_at": now,
|
|
}).Error; err != nil {
|
|
return fmt.Errorf("failed to unarchive item: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// Delete removes a read later item
|
|
func (s *Service) Delete(id string) error {
|
|
if err := s.db.Delete(&ReadLaterItem{}, "id = ?", id).Error; err != nil {
|
|
return fmt.Errorf("failed to delete read later item: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// Reset deletes all read later items (for testing)
|
|
func (s *Service) Reset() error {
|
|
if err := s.db.Session(&gorm.Session{AllowGlobalUpdate: true}).Delete(&ReadLaterItem{}).Error; err != nil {
|
|
return fmt.Errorf("failed to reset read later items: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// ShioriCredentials contains the credentials for connecting to a Shiori instance
|
|
type ShioriCredentials struct {
|
|
URL string `json:"url"`
|
|
Username string `json:"username"`
|
|
Password string `json:"password"`
|
|
}
|
|
|
|
// ShioriBookmark represents a bookmark in Shiori
|
|
type ShioriBookmark struct {
|
|
ID int `json:"id"`
|
|
URL string `json:"url"`
|
|
Title string `json:"title"`
|
|
Excerpt string `json:"excerpt"`
|
|
Author string `json:"author"`
|
|
Public int `json:"public"`
|
|
CreatedAt string `json:"createdAt"`
|
|
ModifiedAt string `json:"modifiedAt"`
|
|
Modified time.Time `json:"modified,omitempty"`
|
|
Content string `json:"content,omitempty"`
|
|
HTML string `json:"html,omitempty"`
|
|
ImageURL string `json:"imageURL,omitempty"`
|
|
HasContent bool `json:"hasContent"`
|
|
HasImage bool `json:"hasImage"`
|
|
HasArchive bool `json:"hasArchive,omitempty"`
|
|
HasEbook bool `json:"hasEbook,omitempty"`
|
|
CreateArchive bool `json:"create_archive,omitempty"`
|
|
CreateEbook bool `json:"create_ebook,omitempty"`
|
|
Tags json.RawMessage `json:"tags,omitempty"`
|
|
}
|
|
|
|
// ShioriLoginResponse represents the response from Shiori login API
|
|
type ShioriLoginResponse struct {
|
|
OK bool `json:"ok"`
|
|
Message struct {
|
|
Token string `json:"token"` // JWT token for bearer auth
|
|
Session string `json:"session"` // Session ID
|
|
Expires int64 `json:"expires"`
|
|
} `json:"message"`
|
|
}
|
|
|
|
// ShioriBookmarksResponse represents the response from Shiori bookmarks API
|
|
type ShioriBookmarksResponse struct {
|
|
Bookmarks []ShioriBookmark `json:"bookmarks"`
|
|
MaxPage int `json:"maxPage"`
|
|
Count int `json:"count"`
|
|
}
|
|
|
|
// ImportFromShiori imports bookmarks from a Shiori instance
|
|
// Returns the import ID which can be used to check the status
|
|
func (s *Service) ImportFromShiori(creds ShioriCredentials) (string, error) {
|
|
// For debugging
|
|
fmt.Printf("[DEBUG] Starting import from Shiori URL: %s\n", creds.URL)
|
|
|
|
// Create a new import status
|
|
importID := s.CreateImportStatus()
|
|
fmt.Printf("[DEBUG] Created import status with ID: %s\n", importID)
|
|
|
|
// Start the import process in a goroutine
|
|
go s.runShioriImport(importID, creds)
|
|
|
|
// Return the import ID so the caller can check the status
|
|
return importID, nil
|
|
}
|
|
|
|
// runShioriImport performs the actual import process in the background
|
|
func (s *Service) runShioriImport(importID string, creds ShioriCredentials) {
|
|
fmt.Printf("[DEBUG] Starting runShioriImport for ID: %s\n", importID)
|
|
|
|
// Define a helper function to mark import as failed
|
|
markFailed := func(err error) {
|
|
fmt.Printf("[DEBUG] Import failed: %v\n", err)
|
|
s.UpdateImportStatus(importID, func(status *ImportStatus) {
|
|
status.InProgress = false
|
|
status.Error = err.Error()
|
|
})
|
|
}
|
|
|
|
// Login to Shiori
|
|
fmt.Printf("[DEBUG] Attempting to login to Shiori at %s\n", creds.URL)
|
|
token, err := s.loginToShiori(creds)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] Login failed: %v\n", err)
|
|
markFailed(fmt.Errorf("failed to login to Shiori: %v", err))
|
|
return
|
|
}
|
|
fmt.Printf("[DEBUG] Login successful, token: %s...\n", token[:min(len(token), 10)])
|
|
|
|
// Fetch all bookmarks from Shiori with pagination
|
|
fmt.Printf("[DEBUG] Fetching bookmarks from Shiori\n")
|
|
allBookmarks, err := s.fetchShioriBookmarks(creds.URL, token)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] Fetching bookmarks failed: %v\n", err)
|
|
markFailed(fmt.Errorf("failed to fetch bookmarks: %v", err))
|
|
return
|
|
}
|
|
fmt.Printf("[DEBUG] Fetched %d bookmarks\n", len(allBookmarks))
|
|
|
|
// Setup counters
|
|
importedCount := 0
|
|
failedCount := 0
|
|
|
|
// Update status with total count
|
|
s.UpdateImportStatus(importID, func(status *ImportStatus) {
|
|
status.TotalBookmarks = len(allBookmarks)
|
|
})
|
|
fmt.Printf("[DEBUG] Updated import status with total count: %d\n", len(allBookmarks))
|
|
|
|
// Process each bookmark
|
|
for i, bookmark := range allBookmarks {
|
|
fmt.Printf("[DEBUG] Processing bookmark %d/%d: %s\n", i+1, len(allBookmarks), bookmark.URL)
|
|
<-s.rateLimiter.C // Apply rate limiting for processing each bookmark
|
|
|
|
// Create a ReadLaterItem from the bookmark
|
|
item := ReadLaterItem{
|
|
ID: uuid.New().String(),
|
|
URL: bookmark.URL,
|
|
Title: bookmark.Title,
|
|
Image: bookmark.ImageURL,
|
|
Description: bookmark.Excerpt,
|
|
Status: "unread",
|
|
Content: bookmark.Content,
|
|
CreatedAt: time.Now(),
|
|
UpdatedAt: time.Now(),
|
|
}
|
|
|
|
// If content is empty, try to fetch it
|
|
if item.Content == "" {
|
|
fmt.Printf("[DEBUG] Content empty, fetching from URL: %s\n", bookmark.URL)
|
|
article, err := readability.FromURL(bookmark.URL, 30*time.Second)
|
|
if err == nil && article.Content != "" {
|
|
item.Content = article.Content
|
|
|
|
// If description/excerpt is empty, use the beginning of the content
|
|
if item.Description == "" {
|
|
plainText, err := s.ConvertHTMLToText(article.Content)
|
|
if err == nil && plainText != "" {
|
|
// Use the first 150 characters as description
|
|
if len(plainText) > 150 {
|
|
item.Description = plainText[:150] + "..."
|
|
} else {
|
|
item.Description = plainText
|
|
}
|
|
}
|
|
}
|
|
|
|
// If title is empty, use article title
|
|
if item.Title == "" && article.Title != "" {
|
|
item.Title = article.Title
|
|
}
|
|
|
|
// If image is empty, use article image
|
|
if item.Image == "" && article.Image != "" {
|
|
item.Image = article.Image
|
|
}
|
|
} else if err != nil {
|
|
fmt.Printf("[DEBUG] Error fetching article content: %v\n", err)
|
|
}
|
|
} else if item.Description == "" { // Convert any existing HTML content to plain text for the description if needed
|
|
plainText, err := s.ConvertHTMLToText(item.Content)
|
|
if err == nil && plainText != "" {
|
|
// Use the first 150 characters as description
|
|
if len(plainText) > 150 {
|
|
item.Description = plainText[:150] + "..."
|
|
} else {
|
|
item.Description = plainText
|
|
}
|
|
} else if err != nil {
|
|
fmt.Printf("[DEBUG] Error converting HTML to text: %v\n", err)
|
|
}
|
|
}
|
|
|
|
// Ensure we have at least a basic title if it's still empty
|
|
if item.Title == "" {
|
|
item.Title = bookmark.URL
|
|
}
|
|
|
|
// Save the item to the database
|
|
fmt.Printf("[DEBUG] Saving item to database: %s\n", item.URL)
|
|
err = s.db.Create(&item).Error
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] Error saving item: %v\n", err)
|
|
failedCount++
|
|
} else {
|
|
importedCount++
|
|
}
|
|
|
|
// Update import status
|
|
s.UpdateImportStatus(importID, func(status *ImportStatus) {
|
|
status.ImportedCount = importedCount
|
|
status.FailedCount = failedCount
|
|
})
|
|
}
|
|
|
|
// Mark import as complete
|
|
fmt.Printf("[DEBUG] Import complete. Imported: %d, Failed: %d\n", importedCount, failedCount)
|
|
s.UpdateImportStatus(importID, func(status *ImportStatus) {
|
|
status.InProgress = false
|
|
completedAt := time.Now()
|
|
status.CompletedAt = &completedAt
|
|
})
|
|
}
|
|
|
|
// loginToShiori logs in to a Shiori instance and returns the session token
|
|
func (s *Service) loginToShiori(creds ShioriCredentials) (string, error) {
|
|
// Apply rate limiting
|
|
<-s.rateLimiter.C
|
|
|
|
fmt.Printf("[DEBUG] loginToShiori: Starting login to %s\n", creds.URL)
|
|
|
|
// Construct login URL
|
|
loginURL := fmt.Sprintf("%s/api/v1/auth/login", strings.TrimSuffix(creds.URL, "/"))
|
|
fmt.Printf("[DEBUG] loginToShiori: Login URL: %s\n", loginURL)
|
|
|
|
// Prepare login data
|
|
loginData := map[string]string{
|
|
"username": creds.Username,
|
|
"password": creds.Password,
|
|
}
|
|
|
|
// Convert login data to JSON
|
|
jsonData, err := json.Marshal(loginData)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] loginToShiori: Error marshaling login data: %v\n", err)
|
|
return "", fmt.Errorf("failed to marshal login data: %v", err)
|
|
}
|
|
|
|
// Create request
|
|
req, err := http.NewRequest("POST", loginURL, bytes.NewBuffer(jsonData))
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] loginToShiori: Error creating request: %v\n", err)
|
|
return "", fmt.Errorf("failed to create login request: %v", err)
|
|
}
|
|
|
|
// Set headers
|
|
req.Header.Set("Content-Type", "application/json")
|
|
|
|
// Send request
|
|
fmt.Printf("[DEBUG] loginToShiori: Sending login request\n")
|
|
client := &http.Client{}
|
|
resp, err := client.Do(req)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] loginToShiori: Error sending request: %v\n", err)
|
|
return "", fmt.Errorf("failed to send login request: %v", err)
|
|
}
|
|
defer func() {
|
|
if err := resp.Body.Close(); err != nil {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error closing response body: %v\n", err)
|
|
}
|
|
}()
|
|
|
|
// Check response status
|
|
fmt.Printf("[DEBUG] loginToShiori: Response status: %s\n", resp.Status)
|
|
if resp.StatusCode != http.StatusOK {
|
|
// Read the error response body
|
|
errBody, _ := io.ReadAll(resp.Body)
|
|
fmt.Printf("[DEBUG] loginToShiori: Error response body: %s\n", string(errBody))
|
|
return "", fmt.Errorf("login failed with status code: %d", resp.StatusCode)
|
|
}
|
|
|
|
// Read response body
|
|
bodyBytes, err := io.ReadAll(resp.Body)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] loginToShiori: Error reading response body: %v\n", err)
|
|
return "", fmt.Errorf("failed to read login response: %v", err)
|
|
}
|
|
|
|
// Print response body for debugging
|
|
fmt.Printf("[DEBUG] loginToShiori: Response body: %s\n", string(bodyBytes))
|
|
|
|
// We need to re-create the reader since we consumed it
|
|
resp.Body = io.NopCloser(bytes.NewBuffer(bodyBytes))
|
|
|
|
// Parse response
|
|
var loginResp ShioriLoginResponse
|
|
if err := json.NewDecoder(resp.Body).Decode(&loginResp); err != nil {
|
|
fmt.Printf("[DEBUG] loginToShiori: Error parsing response: %v\n", err)
|
|
return "", fmt.Errorf("failed to parse login response: %v", err)
|
|
}
|
|
|
|
// Extract token
|
|
token := loginResp.Message.Token
|
|
fmt.Printf("[DEBUG] loginToShiori: Successfully logged in, token length: %d\n", len(token))
|
|
|
|
return token, nil
|
|
}
|
|
|
|
// fetchShioriBookmarks retrieves bookmarks from a Shiori instance using the session token
|
|
func (s *Service) fetchShioriBookmarks(baseURL, session string) ([]ShioriBookmark, error) {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Starting fetching bookmarks from %s\n", baseURL)
|
|
// Apply rate limiting
|
|
<-s.rateLimiter.C
|
|
|
|
// Ensure baseURL doesn't have a trailing slash
|
|
baseURL = strings.TrimSuffix(baseURL, "/")
|
|
|
|
// Initialize results
|
|
allBookmarks := []ShioriBookmark{}
|
|
|
|
// Start with page 1
|
|
page := 1
|
|
maxPage := 1 // Will be updated from the first response
|
|
|
|
for page <= maxPage {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Fetching page %d of %d\n", page, maxPage)
|
|
|
|
// Construct URL for the current page - fixing the API endpoint path
|
|
url := fmt.Sprintf("%s/api/bookmarks?page=%d", baseURL, page)
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Request URL for page %d: %s\n", page, url)
|
|
|
|
// Create request
|
|
req, err := http.NewRequest("GET", url, nil)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error creating request for page %d: %v\n", page, err)
|
|
return nil, fmt.Errorf("failed to create request: %v", err)
|
|
}
|
|
|
|
// Set headers
|
|
req.Header.Set("Content-Type", "application/json")
|
|
req.Header.Set("Authorization", fmt.Sprintf("Bearer %s", session))
|
|
|
|
// Send request
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Sending request for page %d\n", page)
|
|
client := &http.Client{}
|
|
resp, err := client.Do(req)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error sending request for page %d: %v\n", page, err)
|
|
return nil, fmt.Errorf("failed to send request: %v", err)
|
|
}
|
|
defer func() {
|
|
if err := resp.Body.Close(); err != nil {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error closing response body: %v\n", err)
|
|
}
|
|
}()
|
|
|
|
// Check response
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Response status for page %d: %s\n", page, resp.Status)
|
|
if resp.StatusCode != http.StatusOK {
|
|
// Read the error response body
|
|
errBody, _ := io.ReadAll(resp.Body)
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error response body for page %d: %s\n", page, string(errBody))
|
|
return nil, fmt.Errorf("request failed with status code: %d", resp.StatusCode)
|
|
}
|
|
|
|
// Read response body
|
|
bodyBytes, err := io.ReadAll(resp.Body)
|
|
if err != nil {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error reading response body for page %d: %v\n", page, err)
|
|
return nil, fmt.Errorf("failed to read response: %v", err)
|
|
}
|
|
|
|
// Print the first 200 characters of response for debugging
|
|
previewText := string(bodyBytes)
|
|
if len(previewText) > 200 {
|
|
previewText = previewText[:200] + "..."
|
|
}
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Response body preview for page %d: %s\n", page, previewText)
|
|
|
|
// We need to re-create the reader since we consumed it
|
|
resp.Body = io.NopCloser(bytes.NewBuffer(bodyBytes))
|
|
|
|
// Parse response
|
|
var bookmarksResp ShioriBookmarksResponse
|
|
if err := json.NewDecoder(resp.Body).Decode(&bookmarksResp); err != nil {
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Error parsing response for page %d: %v\n", page, err)
|
|
return nil, fmt.Errorf("failed to parse response: %v", err)
|
|
}
|
|
|
|
// Update maxPage from the response (only on first page)
|
|
if page == 1 {
|
|
maxPage = bookmarksResp.MaxPage
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Updated max page to %d\n", maxPage)
|
|
}
|
|
|
|
// Add bookmarks from this page to results
|
|
allBookmarks = append(allBookmarks, bookmarksResp.Bookmarks...)
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Added %d bookmarks from page %d, total so far: %d\n",
|
|
len(bookmarksResp.Bookmarks), page, len(allBookmarks))
|
|
|
|
// Move to next page
|
|
page++
|
|
|
|
// Apply rate limiting before next request (if there is one)
|
|
if page <= maxPage {
|
|
<-s.rateLimiter.C
|
|
}
|
|
}
|
|
|
|
fmt.Printf("[DEBUG] fetchShioriBookmarks: Completed, fetched %d bookmarks total\n", len(allBookmarks))
|
|
return allBookmarks, nil
|
|
}
|
|
|
|
// CreateImportStatus initializes a new import status and returns its ID
|
|
func (s *Service) CreateImportStatus() string {
|
|
id := uuid.New().String()
|
|
status := &ImportStatus{
|
|
ID: id,
|
|
InProgress: true,
|
|
StartedAt: time.Now(),
|
|
ImportedCount: 0,
|
|
FailedCount: 0,
|
|
}
|
|
|
|
s.importsMutex.Lock()
|
|
s.imports[id] = status
|
|
s.importsMutex.Unlock()
|
|
|
|
return id
|
|
}
|
|
|
|
// UpdateImportStatus updates the status of an import operation
|
|
func (s *Service) UpdateImportStatus(id string, update func(*ImportStatus)) {
|
|
s.importsMutex.Lock()
|
|
defer s.importsMutex.Unlock()
|
|
|
|
if status, exists := s.imports[id]; exists {
|
|
update(status)
|
|
}
|
|
}
|
|
|
|
// GetImportStatus retrieves the status of an import operation
|
|
func (s *Service) GetImportStatus(id string) (*ImportStatus, bool) {
|
|
s.importsMutex.RLock()
|
|
defer s.importsMutex.RUnlock()
|
|
|
|
status, exists := s.imports[id]
|
|
return status, exists
|
|
}
|
|
|
|
// CleanupOldImports removes completed import statuses older than a day
|
|
func (s *Service) CleanupOldImports() {
|
|
s.importsMutex.Lock()
|
|
defer s.importsMutex.Unlock()
|
|
|
|
cutoff := time.Now().Add(-24 * time.Hour)
|
|
|
|
for id, status := range s.imports {
|
|
if !status.InProgress && status.CompletedAt != nil && status.CompletedAt.Before(cutoff) {
|
|
delete(s.imports, id)
|
|
}
|
|
}
|
|
}
|
|
|
|
// ConvertHTMLToText converts HTML content to plain text
|
|
// This is useful when we need to extract text from HTML for searching or displaying in non-HTML contexts
|
|
func (s *Service) ConvertHTMLToText(htmlContent string) (string, error) {
|
|
if htmlContent == "" {
|
|
return "", nil
|
|
}
|
|
|
|
// Convert HTML to plain text
|
|
text, err := html2text.FromString(htmlContent, html2text.Options{
|
|
PrettyTables: true,
|
|
OmitLinks: false,
|
|
})
|
|
|
|
if err != nil {
|
|
return "", err
|
|
}
|
|
|
|
return text, nil
|
|
}
|
|
|
|
// Add helper function for safe string slicing
|
|
func min(a, b int) int {
|
|
if a < b {
|
|
return a
|
|
}
|
|
return b
|
|
}
|