kjanat
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 31 additions & 0 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 31 additions & 0 deletions
diff --git a/‎internal/exporters/docx.go‎
Lines changed: 196 additions & 0 deletions b/‎internal/exporters/docx.go‎
Lines changed: 196 additions & 0 deletions
diff --git a/‎internal/exporters/factory.go‎
Lines changed: 63 additions & 0 deletions b/‎internal/exporters/factory.go‎
Lines changed: 63 additions & 0 deletions
@@ -105,6 +105,11 @@ jobs:
       - name: Run tests
         run: go test -v ./...
 
+      - name: Install UPX
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y upx
+
       - name: Build binaries
         run: |
           # Set the build time environment variable
@@ -121,6 +126,32 @@ jobs:
             --verbose \
             -ldflags "-s -w -X github.com/kjanat/articulate-parser/internal/version.Version=${{ github.ref_name }} -X github.com/kjanat/articulate-parser/internal/version.BuildTime=$BUILD_TIME -X github.com/kjanat/articulate-parser/internal/version.GitCommit=${{ github.sha }}"
 
+      - name: Compress binaries with UPX
+        run: |
+          echo "Compressing binaries with UPX..."
+          cd build/
+          
+          # Get original sizes
+          echo "Original sizes:"
+          ls -lah
+          echo ""
+          
+          # Compress all binaries except Darwin (macOS) binaries as UPX doesn't work well with recent macOS versions
+          for binary in articulate-parser-*; do
+            if [[ "$binary" == *"darwin"* ]]; then
+              echo "Skipping UPX compression for $binary (macOS compatibility)"
+            else
+              echo "Compressing $binary..."
+              upx --best --lzma "$binary" || {
+                echo "Warning: UPX compression failed for $binary, keeping original"
+              }
+            fi
+          done
+          
+          echo ""
+          echo "Final sizes:"
+          ls -lah
+
       - name: Upload a Build Artifact
         uses: actions/[email protected]
         with:
 
@@ -0,0 +1,196 @@
+// Package exporters provides implementations of the Exporter interface
+// for converting Articulate Rise courses into various file formats.
+package exporters
+
+import (
+	"fmt"
+	"strings"
+
+	"github.com/kjanat/articulate-parser/internal/interfaces"
+	"github.com/kjanat/articulate-parser/internal/models"
+	"github.com/kjanat/articulate-parser/internal/services"
+	"github.com/unidoc/unioffice/document"
+)
+
+// DocxExporter implements the Exporter interface for DOCX format.
+// It converts Articulate Rise course data into a Microsoft Word document
+// using the unioffice/document package.
+type DocxExporter struct {
+	// htmlCleaner is used to convert HTML content to plain text
+	htmlCleaner *services.HTMLCleaner
+}
+
+// NewDocxExporter creates a new DocxExporter instance.
+// It takes an HTMLCleaner to handle HTML content conversion.
+//
+// Parameters:
+//   - htmlCleaner: Service for cleaning HTML content in course data
+//
+// Returns:
+//   - An implementation of the Exporter interface for DOCX format
+func NewDocxExporter(htmlCleaner *services.HTMLCleaner) interfaces.Exporter {
+	return &DocxExporter{
+		htmlCleaner: htmlCleaner,
+	}
+}
+
+// Export exports the course to a DOCX file.
+// It creates a Word document with formatted content based on the course data
+// and saves it to the specified output path.
+//
+// Parameters:
+//   - course: The course data model to export
+//   - outputPath: The file path where the DOCX content will be written
+//
+// Returns:
+//   - An error if creating or saving the document fails
+func (e *DocxExporter) Export(course *models.Course, outputPath string) error {
+	doc := document.New()
+
+	// Add title
+	titlePara := doc.AddParagraph()
+	titleRun := titlePara.AddRun()
+	titleRun.AddText(course.Course.Title)
+	titleRun.Properties().SetBold(true)
+	titleRun.Properties().SetSize(16)
+
+	// Add description if available
+	if course.Course.Description != "" {
+		descPara := doc.AddParagraph()
+		descRun := descPara.AddRun()
+		cleanDesc := e.htmlCleaner.CleanHTML(course.Course.Description)
+		descRun.AddText(cleanDesc)
+	}
+
+	// Add each lesson
+	for _, lesson := range course.Course.Lessons {
+		e.exportLesson(doc, &lesson)
+	}
+
+	// Ensure output directory exists and add .docx extension
+	if !strings.HasSuffix(strings.ToLower(outputPath), ".docx") {
+		outputPath = outputPath + ".docx"
+	}
+
+	return doc.SaveToFile(outputPath)
+}
+
+// exportLesson adds a lesson to the document with appropriate formatting.
+// It creates a lesson heading, adds the description, and processes all items in the lesson.
+//
+// Parameters:
+//   - doc: The Word document being created
+//   - lesson: The lesson data model to export
+func (e *DocxExporter) exportLesson(doc *document.Document, lesson *models.Lesson) {
+	// Add lesson title
+	lessonPara := doc.AddParagraph()
+	lessonRun := lessonPara.AddRun()
+	lessonRun.AddText(fmt.Sprintf("Lesson: %s", lesson.Title))
+	lessonRun.Properties().SetBold(true)
+	lessonRun.Properties().SetSize(14)
+
+	// Add lesson description if available
+	if lesson.Description != "" {
+		descPara := doc.AddParagraph()
+		descRun := descPara.AddRun()
+		cleanDesc := e.htmlCleaner.CleanHTML(lesson.Description)
+		descRun.AddText(cleanDesc)
+	}
+
+	// Add each item in the lesson
+	for _, item := range lesson.Items {
+		e.exportItem(doc, &item)
+	}
+}
+
+// exportItem adds an item to the document.
+// It creates an item heading and processes all sub-items within the item.
+//
+// Parameters:
+//   - doc: The Word document being created
+//   - item: The item data model to export
+func (e *DocxExporter) exportItem(doc *document.Document, item *models.Item) {
+	// Add item type as heading
+	if item.Type != "" {
+		itemPara := doc.AddParagraph()
+		itemRun := itemPara.AddRun()
+		itemRun.AddText(strings.Title(item.Type))
+		itemRun.Properties().SetBold(true)
+		itemRun.Properties().SetSize(12)
+	}
+
+	// Add sub-items
+	for _, subItem := range item.Items {
+		e.exportSubItem(doc, &subItem)
+	}
+}
+
+// exportSubItem adds a sub-item to the document.
+// It handles different components of a sub-item like title, heading,
+// paragraph content, answers, and feedback.
+//
+// Parameters:
+//   - doc: The Word document being created
+//   - subItem: The sub-item data model to export
+func (e *DocxExporter) exportSubItem(doc *document.Document, subItem *models.SubItem) {
+	// Add title if available
+	if subItem.Title != "" {
+		subItemPara := doc.AddParagraph()
+		subItemRun := subItemPara.AddRun()
+		subItemRun.AddText("  " + subItem.Title) // Indented
+		subItemRun.Properties().SetBold(true)
+	}
+
+	// Add heading if available
+	if subItem.Heading != "" {
+		headingPara := doc.AddParagraph()
+		headingRun := headingPara.AddRun()
+		cleanHeading := e.htmlCleaner.CleanHTML(subItem.Heading)
+		headingRun.AddText("  " + cleanHeading) // Indented
+		headingRun.Properties().SetBold(true)
+	}
+
+	// Add paragraph content if available
+	if subItem.Paragraph != "" {
+		contentPara := doc.AddParagraph()
+		contentRun := contentPara.AddRun()
+		cleanContent := e.htmlCleaner.CleanHTML(subItem.Paragraph)
+		contentRun.AddText("  " + cleanContent) // Indented
+	}
+
+	// Add answers if this is a question
+	if len(subItem.Answers) > 0 {
+		answersPara := doc.AddParagraph()
+		answersRun := answersPara.AddRun()
+		answersRun.AddText("  Answers:")
+		answersRun.Properties().SetBold(true)
+
+		for i, answer := range subItem.Answers {
+			answerPara := doc.AddParagraph()
+			answerRun := answerPara.AddRun()
+			prefix := fmt.Sprintf("    %d. ", i+1)
+			if answer.Correct {
+				prefix += "✓ "
+			}
+			cleanAnswer := e.htmlCleaner.CleanHTML(answer.Title)
+			answerRun.AddText(prefix + cleanAnswer)
+		}
+	}
+
+	// Add feedback if available
+	if subItem.Feedback != "" {
+		feedbackPara := doc.AddParagraph()
+		feedbackRun := feedbackPara.AddRun()
+		cleanFeedback := e.htmlCleaner.CleanHTML(subItem.Feedback)
+		feedbackRun.AddText("  Feedback: " + cleanFeedback)
+		feedbackRun.Properties().SetItalic(true)
+	}
+}
+
+// GetSupportedFormat returns the format name this exporter supports.
+//
+// Returns:
+//   - A string representing the supported format ("docx")
+func (e *DocxExporter) GetSupportedFormat() string {
+	return "docx"
+}
@@ -0,0 +1,63 @@
+// Package exporters provides implementations of the Exporter interface
+// for converting Articulate Rise courses into various file formats.
+package exporters
+
+import (
+	"fmt"
+	"strings"
+
+	"github.com/kjanat/articulate-parser/internal/interfaces"
+	"github.com/kjanat/articulate-parser/internal/services"
+)
+
+// Factory implements the ExporterFactory interface.
+// It creates appropriate exporter instances based on the requested format.
+type Factory struct {
+	// htmlCleaner is used by exporters to convert HTML content to plain text
+	htmlCleaner *services.HTMLCleaner
+}
+
+// NewFactory creates a new exporter factory.
+// It takes an HTMLCleaner instance that will be passed to the exporters
+// created by this factory.
+//
+// Parameters:
+//   - htmlCleaner: Service for cleaning HTML content in course data
+//
+// Returns:
+//   - An implementation of the ExporterFactory interface
+func NewFactory(htmlCleaner *services.HTMLCleaner) interfaces.ExporterFactory {
+	return &Factory{
+		htmlCleaner: htmlCleaner,
+	}
+}
+
+// CreateExporter creates an exporter for the specified format.
+// It returns an appropriate exporter implementation based on the format string.
+// Format strings are case-insensitive.
+//
+// Parameters:
+//   - format: The desired export format (e.g., "markdown", "docx")
+//
+// Returns:
+//   - An implementation of the Exporter interface if the format is supported
+//   - An error if the format is not supported
+func (f *Factory) CreateExporter(format string) (interfaces.Exporter, error) {
+	switch strings.ToLower(format) {
+	case "markdown", "md":
+		return NewMarkdownExporter(f.htmlCleaner), nil
+	case "docx", "word":
+		return NewDocxExporter(f.htmlCleaner), nil
+	default:
+		return nil, fmt.Errorf("unsupported export format: %s", format)
+	}
+}
+
+// GetSupportedFormats returns a list of all supported export formats.
+// This includes both primary format names and their aliases.
+//
+// Returns:
+//   - A string slice containing all supported format names
+func (f *Factory) GetSupportedFormats() []string {
+	return []string{"markdown", "md", "docx", "word"}
+}