wordpress-mobile
diff --git a/‎Modules/Package.swift‎
Lines changed: 5 additions & 1 deletion b/‎Modules/Package.swift‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎Modules/Sources/WordPressIntelligence/IntelligenceService.swift‎
Lines changed: 134 additions & 0 deletions b/‎Modules/Sources/WordPressIntelligence/IntelligenceService.swift‎
Lines changed: 134 additions & 0 deletions
diff --git a/‎Modules/Sources/WordPressIntelligence/Parameters/MediaMetadata.swift‎
Lines changed: 38 additions & 0 deletions b/‎Modules/Sources/WordPressIntelligence/Parameters/MediaMetadata.swift‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎Modules/Sources/WordPressIntelligence/UseCases/ImageAltTextGenerator.swift‎
Lines changed: 196 additions & 0 deletions b/‎Modules/Sources/WordPressIntelligence/UseCases/ImageAltTextGenerator.swift‎
Lines changed: 196 additions & 0 deletions
@@ -256,7 +256,11 @@ let package = Package(
         .testTarget(name: "WordPressSharedObjCTests", dependencies: [.target(name: "WordPressShared"), .target(name: "WordPressTesting")], swiftSettings: [.swiftLanguageMode(.v5)]),
         .testTarget(name: "WordPressUIUnitTests", dependencies: [.target(name: "WordPressUI")], swiftSettings: [.swiftLanguageMode(.v5)]),
         .testTarget(name: "WordPressCoreTests", dependencies: [.target(name: "WordPressCore")]),
-        .testTarget(name: "WordPressIntelligenceTests", dependencies: [.target(name: "WordPressIntelligence")])
+        .testTarget(
+            name: "WordPressIntelligenceTests",
+            dependencies: [.target(name: "WordPressIntelligence")],
+            resources: [.process("Resources")]
+        )
     ]
 )
 
 
@@ -1,6 +1,9 @@
 import Foundation
 import FoundationModels
 import NaturalLanguage
+import Vision
+import UIKit
+import WordPressShared
 
 public enum IntelligenceService {
     /// Maximum context size for language model sessions (in tokens).
@@ -62,4 +65,135 @@ public enum IntelligenceService {
 
         return languageCode.rawValue
     }
+
+    /// Analyzes an image using Vision framework to extract comprehensive visual information.
+    ///
+    /// Uses multiple Vision APIs to gather detailed information about the image:
+    /// - Image classification for scene and object identification
+    /// - Text recognition for readable content
+    /// - Face detection for portrait photos
+    /// - Human and animal detection for subjects
+    /// - Saliency analysis for key regions of interest
+    /// - Horizon detection for landscape orientation
+    /// - Barcode detection for QR codes and barcodes
+    ///
+    /// - Parameter cgImage: The image to analyze
+    /// - Returns: A comprehensive description of what's in the image
+    /// - Throws: If image analysis fails
+    @available(iOS 26, *)
+    public static func analyzeImage(_ cgImage: CGImage) async throws -> String {
+        let startTime = CFAbsoluteTimeGetCurrent()
+
+        var descriptions: [String] = []
+
+        // Create all analysis requests
+        let classifyRequest = VNClassifyImageRequest()
+        let textRequest = VNRecognizeTextRequest()
+        textRequest.recognitionLevel = .accurate
+
+        let faceRequest = VNDetectFaceRectanglesRequest()
+        let humanRequest = VNDetectHumanRectanglesRequest()
+        let animalRequest = VNRecognizeAnimalsRequest()
+        let saliencyRequest = VNGenerateAttentionBasedSaliencyImageRequest()
+        let horizonRequest = VNDetectHorizonRequest()
+        let barcodeRequest = VNDetectBarcodesRequest()
+
+        // Perform all requests
+        let handler = VNImageRequestHandler(cgImage: cgImage, options: [:])
+        try handler.perform([
+            classifyRequest,
+            textRequest,
+            faceRequest,
+            humanRequest,
+            animalRequest,
+            saliencyRequest,
+            horizonRequest,
+            barcodeRequest
+        ])
+
+        // 1. Scene/Object Classification
+        if let classifications = classifyRequest.results?.prefix(5) {
+            let labels = classifications
+                .filter { $0.confidence > 0.3 }
+                .map { "\($0.identifier.replacingOccurrences(of: "_", with: " ")) (\(Int($0.confidence * 100))%)" }
+            if !labels.isEmpty {
+                descriptions.append("Scene: \(labels.joined(separator: ", "))")
+            }
+        }
+
+        // 2. Subjects - Faces
+        if let faceObservations = faceRequest.results, !faceObservations.isEmpty {
+            let faceCount = faceObservations.count
+            let faceDesc = faceCount == 1 ? "1 face" : "\(faceCount) faces"
+            descriptions.append("Subjects: \(faceDesc) detected")
+        }
+
+        // 3. Subjects - Humans (full body)
+        if let humanObservations = humanRequest.results, !humanObservations.isEmpty {
+            let humanCount = humanObservations.count
+            let humanDesc = humanCount == 1 ? "1 person" : "\(humanCount) people"
+
+            // Only add if we didn't already mention faces, or if there are more humans than faces
+            if let faceCount = faceRequest.results?.count, humanCount > faceCount {
+                descriptions.append("Additional subjects: \(humanDesc) visible")
+            } else if faceRequest.results?.isEmpty ?? true {
+                descriptions.append("Subjects: \(humanDesc) detected")
+            }
+        }
+
+        // 4. Animals
+        if let animalObservations = animalRequest.results, !animalObservations.isEmpty {
+            let animals = animalObservations
+                .filter { $0.confidence > 0.5 }
+                .compactMap { observation -> String? in
+                    guard let label = observation.labels.first else { return nil }
+                    return "\(label.identifier) (\(Int(label.confidence * 100))%)"
+                }
+            if !animals.isEmpty {
+                descriptions.append("Animals: \(animals.joined(separator: ", "))")
+            }
+        }
+
+        // 5. Saliency (regions of interest)
+        if let saliencyObservations = saliencyRequest.results as? [VNSaliencyImageObservation],
+           let observation = saliencyObservations.first,
+           let salientObjects = observation.salientObjects, !salientObjects.isEmpty {
+            descriptions.append("Key regions: \(salientObjects.count) area\(salientObjects.count == 1 ? "" : "s") of interest")
+        }
+
+        // 6. Horizon detection (indicates landscape/orientation)
+        if let horizonObservations = horizonRequest.results, let horizon = horizonObservations.first {
+            let angle = horizon.angle * 180 / .pi
+            if abs(angle) > 5 { // Only mention if horizon is noticeably tilted
+                descriptions.append("Composition: horizon at \(Int(angle))° angle")
+            }
+        }
+
+        // 7. Text content
+        if let textObservations = textRequest.results, !textObservations.isEmpty {
+            let text = textObservations
+                .compactMap { $0.topCandidates(1).first?.string }
+                .joined(separator: " ")
+            if !text.isEmpty {
+                let truncatedText = String(text.prefix(100))
+                descriptions.append("Text: \"\(truncatedText)\(text.count > 100 ? "..." : "")\"")
+            }
+        }
+
+        // 8. Barcodes/QR codes
+        if let barcodeObservations = barcodeRequest.results, !barcodeObservations.isEmpty {
+            let barcodeTypes = barcodeObservations.compactMap { $0.symbology.rawValue }
+            if !barcodeTypes.isEmpty {
+                descriptions.append("Codes: \(barcodeTypes.joined(separator: ", "))")
+            }
+        }
+
+        let description = descriptions.isEmpty
+            ? "Image analyzed"
+            : descriptions.joined(separator: "; ")
+
+        WPLogInfo("IntelligenceService.analyzeImage executed in \((CFAbsoluteTimeGetCurrent() - startTime) * 1000) ms")
+
+        return description
+    }
 }
@@ -0,0 +1,38 @@
+import Foundation
+
+/// Metadata for generating alt text and captions for media items.
+public struct MediaMetadata {
+    public let filename: String?
+    public let title: String?
+    public let caption: String?
+    public let description: String?
+    public let altText: String?
+    public let fileType: String?
+    public let dimensions: String?
+    public let imageAnalysis: String?
+
+    public init(
+        filename: String? = nil,
+        title: String? = nil,
+        caption: String? = nil,
+        description: String? = nil,
+        altText: String? = nil,
+        fileType: String? = nil,
+        dimensions: String? = nil,
+        imageAnalysis: String? = nil
+    ) {
+        self.filename = filename
+        self.title = title
+        self.caption = caption
+        self.description = description
+        self.altText = altText
+        self.fileType = fileType
+        self.dimensions = dimensions
+        self.imageAnalysis = imageAnalysis
+    }
+
+    var hasContent: Bool {
+        return [filename, title, caption, description, altText, fileType, dimensions, imageAnalysis]
+            .contains(where: { !($0?.isEmpty ?? true) })
+    }
+}
@@ -0,0 +1,196 @@
+import Foundation
+import FoundationModels
+import UIKit
+import WordPressShared
+
+/// Alt text generation for media items.
+///
+/// Generates concise, descriptive, and accessible alt text for images based on
+/// visual analysis and available metadata.
+///
+/// Example usage:
+/// ```swift
+/// let generator = ImageAltTextGenerator()
+/// let altText = try await generator.generate(metadata: metadata)
+/// ```
+@available(iOS 26, *)
+public struct ImageAltTextGenerator {
+    public var options: GenerationOptions
+
+    public init(options: GenerationOptions = GenerationOptions(temperature: 0.7)) {
+        self.options = options
+    }
+
+    /// Generates alt text for a media item.
+    ///
+    /// - Parameter metadata: The media metadata to use for generation
+    /// - Returns: Generated alt text
+    /// - Throws: If metadata is insufficient or generation fails
+    public func generate(metadata: MediaMetadata) async throws -> String {
+        guard metadata.hasContent else {
+            throw NSError(domain: "IntelligenceService", code: -1, userInfo: [
+                NSLocalizedDescriptionKey: "Insufficient metadata to generate alt text. Please add a filename, title, or description first."
+            ])
+        }
+
+        let startTime = CFAbsoluteTimeGetCurrent()
+        let session = makeSession()
+        let prompt = makePrompt(metadata: metadata)
+
+        let response = try await session.respond(to: prompt, options: options)
+
+        WPLogInfo("ImageAltTextGenerator executed in \((CFAbsoluteTimeGetCurrent() - startTime) * 1000) ms")
+
+        return response.content.trimmingCharacters(in: .whitespacesAndNewlines)
+    }
+
+    /// Generates alt text for an image with automatic Vision analysis.
+    ///
+    /// This convenience method automatically analyzes the image using Vision framework
+    /// and generates alt text based on the analysis combined with provided metadata.
+    ///
+    /// - Parameters:
+    ///   - cgImage: The image to analyze and generate alt text for
+    ///   - metadata: Additional metadata (filename, title, etc.). The imageAnalysis field will be populated automatically.
+    /// - Returns: Generated alt text
+    /// - Throws: If image analysis or generation fails
+    public func generate(cgImage: CGImage, metadata: MediaMetadata = MediaMetadata()) async throws -> String {
+        let imageAnalysis = try await IntelligenceService.analyzeImage(cgImage)
+
+        let metadataWithAnalysis = MediaMetadata(
+            filename: metadata.filename,
+            title: metadata.title,
+            caption: metadata.caption,
+            description: metadata.description,
+            altText: metadata.altText,
+            fileType: metadata.fileType,
+            dimensions: metadata.dimensions,
+            imageAnalysis: imageAnalysis
+        )
+
+        return try await generate(metadata: metadataWithAnalysis)
+    }
+
+    /// Generates alt text for an image with automatic Vision analysis.
+    ///
+    /// This convenience method automatically analyzes the image using Vision framework
+    /// and generates alt text based on the analysis combined with provided metadata.
+    ///
+    /// - Parameters:
+    ///   - image: The UIImage to analyze and generate alt text for
+    ///   - metadata: Additional metadata (filename, title, etc.). The imageAnalysis field will be populated automatically.
+    /// - Returns: Generated alt text
+    /// - Throws: If the image cannot be converted to CGImage, or if analysis/generation fails
+    public func generate(image: UIImage, metadata: MediaMetadata = MediaMetadata()) async throws -> String {
+        guard let cgImage = image.cgImage else {
+            throw NSError(domain: "IntelligenceService", code: -2, userInfo: [
+                NSLocalizedDescriptionKey: "Unable to convert UIImage to CGImage"
+            ])
+        }
+        return try await generate(cgImage: cgImage, metadata: metadata)
+    }
+
+    /// Generates alt text for image data with automatic Vision analysis.
+    ///
+    /// This convenience method automatically analyzes the image using Vision framework
+    /// and generates alt text based on the analysis combined with provided metadata.
+    ///
+    /// - Parameters:
+    ///   - imageData: The image data to analyze and generate alt text for
+    ///   - metadata: Additional metadata (filename, title, etc.). The imageAnalysis field will be populated automatically.
+    /// - Returns: Generated alt text
+    /// - Throws: If the data cannot be converted to an image, or if analysis/generation fails
+    public func generate(imageData: Data, metadata: MediaMetadata = MediaMetadata()) async throws -> String {
+        guard let image = UIImage(data: imageData) else {
+            throw NSError(domain: "IntelligenceService", code: -3, userInfo: [
+                NSLocalizedDescriptionKey: "Unable to create UIImage from data"
+            ])
+        }
+        return try await generate(image: image, metadata: metadata)
+    }
+
+    // MARK: - Session & Prompt Building
+
+    /// Creates a language model session configured for alt text generation.
+    ///
+    /// - Returns: Configured session with instructions
+    public func makeSession() -> LanguageModelSession {
+        LanguageModelSession(
+            model: .init(guardrails: .permissiveContentTransformations),
+            instructions: Self.instructions
+        )
+    }
+
+    /// Instructions for the language model on how to generate alt text.
+    public static var instructions: String {
+        """
+        You are helping a WordPress user generate alt text for an image.
+        Alt text should be concise, descriptive, and accessible for screen readers.
+
+        **Parameters**
+        - IMAGE_ANALYSIS: Visual analysis of the actual image content (MOST IMPORTANT)
+        - FILENAME: the image filename
+        - FILE_TYPE: the file type/extension
+        - DIMENSIONS: the image dimensions
+        - TITLE: the image title (if available)
+        - CAPTION: the image caption (if available)
+        - DESCRIPTION: the image description (if available)
+
+        **Requirements**
+        - Generate concise alt text (1-2 sentences, max 125 characters)
+        - Prioritize IMAGE_ANALYSIS when describing what's in the image
+        - Focus on what the image depicts, not decorative elements
+        - Use simple, clear language
+        - Do not include phrases like "image of" or "picture of"
+        - Only output the alt text, nothing else
+        """
+    }
+
+    /// Builds the prompt for generating alt text.
+    ///
+    /// - Parameter metadata: The media metadata
+    /// - Returns: Formatted prompt string ready for the language model
+    public func makePrompt(metadata: MediaMetadata) -> String {
+        var contextParts: [String] = []
+
+        if let imageAnalysis = metadata.imageAnalysis, !imageAnalysis.isEmpty {
+            contextParts.append("IMAGE_ANALYSIS: '\(imageAnalysis)'")
+        }
+        if let filename = metadata.filename, !filename.isEmpty {
+            contextParts.append("FILENAME: '\(filename)'")
+        }
+        if let fileType = metadata.fileType, !fileType.isEmpty {
+            contextParts.append("FILE_TYPE: '\(fileType)'")
+        }
+        if let dimensions = metadata.dimensions, !dimensions.isEmpty {
+            contextParts.append("DIMENSIONS: '\(dimensions)'")
+        }
+        if let title = metadata.title, !title.isEmpty {
+            contextParts.append("TITLE: '\(title)'")
+        }
+        if let caption = metadata.caption, !caption.isEmpty {
+            contextParts.append("CAPTION: '\(caption)'")
+        }
+        if let description = metadata.description, !description.isEmpty {
+            contextParts.append("DESCRIPTION: '\(description)'")
+        }
+
+        return """
+        Generate alt text for an image with the following information:
+
+        \(contextParts.joined(separator: "\n"))
+        """
+    }
+}
+
+@available(iOS 26, *)
+extension IntelligenceService {
+    /// Generates alt text for a media item based on available metadata.
+    ///
+    /// - Parameter metadata: The media metadata to use for generation
+    /// - Returns: Generated alt text
+    /// - Throws: If metadata is insufficient or generation fails
+    public func generateAltText(metadata: MediaMetadata) async throws -> String {
+        try await ImageAltTextGenerator().generate(metadata: metadata)
+    }
+}
Original file line number	Diff line number	Diff line change
`@@ -256,7 +256,11 @@ let package = Package(`
`256`	`256`	`.testTarget(name: "WordPressSharedObjCTests", dependencies: [.target(name: "WordPressShared"), .target(name: "WordPressTesting")], swiftSettings: [.swiftLanguageMode(.v5)]),`
`257`	`257`	`.testTarget(name: "WordPressUIUnitTests", dependencies: [.target(name: "WordPressUI")], swiftSettings: [.swiftLanguageMode(.v5)]),`
`258`	`258`	`.testTarget(name: "WordPressCoreTests", dependencies: [.target(name: "WordPressCore")]),`
`259`		`- .testTarget(name: "WordPressIntelligenceTests", dependencies: [.target(name: "WordPressIntelligence")])`
	`259`	`+ .testTarget(`
	`260`	`+ name: "WordPressIntelligenceTests",`
	`261`	`+ dependencies: [.target(name: "WordPressIntelligence")],`
	`262`	`+ resources: [.process("Resources")]`
	`263`	`+ )`
`260`	`264`	`]`
`261`	`265`	`)`
`262`	`266`