import SwiftUI
import RealityKit
import Vision
import ARKit
import CoreML

struct ImmersiveView: View {
    @State private var arkitSession: ARKitSession?
    @State private var detectionResults: [VNRecognizedObjectObservation] = []
    @State private var contentEntity = Entity()
    @State private var boundingBoxEntities: [UUID: ModelEntity] = [:]
    @State private var worldTrackingProvider = WorldTrackingProvider()
    @State private var cameraFrameProvider: CameraFrameProvider?
    @State private var isTrackingReady = false

    var body: some View {
        RealityView { content in
            print(&#34;🎥 Initializing RealityKit scene...&#34;)
            
            // Add a clear reference point
            let testSphere = ModelEntity(mesh: .generateSphere(radius: 0.5))
            testSphere.position = [0, 0.5, -2.0] // Further in front of camera
            testSphere.model?.materials = [SimpleMaterial(color: .red, isMetallic: false)]
            content.add(testSphere)
            
            content.add(contentEntity)

            Task {
                await setupARKitSession()
            }
        } update: { content in
            Task { @MainActor in
                if isTrackingReady {
                    await updateBoundingBoxes()
                }
            }
        }
    }

    // MARK: - Setup ARKit &amp; Camera Frame Provider
    private func setupARKitSession() async {
        do {
            guard CameraFrameProvider.isSupported else {
                print(&#34;🚨 CameraFrameProvider is not supported on this device.&#34;)
                return
            }

            let cameraProvider = CameraFrameProvider()
            let session = ARKitSession()
            
            // ✅ Explicitly start world tracking provider
            worldTrackingProvider = WorldTrackingProvider()
            
            try await session.run([cameraProvider, worldTrackingProvider])
            
            self.arkitSession = session
            self.cameraFrameProvider = cameraProvider

            print(&#34;✅ ARKit Session started. Waiting for world tracking to initialize...&#34;)

            // ✅ Wait until world tracking is fully initialized
            for _ in 0..&lt;5 {
                try await Task.sleep(nanoseconds: 1_000_000_000) // Wait 1 second
                if await worldTrackingProvider.allAnchors != nil {
                    self.isTrackingReady = true
                    print(&#34;✅ World Tracking is now ready!&#34;)
                    break
                }
                print(&#34;⏳ Waiting for world tracking to initialize...&#34;)
            }

            guard self.isTrackingReady else {
                print(&#34;🚨 World tracking failed to initialize.&#34;)
                return
            }

            // ✅ Configure Camera Processing
            let formats = CameraVideoFormat.supportedVideoFormats(for: .main, cameraPositions: [.left])
            let highResolutionFormat = formats.max { $0.frameSize.height &lt; $1.frameSize.height }

            guard let highResolutionFormat,
                  let cameraFrameUpdates = cameraProvider.cameraFrameUpdates(for: highResolutionFormat) else {
                print(&#34;🚨 Failed to get camera frame updates.&#34;)
                return
            }

            print(&#34;🎥 Camera processing started.&#34;)

            for await cameraFrame in cameraFrameUpdates {
                if let sample = cameraFrame.sample(for: .left) {
                    print(&#34;📷 Captured frame from main camera&#34;)
                    processFrame(sample.pixelBuffer)
                }
            }
        } catch {
            print(&#34;🚨 Error initializing ARKit session: \(error)&#34;)
        }
    }

    // MARK: - Process Frame with YOLOv3
    private func processFrame(_ pixelBuffer: CVPixelBuffer) {
        guard let model = try? VNCoreMLModel(for: YOLOv3().model) else {
            print(&#34;🚨 Failed to load YOLOv3 model.&#34;)
            return
        }

        let request = VNCoreMLRequest(model: model) { request, _ in
            guard let results = request.results as? [VNRecognizedObjectObservation] else {
                print(&#34;🚨 No objects detected.&#34;)
                return
            }

            DispatchQueue.main.async {
                self.detectionResults = results
                print(&#34;🔍 Detected \(results.count) object(s)&#34;)
                for result in results {
                    if let label = result.labels.first {
                        print(&#34;🛑 Object: \(label.identifier) | Confidence: \(label.confidence * 100)%&#34;)
                    }
                }
            }
        }

        let handler = VNImageRequestHandler(cvPixelBuffer: pixelBuffer)
        do {
            try handler.perform([request])
        } catch {
            print(&#34;🚨 Error performing object detection: \(error)&#34;)
        }
    }

    // MARK: - Update Bounding Boxes in World Space
    private func updateBoundingBoxes() async {
        guard isTrackingReady else {
            print(&#34;🚨 World tracking is not ready yet.&#34;)
            return
        }

        guard let cameraTransform = await worldTrackingProvider.allAnchors?.last?.originFromAnchorTransform else {
            print(&#34;⏳ Waiting for a valid camera transform...&#34;)
            return
        }

        let currentIds = Set(detectionResults.map { $0.uuid })

        print(&#34;📡 Updating bounding boxes (\(currentIds.count) detected objects).&#34;)

        // ✅ Remove outdated bounding boxes
        boundingBoxEntities.keys.filter { !currentIds.contains($0) }
            .forEach { id in
                print(&#34;❌ Removing outdated bounding box: \(id)&#34;)
                boundingBoxEntities[id]?.removeFromParent()
                boundingBoxEntities.removeValue(forKey: id)
            }

        // ✅ Add new bounding boxes
        for observation in detectionResults {
            if let entity = await createOrUpdateBoundingBox(for: observation, cameraTransform: cameraTransform) {
                if boundingBoxEntities[observation.uuid] == nil {
                    contentEntity.addChild(entity)
                    boundingBoxEntities[observation.uuid] = entity
                    print(&#34;✅ Added bounding box for detected object: \(observation.labels.first?.identifier ?? &#34;Unknown&#34;)&#34;)
                }
            }
        }
    }

    // MARK: - Convert Bounding Box to World Space
    private func createOrUpdateBoundingBox(for observation: VNRecognizedObjectObservation, cameraTransform: simd_float4x4) async -&gt; ModelEntity? {
        let boundingBox = observation.boundingBox
        let entity = boundingBoxEntities[observation.uuid] ?? ModelEntity()

        // ✅ Estimate depth based on world tracking data
        let estimatedDepth: Float = 1.5
        let cameraPosition = cameraTransform.columns.3

        let worldPosition = SIMD3(
            x: Float(boundingBox.midX - 0.5) * estimatedDepth + cameraPosition.x,
            y: Float(0.5 - boundingBox.midY) * estimatedDepth + cameraPosition.y,
            z: -estimatedDepth + cameraPosition.z
        )

        let boxSize = Float(min(boundingBox.width, boundingBox.height)) * estimatedDepth
        let newMesh = MeshResource.generateBox(width: boxSize, height: boxSize, depth: 0.02)
        let material = UnlitMaterial(color: .green.withAlphaComponent(0.5))
        entity.model = ModelComponent(mesh: newMesh, materials: [material])
        entity.position = worldPosition

        print(&#34;📌 Bounding box position: \(entity.position)&#34;)

        return entity
    }
}