Zoom iOS 转录例子

news2024/9/21 22:34:31

一、在zoom marketplace创建通用app,zoom-recall 详见Zoom会议机器人转写例子-CSDN博客

二、mac下按照Xcode,创建APP项目meetingbot4ios

三、本实用的SDK为MobileRTC,即Meeting SDK的iOS版本

四、依赖如下:

MobileRTC和CryptoSwift

五、所有代码如下(meetingbot4iosApp.swift):

import SwiftUI
import MobileRTC
import CryptoSwift

@main
struct MeetingBot: App {
    @UIApplicationDelegateAdaptor(AppDelegate.self) var appDelegate
    @StateObject private var meetingInfo = MeetingInfo()
    
    var body: some Scene {
        WindowGroup {
            ContentView(meetingInfo: meetingInfo, appDelegate: appDelegate)
        }
    }
}

struct ZoomMeetingView: UIViewRepresentable {
    func makeUIView(context: Context) -> UIView {
        let view = MobileRTC.shared().getMeetingService()?.meetingView() ?? UIView()
        if view.subviews.isEmpty {
            print("Meeting view is empty")
        } else {
            print("Meeting view has subviews")
        }
        return view
    }

    func updateUIView(_ uiView: UIView, context: Context) {
        // Update the view if needed
    }
}

class MeetingInfo: ObservableObject {
    @Published var meetingUrl: String = "https://us05web.zoom.us/j/81334539494?pwd=sf96p7am967Oc3GI39J1yLWSPa6WnS.1"
}

struct ContentView: View {
    @ObservedObject var meetingInfo: MeetingInfo
    @ObservedObject var appDelegate: AppDelegate
    
    init(meetingInfo: MeetingInfo, appDelegate: AppDelegate) {
        self.meetingInfo = meetingInfo
        self.appDelegate = appDelegate
        self.appDelegate.meetingInfo = meetingInfo
    }
    var body: some View {
        VStack {
            TextField("Enter Meeting URL", text: $meetingInfo.meetingUrl)
                .textFieldStyle(RoundedBorderTextFieldStyle())
                .padding()
            // 显示会议状态
            Text("Meeting State: \(appDelegate.meetingState)")
                .padding()
            Button(action: {
                // Trigger initialization with the entered meeting URL
                self.appDelegate.initializeMobileRTCWithMeetingUrl(meetingInfo.meetingUrl)
                
            }) {
                Text("Join Meeting")
            }
            .padding()
            Button(action: {
                appDelegate.toggleRecording()
            }) {
                Text(appDelegate.recordingState == "stopped" ? "Start Recording" : "Stop Recording")
            }
            .padding()

            Text(appDelegate.transcriptText)
                .padding()

            ScrollView {
                Text(appDelegate.transcript.joined(separator: "\n"))
                    .padding()
            }
        }
    }
}

class AppDelegate: NSObject, UIApplicationDelegate, ObservableObject, MobileRTCAuthDelegate, MobileRTCMeetingServiceDelegate {
    @Published var meetingNumber: String?
    @Published var password: String?
    @Published var recordingState: String = "stopped"
    @Published var transcript: [String] = []
    @Published var botId: String?
    @Published var meetingState: String = "Not Joined" // 新增会议状态属性
    @Published var transcriptText = "Loading..."
    var meetingInfo: MeetingInfo?
    var window: UIWindow?
    private var refreshTimer: Timer?
    private var ZM_CLIENT_ID = ""
    private var ZM_CLIENT_SECRET = ""
    private var recallApiKey = ""
    private var WEBHOOK_SECRET=""
    private var PUBLIC_URL=""

    func application(_ application: UIApplication, didFinishLaunchingWithOptions launchOptions: [UIApplication.LaunchOptionsKey : Any]? = nil) -> Bool {
        // Initialize MobileRTC SDK
        let context = MobileRTCSDKInitContext()
        context.domain = "zoom.us"
        context.enableLog = true

        let success = MobileRTC.shared().initialize(context)
        if success {
            print("MobileRTC SDK initialized successfully")
        } else {
            print("Failed to initialize MobileRTC SDK")
        }

        return true
    }

    func initializeMobileRTCWithMeetingUrl(_ meetingUrl: String) {
        // Parse meeting URL
        guard let (meetingNumber, password) = parseMeetingUrl(meetingUrl) else {
            print("Failed to parse meeting URL")
            return
        }

        self.meetingNumber = meetingNumber
        self.password = password

        // Generate JWT
        guard let jwt = generateSDKJWT(meetingNumber: meetingNumber, role: 0, expirationSeconds: 3600) else {
            print("Failed to generate JWT")
            return
        }

        // Set up the Zoom SDK with JWT
        let authService = MobileRTC.shared().getAuthService()
        authService?.delegate = self
        authService?.jwtToken = jwt
        authService?.sdkAuth()
    }

    private func parseMeetingUrl(_ link: String) -> (String, String)? {
        // 查找会议号和密码
        let meetingNumberPattern = "/j/(\\d+)"
        let passwordPattern = "pwd=([^&]+)"
        
        // 使用正则表达式来匹配会议号
        if let meetingNumberRange = link.range(of: meetingNumberPattern, options: .regularExpression) {
            let meetingNumberSubstring = link[meetingNumberRange]
            let meetingNumber = meetingNumberSubstring.replacingOccurrences(of: "/j/", with: "")
            
            // 使用正则表达式来匹配密码
            if let passwordRange = link.range(of: passwordPattern, options: .regularExpression) {
                let passwordSubstring = link[passwordRange]
                let password = passwordSubstring.replacingOccurrences(of: "pwd=", with: "")
                print(meetingNumber, password)
                return (meetingNumber, password)
            }
        }
        
        return nil
    }

    private func generateSDKJWT(meetingNumber: String, role: Int, expirationSeconds: Int?) -> String? {
        let iat = Int(Date().timeIntervalSince1970)
        let exp = expirationSeconds != nil ? iat + expirationSeconds! : iat + 60 * 60 * 2

        let header = ["alg": "HS256", "typ": "JWT"]
        let payload: [String: Any] = [
            "appKey": ZM_CLIENT_ID,
            "sdkKey": ZM_CLIENT_ID,
            "mn": meetingNumber,
            "role": role,
            "iat": iat,
            "exp": exp,
            "tokenExp": exp
        ]

        guard let headerData = try? JSONSerialization.data(withJSONObject: header, options: []),
              let payloadData = try? JSONSerialization.data(withJSONObject: payload, options: []) else {
            return nil
        }

        let headerBase64 = headerData.base64EncodedString().replacingOccurrences(of: "=", with: "").replacingOccurrences(of: "+", with: "-").replacingOccurrences(of: "/", with: "_")
        let payloadBase64 = payloadData.base64EncodedString().replacingOccurrences(of: "=", with: "").replacingOccurrences(of: "+", with: "-").replacingOccurrences(of: "/", with: "_")

        let toSign = "\(headerBase64).\(payloadBase64)"
        guard let hmac = try? HMAC(key: ZM_CLIENT_SECRET.bytes, variant: .sha256).authenticate(toSign.bytes) else {
            return nil
        }

        let signatureBase64 = hmac.toBase64().replacingOccurrences(of: "=", with: "").replacingOccurrences(of: "+", with: "-").replacingOccurrences(of: "/", with: "_")
        let jwt = "\(toSign).\(signatureBase64)"

        return jwt
    }

    // MobileRTCAuthDelegate
    func onMobileRTCAuthReturn(_ returnValue: MobileRTCAuthError) {
        if returnValue == .success {
            print("Zoom SDK authentication successful")
            joinMeeting()
        } else {
            print("Zoom SDK authentication failed with error: \(returnValue)")
        }
    }

    // MobileRTCMeetingServiceDelegate
    func onMeetingStateChange(_ state: MobileRTCMeetingState) {
        let stateValue = state.rawValue
        print("Meeting state changed: \(stateValue)")
        
        switch stateValue {
        case 1:
            meetingState = "Connecting to Meeting Server"
        case 3:
            meetingState = "Promoting Participant to Host"
        case 4:
            meetingState = "Demoting Host to Participant"
        case 5:
            meetingState = "Disconnecting from Meeting"
        case 6:
            meetingState = "Reconnecting to Meeting"
        case 7:
            meetingState = "Connection Failed"
        case 10:
            meetingState = "Meeting Locked"
        case 12:
            meetingState = "Participant in Waiting Room"
        default:
            meetingState = "Other Meeting State"
        }
        // Update the ZoomMeetingView based on the meeting state
        DispatchQueue.main.async {
            self.objectWillChange.send()
        }
    }

    private func joinMeeting() {
        guard let meetingNumber = self.meetingNumber, let password = self.password else {
            print("Meeting number or password is missing")
            return
        }

        let meetingService = MobileRTC.shared().getMeetingService()
        meetingService?.delegate = self

        let joinParam = MobileRTCMeetingJoinParam()
        joinParam.meetingNumber = meetingNumber
        joinParam.password = password
        joinParam.userName = "iOS User"
        joinParam.noAudio = true
        joinParam.noVideo = false

        let result = meetingService?.joinMeeting(with: joinParam)
        if result == .success {
            print("Joining meeting...")
        } else {
            print("Failed to join meeting with error: \(result ?? .unknown)")
        }
    }

    func toggleRecording() {
        if recordingState == "stopped" {
            startRecording()
        } else {
            stopRecording()
        }
    }

    func startRecording() {
        recordingState = "starting"

        guard let meetingUrl = URL(string: meetingInfo?.meetingUrl ?? "") else {
            print("Invalid meeting URL.")
            return
        }

        let url = "https://us-west-2.recall.ai/api/v1/bot"
        var request = URLRequest(url: URL(string: url)!)
        request.httpMethod = "POST"
        request.addValue("Token \(recallApiKey)", forHTTPHeaderField: "Authorization")
        request.addValue("application/json", forHTTPHeaderField: "Content-Type")

        let body: [String: Any] = [
            "bot_name": "meeetingbot",
            "meeting_url": meetingUrl.absoluteString,
            "transcription_options": [
                "provider": "assembly_ai"
            ],
            "real_time_transcription": [
                "destination_url": PUBLIC_URL+"/webhook/transcription?secret="+WEBHOOK_SECRET,
                "partial_results": true
            ],
            "zoom": [
                "request_recording_permission_on_host_join": true,
                "require_recording_permission": true
            ]
        ]

        request.httpBody = try? JSONSerialization.data(withJSONObject: body, options: .prettyPrinted)

        let task = URLSession.shared.dataTask(with: request) { data, response, error in
            guard let data = data, error == nil else {
                print("Error: \(error?.localizedDescription ?? "Unknown error")")
                return
            }

            if let httpResponse = response as? HTTPURLResponse {
                if httpResponse.statusCode <= 299 {
                    let bot = try? JSONDecoder().decode(BotResponse.self, from: data)
                    DispatchQueue.main.async {
                        self.botId = bot?.id
                        self.recordingState = "bot-joining"
                        print("startRecording:",self.botId)
                        print("stopRecording:",self.recordingState)
                        // 启动定时器
                        self.refreshTimer = Timer.scheduledTimer(withTimeInterval: 1.0, repeats: true) { _ in
                            self.fetchTranscript()
                        }
                    }
                } else {
                    DispatchQueue.main.async {
                        self.recordingState = "error"
                        print("startRecording:",self.recordingState)
                        print("startRecording:",httpResponse.statusCode)
                    }
                }
            }
        }

        task.resume()
    }

    func stopRecording() {
        guard let botId = botId else {
            print("No botId to stop recording")
            // 恢复到 startRecording 的状态或提供适当的错误处理
            DispatchQueue.main.async {
                self.recordingState = "stopped"
                print("stopRecording: No botId, resetting to stopped state")
            }
            return
        }

        recordingState = "stopping"

        let url = "https://us-west-2.recall.ai/api/v1/bot/\(botId)/leave_call"
        var request = URLRequest(url: URL(string: url)!)
        request.httpMethod = "POST"
        request.addValue("Token \(recallApiKey)", forHTTPHeaderField: "Authorization")
        request.addValue("application/json", forHTTPHeaderField: "Content-Type")

        let task = URLSession.shared.dataTask(with: request) { data, response, error in
            guard let _ = data, error == nil else {
                print("Error: \(error?.localizedDescription ?? "Unknown error")")
                return
            }

            if let httpResponse = response as? HTTPURLResponse {
                if httpResponse.statusCode <= 299 {
                    DispatchQueue.main.async {
                        self.recordingState = "bot-leaving"
                        self.recordingState = "stopped"
                        print("stopRecording:",self.recordingState)
                        // 停止定时器
                        self.refreshTimer?.invalidate()
                        self.refreshTimer = nil
                    }
                } else {
                    DispatchQueue.main.async {
                        self.recordingState = "error"
                        print("stopRecording:",self.recordingState)
                        print("stopRecording:",httpResponse.statusCode)
                    }
                }
            }
        }

        task.resume()
    }

    func fetchTranscript() {
            guard let botId = botId else {
                print("No botId to fetchTranscript")
                return
            }
            let url = "https://us-west-2.recall.ai/api/v1/bot/\(botId)/transcript/?enhanced_diarization=true"
            var request = URLRequest(url: URL(string: url)!)
            request.httpMethod = "GET"
            request.addValue("Token \(recallApiKey)", forHTTPHeaderField: "Authorization")
            request.addValue("application/json", forHTTPHeaderField: "Content-Type")

            URLSession.shared.dataTask(with: request) { data, response, error in
                if let error = error {
                    self.updateTranscriptText(text: "Error: \(error.localizedDescription)")
                    return
                }

                guard let data = data else {
                    self.updateTranscriptText(text: "No data received")
                    return
                }

                do {
                    let transcripts = try JSONDecoder().decode([Transcript].self, from: data)
                    var transcriptText = ""
                    for transcript in transcripts {
                        transcriptText += "Speaker: \(transcript.speaker)\n"
                        for word in transcript.words {
                            transcriptText += "\(word.text) "
                        }
                        transcriptText += "\n"
                    }
                    self.updateTranscriptText(text: transcriptText)
                } catch {
                    self.updateTranscriptText(text: "Decoding error: \(error.localizedDescription)")
                }
            }.resume()
        }

        func updateTranscriptText(text: String) {
            DispatchQueue.main.async {
                self.transcriptText = text
            }
        }
    }

    // 定义 JSON 数据的结构
    struct Transcript: Codable {
        let words: [Word]
        let speaker: String
        let speaker_id: Int
        let language: String?
    }

    struct Word: Codable {
        let text: String
        let start_timestamp: Double
        let end_timestamp: Double
        let language: String?
        let confidence: Double?
    }

    struct BotResponse: Codable {
        let id: String
    }

六、在远程(海外)启动zoom客户端新建一个会议

七、复制会议地址

八、运行ios程序,输入会议地址,加入会议,开始转录(最终效果)

九、由于本机远程重定向了语音,所以iOS User的语音没有打开(会导致程序崩溃)。

本文来自互联网用户投稿,该文观点仅代表作者本人,不代表本站立场。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如若转载,请注明出处:http://www.coloradmin.cn/o/2079047.html

如若内容造成侵权/违法违规/事实不符,请联系多彩编程网进行投诉反馈,一经查实,立即删除!

相关文章

Swift-UITableView列表动态设置高度,根据不同的内容长度,设置heightForRowAt

此篇文章主要阐述如何利用swift语言&#xff0c;实现返回内容不同长度文本的高度&#xff0c;比如第一个列表文字1行&#xff0c;只需要50像素高度&#xff0c;第二个列表文字超出了1行&#xff0c;如2行&#xff0c;那么就自动调整这个单元文本的高度&#xff1b; 用MVC实现&…

给房子“养老”,你准备好了吗?

文&#xff5c;琥珀食酒社 作者 | 积溪 真崩不住了啊 一觉醒来 朋友圈被房屋养老金刷屏了 有人说买房如买“爹”&#xff0c;真的好费钱 有的说咱自己的养老还没着落呢 未来还得给房子养老&#xff1f; 当然&#xff0c;这事已经被辟谣了 说公共账户不需要咱老百姓额外…

力扣经典题目之->相同的树(递归判断两颗二叉树是否相同)

一&#xff1a;题目 二&#xff1a;代码 三&#xff1a;递归展开 第一种模型&#xff1a; 递归展开图&#xff1a; 左&#xff1a; 右&#xff1a; 第二种模型及其递归展开图&#xff1a; 解释&#xff1a; 递归思路即&#xff1a;根相同&#xff0c;左子树相同&#xff0c;…

cdga|制造业、工程设计行业、创投行业的数据治理痛点与解决方案

在当今数字化时代&#xff0c;数据已成为企业核心资产&#xff0c;数据治理成为推动企业数字化转型和高质量发展的关键。然而&#xff0c;不同行业在数据治理过程中面临着不同的痛点与挑战。 今天小编来和大家聊聊制造业、工程设计行业、创投行业的数据治理痛点进行详细分析&a…

【java计算机毕设】网上商城MySQL springcloud vue HTML maven项目设计源码带项目报告PPT 前后端可分离也可不分离

目录 1项目功能 2项目介绍 3项目地址 1项目功能 【java计算机毕设】网上商城MySQL springcloud vue HTML maven项目设计源码带项目报告PPT 前后端可分离也可不分离 2项目介绍 系统功能&#xff1a; 网上商城包括管理员、用户两种角色。 管理员功能包括个人中心模块用于修改…

Java | Leetcode Java题解之第375题猜数字大小II

题目&#xff1a; 题解&#xff1a; class Solution {public int getMoneyAmount(int n) {int[][] f new int[n 1][n 1];for (int i n - 1; i > 1; i--) {for (int j i 1; j < n; j) {f[i][j] j f[i][j - 1];for (int k i; k < j; k) {f[i][j] Math.min(f[…

leetcode 560 和为k 的子数组

leetcode 560 和为k 的子数组 正文一般解法字典方法 正文 一般解法 class Solution:def subarraySum(self, nums: List[int], k: int) -> int:number 0for i in range(len(nums)):for j in range(i , len(nums)):if sum(nums[i:j 1]) k:number 1return number上述方法虽…

北斗卫星导航系统的应用落地,改变未来出行方式

近年来&#xff0c;随着北斗卫星导航系统在全球范围内的部署和完善&#xff0c;它的应用范围不断扩大&#xff0c;正逐渐成为数字化出行时代的重要基础设施。从智能导航到车联网&#xff0c;从航空导航到陆地测绘&#xff0c;北斗卫星导航系统的应用正在深入各个领域&#xff0…

视频单条剪、脚本靠手写?云微客开启海量视频时代

老板们注意了&#xff0c;现在已不再是视频单条剪&#xff0c;脚本靠手写的时代&#xff01;在这个信息爆炸的时代&#xff0c;短视频已经成为了现代信息传播和娱乐消费的重要载体&#xff0c;那么我们该如何高效、快速地制作出大量高质量的短视频内容呢&#xff1f;这就需要云…

TRIZ理论在手术机器人功能区设计中的应用

TRIZ&#xff0c;全称为“Theory of Inventive Problem Solving”&#xff0c;是一套系统化地分析和解决复杂问题的理论工具。它不仅能够预测技术系统的发展趋势&#xff0c;还能提供一套高效的问题解决策略&#xff0c;帮助设计师突破思维定势&#xff0c;实现突破性创新。在手…

视频转换成MP3怎么转?这里有快速转换通道

视频转换成MP3怎么转&#xff1f;在数字化时代&#xff0c;视频和音频内容无处不在&#xff0c;我们时常需要将视频中的音频提取出来&#xff0c;以便在特定场合下单独播放或编辑。将视频转换成MP3音频格式是一种常见且实用的需求。为了帮助你轻松实现这一操作&#xff0c;本文…

openlayers10+vue3+ts

在 Vue 3 应用程序中使用 Vite 工具链和 OpenLayers10 创建一个简单的地图实例&#xff0c;并实现一些基础的地图交互功能。 Demo 地图初始化 底图加载与切换 GeoJSON 数据的加载与导出 绘制功能 轨迹回放功能 使用 VectorLayer postrender 实现丝滑的轨迹运动效果。

基于Java的音乐网站与分享平台

你好&#xff0c;我是音乐技术爱好者&#xff0c;专注于音乐与技术的结合。如需交流或合作&#xff0c;请联系我。 开发语言&#xff1a;Java 数据库&#xff1a;MySQL 技术&#xff1a;Java语言&#xff0c;Spring Boot框架&#xff0c;B/S架构 工具&#xff1a;Eclipse&a…

007、架构_MDS

​架构 什么是元数据 什么是元数据 元数据又称中介数据、中继数据,为描述数据的数据,主要是描述数据属性的信息,用来支持如指示存储位置、历史数据、资源查找、文件记录等功能;GoldenDB 数据库元数据大致分为两类: 数据字典:库、表、字段属性信息、视图、函数、存储过程属…

【数据结构-前缀异或】力扣1310. 子数组异或查询

有一个正整数数组 arr&#xff0c;现给你一个对应的查询数组 queries&#xff0c;其中 queries[i] [Li, Ri]。 对于每个查询 i&#xff0c;请你计算从 Li 到 Ri 的 XOR 值&#xff08;即 arr[Li] xor arr[Li1] xor … xor arr[Ri]&#xff09;作为本次查询的结果。 并返回一…

SpringBoot2:依赖管理与自动配置

一、依赖管理 什么叫依赖管理&#xff1f; 我们做过Maven项目的&#xff0c;都知道pom.xml的作用。里面配置了一大堆的包依赖。 所以&#xff0c;SpringBoot的依赖管理&#xff0c;意思就是&#xff0c;我们用SpringBoot开发web应用&#xff0c;那么&#xff0c;相关的依赖包&…

添加专辑失败,获取 userId 为空

文章目录 1、debug发现问题2、发现 userId 为空3、GuiGuAspect4、GuiGuLogin 1、debug发现问题 2、发现 userId 为空 点击 getUserId() 进入方法内部 package com.atguigu.tingshu.common.util;/*** 获取当前用户信息帮助类*/ public class AuthContextHolder {private stati…

【Python】copy()浅拷贝与深拷贝

前言 由于python关于传参的方面和C语言有些出入&#xff0c;对于先学C在学Python的可能需要做些笔记&#xff0c;比如Python中def传参是直接传址&#xff0c;而不是传值创建局部变量等等...而到了copy函数感觉又是个新概念... 1. copy介绍 1.1 copy() 浅拷贝 Python 的 cop…

如何解决 Compute 节点上的内存溢出(OOM)问题

内存溢出&#xff08;Out-of-memory&#xff09;是数据处理系统中常见的问题&#xff0c;本文将分析 OOM 的各种原因并提供有效的解决方法。 RisingWave 使用像 AWS S3 这样的共享存储&#xff0c;并将 Compute 节点的内存用作缓存以增强流处理性能。缓存以 Least Recently Us…

最新盘点!推荐10款简单易用的进销存软件!

本文将会盘点10款比较简单的进销存软件&#xff1a; 简道云、秦丝生意通、管家婆、金蝶精斗云、用友 T、百胜软件、速达软件、商陆花、Zoho Inventory、QuickBooks。 进销存软件就如同企业的得力助手。它能把企业的进货、销售和库存管理得妥妥当当&#xff0c;让企业清楚地掌握…