In Faster Whisper Serverless, how to get transcribe result?

In python code, I sent request :

   # S3 bucket and key for the audio file
    s3 = boto3.client('s3')
    # RunPog API configuration

    presigned_url = s3.generate_presigned_url(
        'get_object',
        Params={'Bucket': BUCKET_NAME, 'Key': av_path},
        ExpiresIn=3600  # valid for 1 hour
    )

    print(presigned_url)

    payload = {
        "input": {
            "audio_base64": presigned_url,
            "model": "large-v3",
            "language": "en",
            "beam_size": 5,
            "vad_filter": True
        }
    }

    headers = {
        "Authorization": f"Bearer {RUNPOD_API_KEY}",
        "Content-Type": "application/json"
    }

    start_time = time.time()
    response = requests.post(
        f"https://api.runpod.ai/v2/{ENDPOINT_ID}/run",
        json=payload,
        headers=headers
    )
    job = response.json()
    print(f"Response data: {job}")
    job_id = job.get("id")
    print(f"Submitted job: {job_id}")

    # Step 2: Poll until complete
    status_url = f"https://api.runpod.ai/v2/{ENDPOINT_ID}/status/{job_id}"
    while True:
        time.sleep(3)
        status_response = requests.get(status_url, headers=headers)
        status = status_response.json()
        if status["status"] == "COMPLETED":
            break
        elif status["status"] == "FAILED":
            raise Exception("Transcription job failed.")
        else:
            print(f"Job status: {status}")
#            print(f"Job status: {status['status']}")

   # S3 bucket and key for the audio file
    s3 = boto3.client('s3')
    # RunPog API configuration

    presigned_url = s3.generate_presigned_url(
        'get_object',
        Params={'Bucket': BUCKET_NAME, 'Key': av_path},
        ExpiresIn=3600  # valid for 1 hour
    )

    print(presigned_url)

    payload = {
        "input": {
            "audio_base64": presigned_url,
            "model": "large-v3",
            "language": "en",
            "beam_size": 5,
            "vad_filter": True
        }
    }

    headers = {
        "Authorization": f"Bearer {RUNPOD_API_KEY}",
        "Content-Type": "application/json"
    }

    start_time = time.time()
    response = requests.post(
        f"https://api.runpod.ai/v2/{ENDPOINT_ID}/run",
        json=payload,
        headers=headers
    )
    job = response.json()
    print(f"Response data: {job}")
    job_id = job.get("id")
    print(f"Submitted job: {job_id}")

    # Step 2: Poll until complete
    status_url = f"https://api.runpod.ai/v2/{ENDPOINT_ID}/status/{job_id}"
    while True:
        time.sleep(3)
        status_response = requests.get(status_url, headers=headers)
        status = status_response.json()
        if status["status"] == "COMPLETED":
            break
        elif status["status"] == "FAILED":
            raise Exception("Transcription job failed.")
        else:
            print(f"Job status: {status}")
#            print(f"Job status: {status['status']}")

I am always get status data:

Status:  {'delayTime': 1164, 'executionTime': 40, 'id': '2db7b7e9-707d-4e52-86c7-4313c968dec5-e1', 'status': 'COMPLETED', 'workerId': 'r1de9b8p7btmh1'}

Status:  {'delayTime': 1164, 'executionTime': 40, 'id': '2db7b7e9-707d-4e52-86c7-4313c968dec5-e1', 'status': 'COMPLETED', 'workerId': 'r1de9b8p7btmh1'}

There is no transcript data. How to get it? I don't see any document. Please help!

Runpod•9mo ago•

13 replies

nqcuong

In Faster Whisper Serverless, how to get transcribe result?

In python code, I sent request :

   # S3 bucket and key for the audio file
    s3 = boto3.client('s3')
    # RunPog API configuration

    presigned_url = s3.generate_presigned_url(
        'get_object',
        Params={'Bucket': BUCKET_NAME, 'Key': av_path},
        ExpiresIn=3600  # valid for 1 hour
    )

    print(presigned_url)

    payload = {
        "input": {
            "audio_base64": presigned_url,
            "model": "large-v3",
            "language": "en",
            "beam_size": 5,
            "vad_filter": True
        }
    }

    headers = {
        "Authorization": f"Bearer {RUNPOD_API_KEY}",
        "Content-Type": "application/json"
    }

    start_time = time.time()
    response = requests.post(
        f"https://api.runpod.ai/v2/{ENDPOINT_ID}/run",
        json=payload,
        headers=headers
    )
    job = response.json()
    print(f"Response data: {job}")
    job_id = job.get("id")
    print(f"Submitted job: {job_id}")

    # Step 2: Poll until complete
    status_url = f"https://api.runpod.ai/v2/{ENDPOINT_ID}/status/{job_id}"
    while True:
        time.sleep(3)
        status_response = requests.get(status_url, headers=headers)
        status = status_response.json()
        if status["status"] == "COMPLETED":
            break
        elif status["status"] == "FAILED":
            raise Exception("Transcription job failed.")
        else:
            print(f"Job status: {status}")
#            print(f"Job status: {status['status']}")

   # S3 bucket and key for the audio file
    s3 = boto3.client('s3')
    # RunPog API configuration

    presigned_url = s3.generate_presigned_url(
        'get_object',
        Params={'Bucket': BUCKET_NAME, 'Key': av_path},
        ExpiresIn=3600  # valid for 1 hour
    )

    print(presigned_url)

    payload = {
        "input": {
            "audio_base64": presigned_url,
            "model": "large-v3",
            "language": "en",
            "beam_size": 5,
            "vad_filter": True
        }
    }

    headers = {
        "Authorization": f"Bearer {RUNPOD_API_KEY}",
        "Content-Type": "application/json"
    }

    start_time = time.time()
    response = requests.post(
        f"https://api.runpod.ai/v2/{ENDPOINT_ID}/run",
        json=payload,
        headers=headers
    )
    job = response.json()
    print(f"Response data: {job}")
    job_id = job.get("id")
    print(f"Submitted job: {job_id}")

    # Step 2: Poll until complete
    status_url = f"https://api.runpod.ai/v2/{ENDPOINT_ID}/status/{job_id}"
    while True:
        time.sleep(3)
        status_response = requests.get(status_url, headers=headers)
        status = status_response.json()
        if status["status"] == "COMPLETED":
            break
        elif status["status"] == "FAILED":
            raise Exception("Transcription job failed.")
        else:
            print(f"Job status: {status}")
#            print(f"Job status: {status['status']}")

I am always get status data:

Status:  {'delayTime': 1164, 'executionTime': 40, 'id': '2db7b7e9-707d-4e52-86c7-4313c968dec5-e1', 'status': 'COMPLETED', 'workerId': 'r1de9b8p7btmh1'}

Status:  {'delayTime': 1164, 'executionTime': 40, 'id': '2db7b7e9-707d-4e52-86c7-4313c968dec5-e1', 'status': 'COMPLETED', 'workerId': 'r1de9b8p7btmh1'}

There is no transcript data. How to get it? I don't see any document. Please help!

In Faster Whisper Serverless, how to get transcribe result?

Similar Threads

In Faster Whisper Serverless, how to get transcribe result?

Similar Threads

Similar Threads

Similar Threads