transcribe_wavs/transcribe.py

import requests
import argparse
import psycopg2
import json
import os
from dotenv import load_dotenv

load_dotenv()
db_host = os.getenv('DB_HOST')
db_name = os.getenv('DB_NAME')
db_user = os.getenv('DB_USER')
db_password = os.getenv('DB_PASSWORD')
openai_api_key = os.getenv('OPENAI_API_KEY')

# Set up the database connection
conn = psycopg2.connect(
     host=       db_host
    ,database=   db_name
    ,user=       db_user
    ,password=   db_password
    ,connect_timeout = 120
)

# Define the API endpoint and headers
url = 'https://api.openai.com/v1/audio/translations'
headers = {
    'Authorization': f'Bearer {openai_api_key}'
}
params = {
    'model': 'whisper-1',
    'response_format': 'vtt'
}
data = {
    'model': 'whisper-1'
}

# Parse command-line arguments
parser = argparse.ArgumentParser()
parser.add_argument('dir_path', help='path to directory containing audio files to transcribe')
args = parser.parse_args()

# Define the audio file to be transcribed
for file_name in os.listdir(args.dir_path):
    if file_name.endswith('.wav'):
        file_path = os.path.join(args.dir_path, file_name)
        file_name = os.path.basename(file_path)
        file_date = file_name[:10]

        # Check if there is a row in the database with a matching filename
        cur = conn.cursor()
        cur.execute("SELECT COUNT(*) FROM rlarp.thirtysec WHERE filename = %s", (file_name,))
        count = cur.fetchone()[0]
        cur.close()
        if count > 0:
            print(f"Skipping {file_name} (already processed)")
            continue

        # Send the transcription request and retrieve the results
        audio_file = open(file_path, 'rb')
        response = requests.post(url, headers=headers, params=params, data=data, files={'file': audio_file})
        transcript = response.text

        print(response.text)

        # Insert the JSON summary into the database
        cur = conn.cursor()
        cur.execute("INSERT INTO rlarp.thirtysec (filename, mdate, message) VALUES (%s, %s, %s);", (file_name, file_date, response.text))
        conn.commit()
        cur.close()

#close db connection
conn.close()
python script to read wav files, call openai api, and write contents to database 2023-03-27 11:27:12 -04:00			`import requests`
make target folder an argument 2023-03-27 11:34:47 -04:00			`import argparse`
python script to read wav files, call openai api, and write contents to database 2023-03-27 11:27:12 -04:00			`import psycopg2`
			`import json`
			`import os`
			`from dotenv import load_dotenv`

			`load_dotenv()`
			`db_host = os.getenv('DB_HOST')`
			`db_name = os.getenv('DB_NAME')`
			`db_user = os.getenv('DB_USER')`
			`db_password = os.getenv('DB_PASSWORD')`
			`openai_api_key = os.getenv('OPENAI_API_KEY')`

			`# Set up the database connection`
			`conn = psycopg2.connect(`
			`host= db_host`
			`,database= db_name`
			`,user= db_user`
			`,password= db_password`
			`,connect_timeout = 120`
			`)`

			`# Define the API endpoint and headers`
			`url = 'https://api.openai.com/v1/audio/translations'`
			`headers = {`
			`'Authorization': f'Bearer {openai_api_key}'`
			`}`
			`params = {`
			`'model': 'whisper-1',`
			`'response_format': 'vtt'`
			`}`
			`data = {`
			`'model': 'whisper-1'`
			`}`

make target folder an argument 2023-03-27 11:34:47 -04:00			`# Parse command-line arguments`
			`parser = argparse.ArgumentParser()`
			`parser.add_argument('dir_path', help='path to directory containing audio files to transcribe')`
			`args = parser.parse_args()`

python script to read wav files, call openai api, and write contents to database 2023-03-27 11:27:12 -04:00			`# Define the audio file to be transcribed`
make target folder an argument 2023-03-27 11:34:47 -04:00			`for file_name in os.listdir(args.dir_path):`
python script to read wav files, call openai api, and write contents to database 2023-03-27 11:27:12 -04:00			`if file_name.endswith('.wav'):`
make target folder an argument 2023-03-27 11:34:47 -04:00			`file_path = os.path.join(args.dir_path, file_name)`
python script to read wav files, call openai api, and write contents to database 2023-03-27 11:27:12 -04:00			`file_name = os.path.basename(file_path)`
			`file_date = file_name[:10]`

			`# Check if there is a row in the database with a matching filename`
			`cur = conn.cursor()`
			`cur.execute("SELECT COUNT(*) FROM rlarp.thirtysec WHERE filename = %s", (file_name,))`
			`count = cur.fetchone()[0]`
			`cur.close()`
			`if count > 0:`
			`print(f"Skipping {file_name} (already processed)")`
			`continue`

			`# Send the transcription request and retrieve the results`
			`audio_file = open(file_path, 'rb')`
			`response = requests.post(url, headers=headers, params=params, data=data, files={'file': audio_file})`
			`transcript = response.text`

			`print(response.text)`

			`# Insert the JSON summary into the database`
			`cur = conn.cursor()`
			`cur.execute("INSERT INTO rlarp.thirtysec (filename, mdate, message) VALUES (%s, %s, %s);", (file_name, file_date, response.text))`
			`conn.commit()`
			`cur.close()`

			`#close db connection`
			`conn.close()`