jarvis-server-v2/jarvis/api.py

import json
import tempfile
from threading import Lock

import requests
from flask import Flask, request, jsonify
from flask_socketio import SocketIO, emit, join_room, leave_room, \
    rooms
from pywhispercpp.model import Model

from jarvis.skills.intent_services import intent_manager

# Set this variable to "threading", "eventlet" or "gevent" to test the
# different async modes, or leave it set to None for the application to choose
# the best option based on installed packages.
async_mode = None

app = Flask(__name__)
app.config['SECRET_KEY'] = 'secret!'
socketio = SocketIO(app, async_mode=async_mode)
thread = None
thread_lock = Lock()
model = Model('small')


@app.route('/')
def index():
    return "Welcome to Jarvis Server API !"


@socketio.event
def process_message(message):
    message = json.loads(message)
    print("New PROCESS request from room " + message['uuid'])

    print("Message : " + message['data'])
    # TODO: maybe implement grammar check ?

    intent_manager.recognise(message['data'], message['uuid'])

    send_jarvis_message_to_room(message['data'], message['uuid'])


@socketio.event
def join(message):
    message = json.loads(message)
    print("New client joined room " + message['uuid'])
    join_room(message['uuid'])


@socketio.event
def leave(message):
    leave_room(message['uuid'])
    emit('my_response', 'In rooms: ' + ', '.join(rooms()))


@socketio.event
def connect():
    global thread
    emit('my_response', {'data': 'Connected', 'count': 0})


def send_user_message_to_room(text, room_id):
    socketio.emit('message_from_user', {'data': text, "uuid": room_id}, to=room_id)


def send_jarvis_message_to_room(text, room_id):
    socketio.emit('message_from_jarvis', {'data': text, "uuid": room_id}, to=room_id)


# .WAV (i.e.) FILE REQUEST
@app.route("/get_text_from_audio", methods=['POST'])
def get_text_from_audio():
    print("[" + request.remote_addr + "] - New STT request")

    audio_temp_file = tempfile.NamedTemporaryFile(prefix='jarvis-audio_', suffix='_client')
    audio_temp_file.write(request.data)

    # text = whisper_stt(audio_temp_file.name)
    text = whisper_cpp_stt(audio_temp_file.name)
    print(text)

    return {"data": text, "uuid": "null"}


"""
@app.route("/process_text", methods=['POST'])
def process_text():
    print("[" + request.remote_addr + "] - New TXT request")

    text = request.values['text']

    answer = intent_manager.recognise(text, request.headers.get('Client-Ip'), request.headers.get('Client-Port'))

    return {"transcription": text, "answer": answer}"""


# send request to whisper-asr server (docker)
def whisper_stt(audio_file):
    headers = {
        'accept': 'application/json',
        # 'Content-Type': 'multipart/form-data',
    }

    params = {
        'task': 'transcribe',
        # TODO: add to config
        'language': 'fr',
        'output': 'json',
    }

    files = {
        'audio_file': open(audio_file, 'rb'),
    }

    # TODO: add to config
    response = requests.post('https://whisper.broillet.ch/asr', params=params, headers=headers, files=files)
    return json.loads(response.text)['text']


def whisper_cpp_stt(audio_file):
    segments = model.transcribe(audio_file, speed_up=False, translate=False)

    # combines all segments in one string
    text = ''
    for segment in segments:
        text += segment.text + ' '

    return text


def start_server():
    socketio.run(app, host='0.0.0.0', port=6000, allow_unsafe_werkzeug=True)
Base 2022-11-28 21:56:08 +01:00			`import json`
			`import tempfile`
websockets stuff 2022-12-02 15:45:17 +01:00			`from threading import Lock`
Base 2022-11-28 21:56:08 +01:00
			`import requests`
added whisper cpp 2023-03-14 21:42:14 +01:00			`from flask import Flask, request, jsonify`
websockets stuff 2022-12-02 15:45:17 +01:00			`from flask_socketio import SocketIO, emit, join_room, leave_room, \`
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`rooms`
added whisper cpp 2023-03-14 21:42:14 +01:00			`from pywhispercpp.model import Model`
Base 2022-11-28 21:56:08 +01:00
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`from jarvis.skills.intent_services import intent_manager`
websockets stuff 2022-12-02 15:45:17 +01:00
			`# Set this variable to "threading", "eventlet" or "gevent" to test the`
			`# different async modes, or leave it set to None for the application to choose`
			`# the best option based on installed packages.`
			`async_mode = None`
started re-implementing old intent system 2022-12-01 16:06:23 +01:00
Base 2022-11-28 21:56:08 +01:00			`app = Flask(__name__)`
websockets stuff 2022-12-02 15:45:17 +01:00			`app.config['SECRET_KEY'] = 'secret!'`
			`socketio = SocketIO(app, async_mode=async_mode)`
			`thread = None`
			`thread_lock = Lock()`
added whisper cpp 2023-03-14 21:42:14 +01:00			`model = Model('small')`
websockets stuff 2022-12-02 15:45:17 +01:00

			`@app.route('/')`
			`def index():`
			`return "Welcome to Jarvis Server API !"`


			`@socketio.event`
			`def process_message(message):`
			`message = json.loads(message)`
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`print("New PROCESS request from room " + message['uuid'])`
websockets stuff 2022-12-02 15:45:17 +01:00
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`print("Message : " + message['data'])`
			`# TODO: maybe implement grammar check ?`
websockets stuff 2022-12-02 15:45:17 +01:00
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`intent_manager.recognise(message['data'], message['uuid'])`
websockets stuff 2022-12-02 15:45:17 +01:00
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`send_jarvis_message_to_room(message['data'], message['uuid'])`
websockets stuff 2022-12-02 15:45:17 +01:00

			`@socketio.event`
			`def join(message):`
			`message = json.loads(message)`
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`print("New client joined room " + message['uuid'])`
websockets stuff 2022-12-02 15:45:17 +01:00			`join_room(message['uuid'])`


			`@socketio.event`
			`def leave(message):`
			`leave_room(message['uuid'])`
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`emit('my_response', 'In rooms: ' + ', '.join(rooms()))`
websockets stuff 2022-12-02 15:45:17 +01:00

			`@socketio.event`
			`def connect():`
			`global thread`
			`emit('my_response', {'data': 'Connected', 'count': 0})`


			`def send_user_message_to_room(text, room_id):`
			`socketio.emit('message_from_user', {'data': text, "uuid": room_id}, to=room_id)`


			`def send_jarvis_message_to_room(text, room_id):`
			`socketio.emit('message_from_jarvis', {'data': text, "uuid": room_id}, to=room_id)`
Base 2022-11-28 21:56:08 +01:00

			`# .WAV (i.e.) FILE REQUEST`
websockets stuff 2022-12-02 15:45:17 +01:00			`@app.route("/get_text_from_audio", methods=['POST'])`
			`def get_text_from_audio():`
Base 2022-11-28 21:56:08 +01:00			`print("[" + request.remote_addr + "] - New STT request")`

			`audio_temp_file = tempfile.NamedTemporaryFile(prefix='jarvis-audio_', suffix='_client')`
			`audio_temp_file.write(request.data)`

added whisper cpp 2023-03-14 21:42:14 +01:00			`# text = whisper_stt(audio_temp_file.name)`
			`text = whisper_cpp_stt(audio_temp_file.name)`
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00			`print(text)`
started re-implementing old intent system 2022-12-01 16:06:23 +01:00
websockets stuff 2022-12-02 15:45:17 +01:00			`return {"data": text, "uuid": "null"}`
started re-implementing old intent system 2022-12-01 16:06:23 +01:00
remade the skill system and implemented test skill 2022-12-04 15:27:45 +01:00
websockets stuff 2022-12-02 15:45:17 +01:00			`"""`
started re-implementing old intent system 2022-12-01 16:06:23 +01:00			`@app.route("/process_text", methods=['POST'])`
			`def process_text():`
			`print("[" + request.remote_addr + "] - New TXT request")`

			`text = request.values['text']`

			`answer = intent_manager.recognise(text, request.headers.get('Client-Ip'), request.headers.get('Client-Port'))`

websockets stuff 2022-12-02 15:45:17 +01:00			`return {"transcription": text, "answer": answer}"""`
Base 2022-11-28 21:56:08 +01:00

			`# send request to whisper-asr server (docker)`
websockets stuff 2022-12-02 15:45:17 +01:00			`def whisper_stt(audio_file):`
Base 2022-11-28 21:56:08 +01:00			`headers = {`
			`'accept': 'application/json',`
			`# 'Content-Type': 'multipart/form-data',`
			`}`

			`params = {`
			`'task': 'transcribe',`
			`# TODO: add to config`
			`'language': 'fr',`
			`'output': 'json',`
			`}`

			`files = {`
			`'audio_file': open(audio_file, 'rb'),`
			`}`

			`# TODO: add to config`
corrected url 2022-11-28 22:15:09 +01:00			`response = requests.post('https://whisper.broillet.ch/asr', params=params, headers=headers, files=files)`
Base 2022-11-28 21:56:08 +01:00			`return json.loads(response.text)['text']`


added whisper cpp 2023-03-14 21:42:14 +01:00			`def whisper_cpp_stt(audio_file):`
			`segments = model.transcribe(audio_file, speed_up=False, translate=False)`

			`# combines all segments in one string`
			`text = ''`
			`for segment in segments:`
			`text += segment.text + ' '`

			`return text`


Base 2022-11-28 21:56:08 +01:00			`def start_server():`
websockets stuff 2022-12-02 15:45:17 +01:00			`socketio.run(app, host='0.0.0.0', port=6000, allow_unsafe_werkzeug=True)`