Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Serval App MVP #192

Merged
merged 15 commits into from
Oct 24, 2023
Merged
Show file tree
Hide file tree
Changes from 10 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
13 changes: 13 additions & 0 deletions samples/ServalApp/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
### Running the Serval APP
Before running the app, verify that both `SERVAL_APP_EMAIL_PASSWORD` and `SERVAL_APP_PASSCODE` are appropriately populated.
Then, run:
```
streamlit run serval_app.py
```

### Regenerating the Python Client
When the Serval API is updated, use the tool [swagger-to](https://pypi.org/project/swagger-to/) to generate a new `serval_client_module.py` using the following command:
```
swagger_to_py_client.py --swagger_path path/to/swagger.json --outpath serval_client_module.py
```
Note: You may need to delete the authorization-related elements of the "swagger.json" before generating.
Binary file added samples/ServalApp/builds.db
Binary file not shown.
30 changes: 30 additions & 0 deletions samples/ServalApp/db.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,30 @@
from sqlalchemy.orm import declarative_base
from sqlalchemy import Column, MetaData, String, Enum, create_engine
import enum

class State(enum.Enum):
Pending = 0
Active = 1
Completed = 2
Faulted = 3

metadata = MetaData()
Base = declarative_base(metadata=metadata)

class Build(Base):
__tablename__ = "builds"
build_id = Column("build_id",String,primary_key=True)
engine_id = Column("engine_id",String,primary_key=True)
email = Column("email",String)
state = Column("state",Enum(State))
corpus_id = Column("corpus_id",String)

def __str__(self):
return str({'build_id':self.build_id, 'engine_id':self.engine_id,'email':self.email,'state':self.state,'corpus_id':self.corpus_id})

def __repr__(self):
return self.__str__()
def clear_and_regenerate_tables():
engine = create_engine("sqlite:///builds.db")
metadata.drop_all(bind=engine)
metadata.create_all(bind=engine)
166 changes: 166 additions & 0 deletions samples/ServalApp/serval_app.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,166 @@
import streamlit as st
from streamlit.runtime.scriptrunner import add_script_run_ctx
from serval_client_module import *
from serval_auth_module import *
from sqlalchemy import create_engine
from sqlalchemy.orm import sessionmaker
from db import Build
from time import sleep
from threading import Thread
import os
from db import Build, State
from serval_email_module import ServalAppEmailServer
import re

def send_emails():
engine = create_engine("sqlite:///builds.db")
Session = sessionmaker(bind=engine)
session = Session()
try:
def started(build:Build, email_server:ServalAppEmailServer, data=None):
print(f"\tStarted {build}")
session.delete(build)
email_server.send_build_started_email(build.email)
session.add(Build(build_id=build.build_id, engine_id=build.engine_id, email=build.email, state=State.Active, corpus_id=build.corpus_id))

def faulted(build:Build, email_server:ServalAppEmailServer, data=None):
print(f"\tFaulted {build}")
session.delete(build)
email_server.send_build_faulted_email(build.email, error=data)

def completed(build:Build, email_server:ServalAppEmailServer, data=None):
print(f"\tCompleted {build}")
session.delete(build)
pretranslations = client.translation_engines_get_all_pretranslations(build.engine_id, build.corpus_id)
email_server.send_build_completed_email(build.email, '\n'.join([f"{'|'.join(pretranslation.refs)}\t{pretranslation.translation}" for pretranslation in pretranslations]))

def update(build:Build, email_server:ServalAppEmailServer, data=None):
print(f"\tUpdated {build}")

serval_auth = ServalBearerAuth()
client = RemoteCaller(url_prefix="https://prod.serval-api.org",auth=serval_auth)
responses:"dict[str,function]" = {"Completed":completed, "Faulted":faulted, "Canceled":faulted}

def get_update(build:Build, email_server:ServalAppEmailServer):
build_update = client.translation_engines_get_build(id=build.engine_id, build_id=build.build_id)
if build.state == State.Pending and build_update.state == "Active":
started(build, email_server)
else:
responses.get(build_update.state, update)(build, email_server, build_update.message)
session.commit()

def send_updates(email_server:ServalAppEmailServer):
print(f"Checking for updates...")
with session.no_autoflush:
builds = session.query(Build).all()
for build in builds:
try:
get_update(build, email_server)
except Exception as e:
print(f"\tFailed to update {build} because of exception {e}")
raise e

with ServalAppEmailServer(os.environ.get('SERVAL_APP_EMAIL_PASSWORD')) as email_server:
while(True):
send_updates(email_server)
sleep(300) #Once every five minutes...
except Exception as e:
print(e)
st.session_state['background_process_has_started'] = False

if not st.session_state.get('background_process_has_started',False):
cron_thread = Thread(target=send_emails)
add_script_run_ctx(cron_thread)
cron_thread.start()
st.session_state['background_process_has_started'] = True

serval_auth = None
if not st.session_state.get('authorized',False):
with st.form(key="Authorization Form"):
st.session_state['client_id'] = st.text_input(label='Client ID')
st.session_state['client_secret'] = st.text_input(label='Client Secret', type='password')
if st.form_submit_button("Authorize"):
st.session_state['authorized'] = True
st.rerun()
if st.session_state.get('authorization_failure', False):
st.error('Invalid credentials. Please check your credentials.')
else:
try:
serval_auth = ServalBearerAuth(client_id=st.session_state['client_id'] if st.session_state['client_id'] != "" else "<invalid>", client_secret=st.session_state['client_secret'] if st.session_state['client_secret'] != "" else "<invalid>")
except ValueError:
st.session_state['authorized'] = False
st.session_state['authorization_failure'] = True
st.rerun()
client = RemoteCaller(url_prefix="https://prod.serval-api.org",auth=serval_auth)
engine = create_engine("sqlite:///builds.db")
Session = sessionmaker(bind=engine)
session = Session()

def submit():
engine = json.loads(client.translation_engines_create(TranslationEngineConfig(source_language=st.session_state['source_language'],target_language=st.session_state['target_language'],type='Nmt',name=f'serval_app_engine:{st.session_state["email"]}')))
source_files = [json.loads(client.data_files_create(st.session_state['source_files'][i], format="Paratext" if st.session_state['source_files'][i].name[-4:] == '.zip' else "Text")) for i in range(len(st.session_state['source_files']))]
target_files = [json.loads(client.data_files_create(st.session_state['target_files'][i], format="Paratext" if st.session_state['target_files'][i].name[-4:] == '.zip' else "Text")) for i in range(len(st.session_state['target_files']))]
corpus = json.loads(client.translation_engines_add_corpus(
engine['id'],
TranslationCorpusConfig(
source_files=[TranslationCorpusFileConfig(file_id=file['id'], text_id=name) for file, name in zip(source_files, list(map(lambda f: f.name, st.session_state['source_files'])))],
target_files=[TranslationCorpusFileConfig(file_id=file['id'], text_id=name) for file, name in zip(target_files, list(map(lambda f: f.name, st.session_state['target_files'])))],
source_language=st.session_state['source_language'],
target_language=st.session_state['target_language']
)
)
)
build = json.loads(client.translation_engines_start_build(engine['id'], TranslationBuildConfig(pretranslate=[PretranslateCorpusConfig(corpus_id=corpus["id"], text_ids= [] if st.session_state['source_files'][0].name[-4:] == '.zip' else list(map(lambda f: f.name, st.session_state['source_files'])))], options="{\"max_steps\":10}")))
session.add(Build(build_id=build['id'],engine_id=engine['id'],email=st.session_state['email'],state=build['state'],corpus_id=corpus['id']))
session.commit()

def already_active_build_for(email:str):
return len(session.query(Build).where(Build.email == email).all()) > 0

st.subheader("Neural Machine Translation")

tried_to_submit = st.session_state.get('tried_to_submit', False)
with st.form(key="NmtTranslationForm"):
st.session_state['source_language'] = st.text_input(label="Source language tag*", placeholder="en")
if st.session_state.get('source_language','') == '' and tried_to_submit:
st.error("Please enter a source language tag before submitting", icon='⬆️')

st.session_state['source_files'] = st.file_uploader(label="Source File(s)", accept_multiple_files=True)
if len(st.session_state.get('source_files',[])) == 0 and tried_to_submit:
st.error("Please upload a source file before submitting", icon='⬆️')
if len(st.session_state.get('source_files',[])) > 1:
st.warning('Please note that source and target text files will be paired together by file name', icon='💡')

st.session_state['target_language'] = st.text_input(label="Target language tag*", placeholder="es")
if st.session_state.get('target_language','') == '' and tried_to_submit:
st.error("Please enter a target language tag before submitting", icon='⬆️')

st.session_state['target_files'] = st.file_uploader(label="Target File(s)", accept_multiple_files=True)
if len(st.session_state.get('target_files',[])) > 1:
st.warning('Please note that source and target text files will be paired together by file name', icon='💡')

st.session_state['email'] = st.text_input(label="Email", placeholder="[email protected]")
if st.session_state.get('email','') == '' and tried_to_submit:
st.error("Please enter an email address", icon='⬆️')
elif not re.match(r"^\S+@\S+\.\S+$", st.session_state['email']) and tried_to_submit:
st.error("Please enter a valid email address", icon='⬆️')
st.session_state['email'] = ''
if tried_to_submit:
st.error(st.session_state.get('error',"Something went wrong. Please try again in a moment."))
if st.form_submit_button("Generate translations"):
if already_active_build_for(st.session_state['email']):
st.session_state['tried_to_submit'] = True
st.session_state['error'] = "There is already an a pending or active build associated with this email address. Please wait for the previous build to finish."
st.rerun()
elif st.session_state['source_language'] != '' and st.session_state['target_language'] != '' and len(st.session_state['source_files']) > 0 and st.session_state['email'] != '':
with st.spinner():
submit()
st.session_state['tried_to_submit'] = False
st.toast("Translations are on their way! You'll receive an email when your translation job has begun.")
sleep(4)
st.rerun()
else:
st.session_state['tried_to_submit'] = True
st.session_state['error'] = "Some required fields were left blank. Please fill in all fields above"
st.rerun()
st.markdown("<sub>\* Use IETF tags if possible. See [here](https://en.wikipedia.org/wiki/IETF_language_tag) for more information on IETF tags.</sub>", unsafe_allow_html=True)
41 changes: 41 additions & 0 deletions samples/ServalApp/serval_auth_module.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,41 @@
import requests
import json
import os
import time

class ServalBearerAuth(requests.auth.AuthBase):
def __init__(self, client_id="", client_secret=""):
self.__client_id = client_id if client_id != "" else os.environ.get("SERVAL_CLIENT_ID")
assert(self.__client_id is not None)
self.__client_secret = client_secret if client_secret != "" else os.environ.get("SERVAL_CLIENT_SECRET")
assert(self.__client_secret is not None)
self.__auth_url = os.environ.get("SERVAL_AUTH_URL")
assert(self.__auth_url is not None)
self.update_token()
self.__last_time_fetched = time.time()
def __call__(self, r):
if(time.time() - self.__last_time_fetched > 20*60):
self.update_token()
r.headers["authorization"] = "Bearer " + self.token
return r

def update_token(self):
data = {
"client_id": f"{self.__client_id}",
"client_secret":f"{self.__client_secret}",
"audience":"https://machine.sil.org",
"grant_type":"client_credentials"
}

encoded_data = json.dumps(data).encode('utf-8')
r = None
try:
r:requests.Response = requests.post(
url=f'{self.__auth_url}/oauth/token',
data=encoded_data,
headers={"content-type": "application/json"}
)
self.token = r.json()['access_token'] if r is not None else None
except Exception as e:
raise ValueError(f"Token cannot be None. Failed to retrieve token from auth server; responded with {r.status_code if r is not None else '<unknown>'}. Original exception: {e}")

Loading