# coding=utf-8 # Copyright 2023 The GIRT Authors. # Lint as: python3 # This space is built based on AMR-KELEG/ALDi and cis-lmu/GlotLID space. # GIRT Space from transformers import AutoTokenizer, AutoModelForSeq2SeqLM import streamlit as st import pandas as pd import base64 @st.cache_data def render_svg(svg): """Renders the given svg string.""" b64 = base64.b64encode(svg.encode("utf-8")).decode("utf-8") html = rf'

' c = st.container() c.write(html, unsafe_allow_html=True) @st.cache_resource def load_model(model_name): model = AutoModelForSeq2SeqLM.from_pretrained(model_name) return model @st.cache_resource def load_tokenizer(model_name): tokenizer = AutoTokenizer.from_pretrained(model_name) return tokenizer with st.spinner(text="Please wait while the model is loading...."): model = load_model('nafisehNik/girt-t5-base') tokenizer = load_tokenizer('nafisehNik/girt-t5-base') def create_instruction(name, about, title, labels, assignees, headline_type, headline, summary): val_list = [name, about, title, labels, assignees, headline_type, headline] val_list = ['<|MASK|>' if not element else element for element in val_list] if not summary: summary = '<|EMPTY|>' instruction = f'name: {value_list[0]}\nabout: {value_list[1]}\ntitle: {value_list[2]}\nlabels: {value_list[3]}\nassignees: {value_list[4]}\nheadlines_type: {value_list[5]}\nheadlines: {value_list[6]}\nsummary: {summary}' return instruction def compute(sample, top_p, top_k, do_sample, max_length, min_length): inputs = tokenizer(sample, return_tensors="pt").to('cpu') outputs = model.generate( **inputs, min_length= min_length, max_length=max_length, do_sample=do_sample, top_p=top_p, top_k=top_k).to('cpu') generated_texts = tokenizer.batch_decode(outputs, skip_special_tokens=False) generated_text = generated_texts[0] replace_dict = { '\n ': '\n', '': '', ' ': '', '': '', '': '' } postprocess_text = generated_text for key, value in replace_dict.items(): postprocess_text = postprocess_text.replace(key, value) return postprocess_text st.markdown("[![Duplicate Space](https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAAXNSR0IArs4c6QAAAP5JREFUOE+lk7FqAkEURY+ltunEgFXS2sZGIbXfEPdLlnxJyDdYB62sbbUKpLbVNhyYFzbrrA74YJlh9r079973psed0cvUD4A+4HoCjsA85X0Dfn/RBLBgBDxnQPfAEJgBY+A9gALA4tcbamSzS4xq4FOQAJgCDwV2CPKV8tZAJcAjMMkUe1vX+U+SMhfAJEHasQIWmXNN3abzDwHUrgcRGmYcgKe0bxrblHEB4E/pndMazNpSZGcsZdBlYJcEL9Afo75molJyM2FxmPgmgPqlWNLGfwZGG6UiyEvLzHYDmoPkDDiNm9JR9uboiONcBXrpY1qmgs21x1QwyZcpvxt9NS09PlsPAAAAAElFTkSuQmCC&logoWidth=14)](https://huggingface.co/spaces/nafisehNik/girt-space?duplicate=true)") render_svg(open("assets/logo.svg").read()) st.markdown( """