basedon_user.py

import streamlit as st
import numpy as np 
import pandas as pd
import plotly.express as px
from plotly.graph_objs import *
import plotly.graph_objects as go
import plotly as py
import plotly.io as pio
import pickle
from sklearn.feature_extraction.text import CountVectorizer, TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
pio.renderers.default = 'chrome'
st.set_option('deprecation.showPyplotGlobalUse', False)
#st.set_page_config(layout="wide")

#st.title('Recommended for you!')
st.markdown(' <p align="center" class="big-font">  <b>Authorship Attribution <u> 🌟 T5 🇸🇦</b>   </p>', unsafe_allow_html=True)	


st.markdown("""
<style>
.big-font {
    font-size:50px !important;
}
</style>
""", unsafe_allow_html=True)


st.markdown("""
إسناد التأليف العربي هو مهمة البحث عن مؤلف المستند. لتحقيق هذا الغرض ، يقارن المرء نص الاستعلام بنموذج المؤلف المرشح ويحدد احتمال نموذج الاستعلام.

Arabic authorship attribution is the task of finding the author of a document.
To achieve this purpose, one compares a query text with a model of the candidate author and determines the likelihood of the model for the query.
	""")
st.write('---')

st.subheader('Check author of a document | ابحث عن المؤلف الحقيقي ')

#raw_text = st.text_area("Authorship Attribution Check","Enter Text Here")
max_lengthy = st.slider('Maximum words length (words)', min_value=30, max_value=512, value=60, step=10)

#num_beamer = st.slider('Speed vs quality of summary (1 is fastest)', min_value=1, max_value=8, value=4, step=1)

text = st.text_area('ادخل النص (maximum 512 words):', height=300) 

submit = st.button('افحص')
st.write('Note: The model is heavy more than 3GB of training, and it might not show results on time as we are hosing on free space!')

# if submit:

#     st.subheader("Results:")

#     with st.spinner(text="This may take a moment..."):

#         summWords = sum2(text, max_length=max_lengthy, min_length=15, num_beams=num_beamer, do_sample=True, early_stopping=True, repetition_penalty=1.5, length_penalty=1.5)

#     text2 =summWords[0]["summary_text"]

#     st.write(text2)
#input = st.text_area("Enter Input Data :")
#output = input.upper() # final_result_from_processing_the_input

#Xvalue=" Author:  ابن أمير حاج | Book:  التقرير والتحبير |  Confidence: 0.8255385 "
cc = st.text_area(label="Output Data:",value="",  height=90)
		

df1 = pd.read_pickle('df.pkl')
cosin = pd.read_pickle('cosine.pkl')


st.write('---')
if st.checkbox("Show orignal dataframe | عرض جميع الكتب الموجودة بنظام التوصية"):
	dataframe=df1
	#dataframe.drop('Unnamed: 0', axis=1, inplace=True)
	dataframe


st.sidebar.header('نظام التوصية')
name = st.sidebar.text_input(''' ادخل اسم الكتاب''')
st.sidebar.write(''' Our Books Collections Below:''')
st.sidebar.write(''' 
مجموعات كتبنا أدناه''')

st.sidebar.table(df1["BookTitle"])

st.write('---')

st.subheader('Your Selected Book Title Details | تفاصيل عنوان الكتاب المختار ')
books = df1[(df1["BookTitle"] == name)]
           #& (reviews["Polarity"] == "Positive")].reset_index(drop=True)
st.write(books)
           
st.write('---')

#st.write(cosin.to_numpy()) 
cosine= cosin.to_numpy()

@st.cache(allow_output_mutation=True)
def get_title_from_index(Index):
    return df1[df1.index == Index]["BookTitle"].values[0]
def get_index_from_title(BookTitle):
    return df1[df1.BookTitle == BookTitle]["index"].values[0]

def get_recommendations(book):
    book_index = get_index_from_title(book)
    similar_books = list(enumerate(cosine[book_index]))
    sortedbooks = sorted(similar_books, key = lambda x:x[1], reverse=True)[1:]
    i = 0
    for book in sortedbooks:
        st.write(" Title: "+ get_title_from_index(book[0]) + " ♦️ "  + " Author: " + df1.author[df1["index"] == book[0]])
      
        i = i+1
        if i>10:
            break
   
#df1.BookTitle[df1["index"] == book[0]]  
st.subheader('💡 Your Recommended Books | كتبك الموصى بها ')
try:
	st.write(get_recommendations(name))
except:
        st.error("🔴 Please make sure that you only enter a name of your book | يرجى التأكد من إدخال اسم كتابك فقط")
        st.stop()

st.write('---')

st.header('Books in Recommnder System')

fig = px.bar(df1, y='author' , x='text_length', color='author',color_discrete_sequence=px.colors.diverging.Geyser,orientation='h', height=600, width=900)
    
fig.update_xaxes(showgrid=False)
fig.update_yaxes(showgrid=True)
    
    
fig.update_layout(template="plotly_white",xaxis_showgrid=False, yaxis_showgrid=False)
    
fig.update_traces( marker_line_color='rgb(8,48,107)',
                  marker_line_width=2, opacity=0.6)
    
fig.update_layout(showlegend=True, title="عدد كلمات الكتب",
xaxis_title="طول النص",
yaxis_title="اسم المؤلف وعدد كتبة")

    
fig.update_xaxes(showline=True, linewidth=1, linecolor='black')
fig.update_yaxes(showline=True, linewidth=1, linecolor='black')
                               
#st.table(get_recommendations(name))

st.plotly_chart(fig)


st.write('---')
st.write('## Contact Our Group')


st.write("""
[Authorship Attribution](https://github.com/A-safarji) - feel free to contact!
""")