File size: 2,224 Bytes
da92bd2 f2ea73e da92bd2 53e8d3f da92bd2 5de2897 da92bd2 f2ea73e 5de2897 f2ea73e da92bd2 f2ea73e da92bd2 f2ea73e da92bd2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 |
import gradio as gr
from collections import Counter
import string
import csv
import io
def process_text(text, sorting_option):
# Remove punctuation from the input text
translator = str.maketrans('', '', string.punctuation)
text = text.translate(translator)
words = text.split()
# Count word frequencies
word_counts = Counter(words)
# Sort words based on the selected option
if sorting_option == 'alphabetically':
sorted_words = sorted(word_counts.items(), key=lambda x: x[0])
elif sorting_option == 'by_frequency':
sorted_words = sorted(word_counts.items(), key=lambda x: x[1], reverse=True)
else:
sorted_words = word_counts.items()
# Get the top 5 words with their frequencies
top_5_words = sorted_words
# Format the top 5 words and frequencies as an HTML table
table_html = "<table style='width:100%'><tr><th>Index</th><th>Word</th><th>Frequency</th></tr>"
for index, (word, freq) in enumerate(top_5_words, start=1):
table_html += f"<tr><td>{index}</td><td>{word}</td><td>{freq}</td></tr>"
table_html += "</table>"
# Create a CSV file
csv_data = [["Index", "Word", "Frequency"]]
for index, (word, freq) in enumerate(top_5_words, start=1):
csv_data.append([index, word, freq])
# Write CSV data to a string buffer
csv_buffer = io.StringIO()
csv_writer = csv.writer(csv_buffer)
csv_writer.writerows(csv_data)
csv_buffer.seek(0)
# Create a download link for the CSV file
csv_download_link = f"<a href='data:application/csv;charset=utf-8,{csv_buffer.getvalue()}' download='word_frequencies.csv'>Download CSV</a>"
# Wrap the table in a div with a fixed height and scrolling
div_with_scroll = f"<div style='height: 200px; overflow-y: scroll;'>{table_html}</div>"
return div_with_scroll, csv_download_link
iface = gr.Interface(
fn=process_text,
inputs=[gr.Textbox("text", label="Paste Text Here"),
gr.Radio(["alphabetically", "by_frequency", "none"], label="Select Sorting Option")],
outputs=[gr.HTML(label="Top 5 Words with Frequencies"), gr.HTML(label="Download CSV")]
)
iface.launch(share=True)
|