Spaces:
Running
Running
Ilia Azizi
commited on
Commit
·
2b90e9b
1
Parent(s):
2e11edb
Update app styling
Browse files- app.py +120 -47
- requirements.txt +7 -5
app.py
CHANGED
@@ -1,92 +1,165 @@
|
|
1 |
-
#
|
2 |
from transformers import pipeline
|
3 |
import gradio as gr
|
4 |
import torch
|
5 |
import re
|
6 |
|
7 |
-
|
8 |
-
# function modified for the demo
|
9 |
-
def get_native_feature_demo(language, input_description, target_feature, question, return_numbers = True):
|
10 |
task = 'question-answering'
|
11 |
french_model = 'AgentPublic/camembert-base-squadFR-fquad-piaf'
|
12 |
english_model = 'deepset/roberta-base-squad2'
|
|
|
13 |
if language == "French":
|
14 |
model = pipeline(task, model=french_model, tokenizer=french_model)
|
15 |
else:
|
16 |
model = pipeline(task, model=english_model, tokenizer=english_model)
|
|
|
17 |
answer = model({
|
18 |
'question': question,
|
19 |
'context': input_description
|
20 |
})
|
|
|
21 |
if target_feature == "price":
|
22 |
-
# price median
|
23 |
reference_target_value = 1650
|
24 |
else:
|
25 |
-
# living space median
|
26 |
reference_target_value = 85
|
|
|
27 |
try:
|
28 |
if return_numbers:
|
29 |
-
nums = re.findall(r"\d*\.\d+|\d+\,\d+|\d{1,3}'[\d{3}']+\d{1,3}\.?\d*|(?<!m)\d+",answer['answer'])
|
30 |
-
nums = [re.sub("
|
31 |
-
# turn every number into float
|
32 |
if len(nums) > 1:
|
33 |
nums = [float(x) for x in nums]
|
34 |
answer_processed = min(nums, key=lambda x:abs(x-reference_target_value))
|
35 |
elif len(nums) == 1:
|
36 |
answer_processed = float(''.join(nums))
|
|
|
|
|
37 |
else:
|
38 |
-
|
39 |
-
|
|
|
40 |
answer_full = answer['answer']
|
41 |
score = answer['score']
|
42 |
-
return ('%f' % answer_processed).rstrip('0').rstrip('.'), score, answer_full
|
43 |
except:
|
44 |
return "No answer!", None, None
|
45 |
|
46 |
-
|
47 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
title = "Extract relevant features from Real Estate Descriptions!"
|
49 |
|
50 |
description = """
|
51 |
-
<
|
52 |
-
<
|
53 |
-
|
54 |
-
|
55 |
-
|
|
|
|
|
56 |
</div>
|
57 |
"""
|
58 |
-
article = """
|
59 |
-
<center>
|
60 |
|
61 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
62 |
|
63 |
-
|
64 |
-
|
|
|
|
|
|
|
|
|
|
|
65 |
|
66 |
-
|
67 |
-
|
|
|
|
|
|
|
68 |
|
69 |
-
|
|
|
|
|
|
|
70 |
|
71 |
-
|
72 |
-
|
73 |
-
|
74 |
-
|
|
|
75 |
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
-
|
90 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
91 |
|
92 |
-
|
|
|
|
1 |
+
# app.py
|
2 |
from transformers import pipeline
|
3 |
import gradio as gr
|
4 |
import torch
|
5 |
import re
|
6 |
|
7 |
+
def get_native_feature_demo(language, input_description, target_feature, question, return_numbers=True):
|
|
|
|
|
8 |
task = 'question-answering'
|
9 |
french_model = 'AgentPublic/camembert-base-squadFR-fquad-piaf'
|
10 |
english_model = 'deepset/roberta-base-squad2'
|
11 |
+
|
12 |
if language == "French":
|
13 |
model = pipeline(task, model=french_model, tokenizer=french_model)
|
14 |
else:
|
15 |
model = pipeline(task, model=english_model, tokenizer=english_model)
|
16 |
+
|
17 |
answer = model({
|
18 |
'question': question,
|
19 |
'context': input_description
|
20 |
})
|
21 |
+
|
22 |
if target_feature == "price":
|
|
|
23 |
reference_target_value = 1650
|
24 |
else:
|
|
|
25 |
reference_target_value = 85
|
26 |
+
|
27 |
try:
|
28 |
if return_numbers:
|
29 |
+
nums = re.findall(r"\d*\.\d+|\d+\,\d+|\d{1,3}'[\d{3}']+\d{1,3}\.?\d*|(?<!m)\d+", answer['answer'])
|
30 |
+
nums = [re.sub(r",|'", "", num) for num in nums] # Fixed escape sequence
|
|
|
31 |
if len(nums) > 1:
|
32 |
nums = [float(x) for x in nums]
|
33 |
answer_processed = min(nums, key=lambda x:abs(x-reference_target_value))
|
34 |
elif len(nums) == 1:
|
35 |
answer_processed = float(''.join(nums))
|
36 |
+
else:
|
37 |
+
return "No numbers found!", None, None
|
38 |
else:
|
39 |
+
answer_processed = answer['answer']
|
40 |
+
|
41 |
+
answer_processed = round(float(answer_processed), 2)
|
42 |
answer_full = answer['answer']
|
43 |
score = answer['score']
|
44 |
+
return ('%f' % answer_processed).rstrip('0').rstrip('.'), f"{score:.4f}", answer_full
|
45 |
except:
|
46 |
return "No answer!", None, None
|
47 |
|
48 |
+
# Example data
|
49 |
+
french_example = """ Venez découvrir votre futur appartement lors des portes ouvertes Quai Ouest à Renens le samedi 6 mars de 9h00 à 12h00. Afin de respecter les mesures de sécurité, merci d'inscrire une personne par tranche horaire. Merci de laisser vos coordonnées (nom, email et téléphone) afin que l'on puisse vous joindre pour confirmer le rendez-vous et l'adresse. Lorsque vous entrer votre nom pour vous inscrire, merci d'indiquer également l'appartement que vous souhaitez visiter (n° ou nombre de pièces). En cas d'intérêt, merci de venir avec un dossier complet : - 3 dernières fiches de salaire - Extrait de l'office des poursuites - Copie carte d'identité ou permis de séjour - Copie de votre police d'assurance RC (responsabilité civile) et ménage Un formulaire de location sera à disposition sur place. Pour en savoir plus: https://quai-ouest.ch/location/logements\nINSCRIPTIONS : https://doodle.com/poll/5cvrqyt2ueaah3su?utm_source=poll&utm_medium=link\nNouvelle promotion de 89 logements en location idéalement située à la Gare de Renens, Quai Ouest ouvrira ses bras aux futurs locataires avec plusieurs options de logements, commerces et bureaux.\nCe magnifique appartement de 4.5 pièces se situe au 3° étage et a été construit avec de très beaux matériaux et se compose comme suit:\nSpacieux séjour de 40m2\nSuite parentale de 23.9m2 avec salle de douche italienne attenante\nDeux chambres à coucher d'environ 13m2 chacune\nRaccordement pour colonne de lavage\nUne salle de bains/WC\nCuisine ouverte avec îlot central et entièrement agencée avec lave-vaisselle\nStores électriques\nEntrée avec armoires murales\nLoyer net : CHF 2'600 .-\nCharges: CHF 320.-\nTotal: CHF 2'920.-\nAdresse: Place de la Gare à 1020 Renens\nPlus d'informations sur www.quai-ouest.ch/location/logements ainsi que chez Omnia Immobilier"""
|
50 |
+
|
51 |
+
english_example = """Come and discover your future apartment at the Quai Ouest open house in Renens on Saturday, March 6th, from 9:00 am to 12:00 pm. In order to respect the security measures, please register one person per hour. Please leave your contact details (name, email and telephone) so that you can be reached to confirm the appointment and address. When entering your name to register, please also indicate the apartment you wish to visit (no or number of rooms). In case of interest, please come with a complete file: - 3 last salary slips - Excerpt from the prosecution office - Copy of identity card or residence permit - Copy of your insurance policy RC (civil liability) and household A rental form will be available on site. For more information: https://quai-ouest.ch/rental/housing INSCRIPTIONS: https://doodle.com/poll/5cvrqyt2ueaah3su?utm_source=poll&utm_medium=link New promotion of 89 rental units ideally located at the Gare de Renens, several new housing options. This magnificent 4.5-room apartment is located on the 3rd floor and has been built with beautiful materials and consists as follows: Spacious living room of 40m2 Master suite of 23.9m2 with adjoining Italian shower room Two bedrooms of about 13m2 each Wash-column connection A bathroom/WC Open kitchen with central island and fully arranged with dishwasher Electric stores Entrance with wall cabinets Net rent: CHF 2'600 .- Charges: CHF 320.- Total: CHF 2'920.- Address: Place de la Gare à 1020 Renens More information on www.quai-ouest.ch/location/housing as well as at Omnia Immobilier"""
|
52 |
+
|
53 |
+
examples = [
|
54 |
+
["French", french_example, 'price', "Combien payez-vous de loyer?"],
|
55 |
+
["French", french_example, 'living_space', "Quelle est la surface en m2?"],
|
56 |
+
["English", english_example, 'price', "How much is the rent?"],
|
57 |
+
["English", english_example, 'living_space', "How large is the surface?"]
|
58 |
+
]
|
59 |
+
|
60 |
+
# Define the parameters
|
61 |
title = "Extract relevant features from Real Estate Descriptions!"
|
62 |
|
63 |
description = """
|
64 |
+
<div style="margin-bottom: 1.5rem;">
|
65 |
+
<div style="display: flex; justify-content: center; margin-bottom: 1.5rem">
|
66 |
+
<img src="https://teara.govt.nz/files/c-21363-atl.jpg" width="300px" alt="Real Estate Image" style="border-radius: 8px;"/>
|
67 |
+
</div>
|
68 |
+
<div style="text-align: justify">
|
69 |
+
Features with missing instances can negatively impact the performance of machine learning models. Information Extraction (IE) can improve the availability of tabular data by identifying relevant information from unstructured textual descriptions. This project demonstrated the application of IE on descriptions of online real estate listings, whereby the required missing values are retrieved from the text. Inspired by question-answering tasks, the aim was to recover these values by asking a set of questions. We tested two ways to achieve this goal. The first one focuses on a model specific to the language of the description (French) to perform IE, while the second translates the descriptions into English before IE. The project compared the performance of both approaches while delivering insights on how the formulation of the questions can impact the effectiveness of Q&A models.
|
70 |
+
</div>
|
71 |
</div>
|
72 |
"""
|
|
|
|
|
73 |
|
74 |
+
css = """
|
75 |
+
/* Comprehensive table text alignment */
|
76 |
+
.table-wrap table td,
|
77 |
+
.table-wrap table td div,
|
78 |
+
.table-wrap table td p,
|
79 |
+
.examples-table td,
|
80 |
+
.examples-table td div,
|
81 |
+
.examples-table td p,
|
82 |
+
.prose td,
|
83 |
+
.prose td div,
|
84 |
+
.prose td p {
|
85 |
+
text-align: left !important;
|
86 |
+
white-space: pre-wrap !important;
|
87 |
+
word-break: break-word !important;
|
88 |
+
}
|
89 |
|
90 |
+
/* Ensure specific targeting of the real estate description column */
|
91 |
+
.table-wrap table td:nth-child(2),
|
92 |
+
.table-wrap table td:nth-child(2) div,
|
93 |
+
.table-wrap table td:nth-child(2) p {
|
94 |
+
text-align: left !important;
|
95 |
+
padding: 8px !important;
|
96 |
+
}
|
97 |
|
98 |
+
/* Additional styling for better readability */
|
99 |
+
.table-wrap table {
|
100 |
+
width: 100% !important;
|
101 |
+
table-layout: fixed !important;
|
102 |
+
}
|
103 |
|
104 |
+
.table-wrap table td {
|
105 |
+
vertical-align: top !important;
|
106 |
+
}
|
107 |
+
"""
|
108 |
|
109 |
+
article = """
|
110 |
+
<div style="text-align: center; margin-top: 1.5rem;">
|
111 |
+
Created by <a href="https://iliaazizi.netlify.app/" target="_blank" style="color: #2563eb;">Ilia Azizi</a> 2022
|
112 |
+
</div>
|
113 |
+
"""
|
114 |
|
115 |
+
# Create the Gradio interface
|
116 |
+
with gr.Blocks(title=title, css=css) as demo:
|
117 |
+
gr.HTML(description)
|
118 |
+
|
119 |
+
with gr.Row():
|
120 |
+
with gr.Column():
|
121 |
+
language = gr.Radio(
|
122 |
+
choices=["French", "English"],
|
123 |
+
label="Language",
|
124 |
+
value="French"
|
125 |
+
)
|
126 |
+
target_feature = gr.Dropdown(
|
127 |
+
choices=["price", "living_space"],
|
128 |
+
label="Target Feature",
|
129 |
+
value="price"
|
130 |
+
)
|
131 |
+
question = gr.Textbox(
|
132 |
+
lines=2,
|
133 |
+
label="Question",
|
134 |
+
placeholder="Ask to retrieve a feature."
|
135 |
+
)
|
136 |
+
input_description = gr.Textbox(
|
137 |
+
lines=10,
|
138 |
+
label="Real Estate Description",
|
139 |
+
placeholder="Type a real estate description here."
|
140 |
+
)
|
141 |
+
submit_btn = gr.Button("Extract Feature", variant="primary")
|
142 |
+
|
143 |
+
with gr.Column():
|
144 |
+
extracted_feature = gr.Textbox(label="Extracted Feature")
|
145 |
+
prediction_prob = gr.Textbox(label="Probability of the prediction")
|
146 |
+
full_answer = gr.Textbox(label="Full Q&A answer")
|
147 |
+
|
148 |
+
gr.Examples(
|
149 |
+
examples=examples,
|
150 |
+
inputs=[language, input_description, target_feature, question],
|
151 |
+
outputs=[extracted_feature, prediction_prob, full_answer],
|
152 |
+
fn=get_native_feature_demo,
|
153 |
+
cache_examples=True
|
154 |
+
)
|
155 |
+
|
156 |
+
gr.HTML(article)
|
157 |
+
|
158 |
+
submit_btn.click(
|
159 |
+
fn=get_native_feature_demo,
|
160 |
+
inputs=[language, input_description, target_feature, question],
|
161 |
+
outputs=[extracted_feature, prediction_prob, full_answer]
|
162 |
+
)
|
163 |
|
164 |
+
if __name__ == "__main__":
|
165 |
+
demo.launch()
|
requirements.txt
CHANGED
@@ -1,5 +1,7 @@
|
|
1 |
-
|
2 |
-
torch
|
3 |
-
|
4 |
-
|
5 |
-
sentencepiece
|
|
|
|
|
|
1 |
+
gradio>=4.12.0
|
2 |
+
torch>=2.0.0
|
3 |
+
transformers>=4.36.0
|
4 |
+
protobuf>=4.25.1
|
5 |
+
sentencepiece>=0.1.99
|
6 |
+
tokenizers>=0.15.0
|
7 |
+
sacremoses>=0.1.1
|