Spaces:
Runtime error
Runtime error
More examples, polish interface
Browse files
app.py
CHANGED
@@ -14,7 +14,6 @@ LaBSE correctly recognizes that "poisson" means fish and that the fish label is
|
|
14 |
|
15 |
The similarity between the text and the labels is measured using cosine similarity.
|
16 |
This means that smaller values indicate a higher similarity.
|
17 |
-
I'll have to find out how to change that at some point.
|
18 |
"""
|
19 |
|
20 |
model = SentenceTransformer('sentence-transformers/LaBSE')
|
@@ -27,8 +26,9 @@ def zero_shot(doc, candidates):
|
|
27 |
query_embedding = embeddings[0]
|
28 |
candidate_embeddings = embeddings[1:]
|
29 |
distances = scipy.spatial.distance.cdist([query_embedding], candidate_embeddings, "cosine")[0]
|
|
|
30 |
results = zip(given_labels, distances)
|
31 |
-
results = sorted(results, key=lambda x: x[1], reverse=
|
32 |
return results
|
33 |
|
34 |
#create input and output objects
|
@@ -37,10 +37,11 @@ input1 = gr.Textbox(label="Text")
|
|
37 |
#input object 2
|
38 |
input2 = gr.Textbox(label="Labels")
|
39 |
#output object
|
40 |
-
# output = gr.Label(label="Output")
|
41 |
output = gr.Dataframe(type='array', headers=['Label', 'Distance'], label="Output")
|
42 |
#example object
|
43 |
examples = [
|
|
|
|
|
44 |
["poisson", "jam, milk, fish, eggs, poison"],
|
45 |
["TDC A/S provides communications and entertainment solutions in Denmark. It operates through Nuuday and TDC NET segments. The company designs, builds, and operates broadband and mobile networks; and provides technical support to customers and networks. It offers services, such as landline voice, TV and streaming, broadband, Internet and network, mobility, and other services. The company provides its products and services under the YouSee, Hiper, Telmore, Blockbuster, TDC Business, TDC Erhverv, Fullrate, NetDesign, and Relatel brands. It serves consumer and business customers. The company was founded in 1882 and is based in Copenhagen, Denmark. TDC A/S is a subsidiary of DK Telekommunikation ApS.", "Diversified Telecommunication Services, Wireless Telecommunication Services, Media, Entertainment, Interactive Media and Services"],
|
46 |
["Giddy Inc., doing business as Boxed Wholesale, offers online wholesale and retailing services. The company provides cleaning and laundry, kitchen, paper, skin care, hair care, and grocery products. Additionally, it offers diapers and organic products. Giddy Inc. was founded in 2013 and is based in Edison, New Jersey.", "Food and Staples Retailing, Beverages, Food Products, Household Products, Personal Products, Tobacco"],
|
|
|
14 |
|
15 |
The similarity between the text and the labels is measured using cosine similarity.
|
16 |
This means that smaller values indicate a higher similarity.
|
|
|
17 |
"""
|
18 |
|
19 |
model = SentenceTransformer('sentence-transformers/LaBSE')
|
|
|
26 |
query_embedding = embeddings[0]
|
27 |
candidate_embeddings = embeddings[1:]
|
28 |
distances = scipy.spatial.distance.cdist([query_embedding], candidate_embeddings, "cosine")[0]
|
29 |
+
distances = [round(x, 3) for x in distances]
|
30 |
results = zip(given_labels, distances)
|
31 |
+
results = sorted(results, key=lambda x: x[1], reverse=False)
|
32 |
return results
|
33 |
|
34 |
#create input and output objects
|
|
|
37 |
#input object 2
|
38 |
input2 = gr.Textbox(label="Labels")
|
39 |
#output object
|
|
|
40 |
output = gr.Dataframe(type='array', headers=['Label', 'Distance'], label="Output")
|
41 |
#example object
|
42 |
examples = [
|
43 |
+
["Eco-friendly Hydrogen: The clean fuel of the future Germany is promoting the use of #eco-friendly hydrogen in the fight against climate change. Hydrogen can replace fossil fuels in virtually every situation, in an engine or fuel cell!", "renewable", "politics", "emission", "temperature", "emergency", "advertisment"],
|
44 |
+
["I like to eat salmon.", "fish, meat, vegetable"],
|
45 |
["poisson", "jam, milk, fish, eggs, poison"],
|
46 |
["TDC A/S provides communications and entertainment solutions in Denmark. It operates through Nuuday and TDC NET segments. The company designs, builds, and operates broadband and mobile networks; and provides technical support to customers and networks. It offers services, such as landline voice, TV and streaming, broadband, Internet and network, mobility, and other services. The company provides its products and services under the YouSee, Hiper, Telmore, Blockbuster, TDC Business, TDC Erhverv, Fullrate, NetDesign, and Relatel brands. It serves consumer and business customers. The company was founded in 1882 and is based in Copenhagen, Denmark. TDC A/S is a subsidiary of DK Telekommunikation ApS.", "Diversified Telecommunication Services, Wireless Telecommunication Services, Media, Entertainment, Interactive Media and Services"],
|
47 |
["Giddy Inc., doing business as Boxed Wholesale, offers online wholesale and retailing services. The company provides cleaning and laundry, kitchen, paper, skin care, hair care, and grocery products. Additionally, it offers diapers and organic products. Giddy Inc. was founded in 2013 and is based in Edison, New Jersey.", "Food and Staples Retailing, Beverages, Food Products, Household Products, Personal Products, Tobacco"],
|