Spaces:

engajify
/

test_1

Sleeping

App Files Files Community

engajify commited on May 28, 2024

Commit

73a0a63

verified ·

1 Parent(s): 2d286d6

Upload 5 files

Browse files

Files changed (5) hide show

F50xXeBbcAA0IIx.jpeg +0 -0
README.md +18 -3
app.py +107 -0
gitattributes +35 -0
requirements.txt +5 -0

F50xXeBbcAA0IIx.jpeg ADDED Viewed

README.md CHANGED Viewed

@@ -1,12 +1,27 @@
 ---
-title: Test 1
-emoji: 🦀
-colorFrom: indigo
 colorTo: pink
 sdk: gradio
 sdk_version: 4.31.5
 app_file: app.py
 pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Action Detection In Images
+emoji: 😻
+colorFrom: blue
 colorTo: pink
 sdk: gradio
 sdk_version: 4.31.5
 app_file: app.py
 pinned: false
+license: mit
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+# General Action Classifier
+This is a Gradio interface that allows users to upload an image and specify candidate labels to check if a certain action is present in the image. The app uses a CLIP-ViT model to classify the image based on the provided labels.
+## How to Use
+1. Upload an image.
+2. Enter candidate labels separated by commas.
+3. The app will classify the image and display the results.
+## Example
+For instance, to check if a person is holding a beverage, you can enter labels like: "human with beverage, human, beverage".

app.py ADDED Viewed

	@@ -0,0 +1,107 @@

+import gradio as gr
+from PIL import ImageFilter, Image
+from transformers import AutoModelForZeroShotImageClassification, AutoProcessor
+import torch
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# Initialize the CLIP-ViT model
+checkpoint = "openai/clip-vit-large-patch14-336"
+model = AutoModelForZeroShotImageClassification.from_pretrained(checkpoint)
+model = model.to(device)
+processor = AutoProcessor.from_pretrained(checkpoint)
+def classify_image(image, candidate_labels):
+    messages = []
+    candidate_labels = [label.strip() for label in candidate_labels.split(",") if label.strip()] + ["other"]
+    if len(candidate_labels) == 1:
+        candidate_labels.append("other")
+    # Blur the image
+    image = image.filter(ImageFilter.GaussianBlur(radius=5))
+    # Process the image and candidate labels
+    inputs = processor(images=image, text=candidate_labels, return_tensors="pt", padding=True)
+    inputs = {key: val.to(device) for key, val in inputs.items()}
+    # Get model's output
+    with torch.no_grad():
+        outputs = model(**inputs)
+    logits = outputs.logits_per_image[0]
+    probs = logits.softmax(dim=-1).cpu().numpy()
+    # Organize results
+    results = [
+        {"score": float(score), "label": candidate_label}
+        for score, candidate_label in sorted(zip(probs, candidate_labels), key=lambda x: -x[0])
+    ]
+    # Convert results to list of lists for Dataframe
+    results_for_df = [[res['label'], res['score']] for res in results]
+    # Decision-making logic
+    top_label = results[0]["label"]
+    second_label = results[1]["label"] if len(results) > 1 else "None"
+    # Add messages to understand the scores
+    messages.append(f"Top label: {top_label} with score: {results[0]['score']:.2f}")
+    messages.append(f"Second label: {second_label} with score: {results[1]['score']:.2f}" if len(results) > 1 else "")
+    # Example decision logic for specific scenarios (can be customized further)
+    if top_label == candidate_labels[0] and results[0]["score"] >= 0.58 and second_label != "other":
+        messages.append("Triggered the new 0.58 check!")
+        result = True
+    elif top_label == candidate_labels[0] and second_label in candidate_labels[:-1] and (results[0]['score'] + results[1]['score']) >= 0.90:
+        messages.append("Triggered the 90% combined check!")
+        result = True
+    elif top_label == candidate_labels[1] and second_label == candidate_labels[0] and (results[0]['score'] + results[1]['score']) >= 0.95:
+        messages.append("Triggered the 90% reverse order check!")
+        result = True
+    else:
+        result = False
+    return result, top_label, results_for_df, messages
+# Default values
+default_labels = "human with beverage,human,beverage"
+default_image_path = "F50xXeBbcAA0IIx.jpeg"
+# Load default image
+default_image = Image.open(default_image_path)
+iface = gr.Interface(
+    fn=classify_image,
+    inputs=[
+        gr.Image(type="pil", label="Upload an Image", value=default_image),
+        gr.Textbox(label="Candidate Labels (comma separated)", value=default_labels)
+    ],
+    outputs=[
+        gr.Label(label="Result"),
+        gr.Textbox(label="Top Label"),
+        gr.Dataframe(headers=["Label", "Score"], label="Details"),
+        gr.Textbox(label="Messages")
+    ],
+    title="General Action Classifier",
+    description="""
+    **Instructions:**
+    1. **Upload an Image**: Drag and drop an image or click to upload an image file. A default image is provided.
+    2. **Enter Candidate Labels**:
+       - Provide candidate labels separated by commas.
+       - For example: `human with beverage,human,beverage`
+       - The label "other" will automatically be added to the list of candidate labels.
+       - You can enter just one label, and "other" will still be added automatically. Default labels are provided.
+    3. **View Results**:
+       - The result will indicate whether the specified action (top label) is present in the image.
+       - Detailed scores for each label will be displayed in a table.
+       - Additional messages explaining the decision process will also be shown.
+    """
+)
+if __name__ == "__main__":
+    iface.launch()

gitattributes ADDED Viewed

	@@ -0,0 +1,35 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+gradio
+transformers
+torch
+pillow
+requests