Spaces:

JoannaKOKO
/

Tarot_Explainer_gpu

Sleeping

App Files Files Community

JoannaKOKO commited on Mar 25

Commit

a314f0c

verified ·

1 Parent(s): aadfcbe

Upload 2 files

Browse files

Files changed (2) hide show

app.py +174 -0
requirements.txt +7 -0

app.py ADDED Viewed

	@@ -0,0 +1,174 @@

+import os
+from huggingface_hub import login
+import gradio as gr
+from PIL import Image
+from transformers import AutoProcessor, AutoModelForImageTextToText, pipeline
+import torch
+import spaces
+# Function to process vision information
+def process_vision_info(messages: list[dict]) -> list[Image.Image]:
+    image_inputs = []
+    for msg in messages:
+        content = msg.get("content", [])
+        if not isinstance(content, list):
+            content = [content]
+        for element in content:
+            if isinstance(element, dict) and ("image" in element or element.get("type") == "image"):
+                image = element["image"] if "image" in element else element
+                image_inputs.append(image.convert("RGB"))
+    return image_inputs
+# Load image model and processor on CPU
+def load_image_model():
+    model_name = "JoannaKOKO/Gemma3-4b_tarot"
+    model = AutoModelForImageTextToText.from_pretrained(
+        model_name,
+        device_map="cpu",
+        torch_dtype=torch.bfloat16,
+        attn_implementation="eager",
+    )
+    processor = AutoProcessor.from_pretrained(model_name)
+    return processor, model
+# Load text model on CPU
+def load_text_model():
+    return pipeline(
+        "text-generation",
+        model="tarotscientist/llama-2-7b-tarotreader",
+        device=-1  # Force CPU
+    )
+# Generate card description with ZeroGPU
+@spaces.GPU
+def generate_description(sample, model, processor):
+    # Move the image model to GPU
+    model.to('cuda')
+    system_message = 'You are a Tarot Card Identifier providing the card names and whether they are in upright or reversed position.'
+    messages = [
+        {"role": "system", "content": [{"type": "text", "text": system_message}]},
+        {"role": "user", "content": [
+            {"type": "image", "image": sample["image"]},
+            {"type": "text", "text": sample["prompt"]},
+        ]},
+    ]
+    text = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
+    image_inputs = process_vision_info(messages)
+    inputs = processor(text=[text], images=image_inputs, padding=True, return_tensors="pt")
+    inputs = inputs.to("cuda")
+    stop_token_ids = [processor.tokenizer.eos_token_id, processor.tokenizer.convert_tokens_to_ids("<end_of_turn>")]
+    generated_ids = model.generate(
+        **inputs,
+        max_new_tokens=256,
+        top_p=1.0,
+        do_sample=True,
+        temperature=0.8,
+        eos_token_id=stop_token_ids,
+        disable_compile=True
+    )
+    generated_ids_trimmed = [out_ids[len(in_ids):] for in_ids, out_ids in zip(inputs.input_ids, generated_ids)]
+    output_text = processor.batch_decode(
+        generated_ids_trimmed,
+        skip_special_tokens=True,
+        clean_up_tokenization_spaces=False
+    )
+    return output_text[0]
+# Generate tarot interpretation with ZeroGPU
+@spaces.GPU
+def generate_interpretation(question, cards, model):
+    prompt = f"""Analyze this tarot reading for the question: {question}
+Cards:
+1. Reason: {cards[0]}
+2. Result: {cards[1]}
+3. Recommendation: {cards[2]}
+Provide a professional interpretation covering:
+- Individual card meanings in their positions
+- Combined message and symbolism
+- Practical advice
+- Potential outcomes"""
+    # Use GPU for this inference call
+    response = model(prompt, max_length=1000, temperature=0.8, top_p=0.95)[0]['generated_text']
+    return response
+def main():
+    """
+    Main function to set up and launch the Gradio tarot reading application.
+    Handles authentication, model loading, and interface creation.
+    """
+    # Authenticate with Hugging Face
+    hf_token = os.environ.get("HF_TOKEN")
+    if not hf_token:
+        raise ValueError("HF_TOKEN not found in environment variables!")
+    login(token=hf_token)
+    # Load models on CPU
+    image_processor, image_model = load_image_model()
+    text_model = load_text_model()
+    # Define the tarot processing function
+    def process_tarot(question, reason_img, result_img, recommendation_img):
+        """
+        Process the user's question and tarot card images to generate a reading.
+        Uses loaded models for card identification and interpretation.
+        """
+        try:
+            # Validate image uploads
+            if any(img is None for img in [reason_img, result_img, recommendation_img]):
+                return "Please upload all three cards!"
+            # Generate descriptions for each card using GPU
+            cards = []
+            for img in [reason_img, result_img, recommendation_img]:
+                sample = {
+                    "prompt": "Please tell me the name of the tarot card in this image, specify 'reversed' if it is. ",
+                    "image": img.convert("RGB")
+                }
+                card = generate_description(sample, image_model, image_processor)
+                cards.append(card)
+                output = "### Identifing Card Name...\n"
+            # Generate the full interpretation using GPU
+            interpretation = generate_interpretation(question, cards, text_model)
+            # Format the output
+            output += "### Card Analysis\n"
+            for i, card in enumerate(cards, 1):
+                output += f"**Position {i}:** {card}\n\n"
+            output += "### Full Interpretation\n"
+            output += interpretation
+            output += "\n\n**Reading complete! Reflect on these insights.**"
+            return output
+        except Exception as e:
+            return f"Error in reading: {str(e)}"
+    # Set up the Gradio interface
+    with gr.Blocks() as demo:
+        gr.Markdown("# 🔮 Advanced Tarot Reader")
+        gr.Markdown("### Professional-grade AI Tarot Analysis")
+        question = gr.Textbox(
+            label="Your Question",
+            placeholder="Enter your question for the cards...",
+            lines=3
+        )
+        with gr.Row():
+            reason_img = gr.Image(label="Reason Card", type="pil")
+            result_img = gr.Image(label="Result Card", type="pil")
+            recommendation_img = gr.Image(label="Recommendation Card", type="pil")
+        submit_btn = gr.Button("Perform Reading")
+        output = gr.Markdown()
+        # Connect the button to the processing function
+        submit_btn.click(
+            fn=process_tarot,
+            inputs=[question, reason_img, result_img, recommendation_img],
+            outputs=output
+        )
+    # Launch the application (no share=True for Hugging Face Spaces)
+    demo.launch()
+# Entry point of the script
+if __name__ == "__main__":
+    main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+torch
+git+https://github.com/huggingface/transformers.git
+pillow
+gradio
+accelerate>=0.26.0
+peft
+huggingface_hub