Spaces:

rootxhacker
/

CodeAstra-7B-demo

Runtime error

File size: 3,141 Bytes

8b644df
 
 
d1bab71
18ef497
d1bab71
bbcea92
2e03541
 
bbcea92
ccad9ef
 
 
 
 
 
 
 
 
 
 
 
 
2e03541
a93c076
 
 
ccad9ef
bbcea92
2e03541
8b644df
bbcea92
2e03541
 
bcc9c6b
2e03541
bbcea92
ccad9ef
 
 
 
bbcea92
96e9aa5
ccad9ef
 
112e6b8
bbcea92
 
ccad9ef
 
 
 
c9fd348
8b644df
bcc9c6b
8b644df
c9fd348
 
 
 
 
 
 
 
 
 
 
 
 
96e9aa5
655c6e2
96e9aa5
655c6e2
c9fd348
 
 
96e9aa5
655c6e2
96e9aa5
c9fd348
bbc12dc
c9fd348
 
f722dc4
8b644df
 
 
 
 
 
96e9aa5
8b644df
 
112e6b8
ccad9ef

import torch
from peft import PeftModel, PeftConfig
from transformers import AutoModelForCausalLM, AutoTokenizer
import gradio as gr
import spaces

# Load the model and tokenizer
peft_model_id = "rootxhacker/CodeAstra-7B"
config = PeftConfig.from_pretrained(peft_model_id)

# Function to move tensors to CPU
def to_cpu(obj):
    if isinstance(obj, torch.Tensor):
        return obj.cpu()
    elif isinstance(obj, list):
        return [to_cpu(item) for item in obj]
    elif isinstance(obj, tuple):
        return tuple(to_cpu(item) for item in obj)
    elif isinstance(obj, dict):
        return {key: to_cpu(value) for key, value in obj.items()}
    return obj

# Load the model
model = AutoModelForCausalLM.from_pretrained(
    config.base_model_name_or_path,
    return_dict=True,
    load_in_4bit=True,
    device_map='auto'
)
tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)

# Load the Lora model
model = PeftModel.from_pretrained(model, peft_model_id)

@spaces.GPU()
def get_completion(query, model, tokenizer):
    try:
        # Move model to CUDA
        model = model.cuda()
        # Ensure input is on CUDA
        inputs = tokenizer(query, return_tensors="pt").to('cuda')
        with torch.no_grad():
            outputs = model.generate(**inputs, max_new_tokens=1024, do_sample=True, temperature=0.7)
        # Move outputs to CPU before decoding
        outputs = to_cpu(outputs)
        return tokenizer.decode(outputs[0], skip_special_tokens=True)
    except Exception as e:
        return f"An error occurred: {str(e)}"
    finally:
        # Move model back to CPU to free up GPU memory
        model = model.cpu()
        torch.cuda.empty_cache()
        

@spaces.GPU()
def code_review(code_to_analyze):
    two_shot_prompt = f"""First, understand the given code:
Analyze the purpose, functionality, input sources, output destinations, and logical flow of the code. Identify any security-sensitive operations.

Now, review the following code:

{code_to_analyze}

Provide a brief understanding of the code.

Second, correlate the context with the input code and find vulnerabilities:
Based on your understanding of the code, identify potential security issues, logic vulnerabilities, and areas for improvement. Consider common vulnerabilities, possible misuse, input handling, and use of security functions.

Now, for the same code:

{code_to_analyze}

Provide a detailed review including:
1. Potential security issues
2. Potential logic vulnerabilities
3. Suggestions for improvement

Start each section with its number and title."""

    full_response = get_completion(two_shot_prompt, model, tokenizer)
    
    # Return the full response without any processing
    return full_response

# Create Gradio interface
iface = gr.Interface(
    fn=code_review,
    inputs=gr.Textbox(lines=10, label="Enter code to analyze"),
    outputs=gr.Textbox(label="Code Review Result"),
    title="Code Review Expert",
    description="This tool analyzes code for potential security flaws, logic vulnerabilities, and provides guidance on secure coding practices."
)

# Launch the Gradio app
iface.launch()