AIRider
/

Ko-Llama3-Luxia-8B-Q4_K_M-GGUF

Text Generation

Inference Endpoints

Model card Files Files and versions Community

AIRider commited on May 30, 2024

Commit

b2835cd

·

verified ·

1 Parent(s): 63c0bf4

Update handler.py

Files changed (1) hide show

handler.py +6 -24

handler.py CHANGED Viewed

@@ -1,26 +1,8 @@
-# handler.py
-import torch
-from transformers import AutoModelForSequenceClassification, AutoTokenizer
-def handle(request):
-    # 모델 로드
-    model = AutoModelForSequenceClassification.from_pretrained("AIRider/Ko-Llama3-Luxia-8B-Q4_K_M-GGUF")
-    tokenizer = AutoTokenizer.from_pretrained("AIRider/Ko-Llama3-Luxia-8B-Q4_K_M-GGUF")
-    # 입력 데이터 처리
-    input_text = request.inputs["text"]
-    inputs = tokenizer.encode_plus(
-        input_text,
-        add_special_tokens=True,
-        max_length=512,
-        return_attention_mask=True,
-        return_tensors="pt",
-    )
-    # 모델 추론
-    outputs = model(inputs["input_ids"], attention_mask=inputs["attention_mask"])
-    logits = outputs.logits
-    # 결과 반환
-    result = torch.argmax(logits).item()
-    return {"result": result}

+from huggingfacehub import HuggingfaceHubModelregistry
+from transformers import AutoModelorSequenceClassification
+# AIider/o-Llama3-Luxia-8B-Q4M-GG 모델을 로드합니다
+model = AutoModelorSequenceClassification.frompretrained("AIRider/Ko-Llama3-Luxia-8B-Q4_K_M-GGUF")
+# HuggingfaceHubModelregistry를 사용하여 모델을 등록합니다
+HuggingfaceHubModelregistry.register(model)