Spaces:

xavierbarbier
/

rag_ngap

Sleeping

xavierbarbier commited on Aug 30, 2024

Commit

151281a

verified ·

1 Parent(s): 0bca80f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ import numpy as np
 from pypdf import PdfReader
 from gradio_pdf import PDF
 from transformers import pipeline
-from transformers_js import import_transformers_js
 title = "Mistral-7B-Instruct-GGUF Run On CPU-Basic Free Hardware"
@@ -30,15 +30,15 @@ model_name = "SmolLM-1.7B-Instruct.Q2_K.gguf"
 hf_hub_download(repo_id="mradermacher/SmolLM-1.7B-Instruct-GGUF", filename=model_name, local_dir=model_path, local_dir_use_symlinks=False)
 """
-"""
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer
-model_name = "croissantllm/CroissantLLMBase"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, device_map="auto")
-"""
 print("Start the model init process")
 """model = model = GPT4All(model_name, model_path, allow_download = False, device="cpu")
@@ -49,10 +49,7 @@ model._is_chat_session_activated = False
 max_new_tokens = 2048"""
-transformers = import_transformers_js()
-pipeline = transformers.pipeline
-pipe = pipeline('text-generation', 'Xenova/distilgpt2')
 model_kwargs = {'device': 'cpu'}
 encode_kwargs = {'normalize_embeddings': False}

 from pypdf import PdfReader
 from gradio_pdf import PDF
 from transformers import pipeline
 title = "Mistral-7B-Instruct-GGUF Run On CPU-Basic Free Hardware"
 hf_hub_download(repo_id="mradermacher/SmolLM-1.7B-Instruct-GGUF", filename=model_name, local_dir=model_path, local_dir_use_symlinks=False)
 """
 import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer
+model_name = "microsoft/Phi-3.5-mini-instructe"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.int8, device_map="auto")
 print("Start the model init process")
 """model = model = GPT4All(model_name, model_path, allow_download = False, device="cpu")
 max_new_tokens = 2048"""
 model_kwargs = {'device': 'cpu'}
 encode_kwargs = {'normalize_embeddings': False}