test code

Files changed (4) hide show

README.md +20 -12
simple_test.py → example_code.py +24 -7
requirements.txt +10 -0
requirements.txt.py +0 -0

README.md CHANGED Viewed

@@ -57,7 +57,8 @@ from LLAVA_Biovil.llava.model.builder import load_pretrained_model
 from LLAVA_Biovil.llava.conversation import SeparatorStyle, conv_vicuna_v1
 from LLAVA_Biovil.llava.constants import IMAGE_TOKEN_INDEX
-from utils import create_chest_xray_transform_for_inference
 def load_model_from_huggingface(repo_id):
     # Download model files
@@ -67,18 +68,31 @@ def load_model_from_huggingface(repo_id):
     tokenizer, model, image_processor, context_len = load_pretrained_model(model_path, model_base='liuhaotian/llava-v1.5-7b',
                                                                            model_name="llava-v1.5-7b-task-lora_radialog_instruct_llava_biovil_unfrozen_2e-5_5epochs_v5_checkpoint-21000", load_8bit=False, load_4bit=False)
     return tokenizer, model, image_processor, context_len
-tokenizer, model, image_processor, context_len = load_model_from_huggingface(repo_id="Chantal/RaDialog-interactive-radiology-report-generation")
 if __name__ == '__main__':
-    # config = None
-    # model_path = "/home/guests/chantal_pellegrini/RaDialog_LLaVA/LLAVA/checkpoints/llava-v1.5-7b-task-lora_radialog_instruct_llava_biovil_unfrozen_2e-5_5epochs_v5/checkpoint-21000" #TODO hardcoded in huggingface repo probably
-    # model_name = get_model_name_from_path(model_path)
     model.config.tokenizer_padding_side = "left"
-    findings = "edema, pleural effusion" #TODO should these come from chexpert classifier? Or not needed for this demo/test?
     conv = conv_vicuna_v1.copy()
     REPORT_GEN_PROMPT = f"<image>. Predicted Findings: {findings}. You are to act as a radiologist and write the finding section of a chest x-ray radiology report for this X-ray image and the given predicted findings. Write in the style of a radiologist, write one fluent text without enumeration, be concise and don't provide explanations or reasons."
@@ -89,12 +103,6 @@ if __name__ == '__main__':
     # get the image
     vis_transforms_biovil = create_chest_xray_transform_for_inference(512, center_crop_size=448)
-    sample_img_path = "https://openi.nlm.nih.gov/imgs/512/10/10/CXR10_IM-0002-2001.png?keywords=Calcified%20Granuloma" #TODO find good image
-    response = requests.get(sample_img_path)
-    image = Image.open(io.BytesIO(response.content))
-    image = remap_to_uint8(np.array(image))
-    image = Image.fromarray(image).convert("L")
     image_tensor = vis_transforms_biovil(image).unsqueeze(0)
     image_tensor = image_tensor.to(model.device, dtype=torch.bfloat16)

 from LLAVA_Biovil.llava.conversation import SeparatorStyle, conv_vicuna_v1
 from LLAVA_Biovil.llava.constants import IMAGE_TOKEN_INDEX
+from utils import create_chest_xray_transform_for_inference, init_chexpert_predictor
 def load_model_from_huggingface(repo_id):
     # Download model files
     tokenizer, model, image_processor, context_len = load_pretrained_model(model_path, model_base='liuhaotian/llava-v1.5-7b',
                                                                            model_name="llava-v1.5-7b-task-lora_radialog_instruct_llava_biovil_unfrozen_2e-5_5epochs_v5_checkpoint-21000", load_8bit=False, load_4bit=False)
     return tokenizer, model, image_processor, context_len
 if __name__ == '__main__':
+    sample_img_path = "https://openi.nlm.nih.gov/imgs/512/10/10/CXR10_IM-0002-2001.png?keywords=Calcified%20Granuloma" #TODO find good image
+    response = requests.get(sample_img_path)
+    image = Image.open(io.BytesIO(response.content))
+    image = remap_to_uint8(np.array(image))
+    image = Image.fromarray(image).convert("L")
+    tokenizer, model, image_processor, context_len = load_model_from_huggingface(repo_id="Chantal/RaDialog-interactive-radiology-report-generation")
+    cp_model, cp_class_names, cp_transforms = init_chexpert_predictor()
     model.config.tokenizer_padding_side = "left"
+    cp_image = cp_transforms(image)
+    logits = cp_model(cp_image[None].half().cuda())
+    preds_probs = torch.sigmoid(logits)
+    preds = preds_probs > 0.5
+    pred = preds[0].cpu().numpy()
+    findings = cp_class_names[pred].tolist()
+    findings = ', '.join(findings).lower().strip()
     conv = conv_vicuna_v1.copy()
     REPORT_GEN_PROMPT = f"<image>. Predicted Findings: {findings}. You are to act as a radiologist and write the finding section of a chest x-ray radiology report for this X-ray image and the given predicted findings. Write in the style of a radiologist, write one fluent text without enumeration, be concise and don't provide explanations or reasons."
     # get the image
     vis_transforms_biovil = create_chest_xray_transform_for_inference(512, center_crop_size=448)
     image_tensor = vis_transforms_biovil(image).unsqueeze(0)
     image_tensor = image_tensor.to(model.device, dtype=torch.bfloat16)

simple_test.py → example_code.py RENAMED Viewed

@@ -22,7 +22,7 @@ def load_model_from_huggingface(repo_id):
     model_path = Path(model_path)
     tokenizer, model, image_processor, context_len = load_pretrained_model(model_path, model_base='liuhaotian/llava-v1.5-7b',
-                                                                           model_name="llava-v1.5-7b-task-lora_radialog_instruct_llava_biovil_unfrozen_2e-5_5epochs_v5_checkpoint-21000", load_8bit=False, load_4bit=False)
     return tokenizer, model, image_processor, context_len
@@ -30,10 +30,7 @@ def load_model_from_huggingface(repo_id):
 if __name__ == '__main__':
-    # config = None
-    # model_path = "/home/guests/chantal_pellegrini/RaDialog_LLaVA/LLAVA/checkpoints/llava-v1.5-7b-task-lora_radialog_instruct_llava_biovil_unfrozen_2e-5_5epochs_v5/checkpoint-21000" #TODO hardcoded in huggingface repo probably
-    # model_name = get_model_name_from_path(model_path)
-    sample_img_path = "https://openi.nlm.nih.gov/imgs/512/10/10/CXR10_IM-0002-2001.png?keywords=Calcified%20Granuloma" #TODO find good image
     response = requests.get(sample_img_path)
     image = Image.open(io.BytesIO(response.content))
@@ -54,7 +51,7 @@ if __name__ == '__main__':
     findings = ', '.join(findings).lower().strip()
     conv = conv_vicuna_v1.copy()
-    REPORT_GEN_PROMPT = f"<image>. Predicted Findings: {findings}. You are to act as a radiologist and write the finding section of a chest x-ray radiology report for this X-ray image and the given predicted findings. Write in the style of a radiologist, write one fluent text without enumeration, be concise and don't provide explanations or reasons."
     print("USER: ", REPORT_GEN_PROMPT)
     conv.append_message("USER", REPORT_GEN_PROMPT)
     conv.append_message("ASSISTANT", None)
@@ -85,6 +82,27 @@ if __name__ == '__main__':
     pred = tokenizer.decode(output_ids[0, input_ids.shape[1]:]).strip().replace("</s>", "")
     print("ASSISTANT: ", pred)
     # add prediction to conversation
     conv.messages.pop()
     conv.append_message("ASSISTANT", pred)
@@ -108,4 +126,3 @@ if __name__ == '__main__':
     pred = tokenizer.decode(output_ids[0, input_ids.shape[1]:]).strip().replace("</s>", "")
     print("ASSISTANT: ", pred)

     model_path = Path(model_path)
     tokenizer, model, image_processor, context_len = load_pretrained_model(model_path, model_base='liuhaotian/llava-v1.5-7b',
+                                                                           model_name="llava-v1.5-7b-task-lora_radialog_instruct_llava_biovil_unfrozen_2e-5_5epochs_v5_checkpoint-21000", load_8bit=False, $
     return tokenizer, model, image_processor, context_len
 if __name__ == '__main__':
+    sample_img_path = "https://openi.nlm.nih.gov/imgs/512/294/3502/CXR3502_IM-1707-1001.png?keywords=Surgical%20Instruments,Cardiomegaly,Pulmonary%20Congestion,Diaphragm"
     response = requests.get(sample_img_path)
     image = Image.open(io.BytesIO(response.content))
     findings = ', '.join(findings).lower().strip()
     conv = conv_vicuna_v1.copy()
+    REPORT_GEN_PROMPT = f"<image>. Predicted Findings: {findings}. You are to act as a radiologist and write the finding section of a chest x-ray radiology report for this X-ray image and the given predi$
     print("USER: ", REPORT_GEN_PROMPT)
     conv.append_message("USER", REPORT_GEN_PROMPT)
     conv.append_message("ASSISTANT", None)
     pred = tokenizer.decode(output_ids[0, input_ids.shape[1]:]).strip().replace("</s>", "")
     print("ASSISTANT: ", pred)
+    # add prediction to conversation
+    conv.messages.pop()
+    conv.append_message("ASSISTANT", pred)
+    stop_str = conv.sep if conv.sep_style != SeparatorStyle.TWO else conv.sep2
+    stopping_criteria = KeywordsStoppingCriteria([stop_str], tokenizer, input_ids)
+    # generate a report
+    with torch.inference_mode():
+        output_ids = model.generate(
+            input_ids,
+            images=image_tensor,
+            do_sample=False,
+            use_cache=True,
+            max_new_tokens=300,
+            stopping_criteria=[stopping_criteria],
+            pad_token_id=tokenizer.pad_token_id
+        )
+    pred = tokenizer.decode(output_ids[0, input_ids.shape[1]:]).strip().replace("</s>", "")
+    print("ASSISTANT: ", pred)
     # add prediction to conversation
     conv.messages.pop()
     conv.append_message("ASSISTANT", pred)
     pred = tokenizer.decode(output_ids[0, input_ids.shape[1]:]).strip().replace("</s>", "")
     print("ASSISTANT: ", pred)

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+accelerate==0.21.0
+huggingface-hub==0.19.4
+timm==0.6.13
+transformers==4.31.0
+scikit-image==0.18.1
+peft==0.4.0
+pytorch_lightning==1.6.5
+chardet
+scikit-learn==1.2.2
+sentencepiece==0.1.99

requirements.txt.py DELETED Viewed

File without changes